neighbour.h 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535
  1. #ifndef _NET_NEIGHBOUR_H
  2. #define _NET_NEIGHBOUR_H
  3. #include <linux/neighbour.h>
  4. /*
  5. * Generic neighbour manipulation
  6. *
  7. * Authors:
  8. * Pedro Roque <[email protected]>
  9. * Alexey Kuznetsov <[email protected]>
  10. *
  11. * Changes:
  12. *
  13. * Harald Welte: <[email protected]>
  14. * - Add neighbour cache statistics like rtstat
  15. */
  16. #include <linux/atomic.h>
  17. #include <linux/netdevice.h>
  18. #include <linux/skbuff.h>
  19. #include <linux/rcupdate.h>
  20. #include <linux/seq_file.h>
  21. #include <linux/bitmap.h>
  22. #include <linux/err.h>
  23. #include <linux/sysctl.h>
  24. #include <linux/workqueue.h>
  25. #include <net/rtnetlink.h>
  26. /*
  27. * NUD stands for "neighbor unreachability detection"
  28. */
  29. #define NUD_IN_TIMER (NUD_INCOMPLETE|NUD_REACHABLE|NUD_DELAY|NUD_PROBE)
  30. #define NUD_VALID (NUD_PERMANENT|NUD_NOARP|NUD_REACHABLE|NUD_PROBE|NUD_STALE|NUD_DELAY)
  31. #define NUD_CONNECTED (NUD_PERMANENT|NUD_NOARP|NUD_REACHABLE)
  32. struct neighbour;
  33. enum {
  34. NEIGH_VAR_MCAST_PROBES,
  35. NEIGH_VAR_UCAST_PROBES,
  36. NEIGH_VAR_APP_PROBES,
  37. NEIGH_VAR_MCAST_REPROBES,
  38. NEIGH_VAR_RETRANS_TIME,
  39. NEIGH_VAR_BASE_REACHABLE_TIME,
  40. NEIGH_VAR_DELAY_PROBE_TIME,
  41. NEIGH_VAR_GC_STALETIME,
  42. NEIGH_VAR_QUEUE_LEN_BYTES,
  43. NEIGH_VAR_PROXY_QLEN,
  44. NEIGH_VAR_ANYCAST_DELAY,
  45. NEIGH_VAR_PROXY_DELAY,
  46. NEIGH_VAR_LOCKTIME,
  47. #define NEIGH_VAR_DATA_MAX (NEIGH_VAR_LOCKTIME + 1)
  48. /* Following are used as a second way to access one of the above */
  49. NEIGH_VAR_QUEUE_LEN, /* same data as NEIGH_VAR_QUEUE_LEN_BYTES */
  50. NEIGH_VAR_RETRANS_TIME_MS, /* same data as NEIGH_VAR_RETRANS_TIME */
  51. NEIGH_VAR_BASE_REACHABLE_TIME_MS, /* same data as NEIGH_VAR_BASE_REACHABLE_TIME */
  52. /* Following are used by "default" only */
  53. NEIGH_VAR_GC_INTERVAL,
  54. NEIGH_VAR_GC_THRESH1,
  55. NEIGH_VAR_GC_THRESH2,
  56. NEIGH_VAR_GC_THRESH3,
  57. NEIGH_VAR_PROBE,
  58. NEIGH_VAR_MAX
  59. };
  60. struct neigh_parms {
  61. possible_net_t net;
  62. struct net_device *dev;
  63. struct list_head list;
  64. int (*neigh_setup)(struct neighbour *);
  65. void (*neigh_cleanup)(struct neighbour *);
  66. struct neigh_table *tbl;
  67. void *sysctl_table;
  68. int dead;
  69. atomic_t refcnt;
  70. struct rcu_head rcu_head;
  71. int reachable_time;
  72. int data[NEIGH_VAR_DATA_MAX];
  73. DECLARE_BITMAP(data_state, NEIGH_VAR_DATA_MAX);
  74. };
  75. static inline void neigh_var_set(struct neigh_parms *p, int index, int val)
  76. {
  77. set_bit(index, p->data_state);
  78. p->data[index] = val;
  79. }
  80. #define NEIGH_VAR(p, attr) ((p)->data[NEIGH_VAR_ ## attr])
  81. /* In ndo_neigh_setup, NEIGH_VAR_INIT should be used.
  82. * In other cases, NEIGH_VAR_SET should be used.
  83. */
  84. #define NEIGH_VAR_INIT(p, attr, val) (NEIGH_VAR(p, attr) = val)
  85. #define NEIGH_VAR_SET(p, attr, val) neigh_var_set(p, NEIGH_VAR_ ## attr, val)
  86. static inline void neigh_parms_data_state_setall(struct neigh_parms *p)
  87. {
  88. bitmap_fill(p->data_state, NEIGH_VAR_DATA_MAX);
  89. }
  90. static inline void neigh_parms_data_state_cleanall(struct neigh_parms *p)
  91. {
  92. bitmap_zero(p->data_state, NEIGH_VAR_DATA_MAX);
  93. }
  94. struct neigh_statistics {
  95. unsigned long allocs; /* number of allocated neighs */
  96. unsigned long destroys; /* number of destroyed neighs */
  97. unsigned long hash_grows; /* number of hash resizes */
  98. unsigned long res_failed; /* number of failed resolutions */
  99. unsigned long lookups; /* number of lookups */
  100. unsigned long hits; /* number of hits (among lookups) */
  101. unsigned long rcv_probes_mcast; /* number of received mcast ipv6 */
  102. unsigned long rcv_probes_ucast; /* number of received ucast ipv6 */
  103. unsigned long periodic_gc_runs; /* number of periodic GC runs */
  104. unsigned long forced_gc_runs; /* number of forced GC runs */
  105. unsigned long unres_discards; /* number of unresolved drops */
  106. unsigned long table_fulls; /* times even gc couldn't help */
  107. };
  108. #define NEIGH_CACHE_STAT_INC(tbl, field) this_cpu_inc((tbl)->stats->field)
  109. struct neighbour {
  110. struct neighbour __rcu *next;
  111. struct neigh_table *tbl;
  112. struct neigh_parms *parms;
  113. unsigned long confirmed;
  114. unsigned long updated;
  115. rwlock_t lock;
  116. atomic_t refcnt;
  117. struct sk_buff_head arp_queue;
  118. unsigned int arp_queue_len_bytes;
  119. struct timer_list timer;
  120. unsigned long used;
  121. atomic_t probes;
  122. __u8 flags;
  123. __u8 nud_state;
  124. __u8 type;
  125. __u8 dead;
  126. seqlock_t ha_lock;
  127. unsigned char ha[ALIGN(MAX_ADDR_LEN, sizeof(unsigned long))];
  128. struct hh_cache hh;
  129. int (*output)(struct neighbour *, struct sk_buff *);
  130. const struct neigh_ops *ops;
  131. struct rcu_head rcu;
  132. struct net_device *dev;
  133. u8 primary_key[0];
  134. };
  135. struct neigh_ops {
  136. int family;
  137. void (*solicit)(struct neighbour *, struct sk_buff *);
  138. void (*error_report)(struct neighbour *, struct sk_buff *);
  139. int (*output)(struct neighbour *, struct sk_buff *);
  140. int (*connected_output)(struct neighbour *, struct sk_buff *);
  141. };
  142. struct pneigh_entry {
  143. struct pneigh_entry *next;
  144. possible_net_t net;
  145. struct net_device *dev;
  146. u8 flags;
  147. u8 key[0];
  148. };
  149. /*
  150. * neighbour table manipulation
  151. */
  152. #define NEIGH_NUM_HASH_RND 4
  153. struct neigh_hash_table {
  154. struct neighbour __rcu **hash_buckets;
  155. unsigned int hash_shift;
  156. __u32 hash_rnd[NEIGH_NUM_HASH_RND];
  157. struct rcu_head rcu;
  158. };
  159. struct neigh_table {
  160. int family;
  161. int entry_size;
  162. int key_len;
  163. __be16 protocol;
  164. __u32 (*hash)(const void *pkey,
  165. const struct net_device *dev,
  166. __u32 *hash_rnd);
  167. bool (*key_eq)(const struct neighbour *, const void *pkey);
  168. int (*constructor)(struct neighbour *);
  169. int (*pconstructor)(struct pneigh_entry *);
  170. void (*pdestructor)(struct pneigh_entry *);
  171. void (*proxy_redo)(struct sk_buff *skb);
  172. char *id;
  173. struct neigh_parms parms;
  174. struct list_head parms_list;
  175. int gc_interval;
  176. int gc_thresh1;
  177. int gc_thresh2;
  178. int gc_thresh3;
  179. unsigned long last_flush;
  180. struct delayed_work gc_work;
  181. struct timer_list proxy_timer;
  182. struct sk_buff_head proxy_queue;
  183. atomic_t entries;
  184. rwlock_t lock;
  185. unsigned long last_rand;
  186. struct neigh_statistics __percpu *stats;
  187. struct neigh_hash_table __rcu *nht;
  188. struct pneigh_entry **phash_buckets;
  189. };
  190. enum {
  191. NEIGH_ARP_TABLE = 0,
  192. NEIGH_ND_TABLE = 1,
  193. NEIGH_DN_TABLE = 2,
  194. NEIGH_NR_TABLES,
  195. NEIGH_LINK_TABLE = NEIGH_NR_TABLES /* Pseudo table for neigh_xmit */
  196. };
  197. static inline int neigh_parms_family(struct neigh_parms *p)
  198. {
  199. return p->tbl->family;
  200. }
  201. #define NEIGH_PRIV_ALIGN sizeof(long long)
  202. #define NEIGH_ENTRY_SIZE(size) ALIGN((size), NEIGH_PRIV_ALIGN)
  203. static inline void *neighbour_priv(const struct neighbour *n)
  204. {
  205. return (char *)n + n->tbl->entry_size;
  206. }
  207. /* flags for neigh_update() */
  208. #define NEIGH_UPDATE_F_OVERRIDE 0x00000001
  209. #define NEIGH_UPDATE_F_WEAK_OVERRIDE 0x00000002
  210. #define NEIGH_UPDATE_F_OVERRIDE_ISROUTER 0x00000004
  211. #define NEIGH_UPDATE_F_ISROUTER 0x40000000
  212. #define NEIGH_UPDATE_F_ADMIN 0x80000000
  213. static inline bool neigh_key_eq16(const struct neighbour *n, const void *pkey)
  214. {
  215. return *(const u16 *)n->primary_key == *(const u16 *)pkey;
  216. }
  217. static inline bool neigh_key_eq32(const struct neighbour *n, const void *pkey)
  218. {
  219. return *(const u32 *)n->primary_key == *(const u32 *)pkey;
  220. }
  221. static inline bool neigh_key_eq128(const struct neighbour *n, const void *pkey)
  222. {
  223. const u32 *n32 = (const u32 *)n->primary_key;
  224. const u32 *p32 = pkey;
  225. return ((n32[0] ^ p32[0]) | (n32[1] ^ p32[1]) |
  226. (n32[2] ^ p32[2]) | (n32[3] ^ p32[3])) == 0;
  227. }
  228. static inline struct neighbour *___neigh_lookup_noref(
  229. struct neigh_table *tbl,
  230. bool (*key_eq)(const struct neighbour *n, const void *pkey),
  231. __u32 (*hash)(const void *pkey,
  232. const struct net_device *dev,
  233. __u32 *hash_rnd),
  234. const void *pkey,
  235. struct net_device *dev)
  236. {
  237. struct neigh_hash_table *nht = rcu_dereference_bh(tbl->nht);
  238. struct neighbour *n;
  239. u32 hash_val;
  240. hash_val = hash(pkey, dev, nht->hash_rnd) >> (32 - nht->hash_shift);
  241. for (n = rcu_dereference_bh(nht->hash_buckets[hash_val]);
  242. n != NULL;
  243. n = rcu_dereference_bh(n->next)) {
  244. if (n->dev == dev && key_eq(n, pkey))
  245. return n;
  246. }
  247. return NULL;
  248. }
  249. static inline struct neighbour *__neigh_lookup_noref(struct neigh_table *tbl,
  250. const void *pkey,
  251. struct net_device *dev)
  252. {
  253. return ___neigh_lookup_noref(tbl, tbl->key_eq, tbl->hash, pkey, dev);
  254. }
  255. void neigh_table_init(int index, struct neigh_table *tbl);
  256. int neigh_table_clear(int index, struct neigh_table *tbl);
  257. struct neighbour *neigh_lookup(struct neigh_table *tbl, const void *pkey,
  258. struct net_device *dev);
  259. struct neighbour *neigh_lookup_nodev(struct neigh_table *tbl, struct net *net,
  260. const void *pkey);
  261. struct neighbour *__neigh_create(struct neigh_table *tbl, const void *pkey,
  262. struct net_device *dev, bool want_ref);
  263. static inline struct neighbour *neigh_create(struct neigh_table *tbl,
  264. const void *pkey,
  265. struct net_device *dev)
  266. {
  267. return __neigh_create(tbl, pkey, dev, true);
  268. }
  269. void neigh_destroy(struct neighbour *neigh);
  270. int __neigh_event_send(struct neighbour *neigh, struct sk_buff *skb);
  271. int neigh_update(struct neighbour *neigh, const u8 *lladdr, u8 new, u32 flags);
  272. void __neigh_set_probe_once(struct neighbour *neigh);
  273. void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev);
  274. int neigh_ifdown(struct neigh_table *tbl, struct net_device *dev);
  275. int neigh_resolve_output(struct neighbour *neigh, struct sk_buff *skb);
  276. int neigh_connected_output(struct neighbour *neigh, struct sk_buff *skb);
  277. int neigh_direct_output(struct neighbour *neigh, struct sk_buff *skb);
  278. struct neighbour *neigh_event_ns(struct neigh_table *tbl,
  279. u8 *lladdr, void *saddr,
  280. struct net_device *dev);
  281. struct neigh_parms *neigh_parms_alloc(struct net_device *dev,
  282. struct neigh_table *tbl);
  283. void neigh_parms_release(struct neigh_table *tbl, struct neigh_parms *parms);
  284. static inline
  285. struct net *neigh_parms_net(const struct neigh_parms *parms)
  286. {
  287. return read_pnet(&parms->net);
  288. }
  289. unsigned long neigh_rand_reach_time(unsigned long base);
  290. void pneigh_enqueue(struct neigh_table *tbl, struct neigh_parms *p,
  291. struct sk_buff *skb);
  292. struct pneigh_entry *pneigh_lookup(struct neigh_table *tbl, struct net *net,
  293. const void *key, struct net_device *dev,
  294. int creat);
  295. struct pneigh_entry *__pneigh_lookup(struct neigh_table *tbl, struct net *net,
  296. const void *key, struct net_device *dev);
  297. int pneigh_delete(struct neigh_table *tbl, struct net *net, const void *key,
  298. struct net_device *dev);
  299. static inline struct net *pneigh_net(const struct pneigh_entry *pneigh)
  300. {
  301. return read_pnet(&pneigh->net);
  302. }
  303. void neigh_app_ns(struct neighbour *n);
  304. void neigh_for_each(struct neigh_table *tbl,
  305. void (*cb)(struct neighbour *, void *), void *cookie);
  306. void __neigh_for_each_release(struct neigh_table *tbl,
  307. int (*cb)(struct neighbour *));
  308. int neigh_xmit(int fam, struct net_device *, const void *, struct sk_buff *);
  309. void pneigh_for_each(struct neigh_table *tbl,
  310. void (*cb)(struct pneigh_entry *));
  311. struct neigh_seq_state {
  312. struct seq_net_private p;
  313. struct neigh_table *tbl;
  314. struct neigh_hash_table *nht;
  315. void *(*neigh_sub_iter)(struct neigh_seq_state *state,
  316. struct neighbour *n, loff_t *pos);
  317. unsigned int bucket;
  318. unsigned int flags;
  319. #define NEIGH_SEQ_NEIGH_ONLY 0x00000001
  320. #define NEIGH_SEQ_IS_PNEIGH 0x00000002
  321. #define NEIGH_SEQ_SKIP_NOARP 0x00000004
  322. };
  323. void *neigh_seq_start(struct seq_file *, loff_t *, struct neigh_table *,
  324. unsigned int);
  325. void *neigh_seq_next(struct seq_file *, void *, loff_t *);
  326. void neigh_seq_stop(struct seq_file *, void *);
  327. int neigh_proc_dointvec(struct ctl_table *ctl, int write,
  328. void __user *buffer, size_t *lenp, loff_t *ppos);
  329. int neigh_proc_dointvec_jiffies(struct ctl_table *ctl, int write,
  330. void __user *buffer,
  331. size_t *lenp, loff_t *ppos);
  332. int neigh_proc_dointvec_ms_jiffies(struct ctl_table *ctl, int write,
  333. void __user *buffer,
  334. size_t *lenp, loff_t *ppos);
  335. int neigh_sysctl_register(struct net_device *dev, struct neigh_parms *p,
  336. proc_handler *proc_handler);
  337. void neigh_sysctl_unregister(struct neigh_parms *p);
  338. static inline void __neigh_parms_put(struct neigh_parms *parms)
  339. {
  340. atomic_dec(&parms->refcnt);
  341. }
  342. static inline struct neigh_parms *neigh_parms_clone(struct neigh_parms *parms)
  343. {
  344. atomic_inc(&parms->refcnt);
  345. return parms;
  346. }
  347. /*
  348. * Neighbour references
  349. */
  350. static inline void neigh_release(struct neighbour *neigh)
  351. {
  352. if (atomic_dec_and_test(&neigh->refcnt))
  353. neigh_destroy(neigh);
  354. }
  355. static inline struct neighbour * neigh_clone(struct neighbour *neigh)
  356. {
  357. if (neigh)
  358. atomic_inc(&neigh->refcnt);
  359. return neigh;
  360. }
  361. #define neigh_hold(n) atomic_inc(&(n)->refcnt)
  362. static inline int neigh_event_send(struct neighbour *neigh, struct sk_buff *skb)
  363. {
  364. unsigned long now = jiffies;
  365. if (neigh->used != now)
  366. neigh->used = now;
  367. if (!(neigh->nud_state&(NUD_CONNECTED|NUD_DELAY|NUD_PROBE)))
  368. return __neigh_event_send(neigh, skb);
  369. return 0;
  370. }
  371. #if IS_ENABLED(CONFIG_BRIDGE_NETFILTER)
  372. static inline int neigh_hh_bridge(struct hh_cache *hh, struct sk_buff *skb)
  373. {
  374. unsigned int seq, hh_alen;
  375. do {
  376. seq = read_seqbegin(&hh->hh_lock);
  377. hh_alen = HH_DATA_ALIGN(ETH_HLEN);
  378. memcpy(skb->data - hh_alen, hh->hh_data, ETH_ALEN + hh_alen - ETH_HLEN);
  379. } while (read_seqretry(&hh->hh_lock, seq));
  380. return 0;
  381. }
  382. #endif
  383. static inline int neigh_hh_output(const struct hh_cache *hh, struct sk_buff *skb)
  384. {
  385. unsigned int hh_alen = 0;
  386. unsigned int seq;
  387. int hh_len;
  388. do {
  389. seq = read_seqbegin(&hh->hh_lock);
  390. hh_len = hh->hh_len;
  391. if (likely(hh_len <= HH_DATA_MOD)) {
  392. hh_alen = HH_DATA_MOD;
  393. /* skb_push() would proceed silently if we have room for
  394. * the unaligned size but not for the aligned size:
  395. * check headroom explicitly.
  396. */
  397. if (likely(skb_headroom(skb) >= HH_DATA_MOD)) {
  398. /* this is inlined by gcc */
  399. memcpy(skb->data - HH_DATA_MOD, hh->hh_data,
  400. HH_DATA_MOD);
  401. }
  402. } else {
  403. hh_alen = HH_DATA_ALIGN(hh_len);
  404. if (likely(skb_headroom(skb) >= hh_alen)) {
  405. memcpy(skb->data - hh_alen, hh->hh_data,
  406. hh_alen);
  407. }
  408. }
  409. } while (read_seqretry(&hh->hh_lock, seq));
  410. if (WARN_ON_ONCE(skb_headroom(skb) < hh_alen)) {
  411. kfree_skb(skb);
  412. return NET_XMIT_DROP;
  413. }
  414. __skb_push(skb, hh_len);
  415. return dev_queue_xmit(skb);
  416. }
  417. static inline struct neighbour *
  418. __neigh_lookup(struct neigh_table *tbl, const void *pkey, struct net_device *dev, int creat)
  419. {
  420. struct neighbour *n = neigh_lookup(tbl, pkey, dev);
  421. if (n || !creat)
  422. return n;
  423. n = neigh_create(tbl, pkey, dev);
  424. return IS_ERR(n) ? NULL : n;
  425. }
  426. static inline struct neighbour *
  427. __neigh_lookup_errno(struct neigh_table *tbl, const void *pkey,
  428. struct net_device *dev)
  429. {
  430. struct neighbour *n = neigh_lookup(tbl, pkey, dev);
  431. if (n)
  432. return n;
  433. return neigh_create(tbl, pkey, dev);
  434. }
  435. struct neighbour_cb {
  436. unsigned long sched_next;
  437. unsigned int flags;
  438. };
  439. #define LOCALLY_ENQUEUED 0x1
  440. #define NEIGH_CB(skb) ((struct neighbour_cb *)(skb)->cb)
  441. static inline void neigh_ha_snapshot(char *dst, const struct neighbour *n,
  442. const struct net_device *dev)
  443. {
  444. unsigned int seq;
  445. do {
  446. seq = read_seqbegin(&n->ha_lock);
  447. memcpy(dst, n->ha, dev->addr_len);
  448. } while (read_seqretry(&n->ha_lock, seq));
  449. }
  450. #endif