xfrm_state.c 55 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294
  1. /*
  2. * xfrm_state.c
  3. *
  4. * Changes:
  5. * Mitsuru KANDA @USAGI
  6. * Kazunori MIYAZAWA @USAGI
  7. * Kunihiro Ishiguro <kunihiro@ipinfusion.com>
  8. * IPv6 support
  9. * YOSHIFUJI Hideaki @USAGI
  10. * Split up af-specific functions
  11. * Derek Atkins <derek@ihtfp.com>
  12. * Add UDP Encapsulation
  13. *
  14. */
  15. #include <linux/workqueue.h>
  16. #include <net/xfrm.h>
  17. #include <linux/pfkeyv2.h>
  18. #include <linux/ipsec.h>
  19. #include <linux/module.h>
  20. #include <linux/cache.h>
  21. #include <linux/audit.h>
  22. #include <asm/uaccess.h>
  23. #include <linux/ktime.h>
  24. #include <linux/slab.h>
  25. #include <linux/interrupt.h>
  26. #include <linux/kernel.h>
  27. #include "xfrm_hash.h"
  28. /* Each xfrm_state may be linked to two tables:
  29. 1. Hash table by (spi,daddr,ah/esp) to find SA by SPI. (input,ctl)
  30. 2. Hash table by (daddr,family,reqid) to find what SAs exist for given
  31. destination/tunnel endpoint. (output)
  32. */
  33. static DEFINE_SPINLOCK(xfrm_state_lock);
  34. static unsigned int xfrm_state_hashmax __read_mostly = 1 * 1024 * 1024;
  35. static struct xfrm_state_afinfo *xfrm_state_get_afinfo(unsigned int family);
  36. static void xfrm_state_put_afinfo(struct xfrm_state_afinfo *afinfo);
  37. #ifdef CONFIG_AUDITSYSCALL
  38. static void xfrm_audit_state_replay(struct xfrm_state *x,
  39. struct sk_buff *skb, __be32 net_seq);
  40. #else
  41. #define xfrm_audit_state_replay(x, s, sq) do { ; } while (0)
  42. #endif /* CONFIG_AUDITSYSCALL */
  43. static inline unsigned int xfrm_dst_hash(struct net *net,
  44. xfrm_address_t *daddr,
  45. xfrm_address_t *saddr,
  46. u32 reqid,
  47. unsigned short family)
  48. {
  49. return __xfrm_dst_hash(daddr, saddr, reqid, family, net->xfrm.state_hmask);
  50. }
  51. static inline unsigned int xfrm_src_hash(struct net *net,
  52. xfrm_address_t *daddr,
  53. xfrm_address_t *saddr,
  54. unsigned short family)
  55. {
  56. return __xfrm_src_hash(daddr, saddr, family, net->xfrm.state_hmask);
  57. }
  58. static inline unsigned int
  59. xfrm_spi_hash(struct net *net, xfrm_address_t *daddr, __be32 spi, u8 proto, unsigned short family)
  60. {
  61. return __xfrm_spi_hash(daddr, spi, proto, family, net->xfrm.state_hmask);
  62. }
  63. static void xfrm_hash_transfer(struct hlist_head *list,
  64. struct hlist_head *ndsttable,
  65. struct hlist_head *nsrctable,
  66. struct hlist_head *nspitable,
  67. unsigned int nhashmask)
  68. {
  69. struct hlist_node *entry, *tmp;
  70. struct xfrm_state *x;
  71. hlist_for_each_entry_safe(x, entry, tmp, list, bydst) {
  72. unsigned int h;
  73. h = __xfrm_dst_hash(&x->id.daddr, &x->props.saddr,
  74. x->props.reqid, x->props.family,
  75. nhashmask);
  76. hlist_add_head(&x->bydst, ndsttable+h);
  77. h = __xfrm_src_hash(&x->id.daddr, &x->props.saddr,
  78. x->props.family,
  79. nhashmask);
  80. hlist_add_head(&x->bysrc, nsrctable+h);
  81. if (x->id.spi) {
  82. h = __xfrm_spi_hash(&x->id.daddr, x->id.spi,
  83. x->id.proto, x->props.family,
  84. nhashmask);
  85. hlist_add_head(&x->byspi, nspitable+h);
  86. }
  87. }
  88. }
  89. static unsigned long xfrm_hash_new_size(unsigned int state_hmask)
  90. {
  91. return ((state_hmask + 1) << 1) * sizeof(struct hlist_head);
  92. }
  93. static DEFINE_MUTEX(hash_resize_mutex);
  94. static void xfrm_hash_resize(struct work_struct *work)
  95. {
  96. struct net *net = container_of(work, struct net, xfrm.state_hash_work);
  97. struct hlist_head *ndst, *nsrc, *nspi, *odst, *osrc, *ospi;
  98. unsigned long nsize, osize;
  99. unsigned int nhashmask, ohashmask;
  100. int i;
  101. mutex_lock(&hash_resize_mutex);
  102. nsize = xfrm_hash_new_size(net->xfrm.state_hmask);
  103. ndst = xfrm_hash_alloc(nsize);
  104. if (!ndst)
  105. goto out_unlock;
  106. nsrc = xfrm_hash_alloc(nsize);
  107. if (!nsrc) {
  108. xfrm_hash_free(ndst, nsize);
  109. goto out_unlock;
  110. }
  111. nspi = xfrm_hash_alloc(nsize);
  112. if (!nspi) {
  113. xfrm_hash_free(ndst, nsize);
  114. xfrm_hash_free(nsrc, nsize);
  115. goto out_unlock;
  116. }
  117. spin_lock_bh(&xfrm_state_lock);
  118. nhashmask = (nsize / sizeof(struct hlist_head)) - 1U;
  119. for (i = net->xfrm.state_hmask; i >= 0; i--)
  120. xfrm_hash_transfer(net->xfrm.state_bydst+i, ndst, nsrc, nspi,
  121. nhashmask);
  122. odst = net->xfrm.state_bydst;
  123. osrc = net->xfrm.state_bysrc;
  124. ospi = net->xfrm.state_byspi;
  125. ohashmask = net->xfrm.state_hmask;
  126. net->xfrm.state_bydst = ndst;
  127. net->xfrm.state_bysrc = nsrc;
  128. net->xfrm.state_byspi = nspi;
  129. net->xfrm.state_hmask = nhashmask;
  130. spin_unlock_bh(&xfrm_state_lock);
  131. osize = (ohashmask + 1) * sizeof(struct hlist_head);
  132. xfrm_hash_free(odst, osize);
  133. xfrm_hash_free(osrc, osize);
  134. xfrm_hash_free(ospi, osize);
  135. out_unlock:
  136. mutex_unlock(&hash_resize_mutex);
  137. }
  138. static DEFINE_RWLOCK(xfrm_state_afinfo_lock);
  139. static struct xfrm_state_afinfo *xfrm_state_afinfo[NPROTO];
  140. static DEFINE_SPINLOCK(xfrm_state_gc_lock);
  141. int __xfrm_state_delete(struct xfrm_state *x);
  142. int km_query(struct xfrm_state *x, struct xfrm_tmpl *t, struct xfrm_policy *pol);
  143. void km_state_expired(struct xfrm_state *x, int hard, u32 pid);
  144. static struct xfrm_state_afinfo *xfrm_state_lock_afinfo(unsigned int family)
  145. {
  146. struct xfrm_state_afinfo *afinfo;
  147. if (unlikely(family >= NPROTO))
  148. return NULL;
  149. write_lock_bh(&xfrm_state_afinfo_lock);
  150. afinfo = xfrm_state_afinfo[family];
  151. if (unlikely(!afinfo))
  152. write_unlock_bh(&xfrm_state_afinfo_lock);
  153. return afinfo;
  154. }
  155. static void xfrm_state_unlock_afinfo(struct xfrm_state_afinfo *afinfo)
  156. __releases(xfrm_state_afinfo_lock)
  157. {
  158. write_unlock_bh(&xfrm_state_afinfo_lock);
  159. }
  160. int xfrm_register_type(const struct xfrm_type *type, unsigned short family)
  161. {
  162. struct xfrm_state_afinfo *afinfo = xfrm_state_lock_afinfo(family);
  163. const struct xfrm_type **typemap;
  164. int err = 0;
  165. if (unlikely(afinfo == NULL))
  166. return -EAFNOSUPPORT;
  167. typemap = afinfo->type_map;
  168. if (likely(typemap[type->proto] == NULL))
  169. typemap[type->proto] = type;
  170. else
  171. err = -EEXIST;
  172. xfrm_state_unlock_afinfo(afinfo);
  173. return err;
  174. }
  175. EXPORT_SYMBOL(xfrm_register_type);
  176. int xfrm_unregister_type(const struct xfrm_type *type, unsigned short family)
  177. {
  178. struct xfrm_state_afinfo *afinfo = xfrm_state_lock_afinfo(family);
  179. const struct xfrm_type **typemap;
  180. int err = 0;
  181. if (unlikely(afinfo == NULL))
  182. return -EAFNOSUPPORT;
  183. typemap = afinfo->type_map;
  184. if (unlikely(typemap[type->proto] != type))
  185. err = -ENOENT;
  186. else
  187. typemap[type->proto] = NULL;
  188. xfrm_state_unlock_afinfo(afinfo);
  189. return err;
  190. }
  191. EXPORT_SYMBOL(xfrm_unregister_type);
  192. static const struct xfrm_type *xfrm_get_type(u8 proto, unsigned short family)
  193. {
  194. struct xfrm_state_afinfo *afinfo;
  195. const struct xfrm_type **typemap;
  196. const struct xfrm_type *type;
  197. int modload_attempted = 0;
  198. retry:
  199. afinfo = xfrm_state_get_afinfo(family);
  200. if (unlikely(afinfo == NULL))
  201. return NULL;
  202. typemap = afinfo->type_map;
  203. type = typemap[proto];
  204. if (unlikely(type && !try_module_get(type->owner)))
  205. type = NULL;
  206. if (!type && !modload_attempted) {
  207. xfrm_state_put_afinfo(afinfo);
  208. request_module("xfrm-type-%d-%d", family, proto);
  209. modload_attempted = 1;
  210. goto retry;
  211. }
  212. xfrm_state_put_afinfo(afinfo);
  213. return type;
  214. }
  215. static void xfrm_put_type(const struct xfrm_type *type)
  216. {
  217. module_put(type->owner);
  218. }
  219. int xfrm_register_mode(struct xfrm_mode *mode, int family)
  220. {
  221. struct xfrm_state_afinfo *afinfo;
  222. struct xfrm_mode **modemap;
  223. int err;
  224. if (unlikely(mode->encap >= XFRM_MODE_MAX))
  225. return -EINVAL;
  226. afinfo = xfrm_state_lock_afinfo(family);
  227. if (unlikely(afinfo == NULL))
  228. return -EAFNOSUPPORT;
  229. err = -EEXIST;
  230. modemap = afinfo->mode_map;
  231. if (modemap[mode->encap])
  232. goto out;
  233. err = -ENOENT;
  234. if (!try_module_get(afinfo->owner))
  235. goto out;
  236. mode->afinfo = afinfo;
  237. modemap[mode->encap] = mode;
  238. err = 0;
  239. out:
  240. xfrm_state_unlock_afinfo(afinfo);
  241. return err;
  242. }
  243. EXPORT_SYMBOL(xfrm_register_mode);
  244. int xfrm_unregister_mode(struct xfrm_mode *mode, int family)
  245. {
  246. struct xfrm_state_afinfo *afinfo;
  247. struct xfrm_mode **modemap;
  248. int err;
  249. if (unlikely(mode->encap >= XFRM_MODE_MAX))
  250. return -EINVAL;
  251. afinfo = xfrm_state_lock_afinfo(family);
  252. if (unlikely(afinfo == NULL))
  253. return -EAFNOSUPPORT;
  254. err = -ENOENT;
  255. modemap = afinfo->mode_map;
  256. if (likely(modemap[mode->encap] == mode)) {
  257. modemap[mode->encap] = NULL;
  258. module_put(mode->afinfo->owner);
  259. err = 0;
  260. }
  261. xfrm_state_unlock_afinfo(afinfo);
  262. return err;
  263. }
  264. EXPORT_SYMBOL(xfrm_unregister_mode);
  265. static struct xfrm_mode *xfrm_get_mode(unsigned int encap, int family)
  266. {
  267. struct xfrm_state_afinfo *afinfo;
  268. struct xfrm_mode *mode;
  269. int modload_attempted = 0;
  270. if (unlikely(encap >= XFRM_MODE_MAX))
  271. return NULL;
  272. retry:
  273. afinfo = xfrm_state_get_afinfo(family);
  274. if (unlikely(afinfo == NULL))
  275. return NULL;
  276. mode = afinfo->mode_map[encap];
  277. if (unlikely(mode && !try_module_get(mode->owner)))
  278. mode = NULL;
  279. if (!mode && !modload_attempted) {
  280. xfrm_state_put_afinfo(afinfo);
  281. request_module("xfrm-mode-%d-%d", family, encap);
  282. modload_attempted = 1;
  283. goto retry;
  284. }
  285. xfrm_state_put_afinfo(afinfo);
  286. return mode;
  287. }
  288. static void xfrm_put_mode(struct xfrm_mode *mode)
  289. {
  290. module_put(mode->owner);
  291. }
  292. static void xfrm_state_gc_destroy(struct xfrm_state *x)
  293. {
  294. tasklet_hrtimer_cancel(&x->mtimer);
  295. del_timer_sync(&x->rtimer);
  296. kfree(x->aalg);
  297. kfree(x->ealg);
  298. kfree(x->calg);
  299. kfree(x->encap);
  300. kfree(x->coaddr);
  301. if (x->inner_mode)
  302. xfrm_put_mode(x->inner_mode);
  303. if (x->inner_mode_iaf)
  304. xfrm_put_mode(x->inner_mode_iaf);
  305. if (x->outer_mode)
  306. xfrm_put_mode(x->outer_mode);
  307. if (x->type) {
  308. x->type->destructor(x);
  309. xfrm_put_type(x->type);
  310. }
  311. security_xfrm_state_free(x);
  312. kfree(x);
  313. }
  314. static void xfrm_state_gc_task(struct work_struct *work)
  315. {
  316. struct net *net = container_of(work, struct net, xfrm.state_gc_work);
  317. struct xfrm_state *x;
  318. struct hlist_node *entry, *tmp;
  319. struct hlist_head gc_list;
  320. spin_lock_bh(&xfrm_state_gc_lock);
  321. hlist_move_list(&net->xfrm.state_gc_list, &gc_list);
  322. spin_unlock_bh(&xfrm_state_gc_lock);
  323. hlist_for_each_entry_safe(x, entry, tmp, &gc_list, gclist)
  324. xfrm_state_gc_destroy(x);
  325. wake_up(&net->xfrm.km_waitq);
  326. }
  327. static inline unsigned long make_jiffies(long secs)
  328. {
  329. if (secs >= (MAX_SCHEDULE_TIMEOUT-1)/HZ)
  330. return MAX_SCHEDULE_TIMEOUT-1;
  331. else
  332. return secs*HZ;
  333. }
  334. static enum hrtimer_restart xfrm_timer_handler(struct hrtimer * me)
  335. {
  336. struct tasklet_hrtimer *thr = container_of(me, struct tasklet_hrtimer, timer);
  337. struct xfrm_state *x = container_of(thr, struct xfrm_state, mtimer);
  338. struct net *net = xs_net(x);
  339. unsigned long now = get_seconds();
  340. long next = LONG_MAX;
  341. int warn = 0;
  342. int err = 0;
  343. spin_lock(&x->lock);
  344. if (x->km.state == XFRM_STATE_DEAD)
  345. goto out;
  346. if (x->km.state == XFRM_STATE_EXPIRED)
  347. goto expired;
  348. if (x->lft.hard_add_expires_seconds) {
  349. long tmo = x->lft.hard_add_expires_seconds +
  350. x->curlft.add_time - now;
  351. if (tmo <= 0)
  352. goto expired;
  353. if (tmo < next)
  354. next = tmo;
  355. }
  356. if (x->lft.hard_use_expires_seconds) {
  357. long tmo = x->lft.hard_use_expires_seconds +
  358. (x->curlft.use_time ? : now) - now;
  359. if (tmo <= 0)
  360. goto expired;
  361. if (tmo < next)
  362. next = tmo;
  363. }
  364. if (x->km.dying)
  365. goto resched;
  366. if (x->lft.soft_add_expires_seconds) {
  367. long tmo = x->lft.soft_add_expires_seconds +
  368. x->curlft.add_time - now;
  369. if (tmo <= 0)
  370. warn = 1;
  371. else if (tmo < next)
  372. next = tmo;
  373. }
  374. if (x->lft.soft_use_expires_seconds) {
  375. long tmo = x->lft.soft_use_expires_seconds +
  376. (x->curlft.use_time ? : now) - now;
  377. if (tmo <= 0)
  378. warn = 1;
  379. else if (tmo < next)
  380. next = tmo;
  381. }
  382. x->km.dying = warn;
  383. if (warn)
  384. km_state_expired(x, 0, 0);
  385. resched:
  386. if (next != LONG_MAX){
  387. tasklet_hrtimer_start(&x->mtimer, ktime_set(next, 0), HRTIMER_MODE_REL);
  388. }
  389. goto out;
  390. expired:
  391. if (x->km.state == XFRM_STATE_ACQ && x->id.spi == 0) {
  392. x->km.state = XFRM_STATE_EXPIRED;
  393. wake_up(&net->xfrm.km_waitq);
  394. next = 2;
  395. goto resched;
  396. }
  397. err = __xfrm_state_delete(x);
  398. if (!err && x->id.spi)
  399. km_state_expired(x, 1, 0);
  400. xfrm_audit_state_delete(x, err ? 0 : 1,
  401. audit_get_loginuid(current),
  402. audit_get_sessionid(current), 0);
  403. out:
  404. spin_unlock(&x->lock);
  405. return HRTIMER_NORESTART;
  406. }
  407. static void xfrm_replay_timer_handler(unsigned long data);
  408. struct xfrm_state *xfrm_state_alloc(struct net *net)
  409. {
  410. struct xfrm_state *x;
  411. x = kzalloc(sizeof(struct xfrm_state), GFP_ATOMIC);
  412. if (x) {
  413. write_pnet(&x->xs_net, net);
  414. atomic_set(&x->refcnt, 1);
  415. atomic_set(&x->tunnel_users, 0);
  416. INIT_LIST_HEAD(&x->km.all);
  417. INIT_HLIST_NODE(&x->bydst);
  418. INIT_HLIST_NODE(&x->bysrc);
  419. INIT_HLIST_NODE(&x->byspi);
  420. tasklet_hrtimer_init(&x->mtimer, xfrm_timer_handler, CLOCK_REALTIME, HRTIMER_MODE_ABS);
  421. setup_timer(&x->rtimer, xfrm_replay_timer_handler,
  422. (unsigned long)x);
  423. x->curlft.add_time = get_seconds();
  424. x->lft.soft_byte_limit = XFRM_INF;
  425. x->lft.soft_packet_limit = XFRM_INF;
  426. x->lft.hard_byte_limit = XFRM_INF;
  427. x->lft.hard_packet_limit = XFRM_INF;
  428. x->replay_maxage = 0;
  429. x->replay_maxdiff = 0;
  430. x->inner_mode = NULL;
  431. x->inner_mode_iaf = NULL;
  432. spin_lock_init(&x->lock);
  433. }
  434. return x;
  435. }
  436. EXPORT_SYMBOL(xfrm_state_alloc);
  437. void __xfrm_state_destroy(struct xfrm_state *x)
  438. {
  439. struct net *net = xs_net(x);
  440. WARN_ON(x->km.state != XFRM_STATE_DEAD);
  441. spin_lock_bh(&xfrm_state_gc_lock);
  442. hlist_add_head(&x->gclist, &net->xfrm.state_gc_list);
  443. spin_unlock_bh(&xfrm_state_gc_lock);
  444. schedule_work(&net->xfrm.state_gc_work);
  445. }
  446. EXPORT_SYMBOL(__xfrm_state_destroy);
  447. int __xfrm_state_delete(struct xfrm_state *x)
  448. {
  449. struct net *net = xs_net(x);
  450. int err = -ESRCH;
  451. if (x->km.state != XFRM_STATE_DEAD) {
  452. x->km.state = XFRM_STATE_DEAD;
  453. spin_lock(&xfrm_state_lock);
  454. list_del(&x->km.all);
  455. hlist_del(&x->bydst);
  456. hlist_del(&x->bysrc);
  457. if (x->id.spi)
  458. hlist_del(&x->byspi);
  459. net->xfrm.state_num--;
  460. spin_unlock(&xfrm_state_lock);
  461. /* All xfrm_state objects are created by xfrm_state_alloc.
  462. * The xfrm_state_alloc call gives a reference, and that
  463. * is what we are dropping here.
  464. */
  465. xfrm_state_put(x);
  466. err = 0;
  467. }
  468. return err;
  469. }
  470. EXPORT_SYMBOL(__xfrm_state_delete);
  471. int xfrm_state_delete(struct xfrm_state *x)
  472. {
  473. int err;
  474. spin_lock_bh(&x->lock);
  475. err = __xfrm_state_delete(x);
  476. spin_unlock_bh(&x->lock);
  477. return err;
  478. }
  479. EXPORT_SYMBOL(xfrm_state_delete);
  480. #ifdef CONFIG_SECURITY_NETWORK_XFRM
  481. static inline int
  482. xfrm_state_flush_secctx_check(struct net *net, u8 proto, struct xfrm_audit *audit_info)
  483. {
  484. int i, err = 0;
  485. for (i = 0; i <= net->xfrm.state_hmask; i++) {
  486. struct hlist_node *entry;
  487. struct xfrm_state *x;
  488. hlist_for_each_entry(x, entry, net->xfrm.state_bydst+i, bydst) {
  489. if (xfrm_id_proto_match(x->id.proto, proto) &&
  490. (err = security_xfrm_state_delete(x)) != 0) {
  491. xfrm_audit_state_delete(x, 0,
  492. audit_info->loginuid,
  493. audit_info->sessionid,
  494. audit_info->secid);
  495. return err;
  496. }
  497. }
  498. }
  499. return err;
  500. }
  501. #else
  502. static inline int
  503. xfrm_state_flush_secctx_check(struct net *net, u8 proto, struct xfrm_audit *audit_info)
  504. {
  505. return 0;
  506. }
  507. #endif
  508. int xfrm_state_flush(struct net *net, u8 proto, struct xfrm_audit *audit_info)
  509. {
  510. int i, err = 0, cnt = 0;
  511. spin_lock_bh(&xfrm_state_lock);
  512. err = xfrm_state_flush_secctx_check(net, proto, audit_info);
  513. if (err)
  514. goto out;
  515. err = -ESRCH;
  516. for (i = 0; i <= net->xfrm.state_hmask; i++) {
  517. struct hlist_node *entry;
  518. struct xfrm_state *x;
  519. restart:
  520. hlist_for_each_entry(x, entry, net->xfrm.state_bydst+i, bydst) {
  521. if (!xfrm_state_kern(x) &&
  522. xfrm_id_proto_match(x->id.proto, proto)) {
  523. xfrm_state_hold(x);
  524. spin_unlock_bh(&xfrm_state_lock);
  525. err = xfrm_state_delete(x);
  526. xfrm_audit_state_delete(x, err ? 0 : 1,
  527. audit_info->loginuid,
  528. audit_info->sessionid,
  529. audit_info->secid);
  530. xfrm_state_put(x);
  531. if (!err)
  532. cnt++;
  533. spin_lock_bh(&xfrm_state_lock);
  534. goto restart;
  535. }
  536. }
  537. }
  538. if (cnt)
  539. err = 0;
  540. out:
  541. spin_unlock_bh(&xfrm_state_lock);
  542. wake_up(&net->xfrm.km_waitq);
  543. return err;
  544. }
  545. EXPORT_SYMBOL(xfrm_state_flush);
  546. void xfrm_sad_getinfo(struct net *net, struct xfrmk_sadinfo *si)
  547. {
  548. spin_lock_bh(&xfrm_state_lock);
  549. si->sadcnt = net->xfrm.state_num;
  550. si->sadhcnt = net->xfrm.state_hmask;
  551. si->sadhmcnt = xfrm_state_hashmax;
  552. spin_unlock_bh(&xfrm_state_lock);
  553. }
  554. EXPORT_SYMBOL(xfrm_sad_getinfo);
  555. static int
  556. xfrm_init_tempsel(struct xfrm_state *x, struct flowi *fl,
  557. struct xfrm_tmpl *tmpl,
  558. xfrm_address_t *daddr, xfrm_address_t *saddr,
  559. unsigned short family)
  560. {
  561. struct xfrm_state_afinfo *afinfo = xfrm_state_get_afinfo(family);
  562. if (!afinfo)
  563. return -1;
  564. afinfo->init_tempsel(x, fl, tmpl, daddr, saddr);
  565. xfrm_state_put_afinfo(afinfo);
  566. return 0;
  567. }
  568. static struct xfrm_state *__xfrm_state_lookup(struct net *net, u32 mark, xfrm_address_t *daddr, __be32 spi, u8 proto, unsigned short family)
  569. {
  570. unsigned int h = xfrm_spi_hash(net, daddr, spi, proto, family);
  571. struct xfrm_state *x;
  572. struct hlist_node *entry;
  573. hlist_for_each_entry(x, entry, net->xfrm.state_byspi+h, byspi) {
  574. if (x->props.family != family ||
  575. x->id.spi != spi ||
  576. x->id.proto != proto ||
  577. xfrm_addr_cmp(&x->id.daddr, daddr, family))
  578. continue;
  579. if ((mark & x->mark.m) != x->mark.v)
  580. continue;
  581. xfrm_state_hold(x);
  582. return x;
  583. }
  584. return NULL;
  585. }
  586. static struct xfrm_state *__xfrm_state_lookup_byaddr(struct net *net, u32 mark, xfrm_address_t *daddr, xfrm_address_t *saddr, u8 proto, unsigned short family)
  587. {
  588. unsigned int h = xfrm_src_hash(net, daddr, saddr, family);
  589. struct xfrm_state *x;
  590. struct hlist_node *entry;
  591. hlist_for_each_entry(x, entry, net->xfrm.state_bysrc+h, bysrc) {
  592. if (x->props.family != family ||
  593. x->id.proto != proto ||
  594. xfrm_addr_cmp(&x->id.daddr, daddr, family) ||
  595. xfrm_addr_cmp(&x->props.saddr, saddr, family))
  596. continue;
  597. if ((mark & x->mark.m) != x->mark.v)
  598. continue;
  599. xfrm_state_hold(x);
  600. return x;
  601. }
  602. return NULL;
  603. }
  604. static inline struct xfrm_state *
  605. __xfrm_state_locate(struct xfrm_state *x, int use_spi, int family)
  606. {
  607. struct net *net = xs_net(x);
  608. u32 mark = x->mark.v & x->mark.m;
  609. if (use_spi)
  610. return __xfrm_state_lookup(net, mark, &x->id.daddr,
  611. x->id.spi, x->id.proto, family);
  612. else
  613. return __xfrm_state_lookup_byaddr(net, mark,
  614. &x->id.daddr,
  615. &x->props.saddr,
  616. x->id.proto, family);
  617. }
  618. static void xfrm_hash_grow_check(struct net *net, int have_hash_collision)
  619. {
  620. if (have_hash_collision &&
  621. (net->xfrm.state_hmask + 1) < xfrm_state_hashmax &&
  622. net->xfrm.state_num > net->xfrm.state_hmask)
  623. schedule_work(&net->xfrm.state_hash_work);
  624. }
  625. static void xfrm_state_look_at(struct xfrm_policy *pol, struct xfrm_state *x,
  626. struct flowi *fl, unsigned short family,
  627. xfrm_address_t *daddr, xfrm_address_t *saddr,
  628. struct xfrm_state **best, int *acq_in_progress,
  629. int *error)
  630. {
  631. /* Resolution logic:
  632. * 1. There is a valid state with matching selector. Done.
  633. * 2. Valid state with inappropriate selector. Skip.
  634. *
  635. * Entering area of "sysdeps".
  636. *
  637. * 3. If state is not valid, selector is temporary, it selects
  638. * only session which triggered previous resolution. Key
  639. * manager will do something to install a state with proper
  640. * selector.
  641. */
  642. if (x->km.state == XFRM_STATE_VALID) {
  643. if ((x->sel.family &&
  644. !xfrm_selector_match(&x->sel, fl, x->sel.family)) ||
  645. !security_xfrm_state_pol_flow_match(x, pol, fl))
  646. return;
  647. if (!*best ||
  648. (*best)->km.dying > x->km.dying ||
  649. ((*best)->km.dying == x->km.dying &&
  650. (*best)->curlft.add_time < x->curlft.add_time))
  651. *best = x;
  652. } else if (x->km.state == XFRM_STATE_ACQ) {
  653. *acq_in_progress = 1;
  654. } else if (x->km.state == XFRM_STATE_ERROR ||
  655. x->km.state == XFRM_STATE_EXPIRED) {
  656. if (xfrm_selector_match(&x->sel, fl, x->sel.family) &&
  657. security_xfrm_state_pol_flow_match(x, pol, fl))
  658. *error = -ESRCH;
  659. }
  660. }
  661. struct xfrm_state *
  662. xfrm_state_find(xfrm_address_t *daddr, xfrm_address_t *saddr,
  663. struct flowi *fl, struct xfrm_tmpl *tmpl,
  664. struct xfrm_policy *pol, int *err,
  665. unsigned short family)
  666. {
  667. static xfrm_address_t saddr_wildcard = { };
  668. struct net *net = xp_net(pol);
  669. unsigned int h, h_wildcard;
  670. struct hlist_node *entry;
  671. struct xfrm_state *x, *x0, *to_put;
  672. int acquire_in_progress = 0;
  673. int error = 0;
  674. struct xfrm_state *best = NULL;
  675. u32 mark = pol->mark.v & pol->mark.m;
  676. to_put = NULL;
  677. spin_lock_bh(&xfrm_state_lock);
  678. h = xfrm_dst_hash(net, daddr, saddr, tmpl->reqid, family);
  679. hlist_for_each_entry(x, entry, net->xfrm.state_bydst+h, bydst) {
  680. if (x->props.family == family &&
  681. x->props.reqid == tmpl->reqid &&
  682. (mark & x->mark.m) == x->mark.v &&
  683. !(x->props.flags & XFRM_STATE_WILDRECV) &&
  684. xfrm_state_addr_check(x, daddr, saddr, family) &&
  685. tmpl->mode == x->props.mode &&
  686. tmpl->id.proto == x->id.proto &&
  687. (tmpl->id.spi == x->id.spi || !tmpl->id.spi))
  688. xfrm_state_look_at(pol, x, fl, family, daddr, saddr,
  689. &best, &acquire_in_progress, &error);
  690. }
  691. if (best)
  692. goto found;
  693. h_wildcard = xfrm_dst_hash(net, daddr, &saddr_wildcard, tmpl->reqid, family);
  694. hlist_for_each_entry(x, entry, net->xfrm.state_bydst+h_wildcard, bydst) {
  695. if (x->props.family == family &&
  696. x->props.reqid == tmpl->reqid &&
  697. (mark & x->mark.m) == x->mark.v &&
  698. !(x->props.flags & XFRM_STATE_WILDRECV) &&
  699. xfrm_state_addr_check(x, daddr, saddr, family) &&
  700. tmpl->mode == x->props.mode &&
  701. tmpl->id.proto == x->id.proto &&
  702. (tmpl->id.spi == x->id.spi || !tmpl->id.spi))
  703. xfrm_state_look_at(pol, x, fl, family, daddr, saddr,
  704. &best, &acquire_in_progress, &error);
  705. }
  706. found:
  707. x = best;
  708. if (!x && !error && !acquire_in_progress) {
  709. if (tmpl->id.spi &&
  710. (x0 = __xfrm_state_lookup(net, mark, daddr, tmpl->id.spi,
  711. tmpl->id.proto, family)) != NULL) {
  712. to_put = x0;
  713. error = -EEXIST;
  714. goto out;
  715. }
  716. x = xfrm_state_alloc(net);
  717. if (x == NULL) {
  718. error = -ENOMEM;
  719. goto out;
  720. }
  721. /* Initialize temporary selector matching only
  722. * to current session. */
  723. xfrm_init_tempsel(x, fl, tmpl, daddr, saddr, family);
  724. memcpy(&x->mark, &pol->mark, sizeof(x->mark));
  725. error = security_xfrm_state_alloc_acquire(x, pol->security, fl->secid);
  726. if (error) {
  727. x->km.state = XFRM_STATE_DEAD;
  728. to_put = x;
  729. x = NULL;
  730. goto out;
  731. }
  732. if (km_query(x, tmpl, pol) == 0) {
  733. x->km.state = XFRM_STATE_ACQ;
  734. list_add(&x->km.all, &net->xfrm.state_all);
  735. hlist_add_head(&x->bydst, net->xfrm.state_bydst+h);
  736. h = xfrm_src_hash(net, daddr, saddr, family);
  737. hlist_add_head(&x->bysrc, net->xfrm.state_bysrc+h);
  738. if (x->id.spi) {
  739. h = xfrm_spi_hash(net, &x->id.daddr, x->id.spi, x->id.proto, family);
  740. hlist_add_head(&x->byspi, net->xfrm.state_byspi+h);
  741. }
  742. x->lft.hard_add_expires_seconds = net->xfrm.sysctl_acq_expires;
  743. tasklet_hrtimer_start(&x->mtimer, ktime_set(net->xfrm.sysctl_acq_expires, 0), HRTIMER_MODE_REL);
  744. net->xfrm.state_num++;
  745. xfrm_hash_grow_check(net, x->bydst.next != NULL);
  746. } else {
  747. x->km.state = XFRM_STATE_DEAD;
  748. to_put = x;
  749. x = NULL;
  750. error = -ESRCH;
  751. }
  752. }
  753. out:
  754. if (x)
  755. xfrm_state_hold(x);
  756. else
  757. *err = acquire_in_progress ? -EAGAIN : error;
  758. spin_unlock_bh(&xfrm_state_lock);
  759. if (to_put)
  760. xfrm_state_put(to_put);
  761. return x;
  762. }
  763. struct xfrm_state *
  764. xfrm_stateonly_find(struct net *net, u32 mark,
  765. xfrm_address_t *daddr, xfrm_address_t *saddr,
  766. unsigned short family, u8 mode, u8 proto, u32 reqid)
  767. {
  768. unsigned int h;
  769. struct xfrm_state *rx = NULL, *x = NULL;
  770. struct hlist_node *entry;
  771. spin_lock(&xfrm_state_lock);
  772. h = xfrm_dst_hash(net, daddr, saddr, reqid, family);
  773. hlist_for_each_entry(x, entry, net->xfrm.state_bydst+h, bydst) {
  774. if (x->props.family == family &&
  775. x->props.reqid == reqid &&
  776. (mark & x->mark.m) == x->mark.v &&
  777. !(x->props.flags & XFRM_STATE_WILDRECV) &&
  778. xfrm_state_addr_check(x, daddr, saddr, family) &&
  779. mode == x->props.mode &&
  780. proto == x->id.proto &&
  781. x->km.state == XFRM_STATE_VALID) {
  782. rx = x;
  783. break;
  784. }
  785. }
  786. if (rx)
  787. xfrm_state_hold(rx);
  788. spin_unlock(&xfrm_state_lock);
  789. return rx;
  790. }
  791. EXPORT_SYMBOL(xfrm_stateonly_find);
  792. static void __xfrm_state_insert(struct xfrm_state *x)
  793. {
  794. struct net *net = xs_net(x);
  795. unsigned int h;
  796. list_add(&x->km.all, &net->xfrm.state_all);
  797. h = xfrm_dst_hash(net, &x->id.daddr, &x->props.saddr,
  798. x->props.reqid, x->props.family);
  799. hlist_add_head(&x->bydst, net->xfrm.state_bydst+h);
  800. h = xfrm_src_hash(net, &x->id.daddr, &x->props.saddr, x->props.family);
  801. hlist_add_head(&x->bysrc, net->xfrm.state_bysrc+h);
  802. if (x->id.spi) {
  803. h = xfrm_spi_hash(net, &x->id.daddr, x->id.spi, x->id.proto,
  804. x->props.family);
  805. hlist_add_head(&x->byspi, net->xfrm.state_byspi+h);
  806. }
  807. tasklet_hrtimer_start(&x->mtimer, ktime_set(1, 0), HRTIMER_MODE_REL);
  808. if (x->replay_maxage)
  809. mod_timer(&x->rtimer, jiffies + x->replay_maxage);
  810. wake_up(&net->xfrm.km_waitq);
  811. net->xfrm.state_num++;
  812. xfrm_hash_grow_check(net, x->bydst.next != NULL);
  813. }
  814. /* xfrm_state_lock is held */
  815. static void __xfrm_state_bump_genids(struct xfrm_state *xnew)
  816. {
  817. struct net *net = xs_net(xnew);
  818. unsigned short family = xnew->props.family;
  819. u32 reqid = xnew->props.reqid;
  820. struct xfrm_state *x;
  821. struct hlist_node *entry;
  822. unsigned int h;
  823. u32 mark = xnew->mark.v & xnew->mark.m;
  824. h = xfrm_dst_hash(net, &xnew->id.daddr, &xnew->props.saddr, reqid, family);
  825. hlist_for_each_entry(x, entry, net->xfrm.state_bydst+h, bydst) {
  826. if (x->props.family == family &&
  827. x->props.reqid == reqid &&
  828. (mark & x->mark.m) == x->mark.v &&
  829. !xfrm_addr_cmp(&x->id.daddr, &xnew->id.daddr, family) &&
  830. !xfrm_addr_cmp(&x->props.saddr, &xnew->props.saddr, family))
  831. x->genid++;
  832. }
  833. }
  834. void xfrm_state_insert(struct xfrm_state *x)
  835. {
  836. spin_lock_bh(&xfrm_state_lock);
  837. __xfrm_state_bump_genids(x);
  838. __xfrm_state_insert(x);
  839. spin_unlock_bh(&xfrm_state_lock);
  840. }
  841. EXPORT_SYMBOL(xfrm_state_insert);
  842. /* xfrm_state_lock is held */
  843. static struct xfrm_state *__find_acq_core(struct net *net, struct xfrm_mark *m, unsigned short family, u8 mode, u32 reqid, u8 proto, xfrm_address_t *daddr, xfrm_address_t *saddr, int create)
  844. {
  845. unsigned int h = xfrm_dst_hash(net, daddr, saddr, reqid, family);
  846. struct hlist_node *entry;
  847. struct xfrm_state *x;
  848. u32 mark = m->v & m->m;
  849. hlist_for_each_entry(x, entry, net->xfrm.state_bydst+h, bydst) {
  850. if (x->props.reqid != reqid ||
  851. x->props.mode != mode ||
  852. x->props.family != family ||
  853. x->km.state != XFRM_STATE_ACQ ||
  854. x->id.spi != 0 ||
  855. x->id.proto != proto ||
  856. (mark & x->mark.m) != x->mark.v ||
  857. xfrm_addr_cmp(&x->id.daddr, daddr, family) ||
  858. xfrm_addr_cmp(&x->props.saddr, saddr, family))
  859. continue;
  860. xfrm_state_hold(x);
  861. return x;
  862. }
  863. if (!create)
  864. return NULL;
  865. x = xfrm_state_alloc(net);
  866. if (likely(x)) {
  867. switch (family) {
  868. case AF_INET:
  869. x->sel.daddr.a4 = daddr->a4;
  870. x->sel.saddr.a4 = saddr->a4;
  871. x->sel.prefixlen_d = 32;
  872. x->sel.prefixlen_s = 32;
  873. x->props.saddr.a4 = saddr->a4;
  874. x->id.daddr.a4 = daddr->a4;
  875. break;
  876. case AF_INET6:
  877. ipv6_addr_copy((struct in6_addr *)x->sel.daddr.a6,
  878. (struct in6_addr *)daddr);
  879. ipv6_addr_copy((struct in6_addr *)x->sel.saddr.a6,
  880. (struct in6_addr *)saddr);
  881. x->sel.prefixlen_d = 128;
  882. x->sel.prefixlen_s = 128;
  883. ipv6_addr_copy((struct in6_addr *)x->props.saddr.a6,
  884. (struct in6_addr *)saddr);
  885. ipv6_addr_copy((struct in6_addr *)x->id.daddr.a6,
  886. (struct in6_addr *)daddr);
  887. break;
  888. }
  889. x->km.state = XFRM_STATE_ACQ;
  890. x->id.proto = proto;
  891. x->props.family = family;
  892. x->props.mode = mode;
  893. x->props.reqid = reqid;
  894. x->mark.v = m->v;
  895. x->mark.m = m->m;
  896. x->lft.hard_add_expires_seconds = net->xfrm.sysctl_acq_expires;
  897. xfrm_state_hold(x);
  898. tasklet_hrtimer_start(&x->mtimer, ktime_set(net->xfrm.sysctl_acq_expires, 0), HRTIMER_MODE_REL);
  899. list_add(&x->km.all, &net->xfrm.state_all);
  900. hlist_add_head(&x->bydst, net->xfrm.state_bydst+h);
  901. h = xfrm_src_hash(net, daddr, saddr, family);
  902. hlist_add_head(&x->bysrc, net->xfrm.state_bysrc+h);
  903. net->xfrm.state_num++;
  904. xfrm_hash_grow_check(net, x->bydst.next != NULL);
  905. }
  906. return x;
  907. }
  908. static struct xfrm_state *__xfrm_find_acq_byseq(struct net *net, u32 mark, u32 seq);
  909. int xfrm_state_add(struct xfrm_state *x)
  910. {
  911. struct net *net = xs_net(x);
  912. struct xfrm_state *x1, *to_put;
  913. int family;
  914. int err;
  915. u32 mark = x->mark.v & x->mark.m;
  916. int use_spi = xfrm_id_proto_match(x->id.proto, IPSEC_PROTO_ANY);
  917. family = x->props.family;
  918. to_put = NULL;
  919. spin_lock_bh(&xfrm_state_lock);
  920. x1 = __xfrm_state_locate(x, use_spi, family);
  921. if (x1) {
  922. to_put = x1;
  923. x1 = NULL;
  924. err = -EEXIST;
  925. goto out;
  926. }
  927. if (use_spi && x->km.seq) {
  928. x1 = __xfrm_find_acq_byseq(net, mark, x->km.seq);
  929. if (x1 && ((x1->id.proto != x->id.proto) ||
  930. xfrm_addr_cmp(&x1->id.daddr, &x->id.daddr, family))) {
  931. to_put = x1;
  932. x1 = NULL;
  933. }
  934. }
  935. if (use_spi && !x1)
  936. x1 = __find_acq_core(net, &x->mark, family, x->props.mode,
  937. x->props.reqid, x->id.proto,
  938. &x->id.daddr, &x->props.saddr, 0);
  939. __xfrm_state_bump_genids(x);
  940. __xfrm_state_insert(x);
  941. err = 0;
  942. out:
  943. spin_unlock_bh(&xfrm_state_lock);
  944. if (x1) {
  945. xfrm_state_delete(x1);
  946. xfrm_state_put(x1);
  947. }
  948. if (to_put)
  949. xfrm_state_put(to_put);
  950. return err;
  951. }
  952. EXPORT_SYMBOL(xfrm_state_add);
  953. #ifdef CONFIG_XFRM_MIGRATE
  954. static struct xfrm_state *xfrm_state_clone(struct xfrm_state *orig, int *errp)
  955. {
  956. struct net *net = xs_net(orig);
  957. int err = -ENOMEM;
  958. struct xfrm_state *x = xfrm_state_alloc(net);
  959. if (!x)
  960. goto out;
  961. memcpy(&x->id, &orig->id, sizeof(x->id));
  962. memcpy(&x->sel, &orig->sel, sizeof(x->sel));
  963. memcpy(&x->lft, &orig->lft, sizeof(x->lft));
  964. x->props.mode = orig->props.mode;
  965. x->props.replay_window = orig->props.replay_window;
  966. x->props.reqid = orig->props.reqid;
  967. x->props.family = orig->props.family;
  968. x->props.saddr = orig->props.saddr;
  969. if (orig->aalg) {
  970. x->aalg = xfrm_algo_auth_clone(orig->aalg);
  971. if (!x->aalg)
  972. goto error;
  973. }
  974. x->props.aalgo = orig->props.aalgo;
  975. if (orig->ealg) {
  976. x->ealg = xfrm_algo_clone(orig->ealg);
  977. if (!x->ealg)
  978. goto error;
  979. }
  980. x->props.ealgo = orig->props.ealgo;
  981. if (orig->calg) {
  982. x->calg = xfrm_algo_clone(orig->calg);
  983. if (!x->calg)
  984. goto error;
  985. }
  986. x->props.calgo = orig->props.calgo;
  987. if (orig->encap) {
  988. x->encap = kmemdup(orig->encap, sizeof(*x->encap), GFP_KERNEL);
  989. if (!x->encap)
  990. goto error;
  991. }
  992. if (orig->coaddr) {
  993. x->coaddr = kmemdup(orig->coaddr, sizeof(*x->coaddr),
  994. GFP_KERNEL);
  995. if (!x->coaddr)
  996. goto error;
  997. }
  998. memcpy(&x->mark, &orig->mark, sizeof(x->mark));
  999. err = xfrm_init_state(x);
  1000. if (err)
  1001. goto error;
  1002. x->props.flags = orig->props.flags;
  1003. x->curlft.add_time = orig->curlft.add_time;
  1004. x->km.state = orig->km.state;
  1005. x->km.seq = orig->km.seq;
  1006. return x;
  1007. error:
  1008. xfrm_state_put(x);
  1009. out:
  1010. if (errp)
  1011. *errp = err;
  1012. return NULL;
  1013. }
  1014. /* xfrm_state_lock is held */
  1015. struct xfrm_state * xfrm_migrate_state_find(struct xfrm_migrate *m)
  1016. {
  1017. unsigned int h;
  1018. struct xfrm_state *x;
  1019. struct hlist_node *entry;
  1020. if (m->reqid) {
  1021. h = xfrm_dst_hash(&init_net, &m->old_daddr, &m->old_saddr,
  1022. m->reqid, m->old_family);
  1023. hlist_for_each_entry(x, entry, init_net.xfrm.state_bydst+h, bydst) {
  1024. if (x->props.mode != m->mode ||
  1025. x->id.proto != m->proto)
  1026. continue;
  1027. if (m->reqid && x->props.reqid != m->reqid)
  1028. continue;
  1029. if (xfrm_addr_cmp(&x->id.daddr, &m->old_daddr,
  1030. m->old_family) ||
  1031. xfrm_addr_cmp(&x->props.saddr, &m->old_saddr,
  1032. m->old_family))
  1033. continue;
  1034. xfrm_state_hold(x);
  1035. return x;
  1036. }
  1037. } else {
  1038. h = xfrm_src_hash(&init_net, &m->old_daddr, &m->old_saddr,
  1039. m->old_family);
  1040. hlist_for_each_entry(x, entry, init_net.xfrm.state_bysrc+h, bysrc) {
  1041. if (x->props.mode != m->mode ||
  1042. x->id.proto != m->proto)
  1043. continue;
  1044. if (xfrm_addr_cmp(&x->id.daddr, &m->old_daddr,
  1045. m->old_family) ||
  1046. xfrm_addr_cmp(&x->props.saddr, &m->old_saddr,
  1047. m->old_family))
  1048. continue;
  1049. xfrm_state_hold(x);
  1050. return x;
  1051. }
  1052. }
  1053. return NULL;
  1054. }
  1055. EXPORT_SYMBOL(xfrm_migrate_state_find);
  1056. struct xfrm_state * xfrm_state_migrate(struct xfrm_state *x,
  1057. struct xfrm_migrate *m)
  1058. {
  1059. struct xfrm_state *xc;
  1060. int err;
  1061. xc = xfrm_state_clone(x, &err);
  1062. if (!xc)
  1063. return NULL;
  1064. memcpy(&xc->id.daddr, &m->new_daddr, sizeof(xc->id.daddr));
  1065. memcpy(&xc->props.saddr, &m->new_saddr, sizeof(xc->props.saddr));
  1066. /* add state */
  1067. if (!xfrm_addr_cmp(&x->id.daddr, &m->new_daddr, m->new_family)) {
  1068. /* a care is needed when the destination address of the
  1069. state is to be updated as it is a part of triplet */
  1070. xfrm_state_insert(xc);
  1071. } else {
  1072. if ((err = xfrm_state_add(xc)) < 0)
  1073. goto error;
  1074. }
  1075. return xc;
  1076. error:
  1077. kfree(xc);
  1078. return NULL;
  1079. }
  1080. EXPORT_SYMBOL(xfrm_state_migrate);
  1081. #endif
  1082. int xfrm_state_update(struct xfrm_state *x)
  1083. {
  1084. struct xfrm_state *x1, *to_put;
  1085. int err;
  1086. int use_spi = xfrm_id_proto_match(x->id.proto, IPSEC_PROTO_ANY);
  1087. to_put = NULL;
  1088. spin_lock_bh(&xfrm_state_lock);
  1089. x1 = __xfrm_state_locate(x, use_spi, x->props.family);
  1090. err = -ESRCH;
  1091. if (!x1)
  1092. goto out;
  1093. if (xfrm_state_kern(x1)) {
  1094. to_put = x1;
  1095. err = -EEXIST;
  1096. goto out;
  1097. }
  1098. if (x1->km.state == XFRM_STATE_ACQ) {
  1099. __xfrm_state_insert(x);
  1100. x = NULL;
  1101. }
  1102. err = 0;
  1103. out:
  1104. spin_unlock_bh(&xfrm_state_lock);
  1105. if (to_put)
  1106. xfrm_state_put(to_put);
  1107. if (err)
  1108. return err;
  1109. if (!x) {
  1110. xfrm_state_delete(x1);
  1111. xfrm_state_put(x1);
  1112. return 0;
  1113. }
  1114. err = -EINVAL;
  1115. spin_lock_bh(&x1->lock);
  1116. if (likely(x1->km.state == XFRM_STATE_VALID)) {
  1117. if (x->encap && x1->encap)
  1118. memcpy(x1->encap, x->encap, sizeof(*x1->encap));
  1119. if (x->coaddr && x1->coaddr) {
  1120. memcpy(x1->coaddr, x->coaddr, sizeof(*x1->coaddr));
  1121. }
  1122. if (!use_spi && memcmp(&x1->sel, &x->sel, sizeof(x1->sel)))
  1123. memcpy(&x1->sel, &x->sel, sizeof(x1->sel));
  1124. memcpy(&x1->lft, &x->lft, sizeof(x1->lft));
  1125. x1->km.dying = 0;
  1126. tasklet_hrtimer_start(&x1->mtimer, ktime_set(1, 0), HRTIMER_MODE_REL);
  1127. if (x1->curlft.use_time)
  1128. xfrm_state_check_expire(x1);
  1129. err = 0;
  1130. }
  1131. spin_unlock_bh(&x1->lock);
  1132. xfrm_state_put(x1);
  1133. return err;
  1134. }
  1135. EXPORT_SYMBOL(xfrm_state_update);
  1136. int xfrm_state_check_expire(struct xfrm_state *x)
  1137. {
  1138. if (!x->curlft.use_time)
  1139. x->curlft.use_time = get_seconds();
  1140. if (x->km.state != XFRM_STATE_VALID)
  1141. return -EINVAL;
  1142. if (x->curlft.bytes >= x->lft.hard_byte_limit ||
  1143. x->curlft.packets >= x->lft.hard_packet_limit) {
  1144. x->km.state = XFRM_STATE_EXPIRED;
  1145. tasklet_hrtimer_start(&x->mtimer, ktime_set(0,0), HRTIMER_MODE_REL);
  1146. return -EINVAL;
  1147. }
  1148. if (!x->km.dying &&
  1149. (x->curlft.bytes >= x->lft.soft_byte_limit ||
  1150. x->curlft.packets >= x->lft.soft_packet_limit)) {
  1151. x->km.dying = 1;
  1152. km_state_expired(x, 0, 0);
  1153. }
  1154. return 0;
  1155. }
  1156. EXPORT_SYMBOL(xfrm_state_check_expire);
  1157. struct xfrm_state *
  1158. xfrm_state_lookup(struct net *net, u32 mark, xfrm_address_t *daddr, __be32 spi,
  1159. u8 proto, unsigned short family)
  1160. {
  1161. struct xfrm_state *x;
  1162. spin_lock_bh(&xfrm_state_lock);
  1163. x = __xfrm_state_lookup(net, mark, daddr, spi, proto, family);
  1164. spin_unlock_bh(&xfrm_state_lock);
  1165. return x;
  1166. }
  1167. EXPORT_SYMBOL(xfrm_state_lookup);
  1168. struct xfrm_state *
  1169. xfrm_state_lookup_byaddr(struct net *net, u32 mark,
  1170. xfrm_address_t *daddr, xfrm_address_t *saddr,
  1171. u8 proto, unsigned short family)
  1172. {
  1173. struct xfrm_state *x;
  1174. spin_lock_bh(&xfrm_state_lock);
  1175. x = __xfrm_state_lookup_byaddr(net, mark, daddr, saddr, proto, family);
  1176. spin_unlock_bh(&xfrm_state_lock);
  1177. return x;
  1178. }
  1179. EXPORT_SYMBOL(xfrm_state_lookup_byaddr);
  1180. struct xfrm_state *
  1181. xfrm_find_acq(struct net *net, struct xfrm_mark *mark, u8 mode, u32 reqid, u8 proto,
  1182. xfrm_address_t *daddr, xfrm_address_t *saddr,
  1183. int create, unsigned short family)
  1184. {
  1185. struct xfrm_state *x;
  1186. spin_lock_bh(&xfrm_state_lock);
  1187. x = __find_acq_core(net, mark, family, mode, reqid, proto, daddr, saddr, create);
  1188. spin_unlock_bh(&xfrm_state_lock);
  1189. return x;
  1190. }
  1191. EXPORT_SYMBOL(xfrm_find_acq);
  1192. #ifdef CONFIG_XFRM_SUB_POLICY
  1193. int
  1194. xfrm_tmpl_sort(struct xfrm_tmpl **dst, struct xfrm_tmpl **src, int n,
  1195. unsigned short family)
  1196. {
  1197. int err = 0;
  1198. struct xfrm_state_afinfo *afinfo = xfrm_state_get_afinfo(family);
  1199. if (!afinfo)
  1200. return -EAFNOSUPPORT;
  1201. spin_lock_bh(&xfrm_state_lock);
  1202. if (afinfo->tmpl_sort)
  1203. err = afinfo->tmpl_sort(dst, src, n);
  1204. spin_unlock_bh(&xfrm_state_lock);
  1205. xfrm_state_put_afinfo(afinfo);
  1206. return err;
  1207. }
  1208. EXPORT_SYMBOL(xfrm_tmpl_sort);
  1209. int
  1210. xfrm_state_sort(struct xfrm_state **dst, struct xfrm_state **src, int n,
  1211. unsigned short family)
  1212. {
  1213. int err = 0;
  1214. struct xfrm_state_afinfo *afinfo = xfrm_state_get_afinfo(family);
  1215. if (!afinfo)
  1216. return -EAFNOSUPPORT;
  1217. spin_lock_bh(&xfrm_state_lock);
  1218. if (afinfo->state_sort)
  1219. err = afinfo->state_sort(dst, src, n);
  1220. spin_unlock_bh(&xfrm_state_lock);
  1221. xfrm_state_put_afinfo(afinfo);
  1222. return err;
  1223. }
  1224. EXPORT_SYMBOL(xfrm_state_sort);
  1225. #endif
  1226. /* Silly enough, but I'm lazy to build resolution list */
  1227. static struct xfrm_state *__xfrm_find_acq_byseq(struct net *net, u32 mark, u32 seq)
  1228. {
  1229. int i;
  1230. for (i = 0; i <= net->xfrm.state_hmask; i++) {
  1231. struct hlist_node *entry;
  1232. struct xfrm_state *x;
  1233. hlist_for_each_entry(x, entry, net->xfrm.state_bydst+i, bydst) {
  1234. if (x->km.seq == seq &&
  1235. (mark & x->mark.m) == x->mark.v &&
  1236. x->km.state == XFRM_STATE_ACQ) {
  1237. xfrm_state_hold(x);
  1238. return x;
  1239. }
  1240. }
  1241. }
  1242. return NULL;
  1243. }
  1244. struct xfrm_state *xfrm_find_acq_byseq(struct net *net, u32 mark, u32 seq)
  1245. {
  1246. struct xfrm_state *x;
  1247. spin_lock_bh(&xfrm_state_lock);
  1248. x = __xfrm_find_acq_byseq(net, mark, seq);
  1249. spin_unlock_bh(&xfrm_state_lock);
  1250. return x;
  1251. }
  1252. EXPORT_SYMBOL(xfrm_find_acq_byseq);
  1253. u32 xfrm_get_acqseq(void)
  1254. {
  1255. u32 res;
  1256. static atomic_t acqseq;
  1257. do {
  1258. res = atomic_inc_return(&acqseq);
  1259. } while (!res);
  1260. return res;
  1261. }
  1262. EXPORT_SYMBOL(xfrm_get_acqseq);
  1263. int xfrm_alloc_spi(struct xfrm_state *x, u32 low, u32 high)
  1264. {
  1265. struct net *net = xs_net(x);
  1266. unsigned int h;
  1267. struct xfrm_state *x0;
  1268. int err = -ENOENT;
  1269. __be32 minspi = htonl(low);
  1270. __be32 maxspi = htonl(high);
  1271. u32 mark = x->mark.v & x->mark.m;
  1272. spin_lock_bh(&x->lock);
  1273. if (x->km.state == XFRM_STATE_DEAD)
  1274. goto unlock;
  1275. err = 0;
  1276. if (x->id.spi)
  1277. goto unlock;
  1278. err = -ENOENT;
  1279. if (minspi == maxspi) {
  1280. x0 = xfrm_state_lookup(net, mark, &x->id.daddr, minspi, x->id.proto, x->props.family);
  1281. if (x0) {
  1282. xfrm_state_put(x0);
  1283. goto unlock;
  1284. }
  1285. x->id.spi = minspi;
  1286. } else {
  1287. u32 spi = 0;
  1288. for (h=0; h<high-low+1; h++) {
  1289. spi = low + net_random()%(high-low+1);
  1290. x0 = xfrm_state_lookup(net, mark, &x->id.daddr, htonl(spi), x->id.proto, x->props.family);
  1291. if (x0 == NULL) {
  1292. x->id.spi = htonl(spi);
  1293. break;
  1294. }
  1295. xfrm_state_put(x0);
  1296. }
  1297. }
  1298. if (x->id.spi) {
  1299. spin_lock_bh(&xfrm_state_lock);
  1300. h = xfrm_spi_hash(net, &x->id.daddr, x->id.spi, x->id.proto, x->props.family);
  1301. hlist_add_head(&x->byspi, net->xfrm.state_byspi+h);
  1302. spin_unlock_bh(&xfrm_state_lock);
  1303. err = 0;
  1304. }
  1305. unlock:
  1306. spin_unlock_bh(&x->lock);
  1307. return err;
  1308. }
  1309. EXPORT_SYMBOL(xfrm_alloc_spi);
  1310. int xfrm_state_walk(struct net *net, struct xfrm_state_walk *walk,
  1311. int (*func)(struct xfrm_state *, int, void*),
  1312. void *data)
  1313. {
  1314. struct xfrm_state *state;
  1315. struct xfrm_state_walk *x;
  1316. int err = 0;
  1317. if (walk->seq != 0 && list_empty(&walk->all))
  1318. return 0;
  1319. spin_lock_bh(&xfrm_state_lock);
  1320. if (list_empty(&walk->all))
  1321. x = list_first_entry(&net->xfrm.state_all, struct xfrm_state_walk, all);
  1322. else
  1323. x = list_entry(&walk->all, struct xfrm_state_walk, all);
  1324. list_for_each_entry_from(x, &net->xfrm.state_all, all) {
  1325. if (x->state == XFRM_STATE_DEAD)
  1326. continue;
  1327. state = container_of(x, struct xfrm_state, km);
  1328. if (!xfrm_id_proto_match(state->id.proto, walk->proto))
  1329. continue;
  1330. err = func(state, walk->seq, data);
  1331. if (err) {
  1332. list_move_tail(&walk->all, &x->all);
  1333. goto out;
  1334. }
  1335. walk->seq++;
  1336. }
  1337. if (walk->seq == 0) {
  1338. err = -ENOENT;
  1339. goto out;
  1340. }
  1341. list_del_init(&walk->all);
  1342. out:
  1343. spin_unlock_bh(&xfrm_state_lock);
  1344. return err;
  1345. }
  1346. EXPORT_SYMBOL(xfrm_state_walk);
  1347. void xfrm_state_walk_init(struct xfrm_state_walk *walk, u8 proto)
  1348. {
  1349. INIT_LIST_HEAD(&walk->all);
  1350. walk->proto = proto;
  1351. walk->state = XFRM_STATE_DEAD;
  1352. walk->seq = 0;
  1353. }
  1354. EXPORT_SYMBOL(xfrm_state_walk_init);
  1355. void xfrm_state_walk_done(struct xfrm_state_walk *walk)
  1356. {
  1357. if (list_empty(&walk->all))
  1358. return;
  1359. spin_lock_bh(&xfrm_state_lock);
  1360. list_del(&walk->all);
  1361. spin_unlock_bh(&xfrm_state_lock);
  1362. }
  1363. EXPORT_SYMBOL(xfrm_state_walk_done);
  1364. void xfrm_replay_notify(struct xfrm_state *x, int event)
  1365. {
  1366. struct km_event c;
  1367. /* we send notify messages in case
  1368. * 1. we updated on of the sequence numbers, and the seqno difference
  1369. * is at least x->replay_maxdiff, in this case we also update the
  1370. * timeout of our timer function
  1371. * 2. if x->replay_maxage has elapsed since last update,
  1372. * and there were changes
  1373. *
  1374. * The state structure must be locked!
  1375. */
  1376. switch (event) {
  1377. case XFRM_REPLAY_UPDATE:
  1378. if (x->replay_maxdiff &&
  1379. (x->replay.seq - x->preplay.seq < x->replay_maxdiff) &&
  1380. (x->replay.oseq - x->preplay.oseq < x->replay_maxdiff)) {
  1381. if (x->xflags & XFRM_TIME_DEFER)
  1382. event = XFRM_REPLAY_TIMEOUT;
  1383. else
  1384. return;
  1385. }
  1386. break;
  1387. case XFRM_REPLAY_TIMEOUT:
  1388. if ((x->replay.seq == x->preplay.seq) &&
  1389. (x->replay.bitmap == x->preplay.bitmap) &&
  1390. (x->replay.oseq == x->preplay.oseq)) {
  1391. x->xflags |= XFRM_TIME_DEFER;
  1392. return;
  1393. }
  1394. break;
  1395. }
  1396. memcpy(&x->preplay, &x->replay, sizeof(struct xfrm_replay_state));
  1397. c.event = XFRM_MSG_NEWAE;
  1398. c.data.aevent = event;
  1399. km_state_notify(x, &c);
  1400. if (x->replay_maxage &&
  1401. !mod_timer(&x->rtimer, jiffies + x->replay_maxage))
  1402. x->xflags &= ~XFRM_TIME_DEFER;
  1403. }
  1404. static void xfrm_replay_timer_handler(unsigned long data)
  1405. {
  1406. struct xfrm_state *x = (struct xfrm_state*)data;
  1407. spin_lock(&x->lock);
  1408. if (x->km.state == XFRM_STATE_VALID) {
  1409. if (xfrm_aevent_is_on(xs_net(x)))
  1410. xfrm_replay_notify(x, XFRM_REPLAY_TIMEOUT);
  1411. else
  1412. x->xflags |= XFRM_TIME_DEFER;
  1413. }
  1414. spin_unlock(&x->lock);
  1415. }
  1416. int xfrm_replay_check(struct xfrm_state *x,
  1417. struct sk_buff *skb, __be32 net_seq)
  1418. {
  1419. u32 diff;
  1420. u32 seq = ntohl(net_seq);
  1421. if (unlikely(seq == 0))
  1422. goto err;
  1423. if (likely(seq > x->replay.seq))
  1424. return 0;
  1425. diff = x->replay.seq - seq;
  1426. if (diff >= min_t(unsigned int, x->props.replay_window,
  1427. sizeof(x->replay.bitmap) * 8)) {
  1428. x->stats.replay_window++;
  1429. goto err;
  1430. }
  1431. if (x->replay.bitmap & (1U << diff)) {
  1432. x->stats.replay++;
  1433. goto err;
  1434. }
  1435. return 0;
  1436. err:
  1437. xfrm_audit_state_replay(x, skb, net_seq);
  1438. return -EINVAL;
  1439. }
  1440. void xfrm_replay_advance(struct xfrm_state *x, __be32 net_seq)
  1441. {
  1442. u32 diff;
  1443. u32 seq = ntohl(net_seq);
  1444. if (seq > x->replay.seq) {
  1445. diff = seq - x->replay.seq;
  1446. if (diff < x->props.replay_window)
  1447. x->replay.bitmap = ((x->replay.bitmap) << diff) | 1;
  1448. else
  1449. x->replay.bitmap = 1;
  1450. x->replay.seq = seq;
  1451. } else {
  1452. diff = x->replay.seq - seq;
  1453. x->replay.bitmap |= (1U << diff);
  1454. }
  1455. if (xfrm_aevent_is_on(xs_net(x)))
  1456. xfrm_replay_notify(x, XFRM_REPLAY_UPDATE);
  1457. }
  1458. static LIST_HEAD(xfrm_km_list);
  1459. static DEFINE_RWLOCK(xfrm_km_lock);
  1460. void km_policy_notify(struct xfrm_policy *xp, int dir, struct km_event *c)
  1461. {
  1462. struct xfrm_mgr *km;
  1463. read_lock(&xfrm_km_lock);
  1464. list_for_each_entry(km, &xfrm_km_list, list)
  1465. if (km->notify_policy)
  1466. km->notify_policy(xp, dir, c);
  1467. read_unlock(&xfrm_km_lock);
  1468. }
  1469. void km_state_notify(struct xfrm_state *x, struct km_event *c)
  1470. {
  1471. struct xfrm_mgr *km;
  1472. read_lock(&xfrm_km_lock);
  1473. list_for_each_entry(km, &xfrm_km_list, list)
  1474. if (km->notify)
  1475. km->notify(x, c);
  1476. read_unlock(&xfrm_km_lock);
  1477. }
  1478. EXPORT_SYMBOL(km_policy_notify);
  1479. EXPORT_SYMBOL(km_state_notify);
  1480. void km_state_expired(struct xfrm_state *x, int hard, u32 pid)
  1481. {
  1482. struct net *net = xs_net(x);
  1483. struct km_event c;
  1484. c.data.hard = hard;
  1485. c.pid = pid;
  1486. c.event = XFRM_MSG_EXPIRE;
  1487. km_state_notify(x, &c);
  1488. if (hard)
  1489. wake_up(&net->xfrm.km_waitq);
  1490. }
  1491. EXPORT_SYMBOL(km_state_expired);
  1492. /*
  1493. * We send to all registered managers regardless of failure
  1494. * We are happy with one success
  1495. */
  1496. int km_query(struct xfrm_state *x, struct xfrm_tmpl *t, struct xfrm_policy *pol)
  1497. {
  1498. int err = -EINVAL, acqret;
  1499. struct xfrm_mgr *km;
  1500. read_lock(&xfrm_km_lock);
  1501. list_for_each_entry(km, &xfrm_km_list, list) {
  1502. acqret = km->acquire(x, t, pol, XFRM_POLICY_OUT);
  1503. if (!acqret)
  1504. err = acqret;
  1505. }
  1506. read_unlock(&xfrm_km_lock);
  1507. return err;
  1508. }
  1509. EXPORT_SYMBOL(km_query);
  1510. int km_new_mapping(struct xfrm_state *x, xfrm_address_t *ipaddr, __be16 sport)
  1511. {
  1512. int err = -EINVAL;
  1513. struct xfrm_mgr *km;
  1514. read_lock(&xfrm_km_lock);
  1515. list_for_each_entry(km, &xfrm_km_list, list) {
  1516. if (km->new_mapping)
  1517. err = km->new_mapping(x, ipaddr, sport);
  1518. if (!err)
  1519. break;
  1520. }
  1521. read_unlock(&xfrm_km_lock);
  1522. return err;
  1523. }
  1524. EXPORT_SYMBOL(km_new_mapping);
  1525. void km_policy_expired(struct xfrm_policy *pol, int dir, int hard, u32 pid)
  1526. {
  1527. struct net *net = xp_net(pol);
  1528. struct km_event c;
  1529. c.data.hard = hard;
  1530. c.pid = pid;
  1531. c.event = XFRM_MSG_POLEXPIRE;
  1532. km_policy_notify(pol, dir, &c);
  1533. if (hard)
  1534. wake_up(&net->xfrm.km_waitq);
  1535. }
  1536. EXPORT_SYMBOL(km_policy_expired);
  1537. #ifdef CONFIG_XFRM_MIGRATE
  1538. int km_migrate(struct xfrm_selector *sel, u8 dir, u8 type,
  1539. struct xfrm_migrate *m, int num_migrate,
  1540. struct xfrm_kmaddress *k)
  1541. {
  1542. int err = -EINVAL;
  1543. int ret;
  1544. struct xfrm_mgr *km;
  1545. read_lock(&xfrm_km_lock);
  1546. list_for_each_entry(km, &xfrm_km_list, list) {
  1547. if (km->migrate) {
  1548. ret = km->migrate(sel, dir, type, m, num_migrate, k);
  1549. if (!ret)
  1550. err = ret;
  1551. }
  1552. }
  1553. read_unlock(&xfrm_km_lock);
  1554. return err;
  1555. }
  1556. EXPORT_SYMBOL(km_migrate);
  1557. #endif
  1558. int km_report(struct net *net, u8 proto, struct xfrm_selector *sel, xfrm_address_t *addr)
  1559. {
  1560. int err = -EINVAL;
  1561. int ret;
  1562. struct xfrm_mgr *km;
  1563. read_lock(&xfrm_km_lock);
  1564. list_for_each_entry(km, &xfrm_km_list, list) {
  1565. if (km->report) {
  1566. ret = km->report(net, proto, sel, addr);
  1567. if (!ret)
  1568. err = ret;
  1569. }
  1570. }
  1571. read_unlock(&xfrm_km_lock);
  1572. return err;
  1573. }
  1574. EXPORT_SYMBOL(km_report);
  1575. int xfrm_user_policy(struct sock *sk, int optname, u8 __user *optval, int optlen)
  1576. {
  1577. int err;
  1578. u8 *data;
  1579. struct xfrm_mgr *km;
  1580. struct xfrm_policy *pol = NULL;
  1581. if (optlen <= 0 || optlen > PAGE_SIZE)
  1582. return -EMSGSIZE;
  1583. data = kmalloc(optlen, GFP_KERNEL);
  1584. if (!data)
  1585. return -ENOMEM;
  1586. err = -EFAULT;
  1587. if (copy_from_user(data, optval, optlen))
  1588. goto out;
  1589. err = -EINVAL;
  1590. read_lock(&xfrm_km_lock);
  1591. list_for_each_entry(km, &xfrm_km_list, list) {
  1592. pol = km->compile_policy(sk, optname, data,
  1593. optlen, &err);
  1594. if (err >= 0)
  1595. break;
  1596. }
  1597. read_unlock(&xfrm_km_lock);
  1598. if (err >= 0) {
  1599. xfrm_sk_policy_insert(sk, err, pol);
  1600. xfrm_pol_put(pol);
  1601. err = 0;
  1602. }
  1603. out:
  1604. kfree(data);
  1605. return err;
  1606. }
  1607. EXPORT_SYMBOL(xfrm_user_policy);
  1608. int xfrm_register_km(struct xfrm_mgr *km)
  1609. {
  1610. write_lock_bh(&xfrm_km_lock);
  1611. list_add_tail(&km->list, &xfrm_km_list);
  1612. write_unlock_bh(&xfrm_km_lock);
  1613. return 0;
  1614. }
  1615. EXPORT_SYMBOL(xfrm_register_km);
  1616. int xfrm_unregister_km(struct xfrm_mgr *km)
  1617. {
  1618. write_lock_bh(&xfrm_km_lock);
  1619. list_del(&km->list);
  1620. write_unlock_bh(&xfrm_km_lock);
  1621. return 0;
  1622. }
  1623. EXPORT_SYMBOL(xfrm_unregister_km);
  1624. int xfrm_state_register_afinfo(struct xfrm_state_afinfo *afinfo)
  1625. {
  1626. int err = 0;
  1627. if (unlikely(afinfo == NULL))
  1628. return -EINVAL;
  1629. if (unlikely(afinfo->family >= NPROTO))
  1630. return -EAFNOSUPPORT;
  1631. write_lock_bh(&xfrm_state_afinfo_lock);
  1632. if (unlikely(xfrm_state_afinfo[afinfo->family] != NULL))
  1633. err = -ENOBUFS;
  1634. else
  1635. xfrm_state_afinfo[afinfo->family] = afinfo;
  1636. write_unlock_bh(&xfrm_state_afinfo_lock);
  1637. return err;
  1638. }
  1639. EXPORT_SYMBOL(xfrm_state_register_afinfo);
  1640. int xfrm_state_unregister_afinfo(struct xfrm_state_afinfo *afinfo)
  1641. {
  1642. int err = 0;
  1643. if (unlikely(afinfo == NULL))
  1644. return -EINVAL;
  1645. if (unlikely(afinfo->family >= NPROTO))
  1646. return -EAFNOSUPPORT;
  1647. write_lock_bh(&xfrm_state_afinfo_lock);
  1648. if (likely(xfrm_state_afinfo[afinfo->family] != NULL)) {
  1649. if (unlikely(xfrm_state_afinfo[afinfo->family] != afinfo))
  1650. err = -EINVAL;
  1651. else
  1652. xfrm_state_afinfo[afinfo->family] = NULL;
  1653. }
  1654. write_unlock_bh(&xfrm_state_afinfo_lock);
  1655. return err;
  1656. }
  1657. EXPORT_SYMBOL(xfrm_state_unregister_afinfo);
  1658. static struct xfrm_state_afinfo *xfrm_state_get_afinfo(unsigned int family)
  1659. {
  1660. struct xfrm_state_afinfo *afinfo;
  1661. if (unlikely(family >= NPROTO))
  1662. return NULL;
  1663. read_lock(&xfrm_state_afinfo_lock);
  1664. afinfo = xfrm_state_afinfo[family];
  1665. if (unlikely(!afinfo))
  1666. read_unlock(&xfrm_state_afinfo_lock);
  1667. return afinfo;
  1668. }
  1669. static void xfrm_state_put_afinfo(struct xfrm_state_afinfo *afinfo)
  1670. __releases(xfrm_state_afinfo_lock)
  1671. {
  1672. read_unlock(&xfrm_state_afinfo_lock);
  1673. }
  1674. /* Temporarily located here until net/xfrm/xfrm_tunnel.c is created */
  1675. void xfrm_state_delete_tunnel(struct xfrm_state *x)
  1676. {
  1677. if (x->tunnel) {
  1678. struct xfrm_state *t = x->tunnel;
  1679. if (atomic_read(&t->tunnel_users) == 2)
  1680. xfrm_state_delete(t);
  1681. atomic_dec(&t->tunnel_users);
  1682. xfrm_state_put(t);
  1683. x->tunnel = NULL;
  1684. }
  1685. }
  1686. EXPORT_SYMBOL(xfrm_state_delete_tunnel);
  1687. int xfrm_state_mtu(struct xfrm_state *x, int mtu)
  1688. {
  1689. int res;
  1690. spin_lock_bh(&x->lock);
  1691. if (x->km.state == XFRM_STATE_VALID &&
  1692. x->type && x->type->get_mtu)
  1693. res = x->type->get_mtu(x, mtu);
  1694. else
  1695. res = mtu - x->props.header_len;
  1696. spin_unlock_bh(&x->lock);
  1697. return res;
  1698. }
  1699. int xfrm_init_state(struct xfrm_state *x)
  1700. {
  1701. struct xfrm_state_afinfo *afinfo;
  1702. struct xfrm_mode *inner_mode;
  1703. int family = x->props.family;
  1704. int err;
  1705. err = -EAFNOSUPPORT;
  1706. afinfo = xfrm_state_get_afinfo(family);
  1707. if (!afinfo)
  1708. goto error;
  1709. err = 0;
  1710. if (afinfo->init_flags)
  1711. err = afinfo->init_flags(x);
  1712. xfrm_state_put_afinfo(afinfo);
  1713. if (err)
  1714. goto error;
  1715. err = -EPROTONOSUPPORT;
  1716. if (x->sel.family != AF_UNSPEC) {
  1717. inner_mode = xfrm_get_mode(x->props.mode, x->sel.family);
  1718. if (inner_mode == NULL)
  1719. goto error;
  1720. if (!(inner_mode->flags & XFRM_MODE_FLAG_TUNNEL) &&
  1721. family != x->sel.family) {
  1722. xfrm_put_mode(inner_mode);
  1723. goto error;
  1724. }
  1725. x->inner_mode = inner_mode;
  1726. } else {
  1727. struct xfrm_mode *inner_mode_iaf;
  1728. int iafamily = AF_INET;
  1729. inner_mode = xfrm_get_mode(x->props.mode, x->props.family);
  1730. if (inner_mode == NULL)
  1731. goto error;
  1732. if (!(inner_mode->flags & XFRM_MODE_FLAG_TUNNEL)) {
  1733. xfrm_put_mode(inner_mode);
  1734. goto error;
  1735. }
  1736. x->inner_mode = inner_mode;
  1737. if (x->props.family == AF_INET)
  1738. iafamily = AF_INET6;
  1739. inner_mode_iaf = xfrm_get_mode(x->props.mode, iafamily);
  1740. if (inner_mode_iaf) {
  1741. if (inner_mode_iaf->flags & XFRM_MODE_FLAG_TUNNEL)
  1742. x->inner_mode_iaf = inner_mode_iaf;
  1743. else
  1744. xfrm_put_mode(inner_mode_iaf);
  1745. }
  1746. }
  1747. x->type = xfrm_get_type(x->id.proto, family);
  1748. if (x->type == NULL)
  1749. goto error;
  1750. err = x->type->init_state(x);
  1751. if (err)
  1752. goto error;
  1753. x->outer_mode = xfrm_get_mode(x->props.mode, family);
  1754. if (x->outer_mode == NULL)
  1755. goto error;
  1756. x->km.state = XFRM_STATE_VALID;
  1757. error:
  1758. return err;
  1759. }
  1760. EXPORT_SYMBOL(xfrm_init_state);
  1761. int __net_init xfrm_state_init(struct net *net)
  1762. {
  1763. unsigned int sz;
  1764. INIT_LIST_HEAD(&net->xfrm.state_all);
  1765. sz = sizeof(struct hlist_head) * 8;
  1766. net->xfrm.state_bydst = xfrm_hash_alloc(sz);
  1767. if (!net->xfrm.state_bydst)
  1768. goto out_bydst;
  1769. net->xfrm.state_bysrc = xfrm_hash_alloc(sz);
  1770. if (!net->xfrm.state_bysrc)
  1771. goto out_bysrc;
  1772. net->xfrm.state_byspi = xfrm_hash_alloc(sz);
  1773. if (!net->xfrm.state_byspi)
  1774. goto out_byspi;
  1775. net->xfrm.state_hmask = ((sz / sizeof(struct hlist_head)) - 1);
  1776. net->xfrm.state_num = 0;
  1777. INIT_WORK(&net->xfrm.state_hash_work, xfrm_hash_resize);
  1778. INIT_HLIST_HEAD(&net->xfrm.state_gc_list);
  1779. INIT_WORK(&net->xfrm.state_gc_work, xfrm_state_gc_task);
  1780. init_waitqueue_head(&net->xfrm.km_waitq);
  1781. return 0;
  1782. out_byspi:
  1783. xfrm_hash_free(net->xfrm.state_bysrc, sz);
  1784. out_bysrc:
  1785. xfrm_hash_free(net->xfrm.state_bydst, sz);
  1786. out_bydst:
  1787. return -ENOMEM;
  1788. }
  1789. void xfrm_state_fini(struct net *net)
  1790. {
  1791. struct xfrm_audit audit_info;
  1792. unsigned int sz;
  1793. flush_work(&net->xfrm.state_hash_work);
  1794. audit_info.loginuid = -1;
  1795. audit_info.sessionid = -1;
  1796. audit_info.secid = 0;
  1797. xfrm_state_flush(net, IPSEC_PROTO_ANY, &audit_info);
  1798. flush_work(&net->xfrm.state_gc_work);
  1799. WARN_ON(!list_empty(&net->xfrm.state_all));
  1800. sz = (net->xfrm.state_hmask + 1) * sizeof(struct hlist_head);
  1801. WARN_ON(!hlist_empty(net->xfrm.state_byspi));
  1802. xfrm_hash_free(net->xfrm.state_byspi, sz);
  1803. WARN_ON(!hlist_empty(net->xfrm.state_bysrc));
  1804. xfrm_hash_free(net->xfrm.state_bysrc, sz);
  1805. WARN_ON(!hlist_empty(net->xfrm.state_bydst));
  1806. xfrm_hash_free(net->xfrm.state_bydst, sz);
  1807. }
  1808. #ifdef CONFIG_AUDITSYSCALL
  1809. static void xfrm_audit_helper_sainfo(struct xfrm_state *x,
  1810. struct audit_buffer *audit_buf)
  1811. {
  1812. struct xfrm_sec_ctx *ctx = x->security;
  1813. u32 spi = ntohl(x->id.spi);
  1814. if (ctx)
  1815. audit_log_format(audit_buf, " sec_alg=%u sec_doi=%u sec_obj=%s",
  1816. ctx->ctx_alg, ctx->ctx_doi, ctx->ctx_str);
  1817. switch(x->props.family) {
  1818. case AF_INET:
  1819. audit_log_format(audit_buf, " src=%pI4 dst=%pI4",
  1820. &x->props.saddr.a4, &x->id.daddr.a4);
  1821. break;
  1822. case AF_INET6:
  1823. audit_log_format(audit_buf, " src=%pI6 dst=%pI6",
  1824. x->props.saddr.a6, x->id.daddr.a6);
  1825. break;
  1826. }
  1827. audit_log_format(audit_buf, " spi=%u(0x%x)", spi, spi);
  1828. }
  1829. static void xfrm_audit_helper_pktinfo(struct sk_buff *skb, u16 family,
  1830. struct audit_buffer *audit_buf)
  1831. {
  1832. struct iphdr *iph4;
  1833. struct ipv6hdr *iph6;
  1834. switch (family) {
  1835. case AF_INET:
  1836. iph4 = ip_hdr(skb);
  1837. audit_log_format(audit_buf, " src=%pI4 dst=%pI4",
  1838. &iph4->saddr, &iph4->daddr);
  1839. break;
  1840. case AF_INET6:
  1841. iph6 = ipv6_hdr(skb);
  1842. audit_log_format(audit_buf,
  1843. " src=%pI6 dst=%pI6 flowlbl=0x%x%02x%02x",
  1844. &iph6->saddr,&iph6->daddr,
  1845. iph6->flow_lbl[0] & 0x0f,
  1846. iph6->flow_lbl[1],
  1847. iph6->flow_lbl[2]);
  1848. break;
  1849. }
  1850. }
  1851. void xfrm_audit_state_add(struct xfrm_state *x, int result,
  1852. uid_t auid, u32 sessionid, u32 secid)
  1853. {
  1854. struct audit_buffer *audit_buf;
  1855. audit_buf = xfrm_audit_start("SAD-add");
  1856. if (audit_buf == NULL)
  1857. return;
  1858. xfrm_audit_helper_usrinfo(auid, sessionid, secid, audit_buf);
  1859. xfrm_audit_helper_sainfo(x, audit_buf);
  1860. audit_log_format(audit_buf, " res=%u", result);
  1861. audit_log_end(audit_buf);
  1862. }
  1863. EXPORT_SYMBOL_GPL(xfrm_audit_state_add);
  1864. void xfrm_audit_state_delete(struct xfrm_state *x, int result,
  1865. uid_t auid, u32 sessionid, u32 secid)
  1866. {
  1867. struct audit_buffer *audit_buf;
  1868. audit_buf = xfrm_audit_start("SAD-delete");
  1869. if (audit_buf == NULL)
  1870. return;
  1871. xfrm_audit_helper_usrinfo(auid, sessionid, secid, audit_buf);
  1872. xfrm_audit_helper_sainfo(x, audit_buf);
  1873. audit_log_format(audit_buf, " res=%u", result);
  1874. audit_log_end(audit_buf);
  1875. }
  1876. EXPORT_SYMBOL_GPL(xfrm_audit_state_delete);
  1877. void xfrm_audit_state_replay_overflow(struct xfrm_state *x,
  1878. struct sk_buff *skb)
  1879. {
  1880. struct audit_buffer *audit_buf;
  1881. u32 spi;
  1882. audit_buf = xfrm_audit_start("SA-replay-overflow");
  1883. if (audit_buf == NULL)
  1884. return;
  1885. xfrm_audit_helper_pktinfo(skb, x->props.family, audit_buf);
  1886. /* don't record the sequence number because it's inherent in this kind
  1887. * of audit message */
  1888. spi = ntohl(x->id.spi);
  1889. audit_log_format(audit_buf, " spi=%u(0x%x)", spi, spi);
  1890. audit_log_end(audit_buf);
  1891. }
  1892. EXPORT_SYMBOL_GPL(xfrm_audit_state_replay_overflow);
  1893. static void xfrm_audit_state_replay(struct xfrm_state *x,
  1894. struct sk_buff *skb, __be32 net_seq)
  1895. {
  1896. struct audit_buffer *audit_buf;
  1897. u32 spi;
  1898. audit_buf = xfrm_audit_start("SA-replayed-pkt");
  1899. if (audit_buf == NULL)
  1900. return;
  1901. xfrm_audit_helper_pktinfo(skb, x->props.family, audit_buf);
  1902. spi = ntohl(x->id.spi);
  1903. audit_log_format(audit_buf, " spi=%u(0x%x) seqno=%u",
  1904. spi, spi, ntohl(net_seq));
  1905. audit_log_end(audit_buf);
  1906. }
  1907. void xfrm_audit_state_notfound_simple(struct sk_buff *skb, u16 family)
  1908. {
  1909. struct audit_buffer *audit_buf;
  1910. audit_buf = xfrm_audit_start("SA-notfound");
  1911. if (audit_buf == NULL)
  1912. return;
  1913. xfrm_audit_helper_pktinfo(skb, family, audit_buf);
  1914. audit_log_end(audit_buf);
  1915. }
  1916. EXPORT_SYMBOL_GPL(xfrm_audit_state_notfound_simple);
  1917. void xfrm_audit_state_notfound(struct sk_buff *skb, u16 family,
  1918. __be32 net_spi, __be32 net_seq)
  1919. {
  1920. struct audit_buffer *audit_buf;
  1921. u32 spi;
  1922. audit_buf = xfrm_audit_start("SA-notfound");
  1923. if (audit_buf == NULL)
  1924. return;
  1925. xfrm_audit_helper_pktinfo(skb, family, audit_buf);
  1926. spi = ntohl(net_spi);
  1927. audit_log_format(audit_buf, " spi=%u(0x%x) seqno=%u",
  1928. spi, spi, ntohl(net_seq));
  1929. audit_log_end(audit_buf);
  1930. }
  1931. EXPORT_SYMBOL_GPL(xfrm_audit_state_notfound);
  1932. void xfrm_audit_state_icvfail(struct xfrm_state *x,
  1933. struct sk_buff *skb, u8 proto)
  1934. {
  1935. struct audit_buffer *audit_buf;
  1936. __be32 net_spi;
  1937. __be32 net_seq;
  1938. audit_buf = xfrm_audit_start("SA-icv-failure");
  1939. if (audit_buf == NULL)
  1940. return;
  1941. xfrm_audit_helper_pktinfo(skb, x->props.family, audit_buf);
  1942. if (xfrm_parse_spi(skb, proto, &net_spi, &net_seq) == 0) {
  1943. u32 spi = ntohl(net_spi);
  1944. audit_log_format(audit_buf, " spi=%u(0x%x) seqno=%u",
  1945. spi, spi, ntohl(net_seq));
  1946. }
  1947. audit_log_end(audit_buf);
  1948. }
  1949. EXPORT_SYMBOL_GPL(xfrm_audit_state_icvfail);
  1950. #endif /* CONFIG_AUDITSYSCALL */