early_res.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590
  1. /*
  2. * early_res, could be used to replace bootmem
  3. */
  4. #include <linux/kernel.h>
  5. #include <linux/types.h>
  6. #include <linux/init.h>
  7. #include <linux/bootmem.h>
  8. #include <linux/mm.h>
  9. #include <linux/early_res.h>
  10. #include <linux/slab.h>
  11. #include <linux/kmemleak.h>
  12. /*
  13. * Early reserved memory areas.
  14. */
  15. /*
  16. * need to make sure this one is bigger enough before
  17. * find_fw_memmap_area could be used
  18. */
  19. #define MAX_EARLY_RES_X 32
  20. struct early_res {
  21. u64 start, end;
  22. char name[15];
  23. char overlap_ok;
  24. };
  25. static struct early_res early_res_x[MAX_EARLY_RES_X] __initdata;
  26. static int max_early_res __initdata = MAX_EARLY_RES_X;
  27. static struct early_res *early_res __initdata = &early_res_x[0];
  28. static int early_res_count __initdata;
  29. static int __init find_overlapped_early(u64 start, u64 end)
  30. {
  31. int i;
  32. struct early_res *r;
  33. for (i = 0; i < max_early_res && early_res[i].end; i++) {
  34. r = &early_res[i];
  35. if (end > r->start && start < r->end)
  36. break;
  37. }
  38. return i;
  39. }
  40. /*
  41. * Drop the i-th range from the early reservation map,
  42. * by copying any higher ranges down one over it, and
  43. * clearing what had been the last slot.
  44. */
  45. static void __init drop_range(int i)
  46. {
  47. int j;
  48. for (j = i + 1; j < max_early_res && early_res[j].end; j++)
  49. ;
  50. memmove(&early_res[i], &early_res[i + 1],
  51. (j - 1 - i) * sizeof(struct early_res));
  52. early_res[j - 1].end = 0;
  53. early_res_count--;
  54. }
  55. static void __init drop_range_partial(int i, u64 start, u64 end)
  56. {
  57. u64 common_start, common_end;
  58. u64 old_start, old_end;
  59. old_start = early_res[i].start;
  60. old_end = early_res[i].end;
  61. common_start = max(old_start, start);
  62. common_end = min(old_end, end);
  63. /* no overlap ? */
  64. if (common_start >= common_end)
  65. return;
  66. if (old_start < common_start) {
  67. /* make head segment */
  68. early_res[i].end = common_start;
  69. if (old_end > common_end) {
  70. char name[15];
  71. /*
  72. * Save a local copy of the name, since the
  73. * early_res array could get resized inside
  74. * reserve_early_without_check() ->
  75. * __check_and_double_early_res(), which would
  76. * make the current name pointer invalid.
  77. */
  78. strncpy(name, early_res[i].name,
  79. sizeof(early_res[i].name) - 1);
  80. /* add another for left over on tail */
  81. reserve_early_without_check(common_end, old_end, name);
  82. }
  83. return;
  84. } else {
  85. if (old_end > common_end) {
  86. /* reuse the entry for tail left */
  87. early_res[i].start = common_end;
  88. return;
  89. }
  90. /* all covered */
  91. drop_range(i);
  92. }
  93. }
  94. /*
  95. * Split any existing ranges that:
  96. * 1) are marked 'overlap_ok', and
  97. * 2) overlap with the stated range [start, end)
  98. * into whatever portion (if any) of the existing range is entirely
  99. * below or entirely above the stated range. Drop the portion
  100. * of the existing range that overlaps with the stated range,
  101. * which will allow the caller of this routine to then add that
  102. * stated range without conflicting with any existing range.
  103. */
  104. static void __init drop_overlaps_that_are_ok(u64 start, u64 end)
  105. {
  106. int i;
  107. struct early_res *r;
  108. u64 lower_start, lower_end;
  109. u64 upper_start, upper_end;
  110. char name[15];
  111. for (i = 0; i < max_early_res && early_res[i].end; i++) {
  112. r = &early_res[i];
  113. /* Continue past non-overlapping ranges */
  114. if (end <= r->start || start >= r->end)
  115. continue;
  116. /*
  117. * Leave non-ok overlaps as is; let caller
  118. * panic "Overlapping early reservations"
  119. * when it hits this overlap.
  120. */
  121. if (!r->overlap_ok)
  122. return;
  123. /*
  124. * We have an ok overlap. We will drop it from the early
  125. * reservation map, and add back in any non-overlapping
  126. * portions (lower or upper) as separate, overlap_ok,
  127. * non-overlapping ranges.
  128. */
  129. /* 1. Note any non-overlapping (lower or upper) ranges. */
  130. strncpy(name, r->name, sizeof(name) - 1);
  131. lower_start = lower_end = 0;
  132. upper_start = upper_end = 0;
  133. if (r->start < start) {
  134. lower_start = r->start;
  135. lower_end = start;
  136. }
  137. if (r->end > end) {
  138. upper_start = end;
  139. upper_end = r->end;
  140. }
  141. /* 2. Drop the original ok overlapping range */
  142. drop_range(i);
  143. i--; /* resume for-loop on copied down entry */
  144. /* 3. Add back in any non-overlapping ranges. */
  145. if (lower_end)
  146. reserve_early_overlap_ok(lower_start, lower_end, name);
  147. if (upper_end)
  148. reserve_early_overlap_ok(upper_start, upper_end, name);
  149. }
  150. }
  151. static void __init __reserve_early(u64 start, u64 end, char *name,
  152. int overlap_ok)
  153. {
  154. int i;
  155. struct early_res *r;
  156. i = find_overlapped_early(start, end);
  157. if (i >= max_early_res)
  158. panic("Too many early reservations");
  159. r = &early_res[i];
  160. if (r->end)
  161. panic("Overlapping early reservations "
  162. "%llx-%llx %s to %llx-%llx %s\n",
  163. start, end - 1, name ? name : "", r->start,
  164. r->end - 1, r->name);
  165. r->start = start;
  166. r->end = end;
  167. r->overlap_ok = overlap_ok;
  168. if (name)
  169. strncpy(r->name, name, sizeof(r->name) - 1);
  170. early_res_count++;
  171. }
  172. /*
  173. * A few early reservtations come here.
  174. *
  175. * The 'overlap_ok' in the name of this routine does -not- mean it
  176. * is ok for these reservations to overlap an earlier reservation.
  177. * Rather it means that it is ok for subsequent reservations to
  178. * overlap this one.
  179. *
  180. * Use this entry point to reserve early ranges when you are doing
  181. * so out of "Paranoia", reserving perhaps more memory than you need,
  182. * just in case, and don't mind a subsequent overlapping reservation
  183. * that is known to be needed.
  184. *
  185. * The drop_overlaps_that_are_ok() call here isn't really needed.
  186. * It would be needed if we had two colliding 'overlap_ok'
  187. * reservations, so that the second such would not panic on the
  188. * overlap with the first. We don't have any such as of this
  189. * writing, but might as well tolerate such if it happens in
  190. * the future.
  191. */
  192. void __init reserve_early_overlap_ok(u64 start, u64 end, char *name)
  193. {
  194. drop_overlaps_that_are_ok(start, end);
  195. __reserve_early(start, end, name, 1);
  196. }
  197. static void __init __check_and_double_early_res(u64 ex_start, u64 ex_end)
  198. {
  199. u64 start, end, size, mem;
  200. struct early_res *new;
  201. /* do we have enough slots left ? */
  202. if ((max_early_res - early_res_count) > max(max_early_res/8, 2))
  203. return;
  204. /* double it */
  205. mem = -1ULL;
  206. size = sizeof(struct early_res) * max_early_res * 2;
  207. if (early_res == early_res_x)
  208. start = 0;
  209. else
  210. start = early_res[0].end;
  211. end = ex_start;
  212. if (start + size < end)
  213. mem = find_fw_memmap_area(start, end, size,
  214. sizeof(struct early_res));
  215. if (mem == -1ULL) {
  216. start = ex_end;
  217. end = get_max_mapped();
  218. if (start + size < end)
  219. mem = find_fw_memmap_area(start, end, size,
  220. sizeof(struct early_res));
  221. }
  222. if (mem == -1ULL)
  223. panic("can not find more space for early_res array");
  224. new = __va(mem);
  225. /* save the first one for own */
  226. new[0].start = mem;
  227. new[0].end = mem + size;
  228. new[0].overlap_ok = 0;
  229. /* copy old to new */
  230. if (early_res == early_res_x) {
  231. memcpy(&new[1], &early_res[0],
  232. sizeof(struct early_res) * max_early_res);
  233. memset(&new[max_early_res+1], 0,
  234. sizeof(struct early_res) * (max_early_res - 1));
  235. early_res_count++;
  236. } else {
  237. memcpy(&new[1], &early_res[1],
  238. sizeof(struct early_res) * (max_early_res - 1));
  239. memset(&new[max_early_res], 0,
  240. sizeof(struct early_res) * max_early_res);
  241. }
  242. memset(&early_res[0], 0, sizeof(struct early_res) * max_early_res);
  243. early_res = new;
  244. max_early_res *= 2;
  245. printk(KERN_DEBUG "early_res array is doubled to %d at [%llx - %llx]\n",
  246. max_early_res, mem, mem + size - 1);
  247. }
  248. /*
  249. * Most early reservations come here.
  250. *
  251. * We first have drop_overlaps_that_are_ok() drop any pre-existing
  252. * 'overlap_ok' ranges, so that we can then reserve this memory
  253. * range without risk of panic'ing on an overlapping overlap_ok
  254. * early reservation.
  255. */
  256. void __init reserve_early(u64 start, u64 end, char *name)
  257. {
  258. if (start >= end)
  259. return;
  260. __check_and_double_early_res(start, end);
  261. drop_overlaps_that_are_ok(start, end);
  262. __reserve_early(start, end, name, 0);
  263. }
  264. void __init reserve_early_without_check(u64 start, u64 end, char *name)
  265. {
  266. struct early_res *r;
  267. if (start >= end)
  268. return;
  269. __check_and_double_early_res(start, end);
  270. r = &early_res[early_res_count];
  271. r->start = start;
  272. r->end = end;
  273. r->overlap_ok = 0;
  274. if (name)
  275. strncpy(r->name, name, sizeof(r->name) - 1);
  276. early_res_count++;
  277. }
  278. void __init free_early(u64 start, u64 end)
  279. {
  280. struct early_res *r;
  281. int i;
  282. kmemleak_free_part(__va(start), end - start);
  283. i = find_overlapped_early(start, end);
  284. r = &early_res[i];
  285. if (i >= max_early_res || r->end != end || r->start != start)
  286. panic("free_early on not reserved area: %llx-%llx!",
  287. start, end - 1);
  288. drop_range(i);
  289. }
  290. void __init free_early_partial(u64 start, u64 end)
  291. {
  292. struct early_res *r;
  293. int i;
  294. kmemleak_free_part(__va(start), end - start);
  295. if (start == end)
  296. return;
  297. if (WARN_ONCE(start > end, " wrong range [%#llx, %#llx]\n", start, end))
  298. return;
  299. try_next:
  300. i = find_overlapped_early(start, end);
  301. if (i >= max_early_res)
  302. return;
  303. r = &early_res[i];
  304. /* hole ? */
  305. if (r->end >= end && r->start <= start) {
  306. drop_range_partial(i, start, end);
  307. return;
  308. }
  309. drop_range_partial(i, start, end);
  310. goto try_next;
  311. }
  312. #ifdef CONFIG_NO_BOOTMEM
  313. static void __init subtract_early_res(struct range *range, int az)
  314. {
  315. int i, count;
  316. u64 final_start, final_end;
  317. int idx = 0;
  318. count = 0;
  319. for (i = 0; i < max_early_res && early_res[i].end; i++)
  320. count++;
  321. /* need to skip first one ?*/
  322. if (early_res != early_res_x)
  323. idx = 1;
  324. #define DEBUG_PRINT_EARLY_RES 1
  325. #if DEBUG_PRINT_EARLY_RES
  326. printk(KERN_INFO "Subtract (%d early reservations)\n", count);
  327. #endif
  328. for (i = idx; i < count; i++) {
  329. struct early_res *r = &early_res[i];
  330. #if DEBUG_PRINT_EARLY_RES
  331. printk(KERN_INFO " #%d [%010llx - %010llx] %15s\n", i,
  332. r->start, r->end, r->name);
  333. #endif
  334. final_start = PFN_DOWN(r->start);
  335. final_end = PFN_UP(r->end);
  336. if (final_start >= final_end)
  337. continue;
  338. subtract_range(range, az, final_start, final_end);
  339. }
  340. }
  341. int __init get_free_all_memory_range(struct range **rangep, int nodeid)
  342. {
  343. int i, count;
  344. u64 start = 0, end;
  345. u64 size;
  346. u64 mem;
  347. struct range *range;
  348. int nr_range;
  349. count = 0;
  350. for (i = 0; i < max_early_res && early_res[i].end; i++)
  351. count++;
  352. count *= 2;
  353. size = sizeof(struct range) * count;
  354. end = get_max_mapped();
  355. #ifdef MAX_DMA32_PFN
  356. if (end > (MAX_DMA32_PFN << PAGE_SHIFT))
  357. start = MAX_DMA32_PFN << PAGE_SHIFT;
  358. #endif
  359. mem = find_fw_memmap_area(start, end, size, sizeof(struct range));
  360. if (mem == -1ULL)
  361. panic("can not find more space for range free");
  362. range = __va(mem);
  363. /* use early_node_map[] and early_res to get range array at first */
  364. memset(range, 0, size);
  365. nr_range = 0;
  366. /* need to go over early_node_map to find out good range for node */
  367. nr_range = add_from_early_node_map(range, count, nr_range, nodeid);
  368. #ifdef CONFIG_X86_32
  369. subtract_range(range, count, max_low_pfn, -1ULL);
  370. #endif
  371. subtract_early_res(range, count);
  372. nr_range = clean_sort_range(range, count);
  373. /* need to clear it ? */
  374. if (nodeid == MAX_NUMNODES) {
  375. memset(&early_res[0], 0,
  376. sizeof(struct early_res) * max_early_res);
  377. early_res = NULL;
  378. max_early_res = 0;
  379. }
  380. *rangep = range;
  381. return nr_range;
  382. }
  383. #else
  384. void __init early_res_to_bootmem(u64 start, u64 end)
  385. {
  386. int i, count;
  387. u64 final_start, final_end;
  388. int idx = 0;
  389. count = 0;
  390. for (i = 0; i < max_early_res && early_res[i].end; i++)
  391. count++;
  392. /* need to skip first one ?*/
  393. if (early_res != early_res_x)
  394. idx = 1;
  395. printk(KERN_INFO "(%d/%d early reservations) ==> bootmem [%010llx - %010llx]\n",
  396. count - idx, max_early_res, start, end);
  397. for (i = idx; i < count; i++) {
  398. struct early_res *r = &early_res[i];
  399. printk(KERN_INFO " #%d [%010llx - %010llx] %16s", i,
  400. r->start, r->end, r->name);
  401. final_start = max(start, r->start);
  402. final_end = min(end, r->end);
  403. if (final_start >= final_end) {
  404. printk(KERN_CONT "\n");
  405. continue;
  406. }
  407. printk(KERN_CONT " ==> [%010llx - %010llx]\n",
  408. final_start, final_end);
  409. reserve_bootmem_generic(final_start, final_end - final_start,
  410. BOOTMEM_DEFAULT);
  411. }
  412. /* clear them */
  413. memset(&early_res[0], 0, sizeof(struct early_res) * max_early_res);
  414. early_res = NULL;
  415. max_early_res = 0;
  416. early_res_count = 0;
  417. }
  418. #endif
  419. /* Check for already reserved areas */
  420. static inline int __init bad_addr(u64 *addrp, u64 size, u64 align)
  421. {
  422. int i;
  423. u64 addr = *addrp;
  424. int changed = 0;
  425. struct early_res *r;
  426. again:
  427. i = find_overlapped_early(addr, addr + size);
  428. r = &early_res[i];
  429. if (i < max_early_res && r->end) {
  430. *addrp = addr = round_up(r->end, align);
  431. changed = 1;
  432. goto again;
  433. }
  434. return changed;
  435. }
  436. /* Check for already reserved areas */
  437. static inline int __init bad_addr_size(u64 *addrp, u64 *sizep, u64 align)
  438. {
  439. int i;
  440. u64 addr = *addrp, last;
  441. u64 size = *sizep;
  442. int changed = 0;
  443. again:
  444. last = addr + size;
  445. for (i = 0; i < max_early_res && early_res[i].end; i++) {
  446. struct early_res *r = &early_res[i];
  447. if (last > r->start && addr < r->start) {
  448. size = r->start - addr;
  449. changed = 1;
  450. goto again;
  451. }
  452. if (last > r->end && addr < r->end) {
  453. addr = round_up(r->end, align);
  454. size = last - addr;
  455. changed = 1;
  456. goto again;
  457. }
  458. if (last <= r->end && addr >= r->start) {
  459. (*sizep)++;
  460. return 0;
  461. }
  462. }
  463. if (changed) {
  464. *addrp = addr;
  465. *sizep = size;
  466. }
  467. return changed;
  468. }
  469. /*
  470. * Find a free area with specified alignment in a specific range.
  471. * only with the area.between start to end is active range from early_node_map
  472. * so they are good as RAM
  473. */
  474. u64 __init find_early_area(u64 ei_start, u64 ei_last, u64 start, u64 end,
  475. u64 size, u64 align)
  476. {
  477. u64 addr, last;
  478. addr = round_up(ei_start, align);
  479. if (addr < start)
  480. addr = round_up(start, align);
  481. if (addr >= ei_last)
  482. goto out;
  483. while (bad_addr(&addr, size, align) && addr+size <= ei_last)
  484. ;
  485. last = addr + size;
  486. if (last > ei_last)
  487. goto out;
  488. if (last > end)
  489. goto out;
  490. return addr;
  491. out:
  492. return -1ULL;
  493. }
  494. u64 __init find_early_area_size(u64 ei_start, u64 ei_last, u64 start,
  495. u64 *sizep, u64 align)
  496. {
  497. u64 addr, last;
  498. addr = round_up(ei_start, align);
  499. if (addr < start)
  500. addr = round_up(start, align);
  501. if (addr >= ei_last)
  502. goto out;
  503. *sizep = ei_last - addr;
  504. while (bad_addr_size(&addr, sizep, align) && addr + *sizep <= ei_last)
  505. ;
  506. last = addr + *sizep;
  507. if (last > ei_last)
  508. goto out;
  509. return addr;
  510. out:
  511. return -1ULL;
  512. }