binfmt_elf_fdpic.c 46 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787
  1. /* binfmt_elf_fdpic.c: FDPIC ELF binary format
  2. *
  3. * Copyright (C) 2003, 2004, 2006 Red Hat, Inc. All Rights Reserved.
  4. * Written by David Howells (dhowells@redhat.com)
  5. * Derived from binfmt_elf.c
  6. *
  7. * This program is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU General Public License
  9. * as published by the Free Software Foundation; either version
  10. * 2 of the License, or (at your option) any later version.
  11. */
  12. #include <linux/module.h>
  13. #include <linux/fs.h>
  14. #include <linux/stat.h>
  15. #include <linux/sched.h>
  16. #include <linux/mm.h>
  17. #include <linux/mman.h>
  18. #include <linux/errno.h>
  19. #include <linux/signal.h>
  20. #include <linux/binfmts.h>
  21. #include <linux/string.h>
  22. #include <linux/file.h>
  23. #include <linux/fcntl.h>
  24. #include <linux/slab.h>
  25. #include <linux/pagemap.h>
  26. #include <linux/highmem.h>
  27. #include <linux/highuid.h>
  28. #include <linux/personality.h>
  29. #include <linux/ptrace.h>
  30. #include <linux/init.h>
  31. #include <linux/smp_lock.h>
  32. #include <linux/elf.h>
  33. #include <linux/elf-fdpic.h>
  34. #include <linux/elfcore.h>
  35. #include <asm/uaccess.h>
  36. #include <asm/param.h>
  37. #include <asm/pgalloc.h>
  38. typedef char *elf_caddr_t;
  39. #if 0
  40. #define kdebug(fmt, ...) printk("FDPIC "fmt"\n" ,##__VA_ARGS__ )
  41. #else
  42. #define kdebug(fmt, ...) do {} while(0)
  43. #endif
  44. #if 0
  45. #define kdcore(fmt, ...) printk("FDPIC "fmt"\n" ,##__VA_ARGS__ )
  46. #else
  47. #define kdcore(fmt, ...) do {} while(0)
  48. #endif
  49. MODULE_LICENSE("GPL");
  50. static int load_elf_fdpic_binary(struct linux_binprm *, struct pt_regs *);
  51. static int elf_fdpic_fetch_phdrs(struct elf_fdpic_params *, struct file *);
  52. static int elf_fdpic_map_file(struct elf_fdpic_params *, struct file *,
  53. struct mm_struct *, const char *);
  54. static int create_elf_fdpic_tables(struct linux_binprm *, struct mm_struct *,
  55. struct elf_fdpic_params *,
  56. struct elf_fdpic_params *);
  57. #ifndef CONFIG_MMU
  58. static int elf_fdpic_transfer_args_to_stack(struct linux_binprm *,
  59. unsigned long *);
  60. static int elf_fdpic_map_file_constdisp_on_uclinux(struct elf_fdpic_params *,
  61. struct file *,
  62. struct mm_struct *);
  63. #endif
  64. static int elf_fdpic_map_file_by_direct_mmap(struct elf_fdpic_params *,
  65. struct file *, struct mm_struct *);
  66. #if defined(USE_ELF_CORE_DUMP) && defined(CONFIG_ELF_CORE)
  67. static int elf_fdpic_core_dump(long, struct pt_regs *, struct file *);
  68. #endif
  69. static struct linux_binfmt elf_fdpic_format = {
  70. .module = THIS_MODULE,
  71. .load_binary = load_elf_fdpic_binary,
  72. #if defined(USE_ELF_CORE_DUMP) && defined(CONFIG_ELF_CORE)
  73. .core_dump = elf_fdpic_core_dump,
  74. #endif
  75. .min_coredump = ELF_EXEC_PAGESIZE,
  76. };
  77. static int __init init_elf_fdpic_binfmt(void)
  78. {
  79. return register_binfmt(&elf_fdpic_format);
  80. }
  81. static void __exit exit_elf_fdpic_binfmt(void)
  82. {
  83. unregister_binfmt(&elf_fdpic_format);
  84. }
  85. core_initcall(init_elf_fdpic_binfmt);
  86. module_exit(exit_elf_fdpic_binfmt);
  87. static int is_elf_fdpic(struct elfhdr *hdr, struct file *file)
  88. {
  89. if (memcmp(hdr->e_ident, ELFMAG, SELFMAG) != 0)
  90. return 0;
  91. if (hdr->e_type != ET_EXEC && hdr->e_type != ET_DYN)
  92. return 0;
  93. if (!elf_check_arch(hdr) || !elf_check_fdpic(hdr))
  94. return 0;
  95. if (!file->f_op || !file->f_op->mmap)
  96. return 0;
  97. return 1;
  98. }
  99. /*****************************************************************************/
  100. /*
  101. * read the program headers table into memory
  102. */
  103. static int elf_fdpic_fetch_phdrs(struct elf_fdpic_params *params,
  104. struct file *file)
  105. {
  106. struct elf32_phdr *phdr;
  107. unsigned long size;
  108. int retval, loop;
  109. if (params->hdr.e_phentsize != sizeof(struct elf_phdr))
  110. return -ENOMEM;
  111. if (params->hdr.e_phnum > 65536U / sizeof(struct elf_phdr))
  112. return -ENOMEM;
  113. size = params->hdr.e_phnum * sizeof(struct elf_phdr);
  114. params->phdrs = kmalloc(size, GFP_KERNEL);
  115. if (!params->phdrs)
  116. return -ENOMEM;
  117. retval = kernel_read(file, params->hdr.e_phoff,
  118. (char *) params->phdrs, size);
  119. if (retval < 0)
  120. return retval;
  121. /* determine stack size for this binary */
  122. phdr = params->phdrs;
  123. for (loop = 0; loop < params->hdr.e_phnum; loop++, phdr++) {
  124. if (phdr->p_type != PT_GNU_STACK)
  125. continue;
  126. if (phdr->p_flags & PF_X)
  127. params->flags |= ELF_FDPIC_FLAG_EXEC_STACK;
  128. else
  129. params->flags |= ELF_FDPIC_FLAG_NOEXEC_STACK;
  130. params->stack_size = phdr->p_memsz;
  131. break;
  132. }
  133. return 0;
  134. }
  135. /*****************************************************************************/
  136. /*
  137. * load an fdpic binary into various bits of memory
  138. */
  139. static int load_elf_fdpic_binary(struct linux_binprm *bprm,
  140. struct pt_regs *regs)
  141. {
  142. struct elf_fdpic_params exec_params, interp_params;
  143. struct elf_phdr *phdr;
  144. unsigned long stack_size, entryaddr;
  145. #ifndef CONFIG_MMU
  146. unsigned long fullsize;
  147. #endif
  148. #ifdef ELF_FDPIC_PLAT_INIT
  149. unsigned long dynaddr;
  150. #endif
  151. struct file *interpreter = NULL; /* to shut gcc up */
  152. char *interpreter_name = NULL;
  153. int executable_stack;
  154. int retval, i;
  155. memset(&exec_params, 0, sizeof(exec_params));
  156. memset(&interp_params, 0, sizeof(interp_params));
  157. exec_params.hdr = *(struct elfhdr *) bprm->buf;
  158. exec_params.flags = ELF_FDPIC_FLAG_PRESENT | ELF_FDPIC_FLAG_EXECUTABLE;
  159. /* check that this is a binary we know how to deal with */
  160. retval = -ENOEXEC;
  161. if (!is_elf_fdpic(&exec_params.hdr, bprm->file))
  162. goto error;
  163. /* read the program header table */
  164. retval = elf_fdpic_fetch_phdrs(&exec_params, bprm->file);
  165. if (retval < 0)
  166. goto error;
  167. /* scan for a program header that specifies an interpreter */
  168. phdr = exec_params.phdrs;
  169. for (i = 0; i < exec_params.hdr.e_phnum; i++, phdr++) {
  170. switch (phdr->p_type) {
  171. case PT_INTERP:
  172. retval = -ENOMEM;
  173. if (phdr->p_filesz > PATH_MAX)
  174. goto error;
  175. retval = -ENOENT;
  176. if (phdr->p_filesz < 2)
  177. goto error;
  178. /* read the name of the interpreter into memory */
  179. interpreter_name = kmalloc(phdr->p_filesz, GFP_KERNEL);
  180. if (!interpreter_name)
  181. goto error;
  182. retval = kernel_read(bprm->file,
  183. phdr->p_offset,
  184. interpreter_name,
  185. phdr->p_filesz);
  186. if (retval < 0)
  187. goto error;
  188. retval = -ENOENT;
  189. if (interpreter_name[phdr->p_filesz - 1] != '\0')
  190. goto error;
  191. kdebug("Using ELF interpreter %s", interpreter_name);
  192. /* replace the program with the interpreter */
  193. interpreter = open_exec(interpreter_name);
  194. retval = PTR_ERR(interpreter);
  195. if (IS_ERR(interpreter)) {
  196. interpreter = NULL;
  197. goto error;
  198. }
  199. retval = kernel_read(interpreter, 0, bprm->buf,
  200. BINPRM_BUF_SIZE);
  201. if (retval < 0)
  202. goto error;
  203. interp_params.hdr = *((struct elfhdr *) bprm->buf);
  204. break;
  205. case PT_LOAD:
  206. #ifdef CONFIG_MMU
  207. if (exec_params.load_addr == 0)
  208. exec_params.load_addr = phdr->p_vaddr;
  209. #endif
  210. break;
  211. }
  212. }
  213. if (elf_check_const_displacement(&exec_params.hdr))
  214. exec_params.flags |= ELF_FDPIC_FLAG_CONSTDISP;
  215. /* perform insanity checks on the interpreter */
  216. if (interpreter_name) {
  217. retval = -ELIBBAD;
  218. if (!is_elf_fdpic(&interp_params.hdr, interpreter))
  219. goto error;
  220. interp_params.flags = ELF_FDPIC_FLAG_PRESENT;
  221. /* read the interpreter's program header table */
  222. retval = elf_fdpic_fetch_phdrs(&interp_params, interpreter);
  223. if (retval < 0)
  224. goto error;
  225. }
  226. stack_size = exec_params.stack_size;
  227. if (stack_size < interp_params.stack_size)
  228. stack_size = interp_params.stack_size;
  229. if (exec_params.flags & ELF_FDPIC_FLAG_EXEC_STACK)
  230. executable_stack = EXSTACK_ENABLE_X;
  231. else if (exec_params.flags & ELF_FDPIC_FLAG_NOEXEC_STACK)
  232. executable_stack = EXSTACK_DISABLE_X;
  233. else if (interp_params.flags & ELF_FDPIC_FLAG_EXEC_STACK)
  234. executable_stack = EXSTACK_ENABLE_X;
  235. else if (interp_params.flags & ELF_FDPIC_FLAG_NOEXEC_STACK)
  236. executable_stack = EXSTACK_DISABLE_X;
  237. else
  238. executable_stack = EXSTACK_DEFAULT;
  239. retval = -ENOEXEC;
  240. if (stack_size == 0)
  241. goto error;
  242. if (elf_check_const_displacement(&interp_params.hdr))
  243. interp_params.flags |= ELF_FDPIC_FLAG_CONSTDISP;
  244. /* flush all traces of the currently running executable */
  245. retval = flush_old_exec(bprm);
  246. if (retval)
  247. goto error;
  248. /* there's now no turning back... the old userspace image is dead,
  249. * defunct, deceased, etc. after this point we have to exit via
  250. * error_kill */
  251. set_personality(PER_LINUX_FDPIC);
  252. set_binfmt(&elf_fdpic_format);
  253. current->mm->start_code = 0;
  254. current->mm->end_code = 0;
  255. current->mm->start_stack = 0;
  256. current->mm->start_data = 0;
  257. current->mm->end_data = 0;
  258. current->mm->context.exec_fdpic_loadmap = 0;
  259. current->mm->context.interp_fdpic_loadmap = 0;
  260. current->flags &= ~PF_FORKNOEXEC;
  261. #ifdef CONFIG_MMU
  262. elf_fdpic_arch_lay_out_mm(&exec_params,
  263. &interp_params,
  264. &current->mm->start_stack,
  265. &current->mm->start_brk);
  266. retval = setup_arg_pages(bprm, current->mm->start_stack,
  267. executable_stack);
  268. if (retval < 0) {
  269. send_sig(SIGKILL, current, 0);
  270. goto error_kill;
  271. }
  272. #endif
  273. /* load the executable and interpreter into memory */
  274. retval = elf_fdpic_map_file(&exec_params, bprm->file, current->mm,
  275. "executable");
  276. if (retval < 0)
  277. goto error_kill;
  278. if (interpreter_name) {
  279. retval = elf_fdpic_map_file(&interp_params, interpreter,
  280. current->mm, "interpreter");
  281. if (retval < 0) {
  282. printk(KERN_ERR "Unable to load interpreter\n");
  283. goto error_kill;
  284. }
  285. allow_write_access(interpreter);
  286. fput(interpreter);
  287. interpreter = NULL;
  288. }
  289. #ifdef CONFIG_MMU
  290. if (!current->mm->start_brk)
  291. current->mm->start_brk = current->mm->end_data;
  292. current->mm->brk = current->mm->start_brk =
  293. PAGE_ALIGN(current->mm->start_brk);
  294. #else
  295. /* create a stack and brk area big enough for everyone
  296. * - the brk heap starts at the bottom and works up
  297. * - the stack starts at the top and works down
  298. */
  299. stack_size = (stack_size + PAGE_SIZE - 1) & PAGE_MASK;
  300. if (stack_size < PAGE_SIZE * 2)
  301. stack_size = PAGE_SIZE * 2;
  302. down_write(&current->mm->mmap_sem);
  303. current->mm->start_brk = do_mmap(NULL, 0, stack_size,
  304. PROT_READ | PROT_WRITE | PROT_EXEC,
  305. MAP_PRIVATE | MAP_ANON | MAP_GROWSDOWN,
  306. 0);
  307. if (IS_ERR_VALUE(current->mm->start_brk)) {
  308. up_write(&current->mm->mmap_sem);
  309. retval = current->mm->start_brk;
  310. current->mm->start_brk = 0;
  311. goto error_kill;
  312. }
  313. /* expand the stack mapping to use up the entire allocation granule */
  314. fullsize = ksize((char *) current->mm->start_brk);
  315. if (!IS_ERR_VALUE(do_mremap(current->mm->start_brk, stack_size,
  316. fullsize, 0, 0)))
  317. stack_size = fullsize;
  318. up_write(&current->mm->mmap_sem);
  319. current->mm->brk = current->mm->start_brk;
  320. current->mm->context.end_brk = current->mm->start_brk;
  321. current->mm->context.end_brk +=
  322. (stack_size > PAGE_SIZE) ? (stack_size - PAGE_SIZE) : 0;
  323. current->mm->start_stack = current->mm->start_brk + stack_size;
  324. #endif
  325. compute_creds(bprm);
  326. current->flags &= ~PF_FORKNOEXEC;
  327. if (create_elf_fdpic_tables(bprm, current->mm,
  328. &exec_params, &interp_params) < 0)
  329. goto error_kill;
  330. kdebug("- start_code %lx", current->mm->start_code);
  331. kdebug("- end_code %lx", current->mm->end_code);
  332. kdebug("- start_data %lx", current->mm->start_data);
  333. kdebug("- end_data %lx", current->mm->end_data);
  334. kdebug("- start_brk %lx", current->mm->start_brk);
  335. kdebug("- brk %lx", current->mm->brk);
  336. kdebug("- start_stack %lx", current->mm->start_stack);
  337. #ifdef ELF_FDPIC_PLAT_INIT
  338. /*
  339. * The ABI may specify that certain registers be set up in special
  340. * ways (on i386 %edx is the address of a DT_FINI function, for
  341. * example. This macro performs whatever initialization to
  342. * the regs structure is required.
  343. */
  344. dynaddr = interp_params.dynamic_addr ?: exec_params.dynamic_addr;
  345. ELF_FDPIC_PLAT_INIT(regs, exec_params.map_addr, interp_params.map_addr,
  346. dynaddr);
  347. #endif
  348. /* everything is now ready... get the userspace context ready to roll */
  349. entryaddr = interp_params.entry_addr ?: exec_params.entry_addr;
  350. start_thread(regs, entryaddr, current->mm->start_stack);
  351. if (unlikely(current->ptrace & PT_PTRACED)) {
  352. if (current->ptrace & PT_TRACE_EXEC)
  353. ptrace_notify((PTRACE_EVENT_EXEC << 8) | SIGTRAP);
  354. else
  355. send_sig(SIGTRAP, current, 0);
  356. }
  357. retval = 0;
  358. error:
  359. if (interpreter) {
  360. allow_write_access(interpreter);
  361. fput(interpreter);
  362. }
  363. kfree(interpreter_name);
  364. kfree(exec_params.phdrs);
  365. kfree(exec_params.loadmap);
  366. kfree(interp_params.phdrs);
  367. kfree(interp_params.loadmap);
  368. return retval;
  369. /* unrecoverable error - kill the process */
  370. error_kill:
  371. send_sig(SIGSEGV, current, 0);
  372. goto error;
  373. }
  374. /*****************************************************************************/
  375. /*
  376. * present useful information to the program
  377. */
  378. static int create_elf_fdpic_tables(struct linux_binprm *bprm,
  379. struct mm_struct *mm,
  380. struct elf_fdpic_params *exec_params,
  381. struct elf_fdpic_params *interp_params)
  382. {
  383. unsigned long sp, csp, nitems;
  384. elf_caddr_t __user *argv, *envp;
  385. size_t platform_len = 0, len;
  386. char *k_platform;
  387. char __user *u_platform, *p;
  388. long hwcap;
  389. int loop;
  390. /* we're going to shovel a whole load of stuff onto the stack */
  391. #ifdef CONFIG_MMU
  392. sp = bprm->p;
  393. #else
  394. sp = mm->start_stack;
  395. /* stack the program arguments and environment */
  396. if (elf_fdpic_transfer_args_to_stack(bprm, &sp) < 0)
  397. return -EFAULT;
  398. #endif
  399. /* get hold of platform and hardware capabilities masks for the machine
  400. * we are running on. In some cases (Sparc), this info is impossible
  401. * to get, in others (i386) it is merely difficult.
  402. */
  403. hwcap = ELF_HWCAP;
  404. k_platform = ELF_PLATFORM;
  405. u_platform = NULL;
  406. if (k_platform) {
  407. platform_len = strlen(k_platform) + 1;
  408. sp -= platform_len;
  409. u_platform = (char __user *) sp;
  410. if (__copy_to_user(u_platform, k_platform, platform_len) != 0)
  411. return -EFAULT;
  412. }
  413. #if defined(__i386__) && defined(CONFIG_SMP)
  414. /* in some cases (e.g. Hyper-Threading), we want to avoid L1 evictions
  415. * by the processes running on the same package. One thing we can do is
  416. * to shuffle the initial stack for them.
  417. *
  418. * the conditionals here are unneeded, but kept in to make the code
  419. * behaviour the same as pre change unless we have hyperthreaded
  420. * processors. This keeps Mr Marcelo Person happier but should be
  421. * removed for 2.5
  422. */
  423. if (smp_num_siblings > 1)
  424. sp = sp - ((current->pid % 64) << 7);
  425. #endif
  426. sp &= ~7UL;
  427. /* stack the load map(s) */
  428. len = sizeof(struct elf32_fdpic_loadmap);
  429. len += sizeof(struct elf32_fdpic_loadseg) * exec_params->loadmap->nsegs;
  430. sp = (sp - len) & ~7UL;
  431. exec_params->map_addr = sp;
  432. if (copy_to_user((void __user *) sp, exec_params->loadmap, len) != 0)
  433. return -EFAULT;
  434. current->mm->context.exec_fdpic_loadmap = (unsigned long) sp;
  435. if (interp_params->loadmap) {
  436. len = sizeof(struct elf32_fdpic_loadmap);
  437. len += sizeof(struct elf32_fdpic_loadseg) *
  438. interp_params->loadmap->nsegs;
  439. sp = (sp - len) & ~7UL;
  440. interp_params->map_addr = sp;
  441. if (copy_to_user((void __user *) sp, interp_params->loadmap,
  442. len) != 0)
  443. return -EFAULT;
  444. current->mm->context.interp_fdpic_loadmap = (unsigned long) sp;
  445. }
  446. /* force 16 byte _final_ alignment here for generality */
  447. #define DLINFO_ITEMS 13
  448. nitems = 1 + DLINFO_ITEMS + (k_platform ? 1 : 0);
  449. #ifdef DLINFO_ARCH_ITEMS
  450. nitems += DLINFO_ARCH_ITEMS;
  451. #endif
  452. csp = sp;
  453. sp -= nitems * 2 * sizeof(unsigned long);
  454. sp -= (bprm->envc + 1) * sizeof(char *); /* envv[] */
  455. sp -= (bprm->argc + 1) * sizeof(char *); /* argv[] */
  456. sp -= 1 * sizeof(unsigned long); /* argc */
  457. csp -= sp & 15UL;
  458. sp -= sp & 15UL;
  459. /* put the ELF interpreter info on the stack */
  460. #define NEW_AUX_ENT(nr, id, val) \
  461. do { \
  462. struct { unsigned long _id, _val; } __user *ent; \
  463. \
  464. ent = (void __user *) csp; \
  465. __put_user((id), &ent[nr]._id); \
  466. __put_user((val), &ent[nr]._val); \
  467. } while (0)
  468. csp -= 2 * sizeof(unsigned long);
  469. NEW_AUX_ENT(0, AT_NULL, 0);
  470. if (k_platform) {
  471. csp -= 2 * sizeof(unsigned long);
  472. NEW_AUX_ENT(0, AT_PLATFORM,
  473. (elf_addr_t) (unsigned long) u_platform);
  474. }
  475. csp -= DLINFO_ITEMS * 2 * sizeof(unsigned long);
  476. NEW_AUX_ENT( 0, AT_HWCAP, hwcap);
  477. NEW_AUX_ENT( 1, AT_PAGESZ, PAGE_SIZE);
  478. NEW_AUX_ENT( 2, AT_CLKTCK, CLOCKS_PER_SEC);
  479. NEW_AUX_ENT( 3, AT_PHDR, exec_params->ph_addr);
  480. NEW_AUX_ENT( 4, AT_PHENT, sizeof(struct elf_phdr));
  481. NEW_AUX_ENT( 5, AT_PHNUM, exec_params->hdr.e_phnum);
  482. NEW_AUX_ENT( 6, AT_BASE, interp_params->elfhdr_addr);
  483. NEW_AUX_ENT( 7, AT_FLAGS, 0);
  484. NEW_AUX_ENT( 8, AT_ENTRY, exec_params->entry_addr);
  485. NEW_AUX_ENT( 9, AT_UID, (elf_addr_t) current->uid);
  486. NEW_AUX_ENT(10, AT_EUID, (elf_addr_t) current->euid);
  487. NEW_AUX_ENT(11, AT_GID, (elf_addr_t) current->gid);
  488. NEW_AUX_ENT(12, AT_EGID, (elf_addr_t) current->egid);
  489. #ifdef ARCH_DLINFO
  490. /* ARCH_DLINFO must come last so platform specific code can enforce
  491. * special alignment requirements on the AUXV if necessary (eg. PPC).
  492. */
  493. ARCH_DLINFO;
  494. #endif
  495. #undef NEW_AUX_ENT
  496. /* allocate room for argv[] and envv[] */
  497. csp -= (bprm->envc + 1) * sizeof(elf_caddr_t);
  498. envp = (elf_caddr_t __user *) csp;
  499. csp -= (bprm->argc + 1) * sizeof(elf_caddr_t);
  500. argv = (elf_caddr_t __user *) csp;
  501. /* stack argc */
  502. csp -= sizeof(unsigned long);
  503. __put_user(bprm->argc, (unsigned long __user *) csp);
  504. BUG_ON(csp != sp);
  505. /* fill in the argv[] array */
  506. #ifdef CONFIG_MMU
  507. current->mm->arg_start = bprm->p;
  508. #else
  509. current->mm->arg_start = current->mm->start_stack -
  510. (MAX_ARG_PAGES * PAGE_SIZE - bprm->p);
  511. #endif
  512. p = (char __user *) current->mm->arg_start;
  513. for (loop = bprm->argc; loop > 0; loop--) {
  514. __put_user((elf_caddr_t) p, argv++);
  515. len = strnlen_user(p, PAGE_SIZE * MAX_ARG_PAGES);
  516. if (!len || len > PAGE_SIZE * MAX_ARG_PAGES)
  517. return -EINVAL;
  518. p += len;
  519. }
  520. __put_user(NULL, argv);
  521. current->mm->arg_end = (unsigned long) p;
  522. /* fill in the envv[] array */
  523. current->mm->env_start = (unsigned long) p;
  524. for (loop = bprm->envc; loop > 0; loop--) {
  525. __put_user((elf_caddr_t)(unsigned long) p, envp++);
  526. len = strnlen_user(p, PAGE_SIZE * MAX_ARG_PAGES);
  527. if (!len || len > PAGE_SIZE * MAX_ARG_PAGES)
  528. return -EINVAL;
  529. p += len;
  530. }
  531. __put_user(NULL, envp);
  532. current->mm->env_end = (unsigned long) p;
  533. mm->start_stack = (unsigned long) sp;
  534. return 0;
  535. }
  536. /*****************************************************************************/
  537. /*
  538. * transfer the program arguments and environment from the holding pages onto
  539. * the stack
  540. */
  541. #ifndef CONFIG_MMU
  542. static int elf_fdpic_transfer_args_to_stack(struct linux_binprm *bprm,
  543. unsigned long *_sp)
  544. {
  545. unsigned long index, stop, sp;
  546. char *src;
  547. int ret = 0;
  548. stop = bprm->p >> PAGE_SHIFT;
  549. sp = *_sp;
  550. for (index = MAX_ARG_PAGES - 1; index >= stop; index--) {
  551. src = kmap(bprm->page[index]);
  552. sp -= PAGE_SIZE;
  553. if (copy_to_user((void *) sp, src, PAGE_SIZE) != 0)
  554. ret = -EFAULT;
  555. kunmap(bprm->page[index]);
  556. if (ret < 0)
  557. goto out;
  558. }
  559. *_sp = (*_sp - (MAX_ARG_PAGES * PAGE_SIZE - bprm->p)) & ~15;
  560. out:
  561. return ret;
  562. }
  563. #endif
  564. /*****************************************************************************/
  565. /*
  566. * load the appropriate binary image (executable or interpreter) into memory
  567. * - we assume no MMU is available
  568. * - if no other PIC bits are set in params->hdr->e_flags
  569. * - we assume that the LOADable segments in the binary are independently relocatable
  570. * - we assume R/O executable segments are shareable
  571. * - else
  572. * - we assume the loadable parts of the image to require fixed displacement
  573. * - the image is not shareable
  574. */
  575. static int elf_fdpic_map_file(struct elf_fdpic_params *params,
  576. struct file *file,
  577. struct mm_struct *mm,
  578. const char *what)
  579. {
  580. struct elf32_fdpic_loadmap *loadmap;
  581. #ifdef CONFIG_MMU
  582. struct elf32_fdpic_loadseg *mseg;
  583. #endif
  584. struct elf32_fdpic_loadseg *seg;
  585. struct elf32_phdr *phdr;
  586. unsigned long load_addr, stop;
  587. unsigned nloads, tmp;
  588. size_t size;
  589. int loop, ret;
  590. /* allocate a load map table */
  591. nloads = 0;
  592. for (loop = 0; loop < params->hdr.e_phnum; loop++)
  593. if (params->phdrs[loop].p_type == PT_LOAD)
  594. nloads++;
  595. if (nloads == 0)
  596. return -ELIBBAD;
  597. size = sizeof(*loadmap) + nloads * sizeof(*seg);
  598. loadmap = kzalloc(size, GFP_KERNEL);
  599. if (!loadmap)
  600. return -ENOMEM;
  601. params->loadmap = loadmap;
  602. loadmap->version = ELF32_FDPIC_LOADMAP_VERSION;
  603. loadmap->nsegs = nloads;
  604. load_addr = params->load_addr;
  605. seg = loadmap->segs;
  606. /* map the requested LOADs into the memory space */
  607. switch (params->flags & ELF_FDPIC_FLAG_ARRANGEMENT) {
  608. case ELF_FDPIC_FLAG_CONSTDISP:
  609. case ELF_FDPIC_FLAG_CONTIGUOUS:
  610. #ifndef CONFIG_MMU
  611. ret = elf_fdpic_map_file_constdisp_on_uclinux(params, file, mm);
  612. if (ret < 0)
  613. return ret;
  614. break;
  615. #endif
  616. default:
  617. ret = elf_fdpic_map_file_by_direct_mmap(params, file, mm);
  618. if (ret < 0)
  619. return ret;
  620. break;
  621. }
  622. /* map the entry point */
  623. if (params->hdr.e_entry) {
  624. seg = loadmap->segs;
  625. for (loop = loadmap->nsegs; loop > 0; loop--, seg++) {
  626. if (params->hdr.e_entry >= seg->p_vaddr &&
  627. params->hdr.e_entry < seg->p_vaddr + seg->p_memsz) {
  628. params->entry_addr =
  629. (params->hdr.e_entry - seg->p_vaddr) +
  630. seg->addr;
  631. break;
  632. }
  633. }
  634. }
  635. /* determine where the program header table has wound up if mapped */
  636. stop = params->hdr.e_phoff;
  637. stop += params->hdr.e_phnum * sizeof (struct elf_phdr);
  638. phdr = params->phdrs;
  639. for (loop = 0; loop < params->hdr.e_phnum; loop++, phdr++) {
  640. if (phdr->p_type != PT_LOAD)
  641. continue;
  642. if (phdr->p_offset > params->hdr.e_phoff ||
  643. phdr->p_offset + phdr->p_filesz < stop)
  644. continue;
  645. seg = loadmap->segs;
  646. for (loop = loadmap->nsegs; loop > 0; loop--, seg++) {
  647. if (phdr->p_vaddr >= seg->p_vaddr &&
  648. phdr->p_vaddr + phdr->p_filesz <=
  649. seg->p_vaddr + seg->p_memsz) {
  650. params->ph_addr =
  651. (phdr->p_vaddr - seg->p_vaddr) +
  652. seg->addr +
  653. params->hdr.e_phoff - phdr->p_offset;
  654. break;
  655. }
  656. }
  657. break;
  658. }
  659. /* determine where the dynamic section has wound up if there is one */
  660. phdr = params->phdrs;
  661. for (loop = 0; loop < params->hdr.e_phnum; loop++, phdr++) {
  662. if (phdr->p_type != PT_DYNAMIC)
  663. continue;
  664. seg = loadmap->segs;
  665. for (loop = loadmap->nsegs; loop > 0; loop--, seg++) {
  666. if (phdr->p_vaddr >= seg->p_vaddr &&
  667. phdr->p_vaddr + phdr->p_memsz <=
  668. seg->p_vaddr + seg->p_memsz) {
  669. params->dynamic_addr =
  670. (phdr->p_vaddr - seg->p_vaddr) +
  671. seg->addr;
  672. /* check the dynamic section contains at least
  673. * one item, and that the last item is a NULL
  674. * entry */
  675. if (phdr->p_memsz == 0 ||
  676. phdr->p_memsz % sizeof(Elf32_Dyn) != 0)
  677. goto dynamic_error;
  678. tmp = phdr->p_memsz / sizeof(Elf32_Dyn);
  679. if (((Elf32_Dyn *)
  680. params->dynamic_addr)[tmp - 1].d_tag != 0)
  681. goto dynamic_error;
  682. break;
  683. }
  684. }
  685. break;
  686. }
  687. /* now elide adjacent segments in the load map on MMU linux
  688. * - on uClinux the holes between may actually be filled with system
  689. * stuff or stuff from other processes
  690. */
  691. #ifdef CONFIG_MMU
  692. nloads = loadmap->nsegs;
  693. mseg = loadmap->segs;
  694. seg = mseg + 1;
  695. for (loop = 1; loop < nloads; loop++) {
  696. /* see if we have a candidate for merging */
  697. if (seg->p_vaddr - mseg->p_vaddr == seg->addr - mseg->addr) {
  698. load_addr = PAGE_ALIGN(mseg->addr + mseg->p_memsz);
  699. if (load_addr == (seg->addr & PAGE_MASK)) {
  700. mseg->p_memsz +=
  701. load_addr -
  702. (mseg->addr + mseg->p_memsz);
  703. mseg->p_memsz += seg->addr & ~PAGE_MASK;
  704. mseg->p_memsz += seg->p_memsz;
  705. loadmap->nsegs--;
  706. continue;
  707. }
  708. }
  709. mseg++;
  710. if (mseg != seg)
  711. *mseg = *seg;
  712. }
  713. #endif
  714. kdebug("Mapped Object [%s]:", what);
  715. kdebug("- elfhdr : %lx", params->elfhdr_addr);
  716. kdebug("- entry : %lx", params->entry_addr);
  717. kdebug("- PHDR[] : %lx", params->ph_addr);
  718. kdebug("- DYNAMIC[]: %lx", params->dynamic_addr);
  719. seg = loadmap->segs;
  720. for (loop = 0; loop < loadmap->nsegs; loop++, seg++)
  721. kdebug("- LOAD[%d] : %08x-%08x [va=%x ms=%x]",
  722. loop,
  723. seg->addr, seg->addr + seg->p_memsz - 1,
  724. seg->p_vaddr, seg->p_memsz);
  725. return 0;
  726. dynamic_error:
  727. printk("ELF FDPIC %s with invalid DYNAMIC section (inode=%lu)\n",
  728. what, file->f_path.dentry->d_inode->i_ino);
  729. return -ELIBBAD;
  730. }
  731. /*****************************************************************************/
  732. /*
  733. * map a file with constant displacement under uClinux
  734. */
  735. #ifndef CONFIG_MMU
  736. static int elf_fdpic_map_file_constdisp_on_uclinux(
  737. struct elf_fdpic_params *params,
  738. struct file *file,
  739. struct mm_struct *mm)
  740. {
  741. struct elf32_fdpic_loadseg *seg;
  742. struct elf32_phdr *phdr;
  743. unsigned long load_addr, base = ULONG_MAX, top = 0, maddr = 0, mflags;
  744. loff_t fpos;
  745. int loop, ret;
  746. load_addr = params->load_addr;
  747. seg = params->loadmap->segs;
  748. /* determine the bounds of the contiguous overall allocation we must
  749. * make */
  750. phdr = params->phdrs;
  751. for (loop = 0; loop < params->hdr.e_phnum; loop++, phdr++) {
  752. if (params->phdrs[loop].p_type != PT_LOAD)
  753. continue;
  754. if (base > phdr->p_vaddr)
  755. base = phdr->p_vaddr;
  756. if (top < phdr->p_vaddr + phdr->p_memsz)
  757. top = phdr->p_vaddr + phdr->p_memsz;
  758. }
  759. /* allocate one big anon block for everything */
  760. mflags = MAP_PRIVATE;
  761. if (params->flags & ELF_FDPIC_FLAG_EXECUTABLE)
  762. mflags |= MAP_EXECUTABLE;
  763. down_write(&mm->mmap_sem);
  764. maddr = do_mmap(NULL, load_addr, top - base,
  765. PROT_READ | PROT_WRITE | PROT_EXEC, mflags, 0);
  766. up_write(&mm->mmap_sem);
  767. if (IS_ERR_VALUE(maddr))
  768. return (int) maddr;
  769. if (load_addr != 0)
  770. load_addr += PAGE_ALIGN(top - base);
  771. /* and then load the file segments into it */
  772. phdr = params->phdrs;
  773. for (loop = 0; loop < params->hdr.e_phnum; loop++, phdr++) {
  774. if (params->phdrs[loop].p_type != PT_LOAD)
  775. continue;
  776. fpos = phdr->p_offset;
  777. seg->addr = maddr + (phdr->p_vaddr - base);
  778. seg->p_vaddr = phdr->p_vaddr;
  779. seg->p_memsz = phdr->p_memsz;
  780. ret = file->f_op->read(file, (void *) seg->addr,
  781. phdr->p_filesz, &fpos);
  782. if (ret < 0)
  783. return ret;
  784. /* map the ELF header address if in this segment */
  785. if (phdr->p_offset == 0)
  786. params->elfhdr_addr = seg->addr;
  787. /* clear any space allocated but not loaded */
  788. if (phdr->p_filesz < phdr->p_memsz)
  789. clear_user((void *) (seg->addr + phdr->p_filesz),
  790. phdr->p_memsz - phdr->p_filesz);
  791. if (mm) {
  792. if (phdr->p_flags & PF_X) {
  793. mm->start_code = seg->addr;
  794. mm->end_code = seg->addr + phdr->p_memsz;
  795. } else if (!mm->start_data) {
  796. mm->start_data = seg->addr;
  797. #ifndef CONFIG_MMU
  798. mm->end_data = seg->addr + phdr->p_memsz;
  799. #endif
  800. }
  801. #ifdef CONFIG_MMU
  802. if (seg->addr + phdr->p_memsz > mm->end_data)
  803. mm->end_data = seg->addr + phdr->p_memsz;
  804. #endif
  805. }
  806. seg++;
  807. }
  808. return 0;
  809. }
  810. #endif
  811. /*****************************************************************************/
  812. /*
  813. * map a binary by direct mmap() of the individual PT_LOAD segments
  814. */
  815. static int elf_fdpic_map_file_by_direct_mmap(struct elf_fdpic_params *params,
  816. struct file *file,
  817. struct mm_struct *mm)
  818. {
  819. struct elf32_fdpic_loadseg *seg;
  820. struct elf32_phdr *phdr;
  821. unsigned long load_addr, delta_vaddr;
  822. int loop, dvset;
  823. load_addr = params->load_addr;
  824. delta_vaddr = 0;
  825. dvset = 0;
  826. seg = params->loadmap->segs;
  827. /* deal with each load segment separately */
  828. phdr = params->phdrs;
  829. for (loop = 0; loop < params->hdr.e_phnum; loop++, phdr++) {
  830. unsigned long maddr, disp, excess, excess1;
  831. int prot = 0, flags;
  832. if (phdr->p_type != PT_LOAD)
  833. continue;
  834. kdebug("[LOAD] va=%lx of=%lx fs=%lx ms=%lx",
  835. (unsigned long) phdr->p_vaddr,
  836. (unsigned long) phdr->p_offset,
  837. (unsigned long) phdr->p_filesz,
  838. (unsigned long) phdr->p_memsz);
  839. /* determine the mapping parameters */
  840. if (phdr->p_flags & PF_R) prot |= PROT_READ;
  841. if (phdr->p_flags & PF_W) prot |= PROT_WRITE;
  842. if (phdr->p_flags & PF_X) prot |= PROT_EXEC;
  843. flags = MAP_PRIVATE | MAP_DENYWRITE;
  844. if (params->flags & ELF_FDPIC_FLAG_EXECUTABLE)
  845. flags |= MAP_EXECUTABLE;
  846. maddr = 0;
  847. switch (params->flags & ELF_FDPIC_FLAG_ARRANGEMENT) {
  848. case ELF_FDPIC_FLAG_INDEPENDENT:
  849. /* PT_LOADs are independently locatable */
  850. break;
  851. case ELF_FDPIC_FLAG_HONOURVADDR:
  852. /* the specified virtual address must be honoured */
  853. maddr = phdr->p_vaddr;
  854. flags |= MAP_FIXED;
  855. break;
  856. case ELF_FDPIC_FLAG_CONSTDISP:
  857. /* constant displacement
  858. * - can be mapped anywhere, but must be mapped as a
  859. * unit
  860. */
  861. if (!dvset) {
  862. maddr = load_addr;
  863. delta_vaddr = phdr->p_vaddr;
  864. dvset = 1;
  865. } else {
  866. maddr = load_addr + phdr->p_vaddr - delta_vaddr;
  867. flags |= MAP_FIXED;
  868. }
  869. break;
  870. case ELF_FDPIC_FLAG_CONTIGUOUS:
  871. /* contiguity handled later */
  872. break;
  873. default:
  874. BUG();
  875. }
  876. maddr &= PAGE_MASK;
  877. /* create the mapping */
  878. disp = phdr->p_vaddr & ~PAGE_MASK;
  879. down_write(&mm->mmap_sem);
  880. maddr = do_mmap(file, maddr, phdr->p_memsz + disp, prot, flags,
  881. phdr->p_offset - disp);
  882. up_write(&mm->mmap_sem);
  883. kdebug("mmap[%d] <file> sz=%lx pr=%x fl=%x of=%lx --> %08lx",
  884. loop, phdr->p_memsz + disp, prot, flags,
  885. phdr->p_offset - disp, maddr);
  886. if (IS_ERR_VALUE(maddr))
  887. return (int) maddr;
  888. if ((params->flags & ELF_FDPIC_FLAG_ARRANGEMENT) ==
  889. ELF_FDPIC_FLAG_CONTIGUOUS)
  890. load_addr += PAGE_ALIGN(phdr->p_memsz + disp);
  891. seg->addr = maddr + disp;
  892. seg->p_vaddr = phdr->p_vaddr;
  893. seg->p_memsz = phdr->p_memsz;
  894. /* map the ELF header address if in this segment */
  895. if (phdr->p_offset == 0)
  896. params->elfhdr_addr = seg->addr;
  897. /* clear the bit between beginning of mapping and beginning of
  898. * PT_LOAD */
  899. if (prot & PROT_WRITE && disp > 0) {
  900. kdebug("clear[%d] ad=%lx sz=%lx", loop, maddr, disp);
  901. clear_user((void __user *) maddr, disp);
  902. maddr += disp;
  903. }
  904. /* clear any space allocated but not loaded
  905. * - on uClinux we can just clear the lot
  906. * - on MMU linux we'll get a SIGBUS beyond the last page
  907. * extant in the file
  908. */
  909. excess = phdr->p_memsz - phdr->p_filesz;
  910. excess1 = PAGE_SIZE - ((maddr + phdr->p_filesz) & ~PAGE_MASK);
  911. #ifdef CONFIG_MMU
  912. if (excess > excess1) {
  913. unsigned long xaddr = maddr + phdr->p_filesz + excess1;
  914. unsigned long xmaddr;
  915. flags |= MAP_FIXED | MAP_ANONYMOUS;
  916. down_write(&mm->mmap_sem);
  917. xmaddr = do_mmap(NULL, xaddr, excess - excess1,
  918. prot, flags, 0);
  919. up_write(&mm->mmap_sem);
  920. kdebug("mmap[%d] <anon>"
  921. " ad=%lx sz=%lx pr=%x fl=%x of=0 --> %08lx",
  922. loop, xaddr, excess - excess1, prot, flags,
  923. xmaddr);
  924. if (xmaddr != xaddr)
  925. return -ENOMEM;
  926. }
  927. if (prot & PROT_WRITE && excess1 > 0) {
  928. kdebug("clear[%d] ad=%lx sz=%lx",
  929. loop, maddr + phdr->p_filesz, excess1);
  930. clear_user((void __user *) maddr + phdr->p_filesz,
  931. excess1);
  932. }
  933. #else
  934. if (excess > 0) {
  935. kdebug("clear[%d] ad=%lx sz=%lx",
  936. loop, maddr + phdr->p_filesz, excess);
  937. clear_user((void *) maddr + phdr->p_filesz, excess);
  938. }
  939. #endif
  940. if (mm) {
  941. if (phdr->p_flags & PF_X) {
  942. mm->start_code = maddr;
  943. mm->end_code = maddr + phdr->p_memsz;
  944. } else if (!mm->start_data) {
  945. mm->start_data = maddr;
  946. mm->end_data = maddr + phdr->p_memsz;
  947. }
  948. }
  949. seg++;
  950. }
  951. return 0;
  952. }
  953. /*****************************************************************************/
  954. /*
  955. * ELF-FDPIC core dumper
  956. *
  957. * Modelled on fs/exec.c:aout_core_dump()
  958. * Jeremy Fitzhardinge <jeremy@sw.oz.au>
  959. *
  960. * Modelled on fs/binfmt_elf.c core dumper
  961. */
  962. #if defined(USE_ELF_CORE_DUMP) && defined(CONFIG_ELF_CORE)
  963. /*
  964. * These are the only things you should do on a core-file: use only these
  965. * functions to write out all the necessary info.
  966. */
  967. static int dump_write(struct file *file, const void *addr, int nr)
  968. {
  969. return file->f_op->write(file, addr, nr, &file->f_pos) == nr;
  970. }
  971. static int dump_seek(struct file *file, loff_t off)
  972. {
  973. if (file->f_op->llseek) {
  974. if (file->f_op->llseek(file, off, SEEK_SET) != off)
  975. return 0;
  976. } else {
  977. file->f_pos = off;
  978. }
  979. return 1;
  980. }
  981. /*
  982. * Decide whether a segment is worth dumping; default is yes to be
  983. * sure (missing info is worse than too much; etc).
  984. * Personally I'd include everything, and use the coredump limit...
  985. *
  986. * I think we should skip something. But I am not sure how. H.J.
  987. */
  988. static int maydump(struct vm_area_struct *vma)
  989. {
  990. /* Do not dump I/O mapped devices or special mappings */
  991. if (vma->vm_flags & (VM_IO | VM_RESERVED)) {
  992. kdcore("%08lx: %08lx: no (IO)", vma->vm_start, vma->vm_flags);
  993. return 0;
  994. }
  995. /* If we may not read the contents, don't allow us to dump
  996. * them either. "dump_write()" can't handle it anyway.
  997. */
  998. if (!(vma->vm_flags & VM_READ)) {
  999. kdcore("%08lx: %08lx: no (!read)", vma->vm_start, vma->vm_flags);
  1000. return 0;
  1001. }
  1002. /* Dump shared memory only if mapped from an anonymous file. */
  1003. if (vma->vm_flags & VM_SHARED) {
  1004. if (vma->vm_file->f_path.dentry->d_inode->i_nlink == 0) {
  1005. kdcore("%08lx: %08lx: no (share)", vma->vm_start, vma->vm_flags);
  1006. return 1;
  1007. }
  1008. kdcore("%08lx: %08lx: no (share)", vma->vm_start, vma->vm_flags);
  1009. return 0;
  1010. }
  1011. #ifdef CONFIG_MMU
  1012. /* If it hasn't been written to, don't write it out */
  1013. if (!vma->anon_vma) {
  1014. kdcore("%08lx: %08lx: no (!anon)", vma->vm_start, vma->vm_flags);
  1015. return 0;
  1016. }
  1017. #endif
  1018. kdcore("%08lx: %08lx: yes", vma->vm_start, vma->vm_flags);
  1019. return 1;
  1020. }
  1021. /* An ELF note in memory */
  1022. struct memelfnote
  1023. {
  1024. const char *name;
  1025. int type;
  1026. unsigned int datasz;
  1027. void *data;
  1028. };
  1029. static int notesize(struct memelfnote *en)
  1030. {
  1031. int sz;
  1032. sz = sizeof(struct elf_note);
  1033. sz += roundup(strlen(en->name) + 1, 4);
  1034. sz += roundup(en->datasz, 4);
  1035. return sz;
  1036. }
  1037. /* #define DEBUG */
  1038. #define DUMP_WRITE(addr, nr) \
  1039. do { if (!dump_write(file, (addr), (nr))) return 0; } while(0)
  1040. #define DUMP_SEEK(off) \
  1041. do { if (!dump_seek(file, (off))) return 0; } while(0)
  1042. static int writenote(struct memelfnote *men, struct file *file)
  1043. {
  1044. struct elf_note en;
  1045. en.n_namesz = strlen(men->name) + 1;
  1046. en.n_descsz = men->datasz;
  1047. en.n_type = men->type;
  1048. DUMP_WRITE(&en, sizeof(en));
  1049. DUMP_WRITE(men->name, en.n_namesz);
  1050. /* XXX - cast from long long to long to avoid need for libgcc.a */
  1051. DUMP_SEEK(roundup((unsigned long)file->f_pos, 4)); /* XXX */
  1052. DUMP_WRITE(men->data, men->datasz);
  1053. DUMP_SEEK(roundup((unsigned long)file->f_pos, 4)); /* XXX */
  1054. return 1;
  1055. }
  1056. #undef DUMP_WRITE
  1057. #undef DUMP_SEEK
  1058. #define DUMP_WRITE(addr, nr) \
  1059. if ((size += (nr)) > limit || !dump_write(file, (addr), (nr))) \
  1060. goto end_coredump;
  1061. #define DUMP_SEEK(off) \
  1062. if (!dump_seek(file, (off))) \
  1063. goto end_coredump;
  1064. static inline void fill_elf_fdpic_header(struct elfhdr *elf, int segs)
  1065. {
  1066. memcpy(elf->e_ident, ELFMAG, SELFMAG);
  1067. elf->e_ident[EI_CLASS] = ELF_CLASS;
  1068. elf->e_ident[EI_DATA] = ELF_DATA;
  1069. elf->e_ident[EI_VERSION] = EV_CURRENT;
  1070. elf->e_ident[EI_OSABI] = ELF_OSABI;
  1071. memset(elf->e_ident+EI_PAD, 0, EI_NIDENT-EI_PAD);
  1072. elf->e_type = ET_CORE;
  1073. elf->e_machine = ELF_ARCH;
  1074. elf->e_version = EV_CURRENT;
  1075. elf->e_entry = 0;
  1076. elf->e_phoff = sizeof(struct elfhdr);
  1077. elf->e_shoff = 0;
  1078. elf->e_flags = ELF_FDPIC_CORE_EFLAGS;
  1079. elf->e_ehsize = sizeof(struct elfhdr);
  1080. elf->e_phentsize = sizeof(struct elf_phdr);
  1081. elf->e_phnum = segs;
  1082. elf->e_shentsize = 0;
  1083. elf->e_shnum = 0;
  1084. elf->e_shstrndx = 0;
  1085. return;
  1086. }
  1087. static inline void fill_elf_note_phdr(struct elf_phdr *phdr, int sz, loff_t offset)
  1088. {
  1089. phdr->p_type = PT_NOTE;
  1090. phdr->p_offset = offset;
  1091. phdr->p_vaddr = 0;
  1092. phdr->p_paddr = 0;
  1093. phdr->p_filesz = sz;
  1094. phdr->p_memsz = 0;
  1095. phdr->p_flags = 0;
  1096. phdr->p_align = 0;
  1097. return;
  1098. }
  1099. static inline void fill_note(struct memelfnote *note, const char *name, int type,
  1100. unsigned int sz, void *data)
  1101. {
  1102. note->name = name;
  1103. note->type = type;
  1104. note->datasz = sz;
  1105. note->data = data;
  1106. return;
  1107. }
  1108. /*
  1109. * fill up all the fields in prstatus from the given task struct, except
  1110. * registers which need to be filled up seperately.
  1111. */
  1112. static void fill_prstatus(struct elf_prstatus *prstatus,
  1113. struct task_struct *p, long signr)
  1114. {
  1115. prstatus->pr_info.si_signo = prstatus->pr_cursig = signr;
  1116. prstatus->pr_sigpend = p->pending.signal.sig[0];
  1117. prstatus->pr_sighold = p->blocked.sig[0];
  1118. prstatus->pr_pid = p->pid;
  1119. prstatus->pr_ppid = p->parent->pid;
  1120. prstatus->pr_pgrp = process_group(p);
  1121. prstatus->pr_sid = process_session(p);
  1122. if (thread_group_leader(p)) {
  1123. /*
  1124. * This is the record for the group leader. Add in the
  1125. * cumulative times of previous dead threads. This total
  1126. * won't include the time of each live thread whose state
  1127. * is included in the core dump. The final total reported
  1128. * to our parent process when it calls wait4 will include
  1129. * those sums as well as the little bit more time it takes
  1130. * this and each other thread to finish dying after the
  1131. * core dump synchronization phase.
  1132. */
  1133. cputime_to_timeval(cputime_add(p->utime, p->signal->utime),
  1134. &prstatus->pr_utime);
  1135. cputime_to_timeval(cputime_add(p->stime, p->signal->stime),
  1136. &prstatus->pr_stime);
  1137. } else {
  1138. cputime_to_timeval(p->utime, &prstatus->pr_utime);
  1139. cputime_to_timeval(p->stime, &prstatus->pr_stime);
  1140. }
  1141. cputime_to_timeval(p->signal->cutime, &prstatus->pr_cutime);
  1142. cputime_to_timeval(p->signal->cstime, &prstatus->pr_cstime);
  1143. prstatus->pr_exec_fdpic_loadmap = p->mm->context.exec_fdpic_loadmap;
  1144. prstatus->pr_interp_fdpic_loadmap = p->mm->context.interp_fdpic_loadmap;
  1145. }
  1146. static int fill_psinfo(struct elf_prpsinfo *psinfo, struct task_struct *p,
  1147. struct mm_struct *mm)
  1148. {
  1149. unsigned int i, len;
  1150. /* first copy the parameters from user space */
  1151. memset(psinfo, 0, sizeof(struct elf_prpsinfo));
  1152. len = mm->arg_end - mm->arg_start;
  1153. if (len >= ELF_PRARGSZ)
  1154. len = ELF_PRARGSZ - 1;
  1155. if (copy_from_user(&psinfo->pr_psargs,
  1156. (const char __user *) mm->arg_start, len))
  1157. return -EFAULT;
  1158. for (i = 0; i < len; i++)
  1159. if (psinfo->pr_psargs[i] == 0)
  1160. psinfo->pr_psargs[i] = ' ';
  1161. psinfo->pr_psargs[len] = 0;
  1162. psinfo->pr_pid = p->pid;
  1163. psinfo->pr_ppid = p->parent->pid;
  1164. psinfo->pr_pgrp = process_group(p);
  1165. psinfo->pr_sid = process_session(p);
  1166. i = p->state ? ffz(~p->state) + 1 : 0;
  1167. psinfo->pr_state = i;
  1168. psinfo->pr_sname = (i > 5) ? '.' : "RSDTZW"[i];
  1169. psinfo->pr_zomb = psinfo->pr_sname == 'Z';
  1170. psinfo->pr_nice = task_nice(p);
  1171. psinfo->pr_flag = p->flags;
  1172. SET_UID(psinfo->pr_uid, p->uid);
  1173. SET_GID(psinfo->pr_gid, p->gid);
  1174. strncpy(psinfo->pr_fname, p->comm, sizeof(psinfo->pr_fname));
  1175. return 0;
  1176. }
  1177. /* Here is the structure in which status of each thread is captured. */
  1178. struct elf_thread_status
  1179. {
  1180. struct list_head list;
  1181. struct elf_prstatus prstatus; /* NT_PRSTATUS */
  1182. elf_fpregset_t fpu; /* NT_PRFPREG */
  1183. struct task_struct *thread;
  1184. #ifdef ELF_CORE_COPY_XFPREGS
  1185. elf_fpxregset_t xfpu; /* NT_PRXFPREG */
  1186. #endif
  1187. struct memelfnote notes[3];
  1188. int num_notes;
  1189. };
  1190. /*
  1191. * In order to add the specific thread information for the elf file format,
  1192. * we need to keep a linked list of every thread's pr_status and then create
  1193. * a single section for them in the final core file.
  1194. */
  1195. static int elf_dump_thread_status(long signr, struct elf_thread_status *t)
  1196. {
  1197. struct task_struct *p = t->thread;
  1198. int sz = 0;
  1199. t->num_notes = 0;
  1200. fill_prstatus(&t->prstatus, p, signr);
  1201. elf_core_copy_task_regs(p, &t->prstatus.pr_reg);
  1202. fill_note(&t->notes[0], "CORE", NT_PRSTATUS, sizeof(t->prstatus),
  1203. &t->prstatus);
  1204. t->num_notes++;
  1205. sz += notesize(&t->notes[0]);
  1206. t->prstatus.pr_fpvalid = elf_core_copy_task_fpregs(p, NULL, &t->fpu);
  1207. if (t->prstatus.pr_fpvalid) {
  1208. fill_note(&t->notes[1], "CORE", NT_PRFPREG, sizeof(t->fpu),
  1209. &t->fpu);
  1210. t->num_notes++;
  1211. sz += notesize(&t->notes[1]);
  1212. }
  1213. #ifdef ELF_CORE_COPY_XFPREGS
  1214. if (elf_core_copy_task_xfpregs(p, &t->xfpu)) {
  1215. fill_note(&t->notes[2], "LINUX", NT_PRXFPREG, sizeof(t->xfpu),
  1216. &t->xfpu);
  1217. t->num_notes++;
  1218. sz += notesize(&t->notes[2]);
  1219. }
  1220. #endif
  1221. return sz;
  1222. }
  1223. /*
  1224. * dump the segments for an MMU process
  1225. */
  1226. #ifdef CONFIG_MMU
  1227. static int elf_fdpic_dump_segments(struct file *file, struct mm_struct *mm,
  1228. size_t *size, unsigned long *limit)
  1229. {
  1230. struct vm_area_struct *vma;
  1231. for (vma = current->mm->mmap; vma; vma = vma->vm_next) {
  1232. unsigned long addr;
  1233. if (!maydump(vma))
  1234. continue;
  1235. for (addr = vma->vm_start;
  1236. addr < vma->vm_end;
  1237. addr += PAGE_SIZE
  1238. ) {
  1239. struct vm_area_struct *vma;
  1240. struct page *page;
  1241. if (get_user_pages(current, current->mm, addr, 1, 0, 1,
  1242. &page, &vma) <= 0) {
  1243. DUMP_SEEK(file->f_pos + PAGE_SIZE);
  1244. }
  1245. else if (page == ZERO_PAGE(addr)) {
  1246. DUMP_SEEK(file->f_pos + PAGE_SIZE);
  1247. page_cache_release(page);
  1248. }
  1249. else {
  1250. void *kaddr;
  1251. flush_cache_page(vma, addr, page_to_pfn(page));
  1252. kaddr = kmap(page);
  1253. if ((*size += PAGE_SIZE) > *limit ||
  1254. !dump_write(file, kaddr, PAGE_SIZE)
  1255. ) {
  1256. kunmap(page);
  1257. page_cache_release(page);
  1258. return -EIO;
  1259. }
  1260. kunmap(page);
  1261. page_cache_release(page);
  1262. }
  1263. }
  1264. }
  1265. return 0;
  1266. end_coredump:
  1267. return -EFBIG;
  1268. }
  1269. #endif
  1270. /*
  1271. * dump the segments for a NOMMU process
  1272. */
  1273. #ifndef CONFIG_MMU
  1274. static int elf_fdpic_dump_segments(struct file *file, struct mm_struct *mm,
  1275. size_t *size, unsigned long *limit)
  1276. {
  1277. struct vm_list_struct *vml;
  1278. for (vml = current->mm->context.vmlist; vml; vml = vml->next) {
  1279. struct vm_area_struct *vma = vml->vma;
  1280. if (!maydump(vma))
  1281. continue;
  1282. if ((*size += PAGE_SIZE) > *limit)
  1283. return -EFBIG;
  1284. if (!dump_write(file, (void *) vma->vm_start,
  1285. vma->vm_end - vma->vm_start))
  1286. return -EIO;
  1287. }
  1288. return 0;
  1289. }
  1290. #endif
  1291. /*
  1292. * Actual dumper
  1293. *
  1294. * This is a two-pass process; first we find the offsets of the bits,
  1295. * and then they are actually written out. If we run out of core limit
  1296. * we just truncate.
  1297. */
  1298. static int elf_fdpic_core_dump(long signr, struct pt_regs *regs,
  1299. struct file *file)
  1300. {
  1301. #define NUM_NOTES 6
  1302. int has_dumped = 0;
  1303. mm_segment_t fs;
  1304. int segs;
  1305. size_t size = 0;
  1306. int i;
  1307. struct vm_area_struct *vma;
  1308. struct elfhdr *elf = NULL;
  1309. loff_t offset = 0, dataoff;
  1310. unsigned long limit = current->signal->rlim[RLIMIT_CORE].rlim_cur;
  1311. int numnote;
  1312. struct memelfnote *notes = NULL;
  1313. struct elf_prstatus *prstatus = NULL; /* NT_PRSTATUS */
  1314. struct elf_prpsinfo *psinfo = NULL; /* NT_PRPSINFO */
  1315. struct task_struct *g, *p;
  1316. LIST_HEAD(thread_list);
  1317. struct list_head *t;
  1318. elf_fpregset_t *fpu = NULL;
  1319. #ifdef ELF_CORE_COPY_XFPREGS
  1320. elf_fpxregset_t *xfpu = NULL;
  1321. #endif
  1322. int thread_status_size = 0;
  1323. #ifndef CONFIG_MMU
  1324. struct vm_list_struct *vml;
  1325. #endif
  1326. elf_addr_t *auxv;
  1327. /*
  1328. * We no longer stop all VM operations.
  1329. *
  1330. * This is because those proceses that could possibly change map_count
  1331. * or the mmap / vma pages are now blocked in do_exit on current
  1332. * finishing this core dump.
  1333. *
  1334. * Only ptrace can touch these memory addresses, but it doesn't change
  1335. * the map_count or the pages allocated. So no possibility of crashing
  1336. * exists while dumping the mm->vm_next areas to the core file.
  1337. */
  1338. /* alloc memory for large data structures: too large to be on stack */
  1339. elf = kmalloc(sizeof(*elf), GFP_KERNEL);
  1340. if (!elf)
  1341. goto cleanup;
  1342. prstatus = kzalloc(sizeof(*prstatus), GFP_KERNEL);
  1343. if (!prstatus)
  1344. goto cleanup;
  1345. psinfo = kmalloc(sizeof(*psinfo), GFP_KERNEL);
  1346. if (!psinfo)
  1347. goto cleanup;
  1348. notes = kmalloc(NUM_NOTES * sizeof(struct memelfnote), GFP_KERNEL);
  1349. if (!notes)
  1350. goto cleanup;
  1351. fpu = kmalloc(sizeof(*fpu), GFP_KERNEL);
  1352. if (!fpu)
  1353. goto cleanup;
  1354. #ifdef ELF_CORE_COPY_XFPREGS
  1355. xfpu = kmalloc(sizeof(*xfpu), GFP_KERNEL);
  1356. if (!xfpu)
  1357. goto cleanup;
  1358. #endif
  1359. if (signr) {
  1360. struct elf_thread_status *tmp;
  1361. rcu_read_lock();
  1362. do_each_thread(g,p)
  1363. if (current->mm == p->mm && current != p) {
  1364. tmp = kzalloc(sizeof(*tmp), GFP_ATOMIC);
  1365. if (!tmp) {
  1366. rcu_read_unlock();
  1367. goto cleanup;
  1368. }
  1369. tmp->thread = p;
  1370. list_add(&tmp->list, &thread_list);
  1371. }
  1372. while_each_thread(g,p);
  1373. rcu_read_unlock();
  1374. list_for_each(t, &thread_list) {
  1375. struct elf_thread_status *tmp;
  1376. int sz;
  1377. tmp = list_entry(t, struct elf_thread_status, list);
  1378. sz = elf_dump_thread_status(signr, tmp);
  1379. thread_status_size += sz;
  1380. }
  1381. }
  1382. /* now collect the dump for the current */
  1383. fill_prstatus(prstatus, current, signr);
  1384. elf_core_copy_regs(&prstatus->pr_reg, regs);
  1385. #ifdef CONFIG_MMU
  1386. segs = current->mm->map_count;
  1387. #else
  1388. segs = 0;
  1389. for (vml = current->mm->context.vmlist; vml; vml = vml->next)
  1390. segs++;
  1391. #endif
  1392. #ifdef ELF_CORE_EXTRA_PHDRS
  1393. segs += ELF_CORE_EXTRA_PHDRS;
  1394. #endif
  1395. /* Set up header */
  1396. fill_elf_fdpic_header(elf, segs + 1); /* including notes section */
  1397. has_dumped = 1;
  1398. current->flags |= PF_DUMPCORE;
  1399. /*
  1400. * Set up the notes in similar form to SVR4 core dumps made
  1401. * with info from their /proc.
  1402. */
  1403. fill_note(notes + 0, "CORE", NT_PRSTATUS, sizeof(*prstatus), prstatus);
  1404. fill_psinfo(psinfo, current->group_leader, current->mm);
  1405. fill_note(notes + 1, "CORE", NT_PRPSINFO, sizeof(*psinfo), psinfo);
  1406. numnote = 2;
  1407. auxv = (elf_addr_t *) current->mm->saved_auxv;
  1408. i = 0;
  1409. do
  1410. i += 2;
  1411. while (auxv[i - 2] != AT_NULL);
  1412. fill_note(&notes[numnote++], "CORE", NT_AUXV,
  1413. i * sizeof(elf_addr_t), auxv);
  1414. /* Try to dump the FPU. */
  1415. if ((prstatus->pr_fpvalid =
  1416. elf_core_copy_task_fpregs(current, regs, fpu)))
  1417. fill_note(notes + numnote++,
  1418. "CORE", NT_PRFPREG, sizeof(*fpu), fpu);
  1419. #ifdef ELF_CORE_COPY_XFPREGS
  1420. if (elf_core_copy_task_xfpregs(current, xfpu))
  1421. fill_note(notes + numnote++,
  1422. "LINUX", NT_PRXFPREG, sizeof(*xfpu), xfpu);
  1423. #endif
  1424. fs = get_fs();
  1425. set_fs(KERNEL_DS);
  1426. DUMP_WRITE(elf, sizeof(*elf));
  1427. offset += sizeof(*elf); /* Elf header */
  1428. offset += (segs+1) * sizeof(struct elf_phdr); /* Program headers */
  1429. /* Write notes phdr entry */
  1430. {
  1431. struct elf_phdr phdr;
  1432. int sz = 0;
  1433. for (i = 0; i < numnote; i++)
  1434. sz += notesize(notes + i);
  1435. sz += thread_status_size;
  1436. fill_elf_note_phdr(&phdr, sz, offset);
  1437. offset += sz;
  1438. DUMP_WRITE(&phdr, sizeof(phdr));
  1439. }
  1440. /* Page-align dumped data */
  1441. dataoff = offset = roundup(offset, ELF_EXEC_PAGESIZE);
  1442. /* write program headers for segments dump */
  1443. for (
  1444. #ifdef CONFIG_MMU
  1445. vma = current->mm->mmap; vma; vma = vma->vm_next
  1446. #else
  1447. vml = current->mm->context.vmlist; vml; vml = vml->next
  1448. #endif
  1449. ) {
  1450. struct elf_phdr phdr;
  1451. size_t sz;
  1452. #ifndef CONFIG_MMU
  1453. vma = vml->vma;
  1454. #endif
  1455. sz = vma->vm_end - vma->vm_start;
  1456. phdr.p_type = PT_LOAD;
  1457. phdr.p_offset = offset;
  1458. phdr.p_vaddr = vma->vm_start;
  1459. phdr.p_paddr = 0;
  1460. phdr.p_filesz = maydump(vma) ? sz : 0;
  1461. phdr.p_memsz = sz;
  1462. offset += phdr.p_filesz;
  1463. phdr.p_flags = vma->vm_flags & VM_READ ? PF_R : 0;
  1464. if (vma->vm_flags & VM_WRITE)
  1465. phdr.p_flags |= PF_W;
  1466. if (vma->vm_flags & VM_EXEC)
  1467. phdr.p_flags |= PF_X;
  1468. phdr.p_align = ELF_EXEC_PAGESIZE;
  1469. DUMP_WRITE(&phdr, sizeof(phdr));
  1470. }
  1471. #ifdef ELF_CORE_WRITE_EXTRA_PHDRS
  1472. ELF_CORE_WRITE_EXTRA_PHDRS;
  1473. #endif
  1474. /* write out the notes section */
  1475. for (i = 0; i < numnote; i++)
  1476. if (!writenote(notes + i, file))
  1477. goto end_coredump;
  1478. /* write out the thread status notes section */
  1479. list_for_each(t, &thread_list) {
  1480. struct elf_thread_status *tmp =
  1481. list_entry(t, struct elf_thread_status, list);
  1482. for (i = 0; i < tmp->num_notes; i++)
  1483. if (!writenote(&tmp->notes[i], file))
  1484. goto end_coredump;
  1485. }
  1486. DUMP_SEEK(dataoff);
  1487. if (elf_fdpic_dump_segments(file, current->mm, &size, &limit) < 0)
  1488. goto end_coredump;
  1489. #ifdef ELF_CORE_WRITE_EXTRA_DATA
  1490. ELF_CORE_WRITE_EXTRA_DATA;
  1491. #endif
  1492. if (file->f_pos != offset) {
  1493. /* Sanity check */
  1494. printk(KERN_WARNING
  1495. "elf_core_dump: file->f_pos (%lld) != offset (%lld)\n",
  1496. file->f_pos, offset);
  1497. }
  1498. end_coredump:
  1499. set_fs(fs);
  1500. cleanup:
  1501. while (!list_empty(&thread_list)) {
  1502. struct list_head *tmp = thread_list.next;
  1503. list_del(tmp);
  1504. kfree(list_entry(tmp, struct elf_thread_status, list));
  1505. }
  1506. kfree(elf);
  1507. kfree(prstatus);
  1508. kfree(psinfo);
  1509. kfree(notes);
  1510. kfree(fpu);
  1511. #ifdef ELF_CORE_COPY_XFPREGS
  1512. kfree(xfpu);
  1513. #endif
  1514. return has_dumped;
  1515. #undef NUM_NOTES
  1516. }
  1517. #endif /* USE_ELF_CORE_DUMP */