elf loader now mostly supports 64b elfs
[akaros.git] / kern / src / elf.c
index 04fd504..0c56d94 100644 (file)
@@ -6,79 +6,94 @@
 #include <syscall.h>
 #include <elf.h>
 #include <pmap.h>
+#include <smp.h>
+#include <arch/arch.h>
 
-typedef struct
-{
-       long entry;
-       long highest_addr;
-       long phdr;
-       int phnum;
-       int dynamic;
-       char interp[256];
-} elf_info_t;
-
-static int
-load_one_elf(struct proc* p, struct file* f, int pgoffset, elf_info_t* ei)
+#ifdef KERN64
+# define elf_field(obj, field) (elf64 ? (obj##64)->field : (obj##32)->field)
+#else
+# define elf_field(obj, field) ((obj##32)->field)
+#endif
+
+static int load_one_elf(struct proc *p, struct file *f, int pgoffset,
+                        elf_info_t *ei)
 {
        int ret = -1;
        ei->phdr = -1;
        ei->dynamic = 0;
        ei->highest_addr = 0;
        off_t f_off = 0;
-       physaddr_t old_cr3 = rcr3();
-
-       /* Load the proc's address space, in case we need to directly write to its
-        * pages (like when we zero some of the BSS) */
-       lcr3(p->env_cr3);
 
-       // assume program headers fit in a page.
-       // if this isn't true, change the code below that maps in program headers
-       char* elf = (char*)kmalloc(PGSIZE,0);
-       if(!elf || f->f_op->read(f, elf, PGSIZE, &f_off) == -1)
+       /* assume program headers fit in a page.  if this isn't true, change the
+        * code below that maps in program headers */
+       char* elf = (char*)kmalloc(PGSIZE, 0);
+       
+       /* When reading on behalf of the kernel, we need to make sure no proc is
+        * "current".  This is a bit ghetto (TODO: KFOP) */
+       struct proc *cur_proc = current;
+       current = 0;
+       if (!elf || f->f_op->read(f, elf, PGSIZE, &f_off) == -1)
                goto fail;
+       current = cur_proc;
 
-       elf_t* elfhdr = (elf_t*)elf;
-       proghdr_t* proghdrs = (proghdr_t*)(elf+elfhdr->e_phoff);
-       if(elfhdr->e_phoff+elfhdr->e_phnum*sizeof(proghdr_t) > PGSIZE)
+       elf32_t* elfhdr32 = (elf32_t*)elf;
+       elf64_t* elfhdr64 = (elf64_t*)elf;
+       bool elf32 = elfhdr32->e_ident[ELF_IDENT_CLASS] == ELFCLASS32;
+       bool elf64 = elfhdr32->e_ident[ELF_IDENT_CLASS] == ELFCLASS64;
+       if (!elf64 && !elf32)
                goto fail;
-       if(elfhdr->e_phentsize != sizeof(proghdr_t))
+       #ifndef KERN64
+       if(elf64)
+               goto fail;
+       #endif
+       
+       proghdr32_t* proghdrs32 = (proghdr32_t*)(elf + elfhdr32->e_phoff);
+       proghdr64_t* proghdrs64 = (proghdr64_t*)(elf + elfhdr64->e_phoff);
+       uintptr_t e_phoff = elf_field(elfhdr, e_phoff);
+       size_t phsz = elf64 ? sizeof(proghdr64_t) : sizeof(proghdr32_t);
+       uint16_t e_phnum = elf_field(elfhdr, e_phnum);
+       // we don't support prog hdrs extending past the first elf page
+       if (e_phoff + e_phnum * phsz > PGSIZE)
                goto fail;
 
-       for(int i = 0; i < elfhdr->e_phnum; i++)
-       {
-               proghdr_t* ph = proghdrs+i;
-               if(ph->p_type == ELF_PROG_PHDR)
-                       ei->phdr = ph->p_va;
-               if(ph->p_type == ELF_PROG_INTERP)
-               {
-                       int maxlen = MIN(PGSIZE-ph->p_offset,sizeof(ei->interp));
-                       int len = strnlen(elf+ph->p_offset,maxlen);
-                       if(len < maxlen)
-                       {
-                               memcpy(ei->interp,elf+ph->p_offset,maxlen+1);
+       for (int i = 0; i < e_phnum; i++) {
+               proghdr32_t* ph32 = proghdrs32+i;
+               proghdr64_t* ph64 = proghdrs64+i;
+               uint16_t p_type = elf_field(ph, p_type);
+               uintptr_t p_va = elf_field(ph, p_va);
+               uintptr_t p_offset = elf_field(ph, p_offset);
+               uintptr_t p_align = elf_field(ph, p_align);
+               uintptr_t p_memsz = elf_field(ph, p_memsz);
+               uintptr_t p_filesz = elf_field(ph, p_filesz);
+
+               if (p_type == ELF_PROG_PHDR)
+                       ei->phdr = elf_field(ph, p_va);
+               if (p_type == ELF_PROG_INTERP) {
+                       int maxlen = MIN(PGSIZE - p_offset, sizeof(ei->interp));
+                       int len = strnlen(elf + p_offset, maxlen);
+                       if (len < maxlen) {
+                               memcpy(ei->interp, elf + p_offset, maxlen + 1);
                                ei->dynamic = 1;
                        }
                        else
                                goto fail;
                }
 
-               if(ph->p_type == ELF_PROG_LOAD && ph->p_memsz)
-               {
-                       if(ph->p_align % PGSIZE)
+               if (p_type == ELF_PROG_LOAD && p_memsz) {
+                       if (p_align % PGSIZE)
                                goto fail;
-                       if(ph->p_offset % PGSIZE != ph->p_va % PGSIZE)
+                       if (p_offset % PGSIZE != p_va % PGSIZE)
                                goto fail;
 
-                       uintptr_t filestart = ROUNDDOWN(ph->p_offset,PGSIZE);
-                       uintptr_t fileend = ph->p_offset+ph->p_filesz;
-                       uintptr_t filesz = fileend-filestart;
+                       uintptr_t filestart = ROUNDDOWN(p_offset, PGSIZE);
+                       uintptr_t fileend = p_offset + p_filesz;
+                       uintptr_t filesz = fileend - filestart;
 
-                       uintptr_t memstart = ROUNDDOWN(ph->p_va,PGSIZE);
-                       uintptr_t memend = ROUNDUP(ph->p_va + ph->p_memsz,PGSIZE);
-                       uintptr_t memsz = memend-memstart;
-                       if(memend > ei->highest_addr)
+                       uintptr_t memstart = ROUNDDOWN(p_va, PGSIZE);
+                       uintptr_t memend = ROUNDUP(p_va + p_memsz, PGSIZE);
+                       uintptr_t memsz = memend - memstart;
+                       if (memend > ei->highest_addr)
                                ei->highest_addr = memend;
-
                        /* This needs to be a PRIVATE mapping, and the stuff after the file
                         * needs to be zeroed. */
                        if (filesz) {
@@ -88,10 +103,15 @@ load_one_elf(struct proc* p, struct file* f, int pgoffset, elf_info_t* ei)
                                           f, filestart) == MAP_FAILED)
                                        goto fail;
                                /* Due to elf-ghetto-ness, we need to zero the first part of the
-                                * BSS from the last page of the data segment */
+                                * BSS from the last page of the data segment.  We translate to
+                                * the KVA so we don't need to worry about using the proc's
+                                * mapping */
                                uintptr_t z_s = memstart + pgoffset * PGSIZE + filesz;
-                               uintptr_t z_e = ROUNDUP(z_s, PGSIZE);
-                               memset((void*)z_s, 0, z_e - z_s);
+                               pte_t *pte = pgdir_walk(p->env_pgdir, (void*)z_s, 0);
+                               assert(pte);
+                               uintptr_t kva_z_s = (uintptr_t)ppn2kva(PTE2PPN(*pte)) + PGOFF(z_s);
+                               uintptr_t kva_z_e = ROUNDUP(kva_z_s, PGSIZE);
+                               memset((void*)kva_z_s, 0, kva_z_e - kva_z_s);
                                filesz = ROUNDUP(filesz, PGSIZE);
                        }
                        /* Any extra pages are mapped anonymously... (a bit weird) */
@@ -102,62 +122,59 @@ load_one_elf(struct proc* p, struct file* f, int pgoffset, elf_info_t* ei)
                                        goto fail;
                }
        }
-
-       // map in program headers anyway if not present in binary.
-       // useful for TLS in static programs.
-       if(ei->phdr == -1)
-       {
+       /* map in program headers anyway if not present in binary.
+        * useful for TLS in static programs. */
+       if (ei->phdr == -1) {
                void *phdr_addr = do_mmap(p, MMAP_LOWEST_VA, PGSIZE, PROT_READ, 0, f,
                                          0);
-               if(phdr_addr == MAP_FAILED)
+               if (phdr_addr == MAP_FAILED)
                        goto fail;
-               ei->phdr = (long)phdr_addr + elfhdr->e_phoff;
+               ei->phdr = (long)phdr_addr + e_phoff;
        }
-
-       ei->entry = elfhdr->e_entry + pgoffset*PGSIZE;
-       ei->phnum = elfhdr->e_phnum;
-
+       ei->entry = elf_field(elfhdr, e_entry) + pgoffset*PGSIZE;
+       ei->phnum = e_phnum;
+       ei->elf64 = elf64;
        ret = 0;
 fail:
        kfree(elf);
-       lcr3(old_cr3);
        return ret;
 }
 
 int load_elf(struct proc* p, struct file* f)
 {
-       elf_info_t ei,interp_ei;
-       if(load_one_elf(p,f,0,&ei))
+       elf_info_t ei, interp_ei;
+       if (load_one_elf(p, f, 0,& ei))
                return -1;
 
-       if(ei.dynamic)
-       {
-               warn("Convert me to use the filesystem!");
-               struct file* interp = file_open(ei.interp,0,0);
-               /* this will probably conflict with the mmap from the TLS up above */
-               if(interp == NULL || load_one_elf(p,interp,1,&interp_ei))
+       if (ei.dynamic) {
+               struct file *interp = do_file_open(ei.interp, 0, 0);
+               if (!interp)
+                       return -1;
+               /* careful, this could conflict with the mmap from the TLS up above */
+               int error = load_one_elf(p, interp, 2, &interp_ei);
+               kref_put(&interp->f_kref);
+               if (error)
                        return -1;
-               file_decref(interp);
        }
 
        // fill in auxiliary info for dynamic linker/runtime
-       elf_aux_t auxp[] = {{ELF_AUX_PHDR,ei.phdr},
-                           {ELF_AUX_PHENT,sizeof(proghdr_t)},
-                           {ELF_AUX_PHNUM,ei.phnum},
-                           {ELF_AUX_ENTRY,ei.entry},
+       elf_aux_t auxp[] = {{ELF_AUX_PHDR, ei.phdr},
+                           {ELF_AUX_PHENT, sizeof(proghdr32_t)},
+                           {ELF_AUX_PHNUM, ei.phnum},
+                           {ELF_AUX_ENTRY, ei.entry},
                            #ifdef __sparc_v8__
-                           {ELF_AUX_HWCAP,ELF_HWCAP_SPARC_FLUSH},
+                           {ELF_AUX_HWCAP, ELF_HWCAP_SPARC_FLUSH},
                            #endif
-                           {0,0}};
+                           {0, 0}};
 
        // put auxp after argv, envp in procinfo
        int auxp_pos = -1;
-       for(int i = 0, zeros = 0; i < PROCINFO_MAX_ARGP; i++)
-               if(p->procinfo->argp[i] == NULL)
-                       if(++zeros == 2)
-                               auxp_pos = i+1;
-       if(auxp_pos == -1 ||
-          auxp_pos+sizeof(auxp)/sizeof(char*) >= PROCINFO_MAX_ARGP)
+       for (int i = 0, zeros = 0; i < PROCINFO_MAX_ARGP; i++)
+               if (p->procinfo->argp[i] == NULL)
+                       if (++zeros == 2)
+                               auxp_pos = i + 1;
+       if (auxp_pos == -1 ||
+           auxp_pos + sizeof(auxp) / sizeof(char*) >= PROCINFO_MAX_ARGP)
                return -1;
        memcpy(p->procinfo->argp+auxp_pos,auxp,sizeof(auxp));
 
@@ -167,8 +184,8 @@ int load_elf(struct proc* p, struct file* f)
 
        // map in stack using POPULATE (because SPARC requires it)
        uintptr_t stacksz = USTACK_NUM_PAGES*PGSIZE;
-       if(do_mmap(p, USTACKTOP-stacksz, stacksz, PROT_READ | PROT_WRITE,
-                  MAP_FIXED | MAP_ANONYMOUS | MAP_POPULATE, NULL, 0) == MAP_FAILED)
+       if (do_mmap(p, USTACKTOP-stacksz, stacksz, PROT_READ | PROT_WRITE,
+                   MAP_FIXED | MAP_ANONYMOUS | MAP_POPULATE, NULL, 0) == MAP_FAILED)
                return -1;
 
        // Set the heap bottom and top to just past where the text