WebSVN – Kolibri OS – Path Comparison – / – /programs/system/os/modules.inc Rev 6766 and /programs/system/os/modules.inc Rev 6767

Regard whitespace Rev 6766 → Rev 6767

 /programs/system/os/modules.inc
 ,0 → 1,610
+; Module management, non-PE-specific code.
+; Works in conjuction with peloader.inc for PE-specific code.
+;  void* dlopen(const char* filename, int mode)
+;  Opens the module named filename and maps it in; returns a handle that can be
+;  passed to dlsym to get symbol values from it.
+;
+;  If filename starts with '/', it is treated as an absolute file name.
+;  Otherwise, dlopen searches for filename in predefined locations:
+;  /rd/1/lib, /kolibrios/lib, directory of the executable file.
+;  The current directory is *not* searched.
+;
+;  If the same module is loaded again with dlopen(), the same
+;  handle is returned.  The loader maintains reference
+;  counts for loaded modules, so a dynamically loaded module is
+;  not deallocated until dlclose() has been called on it as many times
+;  as dlopen() has succeeded on it.  Any initialization functions
+;  are called just once.
+;
+;  If dlopen() fails for any reason, it returns NULL.
+;
+;  mode is reserved and should be zero.
+proc dlopen stdcall uses esi edi, file, mode
+; find_module_by_name and load_module do all the work.
+; We just need to acquire/release the mutex and adjust input/output.
+        cmp     [mode], 0
+        jnz     .invalid_mode
+        mutex_lock modules_mutex
+        mov     edi, [file]
+        call    find_module_by_name
+        test    esi, esi
+        jnz     .inc_refcount
+        call    load_module
+        xor     edi, edi
+        test    eax, eax
+        jz      .unlock_return
+; The handle returned on success is module base address.
+; Unlike pointer to MODULE struct, it can be actually useful
+; for the caller as is.
+        mov     edi, [eax+MODULE.base]
+        jmp     .unlock_return
+.inc_refcount:
+        inc     [esi+MODULE.refcount]
+        mov     edi, [esi+MODULE.base]
+.unlock_return:
+        mutex_unlock modules_mutex
+        mov     eax, edi
+        ret
+.invalid_mode:
+        xor     eax, eax
+        ret
+endp
+;  int dlclose(void* handle)
+;  Decrements the reference count on the dynamically loaded module
+;  referred to by handle. If the reference count drops to zero,
+;  then the module is unloaded. All modules that were automatically loaded
+;  when dlopen() was invoked on the module referred to by handle are
+;  recursively closed in the same manner.
+;
+;  A successful return from dlclose() does not guarantee that the
+;  module has been actually removed from the caller's address space.
+;  In addition to references resulting from explicit dlopen() calls,
+;  a module may have been implicitly loaded (and reference counted)
+;  because of dependencies in other shared objects.
+;  Only when all references have been released can the module be removed
+;  from the address space.
+;  On success, dlclose() returns 0; on error, it returns a nonzero value.
+proc dlclose stdcall uses esi, handle
+; This function uses two worker functions:
+; find_module_by_addr to map handle -> MODULE,
+; dereference_module for the main work.
+; Aside of calling these, we should only acquire/release the mutex.
+        mutex_lock modules_mutex
+        mov     ecx, [handle]
+        call    find_module_by_addr
+        test    esi, esi
+        jz      .invalid_handle
+        call    dereference_module
+        mutex_unlock modules_mutex
+        xor     eax, eax
+        ret
+.invalid_handle:
+        mutex_unlock modules_mutex
+        xor     eax, eax
+        inc     eax
+        ret
+endp
+;  void* dlsym(void* handle, const char* symbol)
+;  Obtains address of a symbol in a module.
+;  On failure, returns NULL.
+;
+;  symbol can also be a number between 0 and 0xFFFF;
+;  it is interpreted as an ordinal of a symbol.
+;  Low 64K of address space are blocked for the allocation,
+;  so a valid pointer cannot be less than 0x10000.
+;
+;  handle is not validated. Passing an invalid handle can result in a crash.
+proc dlsym stdcall, handle, symbol
+locals
+export_base             dd      ?
+export_ptr              dd      ?
+export_size             dd      ?
+import_module           dd      0
+endl
+; Again, helper functions do all the work.
+; We don't need to browse list of MODULEs,
+; so we don't need to acquire/release the mutex.
+; Unless the function is forwarded or module name is required for error message,
+; but this should be processed by get_exported_function_*.
+        mov     eax, [handle]
+        call    prepare_import_from_module
+        mov     ecx, [symbol]
+        cmp     ecx, 0x10000
+        jb      .ordinal
+        mov     edx, -1 ; no hint for lookup in name table
+        call    get_exported_function_by_name
+        ret
+.ordinal:
+        call    get_exported_function_by_ordinal
+        ret
+endp
+; Errors happen.
+; Some errors should be reported to the user. Some errors are normal.
+; After the process has been initialized, we don't know what an error
+; should mean - is the failed DLL absolutely required or unimportant enhancement?
+; So we report an error to the caller and let it decide how to handle it.
+; However, when the process is initializing, there is no one to report to,
+; so we must inform the user ourselves.
+; In any case, write to the debug board - it is *debug* board, after all.
+;
+; This function is called whenever an error occurs in the loader.
+; Except errors in malloc/realloc - they shouldn't happen anyway,
+; and if they happened after all, we are screwed and likely will fail anyway,
+; so don't bother.
+; Variable number of arguments: strings to be concatenated, end with NULL.
+proc loader_say_error c uses ebx esi, first_msg, ...
+; 1. Concatenate all given strings to the final error message.
+; 1a. Calculate the total length.
+        xor     ebx, ebx
+        lea     edx, [first_msg]
+.get_length:
+        mov     ecx, [edx]
+        test    ecx, ecx
+        jz      .length_done
+@@:
+        inc     ebx
+        inc     ecx
+        cmp     byte [ecx-1], 0
+        jnz     @b
+        dec     ebx
+        add     edx, 4
+        jmp     .get_length
+.length_done:
+        inc     ebx ; terminating zero
+; 1b. Allocate memory. Exit if failed.
+        stdcall malloc, ebx
+        test    eax, eax
+        jz      .nothing
+        mov     esi, eax
+; 1c. Copy data.
+        lea     edx, [first_msg]
+.copy_data:
+        mov     ecx, [edx]
+        test    ecx, ecx
+        jz      .data_done
+@@:
+        mov     bl, [ecx]
+        test    bl, bl
+        jz      @f
+        mov     [eax], bl
+        inc     ecx
+        inc     eax
+        jmp     @b
+@@:
+        add     edx, 4
+        jmp     .copy_data
+.data_done:
+        mov     byte [eax], 0 ; terminating zero
+; 2. Print to the debug board.
+        mov     ecx, loader_debugboard_prefix
+        call    sys_msg_board_str
+        mov     ecx, esi
+        call    sys_msg_board_str
+        mov     ecx, msg_newline
+        call    sys_msg_board_str
+; 3. If the initialization is in process, report to the user.
+        xor     eax, eax
+        cmp     [process_initialized], al
+        jnz     .no_report
+; Use @notify. Create structure for function 70.7 on the stack.
+        push    eax ; to be rewritten with part of path
+        push    eax ; to be rewritten with part of path
+        push    eax ; reserved
+        push    eax ; reserved
+        push    esi ; command line
+        push    eax ; flags: none
+        push    7
+        mov     eax, 70
+        mov     ebx, esp
+        mov     dword [ebx+21], notify_program
+        call    FS_SYSCALL_PTR
+        add     esp, 28
+; Ignore any errors. We can't do anything with them anyway.
+.no_report:
+        stdcall free, esi
+.nothing:
+        ret
+endp
+; When the loader is initializing the process, errors can happen.
+; They should be reported to the user.
+; The main executable cannot do this, it is not initialized yet.
+; So we should do it ourselves.
+; However, after the process has been initialized, the main
+;
+; Helper function that is called whenever an error is occured.
+; For now, we don't expect many modules in one process.
+; So, all modules are linked into a single list,
+; and lookup functions simply walk the entire list.
+; This should be revisited if dozens of modules would be typical.
+; This structure describes one loaded PE module.
+; malloc'd from the default heap,
+; includes variable-sized module path in the end.
+struct MODULE
+; All modules are linked in the global list with head at modules_list.
+next            dd      ?
+prev            dd      ?
+base            dd      ?       ; base address
+size            dd      ?       ; size in memory
+refcount        dd      ?       ; reference counter
+timestamp       dd      ?       ; for bound imports
+basedelta       dd      ?       ; base address - preferred address, for bound imports
+num_imports     dd      ?       ; size of imports array
+imports         dd      ?
+; Pointer to array of pointers to MODULEs containing imported functions.
+; Used to unload all dependencies when the module is unloaded.
+; Contains all modules referenced by import table;
+; if the module forwards some export to another module,
+; then forward target is added to this array when forward source is requested.
+filename        dd      ?       ; pointer inside path array after dirname
+filenamelen     dd      ?       ; strlen(filename) + 1
+path            rb      0
+ends
+; Fills some fields in a new MODULE struct based on given PE image.
+; Assumes that MODULE.path has been filled during the allocation,
+; does not insert the structure in the common list, fills everything else.
+; in: eax -> MODULE
+; in: esi = module base
+proc init_module_struct
+; Straightforward initialization of all non-PE-specific fields.
+        lea     edx, [eax+MODULE.path]
+        mov     [eax+MODULE.filename], edx
+@@:
+        inc     edx
+        cmp     byte [edx-1], 0
+        jz      @f
+        cmp     byte [edx-1], '/'
+        jnz     @b
+        mov     [eax+MODULE.filename], edx
+        jmp     @b
+@@:
+        sub     edx, [eax+MODULE.filename]
+        mov     [eax+MODULE.filenamelen], edx
+        xor     edx, edx
+        mov     [eax+MODULE.base], esi
+        mov     [eax+MODULE.refcount], 1
+        mov     [eax+MODULE.num_imports], edx
+        mov     [eax+MODULE.imports], edx
+; Let the PE-specific part do its job.
+        init_module_struct_pe_specific
+endp
+; Helper function for dlclose and resolving forwarded exports from dlsym.
+; in: ecx = module base address
+; out: esi -> MODULE or esi = NULL
+; modules_mutex should be locked
+proc find_module_by_addr
+; Simple linear lookup in the list.
+        mov     esi, [modules_list + MODULE.next]
+.scan:
+        cmp     esi, modules_list
+        jz      .notfound
+        cmp     ecx, [esi+MODULE.base]
+        jz      .found
+        mov     esi, [esi+MODULE.next]
+        jmp     .scan
+.notfound:
+        xor     esi, esi
+.found:
+        ret
+endp
+; Helper function for whenever we have a module name
+; and want to check whether it is already loaded.
+; in: edi -> name with or without a path
+; out: esi -> MODULE or esi = NULL
+; modules_mutex should be locked
+proc find_module_by_name uses edi
+; 1. Skip the path, if it is present.
+; eax = current pointer,
+; edi is updated whenever the previous character is '/'
+        mov     eax, edi
+.find_basename:
+        cmp     byte [eax], 0
+        jz      .found_basename
+        inc     eax
+        cmp     byte [eax-1], '/'
+        jnz     .find_basename
+        mov     edi, eax
+        jmp     .find_basename
+.found_basename:
+; 2. Simple linear lookup in the list.
+        mov     eax, [modules_list + MODULE.next]
+.scan:
+        cmp     eax, modules_list
+        jz      .notfound
+; For every module, compare base names ignoring paths.
+        push    edi
+        mov     esi, [eax+MODULE.filename]
+        mov     ecx, [eax+MODULE.filenamelen]
+        repz cmpsb
+        pop     edi
+        jz      .found
+        mov     eax, [eax+MODULE.next]
+        jmp     .scan
+.found:
+        mov     esi, eax
+        ret
+.notfound:
+        xor     esi, esi
+        ret
+endp
+; Called when some module is implicitly loaded by another module,
+; either due to a record in import table,
+; or because some exported function forwards to another module.
+; Checks whether the target module has already been referenced
+; by the source module. The first reference is passed down
+; to load_module increasing refcount of the target and possibly
+; loading it if not yet, subsequent references just return
+; without modifying refcount.
+; We don't actually need to deduplicate DLLs from import table
+; as long as we decrement refcount on unload the same number of times
+; that we have incremented it on load.
+; However, we need to keep track of references to forward targets,
+; and we don't want to scan the entire export table and load all forward
+; targets just in case some of those would be useful,
+; so load them on-demand first time and ignore subsequential references.
+; To be consistent, do the same for import table too.
+;
+; in: esi -> source MODULE struct
+; in: edi -> target module name
+; out: eax -> imported MODULE, 0 on error
+; modules_mutex should be locked
+proc load_imported_module uses edi
+; 1. Find the target module in the loaded modules list.
+; If not found, go to 5.
+        push    esi
+        call    find_module_by_name
+        test    esi, esi
+        mov     eax, esi
+        pop     esi
+        jz      .load
+; 2. The module has been already loaded.
+; Now check whether it is already stored in imports array.
+; If yes, just return without doing anything.
+        mov     edi, [esi+MODULE.imports]
+        mov     ecx, [esi+MODULE.num_imports]
+        test    ecx, ecx
+        jz      .newref
+        repnz scasd
+        jz      .nothing
+.newref:
+; The module is loaded, but not by us.
+; 3. Increment the reference counter of the target.
+        inc     [eax+MODULE.refcount]
+.add_to_imports:
+; 4. Add the new pointer to the imports array.
+; 4a. Check whether there is place in the array.
+; If so, go to 4c.
+; We don't want to reallocate too often, since reallocation
+; may involve copying our data to a new place.
+; We always reserve space that is a power of two; in this way,
+; the wasted space is never greater than the used space,
+; and total time of copying the data is O(number of modules).
+; The last fact is not really important right now,
+; since the current implementation of step 2 makes everything
+; quadratic and the number of modules is very small anyway,
+; but since this enhancement costs only a few instructions, why not?
+        mov     edi, eax
+; X is a power of two or zero if and only if (X and (X - 1)) is zero
+        mov     ecx, [esi+MODULE.num_imports]
+        lea     edx, [ecx-1]
+        test    ecx, edx
+        jnz     .has_space
+; 4b. Reallocate the imports array:
+; if the current size is zero, allocate 1 item,
+; otherwise double number of items.
+; Item size is 4 bytes.
+        lea     ecx, [ecx*8]
+        test    ecx, ecx
+        jnz     @f
+        mov     ecx, 4
+@@:
+        stdcall realloc, [esi+MODULE.imports], ecx
+        test    eax, eax
+        jz      .realloc_failed
+        mov     [esi+MODULE.imports], eax
+        mov     ecx, [esi+MODULE.num_imports]
+.has_space:
+; 4c. Append pointer to the target MODULE to imports array.
+        mov     eax, [esi+MODULE.imports]
+        mov     [eax+ecx*4], edi
+        inc     [esi+MODULE.num_imports]
+        mov     eax, edi
+.nothing:
+        ret
+.load:
+; 5. This is a totally new module. Load it.
+        call    load_module
+; On error, return it to the caller. On success, go to 4.
+        test    eax, eax
+        jz      .nothing
+        jmp     .add_to_imports
+.realloc_failed:
+; Out of memory for a couple of dwords? Should not happen.
+; Dereference the target referenced by step 3 or 5
+; and return error to the caller.
+        push    esi
+        mov     esi, edi
+        call    dereference_module
+        pop     esi
+        xor     eax, eax
+        ret
+endp
+; Helper procedure for load_module.
+; Allocates MODULE structure for (given path) + (module name),
+; calls the kernel to map it,
+; on success, fills the MODULE structure.
+; in: edi -> module name
+; in: ebx = strlen(filename) + 1
+proc try_map_module uses ebx esi, path_ptr, path_len
+; 1. Allocate MODULE structure.
+        mov     eax, [path_len]
+        lea     eax, [eax+ebx+MODULE.path]
+        stdcall malloc, eax
+        test    eax, eax
+        jz      .nothing
+; 2. Create the full name of module in MODULE structure:
+; concatenate module path, if given, and module name.
+        mov     ecx, [path_len]
+        mov     esi, [path_ptr]
+        push    edi
+        lea     edi, [eax+MODULE.path]
+        rep movsb
+        mov     ecx, ebx
+        mov     esi, [esp]
+        rep movsb
+        pop     edi
+        mov     esi, eax
+; 3. Call the kernel to map the module.
+        lea     ecx, [eax+MODULE.path]
+        mov     eax, 68
+        mov     ebx, 28
+        call    FS_SYSCALL_PTR
+        cmp     eax, -0x1000
+        ja      .failed
+; 4. On success, fill the rest of MODULE structure and return it.
+        xchg    eax, esi
+        call    init_module_struct
+        ret
+.failed:
+; On failure, undo allocation at step 1 and return zero.
+        stdcall free, esi
+        xor     eax, eax
+.nothing:
+        ret
+endp
+; Worker procedure for loading a new module.
+; Does not check whether the module has been already loaded;
+; find_module_by_name should be called beforehand.
+; in: edi -> filename
+; out: eax -> MODULE or 0
+; modules_mutex should be locked
+proc load_module uses ebx esi ebp
+; 1. Map the module.
+; 1a. Prepare for try_map_module: calculate length of the name.
+        mov     ebx, edi
+@@:
+        inc     ebx
+        cmp     byte [ebx-1], 0
+        jnz     @b
+        sub     ebx, edi
+; 1b. Check whether the given path is absolute.
+; If so, proceed to 1c. If not, go to 1d.
+        cmp     byte [edi], '/'
+        jnz     .relative
+; 1c. The given path is absolute. Use it as is. Don't try any other paths.
+        stdcall try_map_module, 0, 0
+        test    eax, eax
+        jnz     .loaded_ok
+        ccall   loader_say_error, msg_cannot_open, edi, 0
+        jmp     .load_failed
+.relative:
+; 1d. The given path is relative.
+; Try /rd/1/lib/, /kolibrios/lib/ and path to executable
+; in this order.
+        stdcall try_map_module, module_path1, module_path1.size
+        test    eax, eax
+        jnz     .loaded_ok
+        stdcall try_map_module, module_path2, module_path2.size
+        test    eax, eax
+        jnz     .loaded_ok
+; Note: we assume that the executable is always the first module in the list.
+        mov     eax, [modules_list + MODULE.next]
+        mov     ecx, [eax+MODULE.filename]
+        add     eax, MODULE.path
+        mov     esi, eax
+        sub     ecx, eax
+        stdcall try_map_module, eax, ecx
+        test    eax, eax
+        jnz     .loaded_ok
+        mov     ebx, dword [esi+MODULE.filename-MODULE.path]
+        movzx   eax, byte [ebx]
+        mov     byte [ebx], 0
+        push    eax
+        ccall   loader_say_error, msg_cannot_open, edi, msg_paths_begin, esi, 0
+        pop     eax
+        mov     byte [ebx], al
+.load_failed:
+        xor     eax, eax
+        ret
+.loaded_ok:
+; Module has been mapped.
+; MODULE structure has been initialized, but not yet inserted in the common list.
+; 2. Insert the MODULE structure in the end of the common list.
+        mov     esi, eax
+        mov     eax, [modules_list+MODULE.prev]
+        mov     [eax+MODULE.next], esi
+        mov     [esi+MODULE.prev], eax
+        mov     [modules_list+MODULE.prev], esi
+        mov     [esi+MODULE.next], modules_list
+; 3. Call PE-specific code to initialize the mapped module.
+        push    esi
+        push    edi ; for messages in fixup_pe_relocations
+        mov     esi, [esi+MODULE.base]
+        call    fixup_pe_relocations
+        pop     ecx
+        pop     esi
+        jc      .fail_unload
+        call    resolve_pe_imports
+        test    eax, eax
+        jnz     .fail_unload
+        mov     eax, esi
+        ret
+.fail_unload:
+        call    dereference_module
+        xor     eax, eax
+        ret
+endp
+; Worker procedure for unloading a module.
+; Drops one reference to the module; if it was the last one,
+; unloads the module and all referenced modules recursively.
+; in: esi -> MODULE struct
+; modules_mutex should be locked
+proc dereference_module
+; 1. Decrement reference counter.
+; If the decremented value is nonzero, exit.
+        dec     [esi+MODULE.refcount]
+        jnz     .nothing
+; 2. Remove the module from the common list.
+        mov     eax, [esi+MODULE.prev]
+        mov     edx, [esi+MODULE.next]
+        mov     [eax+MODULE.next], edx
+        mov     [edx+MODULE.prev], eax
+; 3. Recursively unload dependencies.
+        cmp     [esi+MODULE.num_imports], 0
+        jz      .import_deref_done
+.import_deref_loop:
+        mov     eax, [esi+MODULE.num_imports]
+        push    esi
+        mov     esi, [esi+MODULE.imports]
+        mov     esi, [esi+(eax-1)*4]
+        call    dereference_module
+        pop     esi
+        dec     [esi+MODULE.num_imports]
+        jnz     .import_deref_loop
+.import_deref_done:
+        stdcall free, [esi+MODULE.imports] ; free(NULL) is ok
+; 4. Unmap the module.
+        push    ebx
+        mov     eax, 68
+        mov     ebx, 29
+        mov     ecx, [esi+MODULE.base]
+        call    FS_SYSCALL_PTR
+        pop     ebx
+; 5. Free the MODULE struct.
+        stdcall free, esi
+.nothing:
+        ret
+endp
 Property changes:
 Added: svn:eol-style
 +native
 \ No newline at end of property

Subversion Repositories Kolibri OS

Compare Revisions

Regard whitespace Rev 6766 → Rev 6767