DynamicLinker.cpp 8.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267
  1. /*
  2. * Copyright (c) 2020, Itamar S. <itamar8910@gmail.com>
  3. * Copyright (c) 2021, the SerenityOS developers.
  4. * All rights reserved.
  5. *
  6. * Redistribution and use in source and binary forms, with or without
  7. * modification, are permitted provided that the following conditions are met:
  8. *
  9. * 1. Redistributions of source code must retain the above copyright notice, this
  10. * list of conditions and the following disclaimer.
  11. *
  12. * 2. Redistributions in binary form must reproduce the above copyright notice,
  13. * this list of conditions and the following disclaimer in the documentation
  14. * and/or other materials provided with the distribution.
  15. *
  16. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  17. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  18. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  19. * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
  20. * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  21. * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
  22. * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  23. * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
  24. * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  25. * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  26. */
  27. #include <AK/HashMap.h>
  28. #include <AK/HashTable.h>
  29. #include <AK/LexicalPath.h>
  30. #include <AK/LogStream.h>
  31. #include <AK/ScopeGuard.h>
  32. #include <LibC/mman.h>
  33. #include <LibC/stdio.h>
  34. #include <LibC/sys/internals.h>
  35. #include <LibC/unistd.h>
  36. #include <LibCore/File.h>
  37. #include <LibELF/AuxiliaryVector.h>
  38. #include <LibELF/DynamicLinker.h>
  39. #include <LibELF/DynamicLoader.h>
  40. #include <LibELF/DynamicObject.h>
  41. #include <LibELF/Image.h>
  42. #include <LibELF/exec_elf.h>
  43. #include <dlfcn.h>
  44. #include <string.h>
  45. #include <sys/stat.h>
  46. #include <sys/types.h>
  47. // #define DYNAMIC_LOAD_VERBOSE
  48. #ifdef DYNAMIC_LOAD_VERBOSE
  49. # define VERBOSE(fmt, ...) dbgprintf(fmt, ##__VA_ARGS__)
  50. #else
  51. # define VERBOSE(fmt, ...) \
  52. do { \
  53. } while (0)
  54. #endif
  55. #define TLS_VERBOSE(fmt, ...) dbgprintf(fmt, ##__VA_ARGS__)
  56. namespace ELF {
  57. namespace {
  58. HashMap<String, NonnullRefPtr<ELF::DynamicLoader>> g_loaders;
  59. HashMap<String, NonnullRefPtr<ELF::DynamicObject>> g_loaded_objects;
  60. Vector<NonnullRefPtr<ELF::DynamicObject>> g_global_objects;
  61. using MainFunction = int (*)(int, char**, char**);
  62. using LibCExitFunction = void (*)(int);
  63. size_t g_current_tls_offset = 0;
  64. size_t g_total_tls_size = 0;
  65. char** g_envp = nullptr;
  66. LibCExitFunction g_libc_exit = nullptr;
  67. }
  68. DynamicObject::SymbolLookupResult DynamicLinker::lookup_global_symbol(const char* symbol_name)
  69. {
  70. DynamicObject::SymbolLookupResult weak_result = {};
  71. for (auto& lib : g_global_objects) {
  72. auto res = lib->lookup_symbol(symbol_name);
  73. if (res.found) {
  74. if (res.bind == STB_GLOBAL) {
  75. return res;
  76. } else if (res.bind == STB_WEAK && !weak_result.found) {
  77. weak_result = res;
  78. }
  79. // We don't want to allow local symbols to be pulled in to other modules
  80. }
  81. }
  82. return weak_result;
  83. }
  84. static void map_library(const String& name, int fd)
  85. {
  86. struct stat lib_stat;
  87. int rc = fstat(fd, &lib_stat);
  88. ASSERT(!rc);
  89. auto loader = ELF::DynamicLoader::construct(name.characters(), fd, lib_stat.st_size);
  90. loader->set_tls_offset(g_current_tls_offset);
  91. g_loaders.set(name, loader);
  92. g_current_tls_offset += loader->tls_size();
  93. }
  94. static void map_library(const String& name)
  95. {
  96. // TODO: Do we want to also look for libs in other paths too?
  97. String path = String::format("/usr/lib/%s", name.characters());
  98. int fd = open(path.characters(), O_RDONLY);
  99. ASSERT(fd >= 0);
  100. map_library(name, fd);
  101. }
  102. static String get_library_name(const StringView& path)
  103. {
  104. return LexicalPath(path).basename();
  105. }
  106. static Vector<String> get_dependencies(const String& name)
  107. {
  108. auto lib = g_loaders.get(name).value();
  109. Vector<String> dependencies;
  110. lib->for_each_needed_library([&dependencies, &name](auto needed_name) {
  111. if (name == needed_name)
  112. return IterationDecision::Continue;
  113. dependencies.append(needed_name);
  114. return IterationDecision::Continue;
  115. });
  116. return dependencies;
  117. }
  118. static void map_dependencies(const String& name)
  119. {
  120. VERBOSE("mapping dependencies for: %s\n", name.characters());
  121. for (const auto& needed_name : get_dependencies(name)) {
  122. VERBOSE("needed library: %s\n", needed_name.characters());
  123. String library_name = get_library_name(needed_name);
  124. if (!g_loaders.contains(library_name)) {
  125. map_library(library_name);
  126. map_dependencies(library_name);
  127. }
  128. }
  129. VERBOSE("mapped dependencies for %s\n", name.characters());
  130. }
  131. static void allocate_tls()
  132. {
  133. size_t total_tls_size = 0;
  134. for (const auto& data : g_loaders) {
  135. VERBOSE("%s: TLS Size: %zu\n", data.key.characters(), data.value->tls_size());
  136. total_tls_size += data.value->tls_size();
  137. }
  138. if (total_tls_size) {
  139. [[maybe_unused]] void* tls_address = ::allocate_tls(total_tls_size);
  140. VERBOSE("from userspace, tls_address: %p\n", tls_address);
  141. }
  142. g_total_tls_size = total_tls_size;
  143. }
  144. static void initialize_libc(DynamicObject& libc)
  145. {
  146. // Traditionally, `_start` of the main program initializes libc.
  147. // However, since some libs use malloc() and getenv() in global constructors,
  148. // we have to initialize libc just after it is loaded.
  149. // Also, we can't just mark `__libc_init` with "__attribute__((constructor))"
  150. // because it uses getenv() internally, so `environ` has to be initialized before we call `__libc_init`.
  151. auto res = libc.lookup_symbol("environ");
  152. ASSERT(res.found);
  153. *((char***)res.address) = g_envp;
  154. res = libc.lookup_symbol("__environ_is_malloced");
  155. ASSERT(res.found);
  156. *((bool*)res.address) = false;
  157. res = libc.lookup_symbol("exit");
  158. ASSERT(res.found);
  159. g_libc_exit = (LibCExitFunction)res.address;
  160. res = libc.lookup_symbol("__libc_init");
  161. ASSERT(res.found);
  162. typedef void libc_init_func();
  163. ((libc_init_func*)res.address)();
  164. }
  165. static void load_elf(const String& name)
  166. {
  167. VERBOSE("load_elf: %s\n", name.characters());
  168. auto loader = g_loaders.get(name).value();
  169. VERBOSE("a1\n");
  170. for (const auto& needed_name : get_dependencies(name)) {
  171. VERBOSE("needed library: %s\n", needed_name.characters());
  172. String library_name = get_library_name(needed_name);
  173. if (!g_loaded_objects.contains(library_name)) {
  174. load_elf(library_name);
  175. }
  176. }
  177. auto dynamic_object = loader->load_from_image(RTLD_GLOBAL | RTLD_LAZY, g_total_tls_size);
  178. ASSERT(dynamic_object);
  179. g_loaded_objects.set(name, *dynamic_object);
  180. g_global_objects.append(*dynamic_object);
  181. VERBOSE("load_elf: done %s\n", name.characters());
  182. }
  183. static NonnullRefPtr<DynamicLoader> commit_elf(const String& name)
  184. {
  185. auto loader = g_loaders.get(name).value();
  186. for (const auto& needed_name : get_dependencies(name)) {
  187. String library_name = get_library_name(needed_name);
  188. if (g_loaders.contains(library_name)) {
  189. commit_elf(library_name);
  190. }
  191. }
  192. auto object = loader->load_stage_3(RTLD_GLOBAL | RTLD_LAZY, g_total_tls_size);
  193. ASSERT(object);
  194. if (name == "libc.so") {
  195. initialize_libc(*object);
  196. }
  197. g_loaders.remove(name);
  198. return loader;
  199. }
  200. void ELF::DynamicLinker::linker_main(String&& main_program_name, int main_program_fd, int argc, char** argv, char** envp)
  201. {
  202. g_envp = envp;
  203. map_library(main_program_name, main_program_fd);
  204. map_dependencies(main_program_name);
  205. VERBOSE("loaded all dependencies");
  206. for ([[maybe_unused]] auto& lib : g_loaders) {
  207. VERBOSE("%s - tls size: %zu, tls offset: %zu\n", lib.key.characters(), lib.value->tls_size(), lib.value->tls_offset());
  208. }
  209. allocate_tls();
  210. load_elf(main_program_name);
  211. auto main_program_lib = commit_elf(main_program_name);
  212. FlatPtr entry_point = reinterpret_cast<FlatPtr>(main_program_lib->image().entry().as_ptr());
  213. if (main_program_lib->is_dynamic())
  214. entry_point += reinterpret_cast<FlatPtr>(main_program_lib->text_segment_load_address().as_ptr());
  215. VERBOSE("entry point: %p\n", (void*)entry_point);
  216. g_loaders.clear();
  217. MainFunction main_function = (MainFunction)(entry_point);
  218. VERBOSE("jumping to main program entry point: %p\n", main_function);
  219. int rc = main_function(argc, argv, envp);
  220. VERBOSE("rc: %d\n", rc);
  221. if (g_libc_exit != nullptr) {
  222. g_libc_exit(rc);
  223. } else {
  224. _exit(rc);
  225. }
  226. ASSERT_NOT_REACHED();
  227. }
  228. }