dwarf_extractor.cpp 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513
  1. /*
  2. * Copyright (C) 2021 Ant Group. All rights reserved.
  3. * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  4. */
  5. #include "lldb/API/SBBlock.h"
  6. #include "lldb/API/SBCompileUnit.h"
  7. #include "lldb/API/SBCommandReturnObject.h"
  8. #include "lldb/API/SBCommandInterpreter.h"
  9. #include "lldb/API/SBBreakpointLocation.h"
  10. #include "lldb/API/SBDebugger.h"
  11. #include "lldb/API//SBFunction.h"
  12. #include "lldb/API//SBModule.h"
  13. #include "lldb/API//SBProcess.h"
  14. #include "lldb/API//SBStream.h"
  15. #include "lldb/API//SBSymbol.h"
  16. #include "lldb/API//SBTarget.h"
  17. #include "lldb/API//SBThread.h"
  18. #include "lldb/API/SBDeclaration.h"
  19. #include "dwarf_extractor.h"
  20. #include "../aot_llvm.h"
  21. #include "bh_log.h"
  22. #include "../../aot/aot_runtime.h"
  23. #include "llvm/BinaryFormat/Dwarf.h"
  24. using namespace lldb;
  25. typedef struct dwar_extractor {
  26. SBDebugger debugger;
  27. SBTarget target;
  28. SBModule module;
  29. } dwar_extractor;
  30. #define TO_HANDLE(extractor) (dwar_extractor_handle_t)(extractor)
  31. #define TO_EXTACTOR(handle) (dwar_extractor *)(handle)
  32. static bool is_debugger_initialized;
  33. dwar_extractor_handle_t
  34. create_dwarf_extractor(AOTCompData *comp_data, char *file_name)
  35. {
  36. char *arch = NULL;
  37. char *platform = NULL;
  38. dwar_extractor *extractor = NULL;
  39. //__attribute__((constructor)) may be better?
  40. if (!is_debugger_initialized) {
  41. SBError error = SBDebugger::InitializeWithErrorHandling();
  42. if (error.Fail()) {
  43. LOG_ERROR("Init Dwarf Debugger failed");
  44. return TO_HANDLE(NULL);
  45. }
  46. is_debugger_initialized = true;
  47. }
  48. SBError error;
  49. SBFileSpec exe_file_spec(file_name, true);
  50. if (!(extractor = new dwar_extractor())) {
  51. LOG_ERROR("Create Dwarf Extractor error: failed to allocate memory");
  52. goto fail3;
  53. }
  54. extractor->debugger = SBDebugger::Create();
  55. if (!extractor->debugger.IsValid()) {
  56. LOG_ERROR("Create Dwarf Debugger failed");
  57. goto fail2;
  58. }
  59. extractor->target = extractor->debugger.CreateTarget(
  60. file_name, arch, platform, false, error);
  61. if (!error.Success()) {
  62. LOG_ERROR("Create Dwarf target failed:%s", error.GetCString());
  63. goto fail1;
  64. }
  65. if (!extractor->target.IsValid()) {
  66. LOG_ERROR("Create Dwarf target not valid");
  67. goto fail1;
  68. }
  69. extractor->module = extractor->target.FindModule(exe_file_spec);
  70. comp_data->extractor = TO_HANDLE(extractor);
  71. return TO_HANDLE(extractor);
  72. fail1:
  73. SBDebugger::Destroy(extractor->debugger);
  74. fail2:
  75. wasm_runtime_free(extractor);
  76. fail3:
  77. return TO_HANDLE(NULL);
  78. }
  79. void
  80. destroy_dwarf_extractor(dwar_extractor_handle_t handle)
  81. {
  82. dwar_extractor *extractor = TO_EXTACTOR(handle);
  83. if (!extractor)
  84. return;
  85. extractor->debugger.DeleteTarget(extractor->target);
  86. SBDebugger::Destroy(extractor->debugger);
  87. delete extractor;
  88. SBDebugger::Terminate();
  89. is_debugger_initialized = false;
  90. }
  91. LLVMMetadataRef
  92. dwarf_gen_file_info(const AOTCompContext *comp_ctx)
  93. {
  94. dwar_extractor *extractor;
  95. int units_number;
  96. LLVMMetadataRef file_info = NULL;
  97. const char *file_name;
  98. const char *dir_name;
  99. if (!(extractor = TO_EXTACTOR(comp_ctx->comp_data->extractor)))
  100. return NULL;
  101. units_number = extractor->module.GetNumCompileUnits();
  102. if (units_number > 0) {
  103. SBCompileUnit compile_unit = extractor->module.GetCompileUnitAtIndex(0);
  104. auto filespec = compile_unit.GetFileSpec();
  105. file_name = filespec.GetFilename();
  106. dir_name = filespec.GetDirectory();
  107. if (file_name || dir_name) {
  108. file_info = LLVMDIBuilderCreateFile(comp_ctx->debug_builder,
  109. file_name, strlen(file_name),
  110. dir_name, strlen(dir_name));
  111. }
  112. }
  113. return file_info;
  114. }
  115. #if 0
  116. void
  117. dwarf_gen_mock_vm_info(AOTCompContext *comp_ctx)
  118. {
  119. LLVMMetadataRef file_info = NULL;
  120. LLVMMetadataRef comp_unit = NULL;
  121. file_info = LLVMDIBuilderCreateFile(comp_ctx->debug_builder,
  122. "ant_runtime_mock.c", 18, ".", 1);
  123. comp_unit = LLVMDIBuilderCreateCompileUnit(
  124. comp_ctx->debug_builder, LLVMDWARFSourceLanguageC, file_info,
  125. "ant compiler", 12, 0, NULL, 0, 1, NULL, 0, LLVMDWARFEmissionFull, 0, 0,
  126. 0, "/", 1, "", 0);
  127. LLVMTypeRef ParamTys[] = {
  128. LLVMVoidType(),
  129. };
  130. LLVMTypeRef FuncTy = LLVMFunctionType(LLVMVoidType(), ParamTys, 0, 0);
  131. LLVMValueRef Function =
  132. LLVMAddFunction(comp_ctx->module, "ant_runtime_mock", FuncTy);
  133. LLVMMetadataRef ParamTypes[0];
  134. LLVMMetadataRef FunctionTy = LLVMDIBuilderCreateSubroutineType(
  135. comp_ctx->debug_builder, file_info, ParamTypes, 0, LLVMDIFlagZero);
  136. /* 0x0015 is subroutine_type */
  137. LLVMMetadataRef ReplaceableFunctionMetadata =
  138. LLVMDIBuilderCreateReplaceableCompositeType(
  139. comp_ctx->debug_builder, 0x15, "ant_runtime_mock", 16, file_info,
  140. file_info, 2, 0, 0, 0, LLVMDIFlagFwdDecl, "", 0);
  141. LLVMMetadataRef FunctionMetadata = LLVMDIBuilderCreateFunction(
  142. comp_ctx->debug_builder, file_info, "ant_runtime_mock", 16,
  143. "ant_runtime_mock", 16, file_info, 2, FunctionTy, true, true, 2, LLVMDIFlagZero,
  144. false);
  145. LLVMMetadataReplaceAllUsesWith(ReplaceableFunctionMetadata,
  146. FunctionMetadata);
  147. LLVMSetSubprogram(Function, FunctionMetadata);
  148. comp_ctx->vm_debug_comp_unit = comp_unit;
  149. comp_ctx->vm_debug_file = file_info;
  150. comp_ctx->vm_debug_func = FunctionMetadata;
  151. }
  152. #endif
  153. LLVMMetadataRef
  154. dwarf_gen_comp_unit_info(const AOTCompContext *comp_ctx)
  155. {
  156. dwar_extractor *extractor;
  157. int units_number;
  158. LLVMMetadataRef comp_unit = NULL;
  159. if (!(extractor = TO_EXTACTOR(comp_ctx->comp_data->extractor)))
  160. return NULL;
  161. units_number = extractor->module.GetNumCompileUnits();
  162. if (units_number > 0) {
  163. SBCompileUnit compile_unit = extractor->module.GetCompileUnitAtIndex(0);
  164. auto lang_type = compile_unit.GetLanguage();
  165. comp_unit = LLVMDIBuilderCreateCompileUnit(
  166. comp_ctx->debug_builder, LLDB_TO_LLVM_LANG_TYPE(lang_type),
  167. comp_ctx->debug_file, "ant compiler", 12, 0, NULL, 0, 1, NULL, 0,
  168. LLVMDWARFEmissionFull, 0, 0, 0, "/", 1, "", 0);
  169. }
  170. return comp_unit;
  171. }
  172. static LLVMDWARFTypeEncoding
  173. lldb_get_basic_type_encoding(BasicType basic_type)
  174. {
  175. LLVMDWARFTypeEncoding encoding = 0;
  176. switch (basic_type) {
  177. case eBasicTypeUnsignedChar:
  178. encoding = llvm::dwarf::DW_ATE_unsigned_char;
  179. break;
  180. case eBasicTypeSignedChar:
  181. encoding = llvm::dwarf::DW_ATE_signed_char;
  182. break;
  183. case eBasicTypeUnsignedInt:
  184. case eBasicTypeUnsignedLong:
  185. case eBasicTypeUnsignedLongLong:
  186. case eBasicTypeUnsignedWChar:
  187. case eBasicTypeUnsignedInt128:
  188. case eBasicTypeUnsignedShort:
  189. encoding = llvm::dwarf::DW_ATE_unsigned;
  190. break;
  191. case eBasicTypeInt:
  192. case eBasicTypeLong:
  193. case eBasicTypeLongLong:
  194. case eBasicTypeWChar:
  195. case eBasicTypeInt128:
  196. case eBasicTypeShort:
  197. encoding = llvm::dwarf::DW_ATE_signed;
  198. break;
  199. case eBasicTypeBool:
  200. encoding = llvm::dwarf::DW_ATE_boolean;
  201. break;
  202. case eBasicTypeHalf:
  203. case eBasicTypeFloat:
  204. case eBasicTypeDouble:
  205. case eBasicTypeLongDouble:
  206. encoding = llvm::dwarf::DW_ATE_float;
  207. break;
  208. default:
  209. break;
  210. }
  211. return encoding;
  212. }
  213. static LLVMMetadataRef
  214. lldb_type_to_type_dbi(const AOTCompContext *comp_ctx, SBType &type)
  215. {
  216. LLVMMetadataRef type_info = NULL;
  217. BasicType basic_type = type.GetBasicType();
  218. uint64_t bit_size = type.GetByteSize() * 8;
  219. LLVMDIBuilderRef DIB = comp_ctx->debug_builder;
  220. LLVMDWARFTypeEncoding encoding;
  221. if (basic_type != eBasicTypeInvalid) {
  222. encoding = lldb_get_basic_type_encoding(basic_type);
  223. type_info = LLVMDIBuilderCreateBasicType(
  224. DIB, type.GetName(), strlen(type.GetName()), bit_size, encoding,
  225. LLVMDIFlagZero);
  226. }
  227. else if (type.IsPointerType()) {
  228. SBType pointee_type = type.GetPointeeType();
  229. type_info = LLVMDIBuilderCreatePointerType(
  230. DIB, lldb_type_to_type_dbi(comp_ctx, pointee_type), bit_size, 0, 0,
  231. "", 0);
  232. }
  233. return type_info;
  234. }
  235. static LLVMMetadataRef
  236. lldb_function_to_function_dbi(const AOTCompContext *comp_ctx,
  237. SBSymbolContext &sc,
  238. const AOTFuncContext *func_ctx)
  239. {
  240. SBFunction function(sc.GetFunction());
  241. const char *function_name = function.GetName();
  242. const char *link_name = function.GetName();
  243. SBTypeList function_args = function.GetType().GetFunctionArgumentTypes();
  244. SBType return_type = function.GetType().GetFunctionReturnType();
  245. const size_t num_function_args = function_args.GetSize();
  246. dwar_extractor *extractor;
  247. if (!(extractor = TO_EXTACTOR(comp_ctx->comp_data->extractor)))
  248. return NULL;
  249. LLVMDIBuilderRef DIB = comp_ctx->debug_builder;
  250. LLVMMetadataRef File = comp_ctx->debug_file;
  251. LLVMMetadataRef ParamTypes[num_function_args + 1];
  252. ParamTypes[0] = lldb_type_to_type_dbi(comp_ctx, return_type);
  253. for (uint32_t function_arg_idx = 0; function_arg_idx < num_function_args;
  254. ++function_arg_idx) {
  255. SBType function_arg_type =
  256. function_args.GetTypeAtIndex(function_arg_idx);
  257. if (function_arg_type.IsValid()) {
  258. ParamTypes[function_arg_idx + 1] =
  259. lldb_type_to_type_dbi(comp_ctx, function_arg_type);
  260. }
  261. }
  262. LLVMMetadataRef FunctionTy = LLVMDIBuilderCreateSubroutineType(
  263. DIB, File, ParamTypes, num_function_args + 1, LLVMDIFlagZero);
  264. auto line_entry = sc.GetLineEntry();
  265. LLVMMetadataRef ReplaceableFunctionMetadata =
  266. LLVMDIBuilderCreateReplaceableCompositeType(
  267. DIB, 0x15, function_name, strlen(function_name), File, File,
  268. line_entry.GetLine(), 0, 0, 0, LLVMDIFlagFwdDecl, "", 0);
  269. LLVMMetadataRef FunctionMetadata = LLVMDIBuilderCreateFunction(
  270. DIB, File, function_name, strlen(function_name), link_name,
  271. strlen(link_name), File, line_entry.GetLine(), FunctionTy, true, true,
  272. line_entry.GetLine(), LLVMDIFlagZero, false);
  273. LLVMMetadataReplaceAllUsesWith(ReplaceableFunctionMetadata,
  274. FunctionMetadata);
  275. LLVMSetSubprogram(func_ctx->func, FunctionMetadata);
  276. LLVMMetadataRef ParamExpression =
  277. LLVMDIBuilderCreateExpression(DIB, NULL, 0);
  278. auto variable_list =
  279. function.GetBlock().GetVariables(extractor->target, true, false, false);
  280. if (num_function_args != variable_list.GetSize()) {
  281. LOG_ERROR(
  282. "function args number dismatch!:value number=%d, function args=%d",
  283. variable_list.GetSize(), num_function_args);
  284. }
  285. LLVMMetadataRef ParamLocation = LLVMDIBuilderCreateDebugLocation(
  286. comp_ctx->context, line_entry.GetLine(), 0, FunctionMetadata, NULL);
  287. // TODO:change to void * or WasmExenv * ?
  288. LLVMMetadataRef voidtype =
  289. LLVMDIBuilderCreateBasicType(DIB, "void", 4, 0, 0, LLVMDIFlagZero);
  290. LLVMMetadataRef voidpionter =
  291. LLVMDIBuilderCreatePointerType(DIB, voidtype, 64, 0, 0, "void *", 6);
  292. LLVMMetadataRef ParamVar = LLVMDIBuilderCreateParameterVariable(
  293. DIB, FunctionMetadata, "exenv", 5, 1,
  294. File, // starts form 1, and 1 is exenv,
  295. line_entry.GetLine(), voidpionter, true, LLVMDIFlagZero);
  296. LLVMValueRef Param = LLVMGetParam(func_ctx->func, 0);
  297. LLVMBasicBlockRef block_curr = LLVMGetEntryBasicBlock(func_ctx->func);
  298. LLVMDIBuilderInsertDbgValueAtEnd(DIB, Param, ParamVar, ParamExpression,
  299. ParamLocation, block_curr);
  300. for (uint32_t function_arg_idx = 0;
  301. function_arg_idx < variable_list.GetSize(); ++function_arg_idx) {
  302. SBValue variable(variable_list.GetValueAtIndex(function_arg_idx));
  303. if (variable.IsValid()) {
  304. SBDeclaration dec(variable.GetDeclaration());
  305. auto valtype = variable.GetType();
  306. LLVMMetadataRef ParamLocation = LLVMDIBuilderCreateDebugLocation(
  307. comp_ctx->context, dec.GetLine(), dec.GetColumn(),
  308. FunctionMetadata, NULL);
  309. LLVMMetadataRef ParamVar = LLVMDIBuilderCreateParameterVariable(
  310. DIB, FunctionMetadata, variable.GetName(),
  311. strlen(variable.GetName()), function_arg_idx + 1 + 1,
  312. File, // starts form 1, and 1 is exenv,
  313. dec.GetLine(), ParamTypes[function_arg_idx + 1], true,
  314. LLVMDIFlagZero);
  315. LLVMValueRef Param =
  316. LLVMGetParam(func_ctx->func, function_arg_idx + 1);
  317. LLVMDIBuilderInsertDbgValueAtEnd(DIB, Param, ParamVar,
  318. ParamExpression, ParamLocation,
  319. block_curr);
  320. }
  321. }
  322. return FunctionMetadata;
  323. }
  324. LLVMMetadataRef
  325. dwarf_gen_func_info(const AOTCompContext *comp_ctx,
  326. const AOTFuncContext *func_ctx)
  327. {
  328. LLVMMetadataRef func_info = NULL;
  329. dwar_extractor *extractor;
  330. uint64_t vm_offset;
  331. AOTFunc *func = func_ctx->aot_func;
  332. if (!(extractor = TO_EXTACTOR(comp_ctx->comp_data->extractor)))
  333. return NULL;
  334. // A code address in DWARF for WebAssembly is the offset of an
  335. // instruction relative within the Code section of the WebAssembly file.
  336. // For this reason Section::GetFileAddress() must return zero for the
  337. // Code section. (refert to ObjectFileWasm.cpp)
  338. vm_offset = func->code - comp_ctx->comp_data->wasm_module->buf_code;
  339. auto sbaddr = extractor->target.ResolveFileAddress(vm_offset);
  340. SBSymbolContext sc(sbaddr.GetSymbolContext(eSymbolContextFunction
  341. | eSymbolContextLineEntry));
  342. if (sc.IsValid()) {
  343. SBFunction function(sc.GetFunction());
  344. if (function.IsValid()) {
  345. func_info = lldb_function_to_function_dbi(comp_ctx, sc, func_ctx);
  346. }
  347. }
  348. return func_info;
  349. }
  350. void
  351. dwarf_get_func_name(const AOTCompContext *comp_ctx,
  352. const AOTFuncContext *func_ctx, char *name, int len)
  353. {
  354. LLVMMetadataRef func_info = NULL;
  355. dwar_extractor *extractor;
  356. uint64_t vm_offset;
  357. AOTFunc *func = func_ctx->aot_func;
  358. name[0] = '\0';
  359. if (!(extractor = TO_EXTACTOR(comp_ctx->comp_data->extractor)))
  360. return;
  361. // A code address in DWARF for WebAssembly is the offset of an
  362. // instruction relative within the Code section of the WebAssembly file.
  363. // For this reason Section::GetFileAddress() must return zero for the
  364. // Code section. (refert to ObjectFileWasm.cpp)
  365. vm_offset = func->code - comp_ctx->comp_data->wasm_module->buf_code;
  366. auto sbaddr = extractor->target.ResolveFileAddress(vm_offset);
  367. SBSymbolContext sc(sbaddr.GetSymbolContext(eSymbolContextFunction
  368. | eSymbolContextLineEntry));
  369. if (sc.IsValid()) {
  370. SBFunction function(sc.GetFunction());
  371. if (function.IsValid()) {
  372. bh_strcpy_s(name, len, function.GetName());
  373. }
  374. }
  375. }
  376. LLVMMetadataRef
  377. dwarf_gen_location(const AOTCompContext *comp_ctx,
  378. const AOTFuncContext *func_ctx, uint64_t vm_offset)
  379. {
  380. LLVMMetadataRef location_info = NULL;
  381. dwar_extractor *extractor;
  382. AOTFunc *func = func_ctx->aot_func;
  383. if (!(extractor = TO_EXTACTOR(comp_ctx->comp_data->extractor)))
  384. return NULL;
  385. auto sbaddr = extractor->target.ResolveFileAddress(vm_offset);
  386. SBSymbolContext sc(sbaddr.GetSymbolContext(eSymbolContextFunction
  387. | eSymbolContextLineEntry));
  388. if (sc.IsValid()) {
  389. // TODO:need to check if the vm_offset is belong to
  390. SBFunction function(sc.GetFunction());
  391. if (function.IsValid()) {
  392. uint64_t start = func_ctx->aot_func->code
  393. - comp_ctx->comp_data->wasm_module->buf_code;
  394. uint64_t end = func_ctx->aot_func->code
  395. - comp_ctx->comp_data->wasm_module->buf_code
  396. + func_ctx->aot_func->code_size;
  397. if (function.GetStartAddress().GetOffset() <= start
  398. && end <= function.GetEndAddress().GetOffset()) {
  399. auto line_entry = sc.GetLineEntry();
  400. location_info = LLVMDIBuilderCreateDebugLocation(
  401. comp_ctx->context, line_entry.GetLine(),
  402. line_entry.GetColumn(), func_ctx->debug_func, NULL);
  403. // LOG_VERBOSE("Gen the location l:%d, c:%d at %lx",
  404. // line_entry.GetLine(), line_entry.GetColumn(), vm_offset);
  405. }
  406. else
  407. LOG_WARNING("the offset and function is not matched");
  408. }
  409. }
  410. return location_info;
  411. }
  412. LLVMMetadataRef
  413. dwarf_gen_func_ret_location(const AOTCompContext *comp_ctx,
  414. const AOTFuncContext *func_ctx)
  415. {
  416. LLVMMetadataRef func_info = NULL;
  417. dwar_extractor *extractor;
  418. uint64_t vm_offset;
  419. AOTFunc *func = func_ctx->aot_func;
  420. LLVMMetadataRef location_info = NULL;
  421. if (!(extractor = TO_EXTACTOR(comp_ctx->comp_data->extractor)))
  422. return NULL;
  423. // A code address in DWARF for WebAssembly is the offset of an
  424. // instruction relative within the Code section of the WebAssembly file.
  425. // For this reason Section::GetFileAddress() must return zero for the
  426. // Code section. (refert to ObjectFileWasm.cpp)
  427. vm_offset = (func->code + func->code_size - 1)
  428. - comp_ctx->comp_data->wasm_module->buf_code;
  429. location_info = dwarf_gen_location(comp_ctx, func_ctx, vm_offset);
  430. return location_info;
  431. }