wasmerio
diff --git a/‎lib/compiler-llvm/src/compiler.rs‎
Lines changed: 4 additions & 2 deletions b/‎lib/compiler-llvm/src/compiler.rs‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎lib/compiler-llvm/src/config.rs‎
Lines changed: 39 additions & 54 deletions b/‎lib/compiler-llvm/src/config.rs‎
Lines changed: 39 additions & 54 deletions
diff --git a/‎lib/compiler-llvm/src/object_file.rs‎
Lines changed: 61 additions & 3 deletions b/‎lib/compiler-llvm/src/object_file.rs‎
Lines changed: 61 additions & 3 deletions
diff --git a/‎lib/compiler-llvm/src/translator/code.rs‎
Lines changed: 11 additions & 3 deletions b/‎lib/compiler-llvm/src/translator/code.rs‎
Lines changed: 11 additions & 3 deletions
diff --git a/‎lib/compiler-llvm/src/translator/intrinsics.rs‎
Lines changed: 2 additions & 2 deletions b/‎lib/compiler-llvm/src/translator/intrinsics.rs‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎lib/compiler/src/engine/artifact.rs‎
Lines changed: 3 additions & 1 deletion b/‎lib/compiler/src/engine/artifact.rs‎
Lines changed: 3 additions & 1 deletion
@@ -102,7 +102,8 @@ impl LLVMCompiler {
         let merged_bitcode = function_body_inputs.into_iter().par_bridge().map_init(
             || {
                 let target_machine = self.config().target_machine(target);
-                FuncTranslator::new(target_machine, binary_format).unwrap()
+                let pointer_width = target.triple().pointer_width().unwrap().bytes();
+                FuncTranslator::new(target_machine, binary_format, pointer_width).unwrap()
             },
             |func_translator, (i, input)| {
                 let module = func_translator.translate_to_module(
@@ -280,7 +281,8 @@ impl Compiler for LLVMCompiler {
             .map_init(
                 || {
                     let target_machine = self.config().target_machine(target);
-                    FuncTranslator::new(target_machine, binary_format).unwrap()
+                    let pointer_width = target.triple().pointer_width().unwrap().bytes();
+                    FuncTranslator::new(target_machine, binary_format, pointer_width).unwrap()
                 },
                 |func_translator, (i, input)| {
                     // TODO: remove (to serialize)
 
@@ -1,7 +1,7 @@
 use crate::compiler::LLVMCompiler;
 use inkwell::targets::{
     CodeModel, InitializationConfig, RelocMode, Target as InkwellTarget, TargetMachine,
-    TargetTriple,
+    TargetMachineOptions, TargetTriple,
 };
 pub use inkwell::OptimizationLevel as LLVMOptLevel;
 use itertools::Itertools;
@@ -193,6 +193,14 @@ impl LLVM {
                 info: true,
                 machine_code: true,
             }),
+            Architecture::Riscv32(_) => InkwellTarget::initialize_riscv(&InitializationConfig {
+                asm_parser: true,
+                asm_printer: true,
+                base: true,
+                disassembler: true,
+                info: true,
+                machine_code: true,
+            }),
             Architecture::LoongArch64 => {
                 InkwellTarget::initialize_loongarch(&InitializationConfig {
                     asm_parser: true,
@@ -224,61 +232,38 @@ impl LLVM {
 
         let target_triple = self.target_triple(target);
         let llvm_target = InkwellTarget::from_triple(&target_triple).unwrap();
-        let llvm_target_machine = llvm_target
-            .create_target_machine(
-                &target_triple,
-                match triple.architecture {
-                    Architecture::Riscv64(_) => "generic-rv64",
-                    Architecture::LoongArch64 => "generic-la64",
-                    _ => "generic",
-                },
-                match triple.architecture {
-                    Architecture::Riscv64(_) => "+m,+a,+c,+d,+f",
-                    Architecture::LoongArch64 => "+f,+d",
-                    _ => &llvm_cpu_features,
-                },
-                self.opt_level,
-                self.reloc_mode(self.target_binary_format(target)),
-                match triple.architecture {
-                    Architecture::LoongArch64 | Architecture::Riscv64(_) => CodeModel::Medium,
-                    _ => self.code_model(self.target_binary_format(target)),
-                },
-            )
-            .unwrap();
-
-        if let Architecture::Riscv64(_) = triple.architecture {
-            // TODO: totally non-portable way to change ABI
-            unsafe {
-                // This structure mimic the internal structure from inkwell
-                // that is defined as
-                //  #[derive(Debug)]
-                //  pub struct TargetMachine {
-                //    pub(crate) target_machine: LLVMTargetMachineRef,
-                //  }
-                pub struct MyTargetMachine {
-                    pub target_machine: *const u8,
+        let mut llvm_target_machine_options = TargetMachineOptions::new()
+            .set_cpu(match triple.architecture {
+                Architecture::Riscv64(_) => "generic-rv64",
+                Architecture::Riscv32(_) => "generic-rv32",
+                Architecture::LoongArch64 => "generic-la64",
+                _ => "generic",
+            })
+            .set_features(match triple.architecture {
+                Architecture::Riscv64(_) => "+m,+a,+c,+d,+f",
+                // TODO: WASM modules requires these features to function, however,
+                // it is also possible to disable those features by generating floating
+                // point routine functions and multiplication routine functions. It might
+                // be worthwhile to allow turning them off, and generate references to
+                // proper routine functions.
+                Architecture::Riscv32(_) => "+m,+d,+f",
+                Architecture::LoongArch64 => "+f,+d",
+                _ => &llvm_cpu_features,
+            })
+            .set_level(self.opt_level)
+            .set_reloc_mode(self.reloc_mode(self.target_binary_format(target)))
+            .set_code_model(match triple.architecture {
+                Architecture::LoongArch64 | Architecture::Riscv64(_) | Architecture::Riscv32(_) => {
+                    CodeModel::Medium
                 }
-                // It is use to live patch the create LLVMTargetMachine
-                // to hard change the ABI and force "-mabi=lp64d" ABI
-                // instead of the default that don't use float registers
-                // because there is no current way to do this change
-
-                let my_target_machine: MyTargetMachine = std::mem::transmute(llvm_target_machine);
-
-                *((my_target_machine.target_machine as *mut u8).offset(0x410) as *mut u64) = 5;
-                std::ptr::copy_nonoverlapping(
-                    "lp64d\0".as_ptr(),
-                    (my_target_machine.target_machine as *mut u8).offset(0x418),
-                    6,
-                );
-
-                std::mem::transmute::<MyTargetMachine, inkwell::targets::TargetMachine>(
-                    my_target_machine,
-                )
-            }
-        } else {
-            llvm_target_machine
+                _ => self.code_model(self.target_binary_format(target)),
+            });
+        if let Architecture::Riscv64(_) = triple.architecture {
+            llvm_target_machine_options = llvm_target_machine_options.set_abi("lp64d");
         }
+        llvm_target
+            .create_target_machine_from_options(&target_triple, llvm_target_machine_options)
+            .unwrap()
     }
 }
 
 
@@ -84,6 +84,64 @@ static LIBCALLS_ELF: phf::Map<&'static str, LibCall> = phf::phf_map! {
     "wasmer_vm_read_exception" => LibCall::ReadException,
     "wasmer_vm_dbg_usize" => LibCall::DebugUsize,
     "wasmer_eh_personality" => LibCall::EHPersonality,
+    // Floating-point & 64-bit mul/div routie functions. Those might
+    // be generated by LLVM when generating objects for 32-bit platforms,
+    // or platforms without floating point supports. Modern Rust & C toolchains
+    // provide implementations for thos functions by default.
+    "__adddf3" => LibCall::Adddf3,
+    "__addsf3" => LibCall::Addsf3,
+    "__divdf3" => LibCall::Divdf3,
+    "__divdi3" => LibCall::Divdi3,
+    "__divsf3" => LibCall::Divsf3,
+    "__divsi3" => LibCall::Divsi3,
+    "__eqdf2" => LibCall::Eqdf2,
+    "__eqsf2" => LibCall::Eqsf2,
+    "__extendsfdf2" => LibCall::Extendsfdf2,
+    "__fixdfdi" => LibCall::Fixdfdi,
+    "__fixdfsi" => LibCall::Fixdfsi,
+    "__fixsfdi" => LibCall::Fixsfdi,
+    "__fixsfsi" => LibCall::Fixsfsi,
+    "__fixunsdfdi" => LibCall::Fixunsdfdi,
+    "__fixunsdfsi" => LibCall::Fixunsdfsi,
+    "__fixunssfdi" => LibCall::Fixunssfdi,
+    "__fixunssfsi" => LibCall::Fixunssfsi,
+    "__floatdidf" => LibCall::Floatdidf,
+    "__floatdisf" => LibCall::Floatdisf,
+    "__floatsidf" => LibCall::Floatsidf,
+    "__floatsisf" => LibCall::Floatsisf,
+    "__floatundidf" => LibCall::Floatundidf,
+    "__floatundisf" => LibCall::Floatundisf,
+    "__floatunsidf" => LibCall::Floatunsidf,
+    "__floatunsisf" => LibCall::Floatunsisf,
+    "__gedf2" => LibCall::Gedf2,
+    "__gesf2" => LibCall::Gesf2,
+    "__gtdf2" => LibCall::Gtdf2,
+    "__gtsf2" => LibCall::Gtsf2,
+    "__ledf2" => LibCall::Ledf2,
+    "__lesf2" => LibCall::Lesf2,
+    "__ltdf2" => LibCall::Ltdf2,
+    "__ltsf2" => LibCall::Ltsf2,
+    "__moddi3" => LibCall::Moddi3,
+    "__modsi3" => LibCall::Modsi3,
+    "__muldf3" => LibCall::Muldf3,
+    "__muldi3" => LibCall::Muldi3,
+    "__mulsf3" => LibCall::Mulsf3,
+    "__mulsi3" => LibCall::Mulsi3,
+    "__nedf2" => LibCall::Nedf2,
+    "__negdf2" => LibCall::Negdf2,
+    "__negsf2" => LibCall::Negsf2,
+    "__nesf2" => LibCall::Nesf2,
+    "__subdf3" => LibCall::Subdf3,
+    "__subsf3" => LibCall::Subsf3,
+    "__truncdfsf2" => LibCall::Truncdfsf2,
+    "__udivdi3" => LibCall::Udivdi3,
+    "__udivsi3" => LibCall::Udivsi3,
+    "__umoddi3" => LibCall::Umoddi3,
+    "__umodsi3" => LibCall::Umodsi3,
+    "__unorddf2" => LibCall::Unorddf2,
+    "__unordsf2" => LibCall::Unordsf2,
+    "memset" => LibCall::Memset,
+    "sqrt" => LibCall::Sqrt,
 };
 
 static LIBCALLS_MACHO: phf::Map<&'static str, LibCall> = phf::phf_map! {
@@ -401,17 +459,17 @@ where
                     0,
                 ) => RelocationKind::Arm64Movw3,
                 (
-                    object::Architecture::Riscv64,
+                    object::Architecture::Riscv64 | object::Architecture::Riscv32,
                     object::RelocationKind::Elf(object::elf::R_RISCV_CALL_PLT),
                     0,
                 ) => RelocationKind::RiscvCall,
                 (
-                    object::Architecture::Riscv64,
+                    object::Architecture::Riscv64 | object::Architecture::Riscv32,
                     object::RelocationKind::Elf(object::elf::R_RISCV_PCREL_HI20),
                     0,
                 ) => RelocationKind::RiscvPCRelHi20,
                 (
-                    object::Architecture::Riscv64,
+                    object::Architecture::Riscv64 | object::Architecture::Riscv32,
                     object::RelocationKind::Elf(object::elf::R_RISCV_PCREL_LO12_I),
                     0,
                 ) => RelocationKind::RiscvPCRelLo12I,
 
@@ -58,12 +58,14 @@ pub struct FuncTranslator {
     abi: Box<dyn Abi>,
     binary_fmt: BinaryFormat,
     func_section: String,
+    pointer_width: u8,
 }
 
 impl FuncTranslator {
     pub fn new(
         target_machine: TargetMachine,
         binary_fmt: BinaryFormat,
+        pointer_width: u8,
     ) -> Result<Self, CompileError> {
         let abi = get_abi(&target_machine);
         Ok(Self {
@@ -80,6 +82,7 @@ impl FuncTranslator {
                 }
             },
             binary_fmt,
+            pointer_width,
         })
     }
 
@@ -116,8 +119,7 @@ impl FuncTranslator {
             .get(wasm_module.functions[func_index])
             .unwrap();
 
-        // TODO: pointer width
-        let offsets = VMOffsets::new(8, wasm_module);
+        let offsets = VMOffsets::new(self.pointer_width, wasm_module);
         let intrinsics = Intrinsics::declare(&module, &self.ctx, &target_data, &self.binary_fmt);
         let (func_type, func_attrs) =
             self.abi
@@ -238,7 +240,13 @@ impl FuncTranslator {
             state,
             function: func,
             locals: params_locals,
-            ctx: CtxType::new(wasm_module, &func, &cache_builder, &*self.abi),
+            ctx: CtxType::new(
+                wasm_module,
+                &func,
+                &cache_builder,
+                &*self.abi,
+                self.pointer_width,
+            ),
             unreachable_depth: 0,
             memory_styles,
             _table_styles,
 
@@ -1232,6 +1232,7 @@ impl<'ctx, 'a> CtxType<'ctx, 'a> {
         func_value: &FunctionValue<'ctx>,
         cache_builder: &'a Builder<'ctx>,
         abi: &'a dyn Abi,
+        pointer_width: u8,
     ) -> CtxType<'ctx, 'a> {
         CtxType {
             ctx_ptr_value: abi.get_vmctx_ptr_param(func_value),
@@ -1248,8 +1249,7 @@ impl<'ctx, 'a> CtxType<'ctx, 'a> {
             cached_memory_grow: HashMap::new(),
             cached_memory_size: HashMap::new(),
 
-            // TODO: pointer width
-            offsets: VMOffsets::new(8, wasm_module),
+            offsets: VMOffsets::new(pointer_width, wasm_module),
         }
     }
 
 
@@ -1107,11 +1107,13 @@ impl Artifact {
             _ => 1,
         };
 
+        // MetadataHeader::parse requires that metadata must be aligned
+        // by 8 bytes.
         emit_data(
             &mut obj,
             object_name.as_bytes(),
             &metadata_binary,
-            default_align,
+            std::cmp::max(8, default_align),
         )
         .map_err(to_compile_error)?;