From e73e2a976eccadc249d7e9560dec63c41e123426 Mon Sep 17 00:00:00 2001
From: Russel Arbore <russel.jma@gmail.com>
Date: Sun, 16 Feb 2025 18:16:37 -0600
Subject: [PATCH] emit aligns

---
 hercules_cg/src/cpu.rs   | 13 ++++++++-----
 juno_scheduler/src/pm.rs |  3 +++
 2 files changed, 11 insertions(+), 5 deletions(-)

diff --git a/hercules_cg/src/cpu.rs b/hercules_cg/src/cpu.rs
index 7d87170b..a19218c7 100644
--- a/hercules_cg/src/cpu.rs
+++ b/hercules_cg/src/cpu.rs
@@ -103,8 +103,9 @@ impl<'a> CPUContext<'a> {
             } else {
                 write!(
                     w,
-                    "{} noalias nofree nonnull noundef %p{}",
+                    "{} noalias nofree nonnull noundef align({}) %p{}",
                     self.get_type(*ty),
+                    get_type_alignment(&self.types, *ty),
                     idx
                 )?;
             }
@@ -506,10 +507,11 @@ impl<'a> CPUContext<'a> {
                     // load.
                     write!(
                         body,
-                        "  {} = load {}, ptr {}\n",
+                        "  {} = load {}, ptr {}, align {}\n",
                         self.get_value(id, false),
                         self.get_type(self_ty),
-                        index_ptr_name
+                        index_ptr_name,
+                        get_type_alignment(self.types, collect_ty),
                     )?;
                 } else {
                     // If this read doesn't reach a primitive type, just return
@@ -538,9 +540,10 @@ impl<'a> CPUContext<'a> {
                     // perform a single store of the data value.
                     write!(
                         body,
-                        "  store {}, ptr {}\n",
+                        "  store {}, ptr {}, align {}\n",
                         self.get_value(data, true),
-                        index_ptr_name
+                        index_ptr_name,
+                        get_type_alignment(self.types, collect_ty),
                     )?;
                 } else {
                     // If the data item being written is not a primitive type,
diff --git a/juno_scheduler/src/pm.rs b/juno_scheduler/src/pm.rs
index 410e614c..1c00e3d0 100644
--- a/juno_scheduler/src/pm.rs
+++ b/juno_scheduler/src/pm.rs
@@ -795,6 +795,7 @@ impl PassManager {
             .arg(&llvm_path)
             .arg("-c")
             .arg("-O3")
+            .arg("-ffast-math")
             .arg("-march=native")
             .arg("-o")
             .arg(&llvm_object)
@@ -830,6 +831,8 @@ impl PassManager {
             let mut nvcc_process = Command::new("nvcc")
                 .arg("-c")
                 .arg("-O3")
+                .arg("-ffast-math")
+                .arg("-march=native")
                 .arg("-diag-suppress")
                 .arg("177")
                 .arg("-o")
-- 
GitLab