Merge branch 'main' of https://github.com/PlatformAwareProgramming/NPB-Rust

decarvalhojunior-fh · decarvalhojunior-fh · commit 52148e8174bc · 2025-04-28T18:56:06.000-03:00
diff --git a/rust-cuda-project/Cargo.toml b/rust-cuda-project/Cargo.toml
@@ -0,0 +1,6 @@
+[package]
+name = "meu-projeto-rust"
+version = "0.1.0"
+edition = "2021"
+
+[dependencies]
diff --git a/rust-cuda-project/Makefile b/rust-cuda-project/Makefile
@@ -0,0 +1,36 @@
+# Caminhos para os arquivos
+CUDA_SRC = src/dot_product.cu
+CUDA_OBJ = dot_product.o
+CUDA_LIB = libdot_product.so
+RUST_TARGET = target/debug/meu-projeto-rust  # Substitua com o nome do seu pacote Rust
+
+# Compilador CUDA
+NVCC = nvcc
+CC = gcc
+CARGO = cargo
+
+# Flags de compila&ccedil;&atilde;o
+CUDA_FLAGS = --compiler-options '-fPIC' -c
+CC_FLAGS = -shared -lcudart
+
+# Compila&ccedil;&atilde;o CUDA: cria o arquivo de objeto
+$(CUDA_OBJ): $(CUDA_SRC)
+	$(NVCC) $(CUDA_FLAGS) $(CUDA_SRC) -o $(CUDA_OBJ)
+
+# Cria&ccedil;&atilde;o da biblioteca compartilhada a partir do objeto compilado
+$(CUDA_LIB): $(CUDA_OBJ)
+	$(CC) $(CC_FLAGS) $(CUDA_OBJ) -o $(CUDA_LIB)
+
+# Compilar o c&oacute;digo Rust e vincular a biblioteca compartilhada
+rust: $(CUDA_LIB)
+	cargo build
+
+# Limpeza de arquivos gerados
+clean:
+	rm -f $(CUDA_OBJ) $(CUDA_LIB)
+	cargo clean
+
+# Compilar tudo
+all: rust
+
+.PHONY: clean all
diff --git a/rust-cuda-project/README.md b/rust-cuda-project/README.md
@@ -0,0 +1,27 @@
+# Meu Projeto Rust
+
+Este &eacute; um projeto de exemplo em Rust.
+
+## Estrutura do Projeto
+
+```
+meu-projeto-rust
+&#9500;&#9472;&#9472; src
+&#9474;   &#9500;&#9472;&#9472; main.rs
+&#9500;&#9472;&#9472; Cargo.toml
+&#9492;&#9472;&#9472; README.md
+```
+
+## Como Configurar
+
+Para configurar o projeto, voc&ecirc; precisa ter o Rust e o Cargo instalados. Voc&ecirc; pode instalar o Rust atrav&eacute;s do [rustup](https://rustup.rs/).
+
+## Como Executar
+
+Para executar o projeto, navegue at&eacute; o diret&oacute;rio do projeto e use o seguinte comando:
+
+```
+cargo run
+```
+
+Isso ir&aacute; compilar e executar o programa.
diff --git a/rust-cuda-project/build.rs b/rust-cuda-project/build.rs
@@ -0,0 +1,6 @@
+fn main() {
+    println!("cargo:rustc-link-search=.");
+    println!("cargo:rustc-link-lib=dylib=dot_product");
+    println!("cargo:rustc-link-search=native=/usr/local/cuda/lib64");
+    println!("cargo:rustc-link-lib=dylib=cudart"); 
+}
diff --git a/rust-cuda-project/dot_product.o b/rust-cuda-project/dot_product.o
diff --git a/rust-cuda-project/libdot_product.so b/rust-cuda-project/libdot_product.so
diff --git a/rust-cuda-project/src/dot_product.cu b/rust-cuda-project/src/dot_product.cu
@@ -0,0 +1,66 @@
+// dot_product.cu
+#include <cuda_runtime.h>
+#include <stdio.h>
+
+extern "C" {
+
+// Kernel CUDA para multiplicar os vetores
+__global__ void dot_product_kernel(const double* x, const double* y, double* partial_sum, int n) {
+    __shared__ double cache[256]; // Cache compartilhado para redu&ccedil;&atilde;o
+    int tid = threadIdx.x + blockIdx.x * blockDim.x;
+    int cacheIndex = threadIdx.x;
+
+    double temp = 0.0;
+    while (tid < n) {
+        temp += x[tid] * y[tid];
+        tid += blockDim.x * gridDim.x;
+    }
+
+    cache[cacheIndex] = temp;
+
+    __syncthreads();
+
+    // Redu&ccedil;&atilde;o paralela
+    int i = blockDim.x/2;
+    while (i != 0) {
+        if (cacheIndex < i) {
+            cache[cacheIndex] += cache[cacheIndex + i];
+        }
+        __syncthreads();
+        i /= 2;
+    }
+
+    if (cacheIndex == 0)
+        partial_sum[blockIdx.x] = cache[0];
+}
+
+// Fun&ccedil;&atilde;o wrapper para ser chamada do Rust
+void dot_product_gpu(const double* x, const double* y, double* result, int n) {
+    double *d_x, *d_y, *d_partial_sum;
+    int blocks = 32;
+    int threads = 256;
+
+    cudaMalloc((void**)&d_x, n * sizeof(double));
+    cudaMalloc((void**)&d_y, n * sizeof(double));
+    cudaMalloc((void**)&d_partial_sum, blocks * sizeof(double));
+
+    cudaMemcpy(d_x, x, n * sizeof(double), cudaMemcpyHostToDevice);
+    cudaMemcpy(d_y, y, n * sizeof(double), cudaMemcpyHostToDevice);
+
+    dot_product_kernel<<<blocks, threads>>>(d_x, d_y, d_partial_sum, n);
+
+    double* h_partial_sum = (double*) malloc(blocks * sizeof(double));
+    cudaMemcpy(h_partial_sum, d_partial_sum, blocks * sizeof(double), cudaMemcpyDeviceToHost);
+
+    *result = 0.0;
+    for (int i = 0; i < blocks; i++) {
+        *result += h_partial_sum[i];
+    }
+
+    free(h_partial_sum);
+    cudaFree(d_x);
+    cudaFree(d_y);
+    cudaFree(d_partial_sum);
+}
+
+}
diff --git a/rust-cuda-project/src/dot_product.h b/rust-cuda-project/src/dot_product.h
@@ -0,0 +1,16 @@
+// dot_product.h
+
+#ifndef DOT_PRODUCT_H
+#define DOT_PRODUCT_H
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+void dot_product_gpu(const double* x, const double* y, double* result, int n);
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif
diff --git a/rust-cuda-project/src/main.rs b/rust-cuda-project/src/main.rs
@@ -0,0 +1,25 @@
+use std::ffi::c_double;
+use std::os::raw::c_int;
+
+extern "C" {
+    fn dot_product_gpu(x: *const c_double, y: *const c_double, result: *mut c_double, n: c_int);
+}
+
+// Fun&ccedil;&atilde;o Rust
+fn vecvecmul(x: &[f64], y: &[f64]) -> f64 {
+    assert_eq!(x.len(), y.len());
+    let mut result: f64 = 0.0;
+
+    unsafe {
+        dot_product_gpu(x.as_ptr(), y.as_ptr(), &mut result as *mut f64, x.len() as i32);
+    }
+
+    result
+}
+
+fn main() {
+    let a = vec![1.0, 2.0, 3.0];
+    let b = vec![4.0, 5.0, 6.0];
+    let dot = vecvecmul(&a, &b);
+    println!("Produto interno: {}", dot); // Deve imprimir 32.0
+}

-Original file line number
+Diff line change
 +# Meu Projeto Rust
++
 +Este é um projeto de exemplo em Rust.
++
 +## Estrutura do Projeto
++
 +```
 +meu-projeto-rust
 +├── src
 +│   ├── main.rs
 +├── Cargo.toml
 +└── README.md
 +```
++
 +## Como Configurar
++
 +Para configurar o projeto, você precisa ter o Rust e o Cargo instalados. Você pode instalar o Rust através do [rustup](https://rustup.rs/).
++
 +## Como Executar
++
 +Para executar o projeto, navegue até o diretório do projeto e use o seguinte comando:
++
 +```
 +cargo run
 +```
++
 +Isso irá compilar e executar o programa.