Submitted vector_search/bacalhau_gpu

2026-03-05 00:08:13 +08:00 · 2025-12-02 16:53:37 +00:00 · 2025-12-02 16:53:37 +00:00 · 3d90630488
commit 3d90630488
parent bdc6ed6794
4 changed files with 209 additions and 1 deletions
--- a/tig-algorithms/src/vector_search/bacalhau_gpu/README.md
+++ b/tig-algorithms/src/vector_search/bacalhau_gpu/README.md
@ -0,0 +1,23 @@
+# TIG Code Submission
+
+## Submission Details
+
+* **Challenge Name:** vector_search
+* **Algorithm Name:** bacalhau_gpu
+* **Copyright:** 2024 Louis Silva
+* **Identity of Submitter:** Louis Silva
+* **Identity of Creator of Algorithmic Method:** null
+* **Unique Algorithm Identifier (UAI):** null
+
+## License
+
+The files in this folder are under the following licenses:
+* TIG Benchmarker Outbound License
+* TIG Commercial License
+* TIG Inbound Game License
+* TIG Innovator Outbound Game License
+* TIG Open Data License
+* TIG THV Game License
+
+Copies of the licenses can be obtained at:
+https://github.com/tig-foundation/tig-monorepo/tree/main/docs/licenses
--- a/tig-algorithms/src/vector_search/bacalhau_gpu/kernels.cu
+++ b/tig-algorithms/src/vector_search/bacalhau_gpu/kernels.cu
@ -0,0 +1,19 @@
+/*!
+Copyright 2024 Louis Silva
+
+Licensed under the TIG Inbound Game License v1.0 or (at your option) any later
+version (the "License"); you may not use this file except in compliance with the
+License. You may obtain a copy of the License at
+
+https://github.com/tig-foundation/tig-monorepo/tree/main/docs/licenses
+
+Unless required by applicable law or agreed to in writing, software distributed
+under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
+CONDITIONS OF ANY KIND, either express or implied. See the License for the specific
+language governing permissions and limitations under the License.
+ */
+
+extern "C" __global__ void do_nothing()
+{
+    // This kernel does nothing
+}             
--- a/tig-algorithms/src/vector_search/bacalhau_gpu/mod.rs
+++ b/tig-algorithms/src/vector_search/bacalhau_gpu/mod.rs
@ -0,0 +1,165 @@
+use anyhow::{anyhow, Result};
+use cudarc::{
+    driver::{safe::LaunchConfig, CudaModule, CudaStream, PushKernelArg},
+    runtime::sys::cudaDeviceProp,
+};
+use serde_json::{Map, Value};
+use std::sync::Arc;
+use tig_challenges::vector_search::{Challenge, Solution};
+
+pub fn solve_challenge(
+    challenge: &Challenge,
+    save_solution: &dyn Fn(&Solution) -> anyhow::Result<()>,
+    hyperparameters: &Option<Map<String, Value>>,
+    module: Arc<CudaModule>,
+    stream: Arc<CudaStream>,
+    prop: &cudaDeviceProp,
+) -> anyhow::Result<()> {
+    Err(anyhow!("This algorithm is no longer compatible."))
+}
+
+// Old code that is no longer compatible
+#[cfg(none)]
+mod dead_code {
+    use anyhow::Result;
+
+    use tig_challenges::vector_search::*;
+
+    #[inline]
+    fn squared_distance(v1: &[f32], v2: &[f32]) -> f32 {
+        v1.iter()
+            .zip(v2.iter())
+            .map(|(a, b)| (a - b) * (a - b))
+            .sum()
+    }
+
+    pub fn solve_challenge(challenge: &Challenge) -> Result<Option<Solution>> {
+        let max_distance_sq = challenge.max_distance * challenge.max_distance;
+
+        let indexes: Vec<Option<usize>> = challenge
+            .query_vectors
+            .iter()
+            .map(|query| {
+                challenge
+                    .vector_database
+                    .iter()
+                    .enumerate()
+                    .filter_map(|(i, vector)| {
+                        let dist_sq = squared_distance(query, vector);
+                        if dist_sq <= max_distance_sq {
+                            Some((i, dist_sq))
+                        } else {
+                            None
+                        }
+                    })
+                    .min_by(|(_, dist_sq1), (_, dist_sq2)| dist_sq1.partial_cmp(dist_sq2).unwrap())
+                    .map(|(i, _)| i)
+            })
+            .collect();
+
+        if indexes.iter().all(Option::is_some) {
+            Ok(Some(Solution {
+                indexes: indexes.into_iter().map(Option::unwrap).collect(),
+            }))
+        } else {
+            Ok(None)
+        }
+    }
+
+    #[cfg(feature = "cuda")]
+    mod gpu_optimization {
+        use super::*;
+        use cudarc::driver::*;
+        use cudarc::driver::{CudaDevice, CudaFunction};
+        use std::{collections::HashMap, sync::Arc};
+        use tig_challenges::CudaKernel;
+
+        pub const KERNEL: Option<CudaKernel> = Some(CudaKernel {
+            src: r#"
+   extern "C" __global__ void find_nearest_neighbors(
+       const float* __restrict__ vector_database,
+       const float* __restrict__ query_vectors,
+       const int num_queries,
+       int* results
+   ) {
+       #define FLT_MAX 3.402823466e+38F
+
+       int query_idx = blockIdx.x * blockDim.x + threadIdx.x;
+       if (query_idx >= num_queries) return;
+
+       float min_dist = FLT_MAX;
+       int nearest_idx = 0;
+
+       for (int i=0; i < 100000; i++) {
+           float dist = 0.0f;
+           for (int j=0; j < 250; j++) {
+               float diff = query_vectors[query_idx * 250 + j] - vector_database[i * 250 + j];
+               dist += diff * diff;
+           }
+
+           if (dist < min_dist) {
+               min_dist = dist;
+               nearest_idx = i;
+           }
+       }
+
+       results[query_idx] = nearest_idx;
+   }
+       "#,
+            funcs: &["find_nearest_neighbors"],
+        });
+
+        pub fn cuda_solve_challenge(
+            challenge: &Challenge,
+            dev: &Arc<CudaDevice>,
+            mut funcs: HashMap<&'static str, CudaFunction>,
+        ) -> Result<Option<Solution>> {
+            let num_query_vectors: usize = challenge.query_vectors.len();
+
+            let flattened_vector_database: Vec<f32> = challenge
+                .vector_database
+                .iter()
+                .flatten()
+                .cloned()
+                .collect();
+            let flattened_query_vectors: Vec<f32> =
+                challenge.query_vectors.iter().flatten().cloned().collect();
+
+            let d_vector_database = dev.htod_sync_copy(&flattened_vector_database)?;
+            let d_query_vectors = dev.htod_sync_copy(&flattened_query_vectors)?;
+            let mut d_results = dev.alloc_zeros::<i32>(num_query_vectors)?;
+
+            let cfg = LaunchConfig {
+                block_dim: (256, 1, 1),
+                grid_dim: (((num_query_vectors + 255) / 256) as u32, 1, 1),
+                shared_mem_bytes: 0,
+            };
+
+            unsafe {
+                funcs.remove("find_nearest_neighbors").unwrap().launch(
+                    cfg,
+                    (
+                        &d_vector_database,
+                        &d_query_vectors,
+                        num_query_vectors as i32,
+                        &mut d_results,
+                    ),
+                )?;
+            }
+
+            let mut h_indexes: Vec<i32> = vec![0; num_query_vectors];
+            dev.dtoh_sync_copy_into(&d_results, &mut h_indexes)?;
+
+            let indexes: Vec<usize> = h_indexes.iter().map(|&index| index as usize).collect();
+
+            Ok(Some(Solution { indexes }))
+        }
+    }
+
+    #[cfg(feature = "cuda")]
+    pub use gpu_optimization::{cuda_solve_challenge, KERNEL};
+}
+
+pub fn help() {
+    println!("No help information available.");
+}
--- a/tig-algorithms/src/vector_search/mod.rs
+++ b/tig-algorithms/src/vector_search/mod.rs
@ -34,7 +34,8 @@

 // c004_a018

-// c004_a019
+pub mod bacalhau_gpu;
+pub use bacalhau_gpu as c004_a019;

 // c004_a020