Able to get matrix math working

2026-06-02 03:40:41 +00:00 · 2025-02-14 10:56:06 -05:00
parent b86ef2201f
commit cfbeaa3ef7
1 changed files with 17 additions and 4 deletions
--- a/self-intention/src/main.rs
+++ b/self-intention/src/main.rs
@@ -1,10 +1,9 @@
 use anyhow::Ok;
 use anyhow::Result;
-use candle_core::Var;
-use candle_core::{DType, Device, Tensor, D};
+use candle_core::{DType, Device, Tensor};
 use candle_nn::ops::softmax;
 use candle_nn::VarBuilder;
-use candle_nn::{linear, Linear, Module, Optimizer, Sequential, VarMap, SGD};
+use candle_nn::{linear, Linear, Module, VarMap};

 struct SelfAttention {
    d: usize, // Embedding size
@@ -34,15 +33,18 @@ impl SelfAttention {

 impl SelfAttention {
    fn attention(&self, x: &Tensor) -> Result<Tensor> {
+        println!("x: {:?}", x);
        let q = self.w_q.forward(x)?;
        let k = self.w_k.forward(x)?;
        let v = self.w_v.forward(x)?;

+        println!("q: {:?}, k: {:?}", q, k);
        let qk = q.matmul(&k.transpose(1, 0)?)?;

        let qk = qk.broadcast_div(&self.scale)?;
        let qk = softmax(&qk, 1)?;

+        println!("qk: {:?}, v: {:?}", qk, v);
        Ok(qk.matmul(&v)?)
    }
 }
@@ -50,7 +52,18 @@ fn main() -> Result<()> {
    let device = Device::cuda_if_available(0)?;
    let varmap = VarMap::new();
    let vs = VarBuilder::from_varmap(&varmap, DType::F32, &device);
-    let self_attn = SelfAttention::new(4, vs)?;
+    let self_attn = SelfAttention::new(2, vs)?;

+    let encoding_matrix = Tensor::new(
+        vec![
+            vec![1.16 as f32, 0.23 as f32],
+            vec![0.57 as f32, 1.36 as f32],
+            vec![4.41 as f32, -2.16 as f32],
+        ],
+        &device,
+    )?;
+
+    let attn = self_attn.attention(&encoding_matrix)?;
+    println!("{}", attn);
    Ok(())
 }