- Updated stablediffusion crate path from "../stable-diffusion-burn" to "./crates/stable-diffusion-burn" for proper workspace resolution - Enhanced .gitignore to include generated model files (.mpk, .pt, .bin, .safetensors, .ckpt) and user_data directory - Added Cargo.lock to gitignore with appropriate comment - Reorganized IDE files section in gitignore for better clarity - Added newline at end of file for proper formatting
91 lines
3.5 KiB
Rust
91 lines
3.5 KiB
Rust
use super::*;
|
|
use burn_tensor::Tolerance;
|
|
use burn_tensor::{Tensor, TensorData, activation};
|
|
|
|
#[test]
|
|
fn test_softmax_grad() {
|
|
let data_1 = TensorData::from([[0.0, 1.0], [3.0, 4.0]]);
|
|
let data_2 = TensorData::from([[6.0, 7.0], [9.0, 10.0]]);
|
|
let device = Default::default();
|
|
let tensor_1 = Tensor::<TestAutodiffBackend, 2>::from_data(data_1, &device).require_grad();
|
|
let tensor_2 = Tensor::<TestAutodiffBackend, 2>::from_data(data_2, &device).require_grad();
|
|
|
|
let tensor_3 = tensor_1.clone().matmul(tensor_2.clone());
|
|
let tensor_4 = activation::softmax(tensor_3, 1).matmul(tensor_2.clone());
|
|
|
|
let grads = tensor_4.backward();
|
|
let grad_1 = tensor_1.grad(&grads).unwrap();
|
|
let grad_2 = tensor_2.grad(&grads).unwrap();
|
|
|
|
let expected = TensorData::from([[1.179665, 1.179661], [0.005462, 0.005463]]);
|
|
|
|
grad_1
|
|
.to_data()
|
|
.assert_approx_eq::<FloatElem>(&expected, Tolerance::rel_abs(0.05, 0.5));
|
|
|
|
let expected = TensorData::from([[0.253469, 0.286237], [0.528630, 2.931664]]);
|
|
grad_2
|
|
.to_data()
|
|
.assert_approx_eq::<FloatElem>(&expected, Tolerance::rel_abs(0.05, 0.05));
|
|
}
|
|
|
|
#[test]
|
|
fn test_log_softmax_grad() {
|
|
let data_1 = TensorData::from([[0.0, 1.0], [3.0, 4.0]]);
|
|
let data_2 = TensorData::from([[6.0, 7.0], [9.0, 10.0]]);
|
|
let device = Default::default();
|
|
let tensor_1 = Tensor::<TestAutodiffBackend, 2>::from_data(data_1, &device).require_grad();
|
|
let tensor_2 = Tensor::<TestAutodiffBackend, 2>::from_data(data_2, &device).require_grad();
|
|
|
|
let tensor_3 = tensor_1.clone().matmul(tensor_2.clone());
|
|
let tensor_4 = activation::log_softmax(tensor_3, 1).matmul(tensor_2.clone());
|
|
|
|
let grads = tensor_4.backward();
|
|
let grad_1 = tensor_1.grad(&grads).unwrap();
|
|
let grad_2 = tensor_2.grad(&grads).unwrap();
|
|
|
|
let expected = TensorData::from([[-4.3939, -4.3939], [-12.9709, -12.9709]]);
|
|
// f16 gradients from log-softmax + matmul amplify error, so we increase the tolerance
|
|
// to account for limited precision and large representable step sizes in this range.
|
|
let tolerance = Tolerance::permissive().set_half_precision_relative(6e-2);
|
|
|
|
grad_1
|
|
.to_data()
|
|
.assert_approx_eq::<FloatElem>(&expected, tolerance);
|
|
|
|
let expected = TensorData::from([[30.5984, -47.2267], [55.9631, -56.5914]]);
|
|
grad_2
|
|
.to_data()
|
|
.assert_approx_eq::<FloatElem>(&expected, tolerance);
|
|
}
|
|
|
|
#[test]
|
|
fn test_quiet_softmax_grad() {
|
|
let data_1 = TensorData::from([[0.0, 1.0], [3.0, 4.0]]);
|
|
let data_2 = TensorData::from([[6.0, 7.0], [9.0, 10.0]]);
|
|
|
|
let device = Default::default();
|
|
let tensor_1 = Tensor::<TestAutodiffBackend, 2>::from_data(data_1, &device).require_grad();
|
|
let tensor_2 = Tensor::<TestAutodiffBackend, 2>::from_data(data_2, &device).require_grad();
|
|
|
|
let tensor_3 = tensor_1.clone().matmul(tensor_2.clone());
|
|
let tensor_4 = activation::softmax(tensor_3, 1).matmul(tensor_2.clone());
|
|
|
|
let grads = tensor_4.backward();
|
|
let grad_1 = tensor_1.grad(&grads).unwrap();
|
|
let grad_2 = tensor_2.grad(&grads).unwrap();
|
|
|
|
let expected = TensorData::from([[1.179665, 1.179661], [0.005462, 0.005463]]);
|
|
|
|
// Precision is quite bad yet on softmax grad especially with half precision.
|
|
let tolerance = Tolerance::rel_abs(0.5, 0.2);
|
|
grad_1
|
|
.to_data()
|
|
.assert_approx_eq::<FloatElem>(&expected, tolerance);
|
|
|
|
let expected = TensorData::from([[0.253469, 0.286237], [0.528630, 2.931664]]);
|
|
grad_2
|
|
.to_data()
|
|
.assert_approx_eq::<FloatElem>(&expected, tolerance);
|
|
}
|