Libtorch nightly declaration file + regen #1

JQuezada0 · 2024-01-06T03:18:31Z

Macbook Pro M1 Pro 16GB 14.1.1

Testing

This test snippet was pieced together from the tch-rs repo, this issue, and @ssoudan's example of using conda to get tch-rs functional on M1 here

use std::time::{Duration, Instant};

use tch::nn::ModuleT;
use tch::{self, Kind};
use tch::{kind, Tensor};

const DEVICE: tch::Device = tch::Device::Mps;

fn test_simple(vs: &tch::nn::Path) -> tch::nn::Sequential {
    const IMAGE_DIM: i64 = 784;
    const HIDDEN_NODES: i64 = 128;
    const LABELS: i64 = 10;

    tch::nn::seq()
        .add(tch::nn::linear(
            vs / "layer1",
            IMAGE_DIM,
            HIDDEN_NODES,
            Default::default(),
        ))
        .add_fn(|xs| xs.relu())
        .add(tch::nn::linear(
            vs,
            HIDDEN_NODES,
            LABELS,
            Default::default(),
        ))
}

fn speed_test(device: tch::Device) {
    let vs = tch::nn::VarStore::new(device);
    let model = test_simple(&vs.root());

    let start = Instant::now();
    for _ in 0..10000 {
        let __ = model.forward_t(
            &tch::Tensor::rand(&[128, 784], (Kind::Float, device)),
            false,
        );
    }
    let duration: Duration = start.elapsed();
    println!(
        "Time for 1000 iterations {:?} on `{:?}` device",
        duration, device
    );
}

fn grad_example() {
    let mut x = Tensor::from(2.0f32)
        .to_device(tch::Device::Mps)
        .set_requires_grad(true);
    let y = &x * &x + &x + 36;
    println!("y {}", y.double_value(&[]));

    x.zero_grad();
    y.backward();

    let dy_over_dx = x.grad();
    println!("dy/dx {}", dy_over_dx.double_value(&[]))
}

fn test_cpu_and_gpu() {
    let t = Tensor::from_slice(&[3, 1, 4, 1, 5]);
    t.print(); // works on CPU tensors

    println!("t(cpu) {:?}", &t);
    println!("t device: {:?}", &t.device());
    let t = Tensor::randn([5, 4], kind::FLOAT_CPU).to_device(tch::Device::Mps);
    t.print();
    println!("t(mps) {:?}", &t);
    println!("t device: {:?}", &t.device());

    grad_example();

    println!("ran grad example!");
}

fn main() {
    test_cpu_and_gpu();

    speed_test(tch::Device::Cpu);
    speed_test(tch::Device::Mps);
}

JQuezada0 added 2 commits January 5, 2024 22:08

add declaration file and regen

ee88740

format

7380712

JQuezada0 mentioned this pull request Jan 6, 2024

Documentation for use on Apple Silicon LaurentMazare/tch-rs#488

Open

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Libtorch nightly declaration file + regen #1

Libtorch nightly declaration file + regen #1

JQuezada0 commented Jan 6, 2024

Libtorch nightly declaration file + regen #1

Are you sure you want to change the base?

Libtorch nightly declaration file + regen #1

Conversation

JQuezada0 commented Jan 6, 2024

Testing