Build status for all platforms: Commercial support:
This directory contains the JavaCPP Presets module for:
- PyTorch 1.13.1
Please refer to the parent file for more detailed information about the JavaCPP Presets.
Java API documentation is available here:
∗ The JNI bindings can instead link with LibTorch, as long as its libraries are from the same version of PyTorch and can be found on the system library path, after setting the "org.bytedeco.javacpp.pathsFirst" system property to "true".
Here is a simple example of PyTorch ported to Java from this C++ source file:
We can use Maven 3 to download and install automatically all the class files as well as the native binaries. To run this sample code, after creating the pom.xml
source files below, simply execute on the command line:
$ mvn compile exec:java
<!-- Additional dependencies required to use CUDA, cuDNN, and NCCL -->
<!-- Additional dependencies to use bundled CUDA, cuDNN, and NCCL -->
<!-- Additional dependencies to use bundled full version of MKL -->
// © Copyright 2019, Torch Contributors.
import org.bytedeco.javacpp.*;
import org.bytedeco.pytorch.*;
import org.bytedeco.pytorch.Module;
import static*;
public class SimpleMNIST {
// Define a new Module.
static class Net extends Module {
Net() {
// Construct and register two Linear submodules.
fc1 = register_module("fc1", new LinearImpl(784, 64));
fc2 = register_module("fc2", new LinearImpl(64, 32));
fc3 = register_module("fc3", new LinearImpl(32, 10));
// Implement the Net's algorithm.
Tensor forward(Tensor x) {
// Use one of many tensor manipulation functions.
x = relu(fc1.forward(x.reshape(x.size(0), 784)));
x = dropout(x, /*p=*/0.5, /*train=*/is_training());
x = relu(fc2.forward(x));
x = log_softmax(fc3.forward(x), /*dim=*/1);
return x;
// Use one of many "standard library" modules.
LinearImpl fc1 = null, fc2 = null, fc3 = null;
public static void main(String[] args) throws Exception {
/* try to use MKL when available */
System.setProperty("org.bytedeco.openblas.load", "mkl");
// Create a new Net.
Net net = new Net();
// Create a multi-threaded data loader for the MNIST dataset.
MNISTMapDataset data_set = new MNIST("./data").map(new ExampleStack());
MNISTRandomDataLoader data_loader = new MNISTRandomDataLoader(
data_set, new RandomSampler(data_set.size().get()),
new DataLoaderOptions(/*batch_size=*/64));
// Instantiate an SGD optimization algorithm to update our Net's parameters.
SGD optimizer = new SGD(net.parameters(), new SGDOptions(/*lr=*/0.01));
for (int epoch = 1; epoch <= 10; ++epoch) {
int batch_index = 0;
// Iterate the data loader to yield batches from the dataset.
for (ExampleIterator it = data_loader.begin(); !it.equals(data_loader.end()); it = it.increment()) {
Example batch = it.access();
// Reset gradients.
// Execute the model on the input data.
Tensor prediction = net.forward(;
// Compute a loss value to judge the prediction of our model.
Tensor loss = nll_loss(prediction,;
// Compute gradients of the loss w.r.t. the parameters of our model.
// Update the parameters based on the calculated gradients.
// Output the loss and checkpoint every 100 batches.
if (++batch_index % 100 == 0) {
System.out.println("Epoch: " + epoch + " | Batch: " + batch_index
+ " | Loss: " + loss.item_float());
// Serialize your model periodically as a checkpoint.
OutputArchive archive = new OutputArchive();;