SGD

stochastic gradient descent optimizer

struct SGD (

Chain

) {

Chain* target;

float lr;

this(Chain target, float lr);

void step(string name, V field);

}

Constructors

this this(Chain target, float lr): Undocumented in source.

Members

Functions

step void step(string name, V field)

Variables

lr float lr;: Undocumented in source.
target Chain* target;: Undocumented in source.

Examples

import std.stdio;
import numir;
import grain.autograd; // : Variable, HostStorage;

{
    auto mlp = MLP!(float, HostStorage)(3);
    mlp.fc1.weight.grad[0] = 1.0;
    mlp.zeroGrad();
    assert(mlp.fc1.weight.grad[0] == 0.0);

    auto sgd = SGD!(typeof(mlp))(mlp, 0.5);
    mlp.fc1.weight.data.zero_();
    mlp.fc1.weight.grad = [[1.0f, 0.0f, 0.0f], [0.0f, 0.0f, 0.0f]].variable
        .data;
    sgd.update();
    assert(mlp.fc1.weight.sliced == [[-0.5, 0.0, 0.0], [0.0, 0.0, 0.0]]);
}
version (grain_cuda) {
    auto mlp = MLP!(float, DeviceStorage)(3);
    mlp.fc1.weight.grad = [[1.0f, 0.0f, 0.0f], [0.0f, 0.0f,
        0.0f]].variable.to!DeviceStorage.data;
    mlp.zeroGrad();
    assert(mlp.fc1.weight.to!HostStorage.gradSliced == [[0.0, 0.0, 0.0], [0.0,
            0.0, 0.0]]);

    auto sgd = SGD!(typeof(mlp))(mlp, 0.5);
    mlp.fc1.weight.data.zero_();
    mlp.fc1.weight.grad = [[1.0f, 0.0f, 0.0f], [0.0f, 0.0f,
        0.0f]].variable.to!DeviceStorage.data;
    sgd.update();
    assert(mlp.fc1.weight.to!HostStorage.sliced == [[-0.5, 0.0, 0.0], [0.0, 0.0,
            0.0]]);
}

SGD

Constructors

Members

Functions

Variables

Examples

Meta

Source