!*rm -f go.work && go work init && go work use . "${HOME}/Projects/gomlx"
%goworkfix

	- Added replace rule for module "github.com/gomlx/gomlx" to local directory "/home/janpf/Projects/gomlx".

import . "github.com/gomlx/gomlx/pkg/core/graph"

func Sum(a, b *Node) *Node {
    return Add(a, b)
}

%env GOMLX_BACKEND=xla:cpu

import _ "github.com/gomlx/gomlx/backends/default"

var backend = backends.MustNew()

%%

// Short version: `ExecOnce` will compile the function and execute only once.
two, err := ExecOnce(backend, /* GoMLX function */ Sum, /* Arguments */ 1.0, 1.0)
if err != nil { panic(err) }
fmt.Printf("Short version:\t1+1=%v\n", two)

// Exec version: `NewExec` will compile the Sum function so it can be executed efficiently
// many times.
exec, err := NewExec(backend, Sum)
if err != nil { panic(err) }
results, err := exec.Exec(1, 1)
if err != nil { panic(err) }
two = results[0]
fmt.Printf("Exec version:\t1+1=%v\n", two)

Set: GOMLX_BACKEND="xla:cpu"
Short version:	1+1=float64(2)
Exec version:	1+1=int64(2)

import (
    "fmt"
    . "github.com/gomlx/gomlx/pkg/core/graph"
)

// Sum is the symbolic funciton (creates a graph) of summing two numbers.
func Sum(a, b *Node) *Node {
    g := a.Graph()  // Graph on which this symbolic computation is being built.
    fmt.Printf("\n- Building graph (GraphId=%d) for a.shape=%s and b.shape=%s\n", g.GraphId(), a.Shape(), b.Shape())
    return Add(a, b)
}


func main() {
    sumExec := MustNewExec(backend, Sum)
    two := sumExec.MustExec1(1, 1)
    fmt.Printf("\t1+1=%s\n", two)

    for ii := 0; ii < 5; ii++ {
        sumInts := sumExec.MustExec1(ii, ii)
        fmt.Printf("\t%d+%d=%s\n", ii, ii, sumInts)
    }

    five := sumExec.MustExec1(3.5, 1.5)
    fmt.Printf("\t3.5+1.5=%s\n", five)

    many := sumExec.MustExec1([]float32{1.1, 2.2, 3.3}, float32(10))
    fmt.Printf("\t[1.1, 2.2, 3.3] + 10 = %s\n", many)
}

- Building graph (GraphId=0) for a.shape=(Int64) and b.shape=(Int64)
	1+1=int64(2)
	0+0=int64(0)
	1+1=int64(2)
	2+2=int64(4)
	3+3=int64(6)
	4+4=int64(8)

- Building graph (GraphId=1) for a.shape=(Float64) and b.shape=(Float64)
	3.5+1.5=float64(5)

- Building graph (GraphId=2) for a.shape=(Float32)[3] and b.shape=(Float32)
	[1.1, 2.2, 3.3] + 10 = [3]float32{11.1, 12.2, 13.3}

%%
sumExec := MustNewExec(backend, Sum)
_, err := sumExec.Exec(1.1, 2) // Error: arguments have different dtypes Float64 and Int64.
klog.Errorf("%+v\n", err)

- Building graph (GraphId=0) for a.shape=(Float64) and b.shape=(Int64)

E1011 09:48:27.498153  999407 main.go:28] cannot broadcast Float64 and Int64 for "Add": they have different dtypes
github.com/gomlx/gomlx/backends/stablehlo.(*Builder).broadcastForBinaryOps
	/home/janpf/Projects/gomlx/backends/stablehlo/builder.go:213
github.com/gomlx/gomlx/backends/stablehlo.(*Builder).Add
	/home/janpf/Projects/gomlx/backends/stablehlo/gen_binary_ops.go:13
github.com/gomlx/gomlx/pkg/core/graph.Add
	/home/janpf/Projects/gomlx/pkg/core/graph/gen_backend_ops.go:191
main.Sum
	 [[ Cell Line 0 ]] /tmp/gonb_099774e5/main.go:20
reflect.Value.call
	/snap/go/current/src/reflect/value.go:581
reflect.Value.Call
	/snap/go/current/src/reflect/value.go:365
github.com/gomlx/gomlx/pkg/core/graph.(*Exec).createAndCacheGraph
	/home/janpf/Projects/gomlx/pkg/core/graph/exec.go:539
github.com/gomlx/gomlx/pkg/core/graph.(*Exec).findOrCreateGraph
	/home/janpf/Projects/gomlx/pkg/core/graph/exec.go:598
github.com/gomlx/gomlx/pkg/core/graph.(*Exec).compileAndExecute
	/home/janpf/Projects/gomlx/pkg/core/graph/exec.go:447
github.com/gomlx/gomlx/pkg/core/graph.(*Exec).ExecWithGraph.func1
	/home/janpf/Projects/gomlx/pkg/core/graph/exec.go:392
github.com/gomlx/gomlx/internal/exceptions.TryCatch[...]
	/home/janpf/Projects/gomlx/internal/exceptions/exceptions.go:90
github.com/gomlx/gomlx/pkg/core/graph.(*Exec).ExecWithGraph
	/home/janpf/Projects/gomlx/pkg/core/graph/exec.go:391
github.com/gomlx/gomlx/pkg/core/graph.(*Exec).Exec
	/home/janpf/Projects/gomlx/pkg/core/graph/exec.go:377
main.main
	 [[ Cell [5] Line 3 ]] /tmp/gonb_099774e5/main.go:27
runtime.main
	/snap/go/current/src/runtime/proc.go:285
runtime.goexit
	/snap/go/current/src/runtime/asm_amd64.s:1693

%%
onePlusExec := MustNewExec(backend, func (x *Node) *Node {
    return OnePlus(x)
})
// exec.MustExec1 will return a *tensor.Tensor.
counter := onePlusExec.MustExec1(0)
// counter.String() will first transfer counter to local (using counter.Local()) to print its values.
fmt.Printf("counter.type=%T, counter=%s\n", counter, counter.String())
for ii := 0; ii < 10; ii++ {
    // Since the counter is not being used locally between the calls, the tensor will only use the
    // device storage.
    counter = onePlusExec.MustExec1(counter)
}
// Again counter.String() (called implicitly by fmt.Printf) will first transfer the counter value locally, and then convert to a Go value.
fmt.Printf("counter=%v\n", counter)

counter.type=*tensors.Tensor, counter=int64(1)
counter=int64(11)

func f(x, y *Node) *Node {
    return Add(Square(x), Mul(x, y))
}

func gradOfF(x, y *Node) (output, gradX, gradY *Node) {
    output = f(x, y)
    reduced := ReduceAllSum(output) // In case x and y are not scalars.
    grads := Gradient(reduced, x, y)
    gradX, gradY = grads[0], grads[1] // df/dx, df/dy
    return output, gradX, gradY
}

%%
exec := MustNewExec(backend, gradOfF)
x := []float64{0, 1, 2}
y := []float64{10, 20, 30}
output, gradX, gradY := exec.MustExec3(x, y)
fmt.Printf("f(x=%v, y=%v)=%s,\n\tdf/dx=%s,\n\tdf/dy=%s\n", x, y, output, gradX, gradY)

f(x=[0 1 2], y=[10 20 30])=[3]float64{0, 21, 64},
	df/dx=[3]float64{10, 22, 34},
	df/dy=[3]float64{0, 1, 2}

// Removing the previous definitions of `f` and `gradOfF`
%rm gradOfF f

. removed func gradOfF
. removed func f

import "github.com/gomlx/gomlx/pkg/ml/context"

%%
ctx := context.New()
exec := context.MustNewExec(backend, ctx, func(ctx *context.Context, g *Graph) *Node {
    counterVar := ctx.VariableWithValue("count", int32(10))
    count := counterVar.ValueGraph(g)
    count = AddScalar(count, 1)
    counterVar.SetValueGraph(count)
    return count
})
fmt.Println("Counting:")
for range(3) {
    fmt.Printf("\tcount=%s\n", exec.MustExec1())
}
counterVar := ctx.InspectVariable(ctx.Scope(), "count").Value()
fmt.Printf("- State of counter=%s\n", counterVar.Value())

Counting:
	count=int32(11)
	count=int32(12)
	count=int32(13)
- State of counter=%!s(int32=13)

import "flag"

var (
    flagA = flag.Float64("a", 1.0, "Value of a in the equation ax^2+bx+c")
    flagB = flag.Float64("b", 2.0, "Value of b in the equation ax^2+bx+c")
    flagC = flag.Float64("c", 4.0, "Value of c in the equation ax^2+bx+c")
    flagNumSteps = flag.Int("steps", 10, "Number of gradient descent steps to perform")
    flagLearningRate    = flag.Float64("lr", 0.1, "Initial learning rate.")
)

// f(x) = ax^2 + bx + c
func f(x *Node) *Node {
    f := MulScalar(Square(x), *flagA)
    f = Add(f, MulScalar(x, *flagB))
    f = AddScalar(f, *flagC)
    return f
}

// minimizeF does one gradient descent step on F by moving a variable "x",
// and returns the value of the function at the current "x".
func minimizeF(ctx *context.Context, graph *Graph) *Node {
    // Create or reuse existing variable "x" -- no graph operation is created with this, it's
    // only a reference.
    xVar := ctx.VariableWithShape("x", shapes.Make(dtypes.Float64))

    x := xVar.ValueGraph(graph)                        // Read variable for the current graph.
    y := f(x)                                          // Value of f(x).

    // Gradient always return a slice, we take the first element for grad of X.
    gradX := Gradient(y, x)[0]

    // stepNum += 1
    stepNumVar := ctx.VariableWithValue("stepNum", 0.0)  // Creates the variable if not existing, or retrieve it if already exists.
    stepNum := stepNumVar.ValueGraph(graph)
    stepNum = OnePlus(stepNum)
    stepNumVar.SetValueGraph(stepNum)

    // step = -learningRate * gradX / Sqrt(stepNum)
    step := Div(gradX, Sqrt(stepNum))
    step = MulScalar(step, -*flagLearningRate)

    // x += step
    x = Add(x, step)
    xVar.SetValueGraph(x)
    return y  // f(x)
}

func Solve() {
    ctx := context.New()
    exec := context.MustNewExec(backend, ctx, minimizeF)
    for ii := 0; ii < *flagNumSteps-1; ii++ {
        _ = exec.MustExec()
    }
    y := exec.MustExec1()
    x := ctx.InspectVariable(ctx.Scope(), "x").Value()
    stepNum := ctx.InspectVariable(ctx.Scope(), "stepNum").Value()
    fmt.Printf("Minimum found at x=%g, f(x)=%g after %f steps.\n", x.Value(), y.Value(), stepNum.Value())
}

%% --a=1 --b=2 --c=3 --steps=10 --lr=0.5
Solve()

Minimum found at x=-1, f(x)=2 after 10.000000 steps.

%% --a=2 --b=12 --c=20 --steps=10 --lr=0.5
Solve()

Minimum found at x=-3, f(x)=2 after 10.000000 steps.

const (
    CoefficientMu    = 0.0
    CoefficientSigma = 5.0
    BiasMu           = 1.0
    BiasSigma        = 10.0
)

import (
    "github.com/gomlx/gomlx/pkg/core/shapes"
    "github.com/gomlx/gomlx/pkg/core/tensors"
)

// initCoefficients chooses random coefficients and bias. These are the true values the model will
// attempt to learn.
func initCoefficients(backend backends.Backend, numVariables int) (coefficients, bias *tensors.Tensor) {
    e := MustNewExec(backend, func(g *Graph) (coefficients, bias *Node) {
        rngState := Const(g, RngState())
        rngState, coefficients = RandomNormal(rngState, shapes.Make(dtypes.Float64, numVariables))
        coefficients = AddScalar(MulScalar(coefficients, CoefficientSigma), CoefficientMu)
        rngState, bias = RandomNormal(rngState, shapes.Make(dtypes.Float64))
        bias = AddScalar(MulScalar(bias, BiasSigma), BiasMu)
        return
    })
    coefficients, bias = e.MustExec2()
    return
}

%%
coef, bias := initCoefficients(backend, 3)
fmt.Printf("Example of target: coefficients=%0.3v, bias=%0.3v\n", coef.Value(), bias.Value())

Example of target: coefficients=[-1.03 6.14 3.05], bias=-18.1

func buildExamples(backend backends.Backend, coef, bias *tensors.Tensor, numExamples int, noise float64) (inputs, labels *tensors.Tensor) {
    e := MustNewExec(backend, func(coef, bias *Node) (inputs, labels *Node) {
        g := coef.Graph()
        numFeatures := coef.Shape().Dimensions[0]

        // Random inputs (observations).
        rngState := Const(g, RngState())
        rngState, inputs = RandomNormal(rngState, shapes.Make(coef.DType(), numExamples, numFeatures))
        coef = ExpandDims(coef, 0)

        // Calculate perfect labels.
        labels = ReduceAndKeep(Mul(inputs, coef), ReduceSum, -1)
        labels = Add(labels, bias)
        if noise > 0 {
            // Add some noise to the labels.
            var noiseVector *Node
            rngState, noiseVector = RandomNormal(rngState, labels.Shape())
            noiseVector = MulScalar(noiseVector, noise)
            labels = Add(labels, noiseVector)
        }
        return
    })
    inputs, labels = e.MustExec2(coef, bias)
    return
}

%%
coef, bias := initCoefficients(backend, 3)
numExamples := 5
inputsTensor, labelsTensor := buildExamples(backend, coef, bias, numExamples, 0.2)
fmt.Printf("Target: coefficients=%0.3v, bias=%0.3v\n", coef.Value(), bias.Value())

fmt.Printf("%d dataset examples:\n", numExamples)
inputs := inputsTensor.Value().([][]float64)
labels := labelsTensor.Value().([][]float64)
for ii := 0; ii < numExamples; ii ++ {
    fmt.Printf("\tx=%0.3v; label=%0.3v\n", inputs[ii], labels[ii])
}

Target: coefficients=[0.728 -6.22 8.15], bias=-24.2
5 dataset examples:
	x=[1.73 0.207 0.162]; label=[-22.8]
	x=[-1.17 0.725 0.0552]; label=[-29]
	x=[0.617 1.31 0.898]; label=[-24.5]
	x=[-0.214 -0.102 1.3]; label=[-13.1]
	x=[1.16 0.758 0.545]; label=[-23.8]

import "github.com/gomlx/gomlx/pkg/ml/train"

// TrivialDataset always returns the whole data.
type TrivialDataset struct {
    name string
    inputs, labels []*tensors.Tensor
}

var (
    // Assert Dataset implements train.Dataset.
    _ train.Dataset = &TrivialDataset{}
)
// Name implements train.Dataset.
func (ds *TrivialDataset) Name() string { return ds.name }

// Yield implements train.Dataset.
func (ds *TrivialDataset) Yield() (spec any, inputs, labels []*tensors.Tensor, err error) {
    return ds, ds.inputs, ds.labels, nil
}

// IsOwnershipTransferred tells the training loop that the dataset keeps ownership of the yielded tensors.
func (ds *TrivialDataset) IsOwnershipTransferred() bool {
    return false
}

// Reset implements train.Dataset.
func (ds *TrivialDataset) Reset() {}

type ModelFn func(ctx *context.Context, spec any, inputs []*graph.Node) (predictions []*graph.Node)

import "github.com/gomlx/gomlx/pkg/ml/context"

func modelGraph(ctx *context.Context, spec any, inputs []*Node) ([]*Node) {
    _ = spec  // Not needed here, we know the dataset.
    logits := layers.DenseWithBias(ctx, inputs[0], /* outputDim= */ 1)
    return []*Node{logits}
}

import (
    "os"
    "github.com/gomlx/gomlx/ui/commandline"
    "github.com/gomlx/gomlx/pkg/ml/layers/regularizers"
)

var (
    flagNumExamples  = flag.Int("num_examples", 10000, "Number of examples to generate")
    flagNumFeatures  = flag.Int("num_features", 3, "Number of features")
    flagNoise        = flag.Float64("noise", 0.2, "Noise in synthetic data generation")
    flagNumSteps     = flag.Int("steps", 100, "Number of gradient descent steps to perform")
    flagLearningRate    = flag.Float64("lr", 0.1, "Initial learning rate.")
)

// AttachToLoop decorators. It will be redefined later.
func AttachToLoop(loop *train.Loop) {
    commandline.AttachProgressBar(loop) // Attaches a progress bar to the loop.
}

// TrainMain() does everything to train the linear model.
func TrainMain() {
    flag.Parse()

    // Select coefficients that we will try to predic.
    trueCoefficients, trueBias := initCoefficients(backend, *flagNumFeatures)
    fmt.Printf("Target: coefficients=%0.3v, bias=%0.3v\n", trueCoefficients.Value(), trueBias.Value())

    // Generate training data with noise.
    inputs, labels := buildExamples(backend, trueCoefficients, trueBias, *flagNumExamples, *flagNoise)
    fmt.Printf("Training data (inputs, labels): (%s, %s)\n\n", inputs.Shape(), labels.Shape())
    dataset := &TrivialDataset{"linear", []*tensors.Tensor{inputs}, []*tensors.Tensor{labels}}

    // Creates Context with learned weights and bias.
    ctx := context.New()
    ctx.SetParam(optimizers.ParamLearningRate, *flagLearningRate)  // = "learning_rate"
    ctx.SetParam(regularizers.ParamL2, 1e-3)  // 1e-3 of L2 regularization.

    // train.Trainer executes a training step.
    trainer := train.NewTrainer(backend, ctx, modelGraph,
        losses.MeanSquaredError,
        optimizers.StochasticGradientDescent(),
        nil, nil) // trainMetrics, evalMetrics
    loop := train.NewLoop(trainer)
    AttachToLoop(loop)

    // Loop for given number of steps. must.M1() panics, if loop.RunSteps returns an error.
    metrics := must.M1(loop.RunSteps(dataset, *flagNumSteps))
    _ = metrics  // We are not interested in them in this example.

    // Print learned coefficients and bias -- from the weights in the dense layer.
    fmt.Println()
    coefVar, biasVar := ctx.GetVariableByScopeAndName("/dense", "weights"), ctx.GetVariableByScopeAndName("/dense", "biases")
    learnedCoef, learnedBias := coefVar.Value(), biasVar.Value()
    fmt.Printf("Learned: coefficients=%0.3v, bias=%0.3v\n", learnedCoef.Value(), learnedBias.Value())
}

%%
TrainMain()

Target: coefficients=[-5.96 5.39 0.652], bias=13.7
Training data (inputs, labels): ((Float64)[10000 3], (Float64)[10000 1])

       100% [========================================] (12516 steps/s) [step=99] [loss+=0.225] [~loss+=13] [~loss=12.9]        ]

Learned: coefficients=[[-5.83] [5.26] [0.649]], bias=[13.4]

import "github.com/gomlx/gomlx/ui/gonb/plotly"
import "os"

func AttachToLoop(loop *train.Loop) {
    commandline.AttachProgressBar(loop) // Attaches a progress bar to the loop.
    _ = plotly.New().Dynamic().ScheduleExponential(loop, 50, 1.1)
}

%% --steps=5000
TrainMain()

Target: coefficients=[-10.3 3.62 3.39], bias=10.3
Training data (inputs, labels): ((Float64)[10000 3], (Float64)[10000 1])

         3% [>.......................................] (16238 steps/s) [0s:0s] [step=164] [loss+=0.182] [~loss+=6.15] [~loss=6.04]

       100% [========================================] (14194 steps/s) [step=4999] [loss+=0.172] [~loss+=0.172] [~loss=0.0414]

Learned: coefficients=[[-10.3] [3.62] [3.38]], bias=[10.3]

    batch_size := inputs[0].Shape().Dimensions[0]
    ...
    layer := Concatenate(allEmbeddings, -1)
    layer.AssertDims(batchSize, -1)  // 2D tensor, with batch size as the leading dimension.

GoMLX Tutorial¶

Note: Output Not Displaying in JupyterLab ?¶

Computation Graphs (or Symbolic Computation)¶

Backends and executing Graphs with `graph.Exec`¶

`Exec` aliases:¶

Error Handling¶

Tensors¶

New tensors¶

Gradients¶

Machine Learning with GoMLX¶

Variables and Context¶

Finding $argmin_{x}{f(x)}$ example¶

Training a machine learning model¶

Dataset¶

ModelFn¶

Trainer and Loop¶

Training and Plotting¶

Other examples¶

Debugging¶

Good old "printf"¶

Errors in GoMLX have stacktrace¶

Node Shape Asserts¶

Graph Execution Logging¶

Catching `NaN` and `Inf` in your training¶

More Debugging¶

GoMLX Tutorial¶

Note: Output Not Displaying in JupyterLab ?¶

Computation Graphs (or Symbolic Computation)¶

Backends and executing Graphs with graph.Exec¶

Exec aliases:¶

Error Handling¶

Tensors¶

New tensors¶

Gradients¶

Machine Learning with GoMLX¶

Variables and Context¶

Finding $argmin_{x}{f(x)}$ example¶

Training a machine learning model¶

Dataset¶

ModelFn¶

Trainer and Loop¶

Training and Plotting¶

Other examples¶

Debugging¶

Good old "printf"¶

Errors in GoMLX have stacktrace¶

Node Shape Asserts¶

Graph Execution Logging¶

Catching NaN and Inf in your training¶

More Debugging¶

Backends and executing Graphs with `graph.Exec`¶

`Exec` aliases:¶

Catching `NaN` and `Inf` in your training¶