jump-dev
diff --git a/‎previews/PR262/examples/Thermal_Generation_Dispatch_Example/index.html
Lines changed: 149 additions & 149 deletions b/‎previews/PR262/examples/Thermal_Generation_Dispatch_Example/index.html
Lines changed: 149 additions & 149 deletions
diff --git a/‎previews/PR262/examples/autotuning-ridge/index.html
Lines changed: 159 additions & 159 deletions b/‎previews/PR262/examples/autotuning-ridge/index.html
Lines changed: 159 additions & 159 deletions
diff --git a/‎previews/PR262/examples/chainrules_unit/index.html
Lines changed: 523 additions & 523 deletions b/‎previews/PR262/examples/chainrules_unit/index.html
Lines changed: 523 additions & 523 deletions
diff --git a/‎previews/PR262/examples/custom-relu.jl
Lines changed: 8 additions & 15 deletions b/‎previews/PR262/examples/custom-relu.jl
Lines changed: 8 additions & 15 deletions
diff --git a/‎previews/PR262/examples/custom-relu/index.html
Lines changed: 8 additions & 37 deletions b/‎previews/PR262/examples/custom-relu/index.html
Lines changed: 8 additions & 37 deletions
diff --git a/‎previews/PR262/examples/matrix-inversion-manual/index.html
Lines changed: 1 addition & 1 deletion b/‎previews/PR262/examples/matrix-inversion-manual/index.html
Lines changed: 1 addition & 1 deletion
@@ -32,7 +32,7 @@ function matrix_relu(
     @variable(model, x[1:layer_size, 1:batch_size] >= 0)
     @objective(model, Min, x[:]'x[:] - 2y[:]'x[:])
     optimize!(model)
-    return value.(x)
+    return Float32.(value.(x))
 end
 
 # Define the reverse differentiation rule, for the function we defined above.
@@ -76,13 +76,13 @@ m = Flux.Chain(
 
 N = 1000 # batch size
 ## Preprocessing train data
-imgs = MLDatasets.MNIST.traintensor(1:N)
-labels = MLDatasets.MNIST.trainlabels(1:N)
+imgs = MLDatasets.MNIST(; split = :train).features[:, :, 1:N]
+labels = MLDatasets.MNIST(; split = :train).targets[1:N]
 train_X = float.(reshape(imgs, size(imgs, 1) * size(imgs, 2), N)) # stack images
 train_Y = Flux.onehotbatch(labels, 0:9);
 ## Preprocessing test data
-test_imgs = MLDatasets.MNIST.testtensor(1:N)
-test_labels = MLDatasets.MNIST.testlabels(1:N)
+test_imgs = MLDatasets.MNIST(; split = :test).features[:, :, 1:N]
+test_labels = MLDatasets.MNIST(; split = :test).targets[1:N];
 test_X = float.(reshape(test_imgs, size(test_imgs, 1) * size(test_imgs, 2), N))
 test_Y = Flux.onehotbatch(test_labels, 0:9);
 
@@ -97,19 +97,12 @@ dataset = repeated((train_X, train_Y), epochs);
 # ## Network training
 
 # training loss function, Flux optimizer
-custom_loss(x, y) = Flux.crossentropy(m(x), y)
-opt = Flux.Adam()
-evalcb = () -> @show(custom_loss(train_X, train_Y))
+custom_loss(m, x, y) = Flux.crossentropy(m(x), y)
+opt = Flux.setup(Flux.Adam(), m)
 
 # Train to optimize network parameters
 
-@time Flux.train!(
-    custom_loss,
-    Flux.params(m),
-    dataset,
-    opt,
-    cb = Flux.throttle(evalcb, 5),
-);
+@time Flux.train!(custom_loss, m, dataset, opt);
 
 # Although our custom implementation takes time, it is able to reach similar
 # accuracy as the usual ReLU function implementation.
 
@@ -17,7 +17,7 @@
     @variable(model, x[1:layer_size, 1:batch_size] &gt;= 0)
     @objective(model, Min, x[:]&#39;x[:] - 2y[:]&#39;x[:])
     optimize!(model)
-    return value.(x)
+    return Float32.(value.(x))
 end</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">matrix_relu (generic function with 1 method)</code></pre><p>Define the reverse differentiation rule, for the function we defined above.</p><pre><code class="language-julia hljs">function ChainRulesCore.rrule(::typeof(matrix_relu), y::Matrix{T}) where {T}
     model = Model(() -&gt; DiffOpt.diff_optimizer(Ipopt.Optimizer))
     pv = matrix_relu(y; model = model)
@@ -53,44 +53,15 @@
   NNlib.softmax,
 )                   # Total: 4 arrays, 7_960 parameters, 31.297 KiB.</code></pre><h2 id="Prepare-data"><a class="docs-heading-anchor" href="#Prepare-data">Prepare data</a><a id="Prepare-data-1"></a><a class="docs-heading-anchor-permalink" href="#Prepare-data" title="Permalink"></a></h2><pre><code class="language-julia hljs">N = 1000 # batch size
 # Preprocessing train data
-imgs = MLDatasets.MNIST.traintensor(1:N)
-labels = MLDatasets.MNIST.trainlabels(1:N)
+imgs = MLDatasets.MNIST(; split = :train).features[:, :, 1:N]
+labels = MLDatasets.MNIST(; split = :train).targets[1:N]
 train_X = float.(reshape(imgs, size(imgs, 1) * size(imgs, 2), N)) # stack images
 train_Y = Flux.onehotbatch(labels, 0:9);
 # Preprocessing test data
-test_imgs = MLDatasets.MNIST.testtensor(1:N)
-test_labels = MLDatasets.MNIST.testlabels(1:N)
+test_imgs = MLDatasets.MNIST(; split = :test).features[:, :, 1:N]
+test_labels = MLDatasets.MNIST(; split = :test).targets[1:N];
 test_X = float.(reshape(test_imgs, size(test_imgs, 1) * size(test_imgs, 2), N))
-test_Y = Flux.onehotbatch(test_labels, 0:9);</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">┌ Warning: MNIST.traintensor() is deprecated, use `MNIST(split=:train).features` instead.
-└ @ MLDatasets ~/.julia/packages/MLDatasets/0MkOE/src/datasets/vision/mnist.jl:157
-┌ Warning: MNIST.trainlabels() is deprecated, use `MNIST(split=:train).targets` instead.
-└ @ MLDatasets ~/.julia/packages/MLDatasets/0MkOE/src/datasets/vision/mnist.jl:173
-┌ Warning: MNIST.testtensor() is deprecated, use `MNIST(split=:test).features` instead.
-└ @ MLDatasets ~/.julia/packages/MLDatasets/0MkOE/src/datasets/vision/mnist.jl:165
-┌ Warning: MNIST.testlabels() is deprecated, use `MNIST(split=:test).targets` instead.
-└ @ MLDatasets ~/.julia/packages/MLDatasets/0MkOE/src/datasets/vision/mnist.jl:180</code></pre><p>Define input data The original data is repeated <code>epochs</code> times because <code>Flux.train!</code> only loops through the data set once</p><pre><code class="language-julia hljs">epochs = 50 # ~1 minute (i7 8th gen with 16gb RAM)
+test_Y = Flux.onehotbatch(test_labels, 0:9);</code></pre><p>Define input data The original data is repeated <code>epochs</code> times because <code>Flux.train!</code> only loops through the data set once</p><pre><code class="language-julia hljs">epochs = 50 # ~1 minute (i7 8th gen with 16gb RAM)
 # epochs = 100 # leads to 77.8% in about 2 minutes
-dataset = repeated((train_X, train_Y), epochs);</code></pre><h2 id="Network-training"><a class="docs-heading-anchor" href="#Network-training">Network training</a><a id="Network-training-1"></a><a class="docs-heading-anchor-permalink" href="#Network-training" title="Permalink"></a></h2><p>training loss function, Flux optimizer</p><pre><code class="language-julia hljs">custom_loss(x, y) = Flux.crossentropy(m(x), y)
-opt = Flux.Adam()
-evalcb = () -&gt; @show(custom_loss(train_X, train_Y))</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">#11 (generic function with 1 method)</code></pre><p>Train to optimize network parameters</p><pre><code class="language-julia hljs">@time Flux.train!(
-    custom_loss,
-    Flux.params(m),
-    dataset,
-    opt,
-    cb = Flux.throttle(evalcb, 5),
-);</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">┌ Warning: Layer with Float32 parameters got Float64 input.
-│   The input will be converted, but any earlier layers may be very slow.
-│   layer = Dense(10 =&gt; 10)     # 110 parameters
-│   summary(x) = &quot;10×1000 Matrix{Float64}&quot;
-└ @ Flux ~/.julia/packages/Flux/hiqg1/src/layers/stateless.jl:60
-custom_loss(train_X, train_Y) = 2.355365f0
-custom_loss(train_X, train_Y) = 2.2240443f0
-custom_loss(train_X, train_Y) = 2.1510334f0
-custom_loss(train_X, train_Y) = 2.0600805f0
-custom_loss(train_X, train_Y) = 1.9604436f0
-custom_loss(train_X, train_Y) = 1.8702683f0
-custom_loss(train_X, train_Y) = 1.7790897f0
-custom_loss(train_X, train_Y) = 1.691865f0
-custom_loss(train_X, train_Y) = 1.610134f0
-custom_loss(train_X, train_Y) = 1.5316879f0
-106.215850 seconds (76.76 M allocations: 4.763 GiB, 1.44% gc time, 0.71% compilation time)</code></pre><p>Although our custom implementation takes time, it is able to reach similar accuracy as the usual ReLU function implementation.</p><h2 id="Accuracy-results"><a class="docs-heading-anchor" href="#Accuracy-results">Accuracy results</a><a id="Accuracy-results-1"></a><a class="docs-heading-anchor-permalink" href="#Accuracy-results" title="Permalink"></a></h2><p>Average of correct guesses</p><pre><code class="language-julia hljs">accuracy(x, y) = Statistics.mean(Flux.onecold(m(x)) .== Flux.onecold(y));</code></pre><p>Training accuracy</p><pre><code class="language-julia hljs">accuracy(train_X, train_Y)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">0.562</code></pre><p>Test accuracy</p><pre><code class="language-julia hljs">accuracy(test_X, test_Y)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">0.478</code></pre><p>Note that the accuracy is low due to simplified training. It is possible to increase the number of samples <code>N</code>, the number of epochs <code>epoch</code> and the connectivity <code>inner</code>.</p><hr/><p><em>This page was generated using <a href="https://github.com/fredrikekre/Literate.jl">Literate.jl</a>.</em></p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../chainrules_unit/">« ChainRules integration demo: Relaxed Unit Commitment</a><a class="docs-footer-nextpage" href="../matrix-inversion-manual/">Differentiating a QP wrt a single variable »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 0.27.25 on <span class="colophon-date" title="Saturday 28 December 2024 09:26">Saturday 28 December 2024</span>. Using Julia version 1.11.2.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+dataset = repeated((train_X, train_Y), epochs);</code></pre><h2 id="Network-training"><a class="docs-heading-anchor" href="#Network-training">Network training</a><a id="Network-training-1"></a><a class="docs-heading-anchor-permalink" href="#Network-training" title="Permalink"></a></h2><p>training loss function, Flux optimizer</p><pre><code class="language-julia hljs">custom_loss(m, x, y) = Flux.crossentropy(m(x), y)
+opt = Flux.setup(Flux.Adam(), m)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">(layers = ((weight = Leaf(Adam(0.001, (0.9, 0.999), 1.0e-8), (Float32[0.0 0.0 … 0.0 0.0; 0.0 0.0 … 0.0 0.0; … ; 0.0 0.0 … 0.0 0.0; 0.0 0.0 … 0.0 0.0], Float32[0.0 0.0 … 0.0 0.0; 0.0 0.0 … 0.0 0.0; … ; 0.0 0.0 … 0.0 0.0; 0.0 0.0 … 0.0 0.0], (0.9, 0.999))), bias = Leaf(Adam(0.001, (0.9, 0.999), 1.0e-8), (Float32[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], Float32[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], (0.9, 0.999))), σ = ()), (), (weight = Leaf(Adam(0.001, (0.9, 0.999), 1.0e-8), (Float32[0.0 0.0 … 0.0 0.0; 0.0 0.0 … 0.0 0.0; … ; 0.0 0.0 … 0.0 0.0; 0.0 0.0 … 0.0 0.0], Float32[0.0 0.0 … 0.0 0.0; 0.0 0.0 … 0.0 0.0; … ; 0.0 0.0 … 0.0 0.0; 0.0 0.0 … 0.0 0.0], (0.9, 0.999))), bias = Leaf(Adam(0.001, (0.9, 0.999), 1.0e-8), (Float32[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], Float32[0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], (0.9, 0.999))), σ = ()), ()),)</code></pre><p>Train to optimize network parameters</p><pre><code class="language-julia hljs">@time Flux.train!(custom_loss, m, dataset, opt);</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">103.973062 seconds (72.91 M allocations: 4.475 GiB, 1.44% gc time, 0.71% compilation time)</code></pre><p>Although our custom implementation takes time, it is able to reach similar accuracy as the usual ReLU function implementation.</p><h2 id="Accuracy-results"><a class="docs-heading-anchor" href="#Accuracy-results">Accuracy results</a><a id="Accuracy-results-1"></a><a class="docs-heading-anchor-permalink" href="#Accuracy-results" title="Permalink"></a></h2><p>Average of correct guesses</p><pre><code class="language-julia hljs">accuracy(x, y) = Statistics.mean(Flux.onecold(m(x)) .== Flux.onecold(y));</code></pre><p>Training accuracy</p><pre><code class="language-julia hljs">accuracy(train_X, train_Y)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">0.562</code></pre><p>Test accuracy</p><pre><code class="language-julia hljs">accuracy(test_X, test_Y)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">0.478</code></pre><p>Note that the accuracy is low due to simplified training. It is possible to increase the number of samples <code>N</code>, the number of epochs <code>epoch</code> and the connectivity <code>inner</code>.</p><hr/><p><em>This page was generated using <a href="https://github.com/fredrikekre/Literate.jl">Literate.jl</a>.</em></p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../chainrules_unit/">« ChainRules integration demo: Relaxed Unit Commitment</a><a class="docs-footer-nextpage" href="../matrix-inversion-manual/">Differentiating a QP wrt a single variable »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 0.27.25 on <span class="colophon-date" title="Tuesday 14 January 2025 06:11">Tuesday 14 January 2025</span>. Using Julia version 1.11.2.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
@@ -68,4 +68,4 @@
     0.0 * index(x[1]) - 1.0,  # to indicate the direction vector to get directional derivatives
 )</code></pre><p>Note that <code>0.0 * index(x[1])</code> is used to make its type <code>typeof(0.0 * index(x[1]) - 1.0) &lt;: MOI.AbstractScalarFunction</code>. To indicate different direction to get directional derivative, users should replace <code>0.0 * index(x[1]) - 1.0</code> as the form of <code>dG*x - dh</code>, where <code>dG</code> and <code>dh</code> correspond to the elements of direction vectors along <code>G</code> and <code>h</code> axes, respectively.</p><p>Compute derivatives</p><pre><code class="language-julia hljs">DiffOpt.forward_differentiate!(model)</code></pre><p>Query derivative</p><pre><code class="language-julia hljs">dx = MOI.get.(model, DiffOpt.ForwardVariablePrimal(), x)</code></pre><pre class="documenter-example-output"><code class="nohighlight hljs ansi">2-element Vector{Float64}:
  0.2500000038571342
- 0.7500000115714025</code></pre><hr/><p><em>This page was generated using <a href="https://github.com/fredrikekre/Literate.jl">Literate.jl</a>.</em></p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../custom-relu/">« Custom ReLU layer</a><a class="docs-footer-nextpage" href="../nearest_correlation/">Nearest correlation »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 0.27.25 on <span class="colophon-date" title="Saturday 28 December 2024 09:26">Saturday 28 December 2024</span>. Using Julia version 1.11.2.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+ 0.7500000115714025</code></pre><hr/><p><em>This page was generated using <a href="https://github.com/fredrikekre/Literate.jl">Literate.jl</a>.</em></p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../custom-relu/">« Custom ReLU layer</a><a class="docs-footer-nextpage" href="../nearest_correlation/">Nearest correlation »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 0.27.25 on <span class="colophon-date" title="Tuesday 14 January 2025 06:11">Tuesday 14 January 2025</span>. Using Julia version 1.11.2.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>