fix doc

BatyLeo · BatyLeo · commit 1b2b20ed3a8d · 2026-01-10T09:13:43.000+01:00
diff --git a/docs/Project.toml b/docs/Project.toml
@@ -1,4 +1,8 @@
 [deps]
 DecisionFocusedLearningAlgorithms = "46d52364-bc3b-4fac-a992-eb1d3ef2de15"
+DecisionFocusedLearningBenchmarks = "2fbe496a-299b-4c81-bab5-c44dfc55cf20"
 Documenter = "e30172f5-a6a5-5a46-863b-614d45cd2de4"
 Literate = "98b081ad-f1c9-55d3-8b20-4c87d4299306"
+Flux = "587475ba-b771-5e3f-ad9e-33799f191a9c"
+MLUtils = "f1d291b0-491e-4a28-83b9-f70985020b54"
+Plots = "91a5bcdd-55d7-5caf-9e0b-520d859cae80"
diff --git a/docs/make.jl b/docs/make.jl
@@ -1,24 +1,35 @@
 using DecisionFocusedLearningAlgorithms
 using Documenter
+using Literate
 
 DocMeta.setdocmeta!(
     DecisionFocusedLearningAlgorithms,
     :DocTestSetup,
-    :(using DecisionFocusedLearningAlgorithms);
+    :(begin
+        using DecisionFocusedLearningAlgorithms
+        using DecisionFocusedLearningBenchmarks
+        using Flux
+        using MLUtils
+        using Plots
+    end),
     recursive=true,
 )
 
+# Generate markdown files from tutorial scripts
 tutorial_dir = joinpath(@__DIR__, "src", "tutorials")
+tutorial_files = filter(f -> endswith(f, ".jl"), readdir(tutorial_dir))
 
-include_tutorial = true
-
-if include_tutorial
-    for file in tutorial_files
-        filepath = joinpath(tutorial_dir, file)
-        Literate.markdown(filepath, md_dir; documenter=true, execute=false)
-    end
+# Convert .jl tutorial files to markdown
+for file in tutorial_files
+    filepath = joinpath(tutorial_dir, file)
+    Literate.markdown(filepath, tutorial_dir; documenter=true, execute=false)
 end
 
+# Get list of generated markdown files for the docs
+md_tutorial_files = [
+    "tutorials/" * replace(file, ".jl" => ".md") for file in tutorial_files
+]
+
 makedocs(;
     modules=[DecisionFocusedLearningAlgorithms],
     authors="Members of JuliaDecisionFocusedLearning and contributors",
@@ -28,7 +39,7 @@ makedocs(;
         edit_link="main",
         assets=String[],
     ),
-    pages=["Home" => "index.md", "Tutorials" => include_tutorial ? md_tutorial_files : []],
+    pages=["Home" => "index.md", "Tutorials" => md_tutorial_files],
 )
 
 deploydocs(;
diff --git a/docs/src/tutorials/tutorial.jl b/docs/src/tutorials/tutorial.jl
@@ -13,35 +13,65 @@ train_instances, validation_instances, test_instances = splitobs(
 model = generate_statistical_model(b; seed=0)
 maximizer = generate_maximizer(b)
 
-compute_gap(b, test_instances, model, maximizer)
-
-metrics_callbacks = (;
-    :time => (model, maximizer, epoch) -> (epoch_time = time()),
-    :gap => (;
-        :val =>
-            (model, maximizer, epoch) ->
-                (gap = compute_gap(b, validation_instances, model, maximizer)),
-        :test =>
-            (model, maximizer, epoch) ->
-                (gap = compute_gap(b, test_instances, model, maximizer)),
-    ),
+# Compute initial gap
+initial_gap = compute_gap(b, test_instances, model, maximizer)
+println("Initial test gap: $initial_gap")
+
+# Configure the training algorithm
+algorithm = PerturbedImitationAlgorithm(;
+    nb_samples=10, ε=0.1, threaded=true, seed=0
 )
 
+# Define metrics to track during training
+validation_loss_metric = FYLLossMetric(validation_instances, :validation_loss)
+
+# Validation gap metric
+val_gap_metric = FunctionMetric(:val_gap, validation_instances) do ctx, data
+    compute_gap(b, data, ctx.model, ctx.maximizer)
+end
+
+# Test gap metric
+test_gap_metric = FunctionMetric(:test_gap, test_instances) do ctx, data
+    compute_gap(b, data, ctx.model, ctx.maximizer)
+end
+
+# Combine metrics
+metrics = (validation_loss_metric, val_gap_metric, test_gap_metric)
+
+# Train the model
 fyl_model = deepcopy(model)
-log = fyl_train_model!(
+history = train_policy!(
+    algorithm,
     fyl_model,
     maximizer,
     train_instances,
     validation_instances;
     epochs=100,
-    metrics_callbacks,
+    metrics=metrics,
 )
 
-log[:gap]
+# Plot validation and test gaps
+val_gap_epochs, val_gap_values = get(history, :val_gap)
+test_gap_epochs, test_gap_values = get(history, :test_gap)
+
 plot(
-    [log[:gap].val, log[:gap].test];
+    [val_gap_epochs, test_gap_epochs],
+    [val_gap_values, test_gap_values];
     labels=["Val Gap" "Test Gap"],
     xlabel="Epoch",
     ylabel="Gap",
+    title="Gap Evolution During Training",
+)
+
+# Plot validation loss
+train_loss_epochs, train_loss_values = get(history, :training_loss)
+val_loss_epochs, val_loss_values = get(history, :validation_loss)
+
+plot(
+    [train_loss_epochs, val_loss_epochs],
+    [train_loss_values, val_loss_values];
+    labels=["Training Loss" "Validation Loss"],
+    xlabel="Epoch",
+    ylabel="Loss",
+    title="Loss Evolution During Training",
 )
-plot(log[:validation_loss])
diff --git a/docs/src/tutorials/tutorial.md b/docs/src/tutorials/tutorial.md
@@ -0,0 +1,116 @@
+```@meta
+EditURL = "tutorial.jl"
+```
+
+Tutorial
+
+````@example tutorial
+using DecisionFocusedLearningAlgorithms
+using DecisionFocusedLearningBenchmarks
+using MLUtils: splitobs
+using Plots
+
+b = ArgmaxBenchmark()
+dataset = generate_dataset(b, 100)
+train_instances, validation_instances, test_instances = splitobs(
+    dataset; at=(0.3, 0.3, 0.4)
+)
+
+model = generate_statistical_model(b; seed=0)
+maximizer = generate_maximizer(b)
+````
+
+Compute initial gap
+
+````@example tutorial
+initial_gap = compute_gap(b, test_instances, model, maximizer)
+println("Initial test gap: $initial_gap")
+````
+
+Configure the training algorithm
+
+````@example tutorial
+algorithm = PerturbedImitationAlgorithm(;
+    nb_samples=10, ε=0.1, threaded=true, seed=0
+)
+````
+
+Define metrics to track during training
+
+````@example tutorial
+validation_loss_metric = FYLLossMetric(validation_instances, :validation_loss)
+````
+
+Validation gap metric
+
+````@example tutorial
+val_gap_metric = FunctionMetric(:val_gap, validation_instances) do ctx, data
+    compute_gap(b, data, ctx.model, ctx.maximizer)
+end
+````
+
+Test gap metric
+
+````@example tutorial
+test_gap_metric = FunctionMetric(:test_gap, test_instances) do ctx, data
+    compute_gap(b, data, ctx.model, ctx.maximizer)
+end
+````
+
+Combine metrics
+
+````@example tutorial
+metrics = (validation_loss_metric, val_gap_metric, test_gap_metric)
+````
+
+Train the model
+
+````@example tutorial
+fyl_model = deepcopy(model)
+history = train_policy!(
+    algorithm,
+    fyl_model,
+    maximizer,
+    train_instances,
+    validation_instances;
+    epochs=100,
+    metrics=metrics,
+)
+````
+
+Plot validation and test gaps
+
+````@example tutorial
+val_gap_epochs, val_gap_values = get(history, :val_gap)
+test_gap_epochs, test_gap_values = get(history, :test_gap)
+
+plot(
+    [val_gap_epochs, test_gap_epochs],
+    [val_gap_values, test_gap_values];
+    labels=["Val Gap" "Test Gap"],
+    xlabel="Epoch",
+    ylabel="Gap",
+    title="Gap Evolution During Training",
+)
+````
+
+Plot validation loss
+
+````@example tutorial
+train_loss_epochs, train_loss_values = get(history, :training_loss)
+val_loss_epochs, val_loss_values = get(history, :validation_loss)
+
+plot(
+    [train_loss_epochs, val_loss_epochs],
+    [train_loss_values, val_loss_values];
+    labels=["Training Loss" "Validation Loss"],
+    xlabel="Epoch",
+    ylabel="Loss",
+    title="Loss Evolution During Training",
+)
+````
+
+---
+
+*This page was generated using [Literate.jl](https://github.com/fredrikekre/Literate.jl).*
+
diff --git a/src/DecisionFocusedLearningAlgorithms.jl b/src/DecisionFocusedLearningAlgorithms.jl
@@ -19,8 +19,8 @@ include("metrics/accumulators.jl")
 include("metrics/function_metric.jl")
 include("metrics/periodic.jl")
 
-include("fyl.jl")
-include("dagger.jl")
+include("algorithms/fyl.jl")
+include("algorithms/dagger.jl")
 
 export TrainingContext
 
diff --git a/src/algorithms/dagger.jl b/src/algorithms/dagger.jl
diff --git a/src/algorithms/fyl.jl b/src/algorithms/fyl.jl