TrainingLoop: refactor progress printer and add CSVLogger (#668)

xihui-wu · web-flow · commit adda08e6fe79 · 2020-09-23T17:35:14.000-07:00
diff --git a/Examples/LeNet-MNIST/main.swift b/Examples/LeNet-MNIST/main.swift
@@ -31,24 +31,33 @@ let dataset = MNIST(batchSize: batchSize, on: device)
 
 // The LeNet-5 model, equivalent to `LeNet` in `ImageClassificationModels`.
 var classifier = Sequential {
-    Conv2D<Float>(filterShape: (5, 5, 1, 6), padding: .same, activation: relu)
-    AvgPool2D<Float>(poolSize: (2, 2), strides: (2, 2))
-    Conv2D<Float>(filterShape: (5, 5, 6, 16), activation: relu)
-    AvgPool2D<Float>(poolSize: (2, 2), strides: (2, 2))
-    Flatten<Float>()
-    Dense<Float>(inputSize: 400, outputSize: 120, activation: relu)
-    Dense<Float>(inputSize: 120, outputSize: 84, activation: relu)
-    Dense<Float>(inputSize: 84, outputSize: 10)
+  Conv2D<Float>(filterShape: (5, 5, 1, 6), padding: .same, activation: relu)
+  AvgPool2D<Float>(poolSize: (2, 2), strides: (2, 2))
+  Conv2D<Float>(filterShape: (5, 5, 6, 16), activation: relu)
+  AvgPool2D<Float>(poolSize: (2, 2), strides: (2, 2))
+  Flatten<Float>()
+  Dense<Float>(inputSize: 400, outputSize: 120, activation: relu)
+  Dense<Float>(inputSize: 120, outputSize: 84, activation: relu)
+  Dense<Float>(inputSize: 84, outputSize: 10)
 }
 
 var optimizer = SGD(for: classifier, learningRate: 0.1)
 
-let trainingProgress = TrainingProgress()
 var trainingLoop = TrainingLoop(
   training: dataset.training,
   validation: dataset.validation,
   optimizer: optimizer,
   lossFunction: softmaxCrossEntropy,
-  callbacks: [trainingProgress.update])
+  metrics: [.accuracy],
+  callbacks: [try! CSVLogger().log])
+
+// Compute statistics only when last batch ends.
+trainingLoop.statisticsRecorder!.shouldCompute = {
+  (
+    _ batchIndex: Int, _ batchCount: Int, _ epochIndex: Int, _ epochCount: Int,
+    _ event: TrainingLoopEvent
+  ) -> Bool in
+  return event == .batchEnd && batchIndex + 1 == batchCount
+}
 
 try! trainingLoop.fit(&classifier, epochs: epochCount, on: device)
diff --git a/Examples/MobileNetV1-Imagenette/main.swift b/Examples/MobileNetV1-Imagenette/main.swift
@@ -29,12 +29,11 @@ let dataset = Imagenette(batchSize: 64, inputSize: .resized320, outputSize: 224,
 var model = MobileNetV1(classCount: 10)
 let optimizer = SGD(for: model, learningRate: 0.02, momentum: 0.9)
 
-let trainingProgress = TrainingProgress()
 var trainingLoop = TrainingLoop(
   training: dataset.training,
   validation: dataset.validation,
   optimizer: optimizer,
   lossFunction: softmaxCrossEntropy,
-  callbacks: [trainingProgress.update])
+  metrics: [.accuracy])
 
 try! trainingLoop.fit(&model, epochs: 10, on: device)
diff --git a/Examples/MobileNetV2-Imagenette/main.swift b/Examples/MobileNetV2-Imagenette/main.swift
@@ -29,12 +29,11 @@ let dataset = Imagenette(batchSize: 64, inputSize: .resized320, outputSize: 224,
 var model = MobileNetV2(classCount: 10)
 let optimizer = SGD(for: model, learningRate: 0.002, momentum: 0.9)
 
-let trainingProgress = TrainingProgress()
 var trainingLoop = TrainingLoop(
   training: dataset.training,
   validation: dataset.validation,
   optimizer: optimizer,
   lossFunction: softmaxCrossEntropy,
-  callbacks: [trainingProgress.update])
+  metrics: [.accuracy])
 
 try! trainingLoop.fit(&model, epochs: 10, on: device)
diff --git a/Examples/ResNet-CIFAR10/main.swift b/Examples/ResNet-CIFAR10/main.swift
@@ -29,12 +29,11 @@ let dataset = CIFAR10(batchSize: 10, on: device)
 var model = ResNet(classCount: 10, depth: .resNet56, downsamplingInFirstStage: false)
 var optimizer = SGD(for: model, learningRate: 0.001)
 
-let trainingProgress = TrainingProgress()
 var trainingLoop = TrainingLoop(
   training: dataset.training,
   validation: dataset.validation,
   optimizer: optimizer,
   lossFunction: softmaxCrossEntropy,
-  callbacks: [trainingProgress.update])
+  metrics: [.accuracy])
 
 try! trainingLoop.fit(&model, epochs: 10, on: device)
diff --git a/Examples/VGG-Imagewoof/main.swift b/Examples/VGG-Imagewoof/main.swift
@@ -39,12 +39,12 @@ public func scheduleLearningRate<L: TrainingLoopProtocol>(
   }
 }
 
-let trainingProgress = TrainingProgress()
 var trainingLoop = TrainingLoop(
   training: dataset.training,
   validation: dataset.validation,
   optimizer: optimizer,
   lossFunction: softmaxCrossEntropy,
-  callbacks: [trainingProgress.update, scheduleLearningRate])
+  metrics: [.accuracy],
+  callbacks: [scheduleLearningRate])
 
 try! trainingLoop.fit(&model, epochs: 90, on: device)
diff --git a/Support/FileSystem.swift b/Support/FileSystem.swift
@@ -39,4 +39,5 @@ public protocol File {
   func read(position: Int, count: Int) throws -> Data
   func write(_ value: Data) throws
   func write(_ value: Data, position: Int) throws
+  func append(_ value: Data) throws
 }
diff --git a/Support/FoundationFileSystem.swift b/Support/FoundationFileSystem.swift
@@ -58,4 +58,14 @@ public struct FoundationFile: File {
     // TODO: Incorporate file offset.
     try value.write(to: location)
   }
+
+  /// Append data to the file.
+  ///
+  /// Parameter value: data to be appended at the end.
+  public func append(_ value: Data) throws {
+    let fileHandler = try FileHandle(forUpdating: location)
+    try fileHandler.seekToEnd()
+    try fileHandler.write(contentsOf: value)
+    try fileHandler.close()
+  }
 }
diff --git a/TrainingLoop/CMakeLists.txt b/TrainingLoop/CMakeLists.txt
@@ -1,8 +1,10 @@
 add_library(TrainingLoop
   LossFunctions.swift
+  Metrics.swift
   TrainingLoop.swift
-  TrainingProgress.swift
-  TrainingStatistics.swift)
+  Callbacks/StatisticsRecorder.swift
+  Callbacks/ProgressPrinter.swift
+  Callbacks/CSVLogger.swift)
 target_link_libraries(TrainingLoop PUBLIC
   ModelSupport)
 set_target_properties(TrainingLoop PROPERTIES
diff --git a/TrainingLoop/Callbacks/CSVLogger.swift b/TrainingLoop/Callbacks/CSVLogger.swift
@@ -0,0 +1,74 @@
+import Foundation
+import ModelSupport
+
+public enum CSVLoggerError: Error {
+  case InvalidPath
+}
+
+/// A handler for logging training and validation statistics to a CSV file.
+public class CSVLogger {
+  /// The path of the file that statistics are logged to.
+  public var path: String
+
+  // True iff the header of the CSV file has been written.
+  fileprivate var headerWritten: Bool
+
+  /// Creates an instance that logs to a file with the given path.
+  ///
+  /// Throws: File system errors.
+  public init(path: String = "run/log.csv") throws {
+    self.path = path
+
+    // Validate the path.
+    let url = URL(fileURLWithPath: path)
+    if url.pathExtension != "csv" {
+      throw CSVLoggerError.InvalidPath
+    }
+    // Create the containing directory if it is missing.
+    try FoundationFileSystem().createDirectoryIfMissing(at: url.deletingLastPathComponent().path)
+    // Initialize the file with empty string.
+    try FoundationFile(path: path).write(Data())
+
+    self.headerWritten = false
+  }
+
+  /// Logs the statistics for the 'loop' when 'batchEnd' event happens; 
+  /// ignoring other events.
+  ///
+  /// Throws: File system errors.
+  public func log<L: TrainingLoopProtocol>(_ loop: inout L, event: TrainingLoopEvent) throws {
+    switch event {
+    case .batchEnd:
+      guard let epochIndex = loop.epochIndex, let epochCount = loop.epochCount,
+        let batchIndex = loop.batchIndex, let batchCount = loop.batchCount,
+        let stats = loop.lastStatsLog
+      else {
+        // No-Op if trainingLoop doesn't set the required values for stats logging.
+        return
+      }
+
+      if !headerWritten {
+        try writeHeader(stats: stats)
+        headerWritten = true
+      }
+
+      try writeDataRow(
+        epoch: "\(epochIndex + 1)/\(epochCount)",
+        batch: "\(batchIndex + 1)/\(batchCount)",
+        stats: stats)
+    default:
+      return
+    }
+  }
+
+  func writeHeader(stats: [(name: String, value: Float)]) throws {
+    let header = (["epoch", "batch"] + stats.lazy.map { $0.name }).joined(separator: ", ") + "\n"
+    try FoundationFile(path: path).append(header.data(using: .utf8)!)
+  }
+
+  func writeDataRow(epoch: String, batch: String, stats: [(name: String, value: Float)]) throws {
+    let dataRow = ([epoch, batch] + stats.lazy.map { String($0.value) }).joined(separator: ", ")
+      + "\n"
+    try FoundationFile(path: path).append(dataRow.data(using: .utf8)!)
+  }
+}
diff --git a/TrainingLoop/Callbacks/ProgressPrinter.swift b/TrainingLoop/Callbacks/ProgressPrinter.swift
@@ -0,0 +1,85 @@
+// Copyright 2020 The TensorFlow Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+import Foundation
+
+let progressBarLength = 30
+
+/// A handler for printing the training and validation progress. 
+public class ProgressPrinter {
+  /// Print training or validation progress in response of the 'event'.
+  /// 
+  /// An example of the progress would be:
+  /// Epoch 1/12
+  /// 468/468 [==============================] - loss: 0.4819 - accuracy: 0.8513
+  /// 79/79 [==============================] - loss: 0.1520 - accuracy: 0.9521
+  public func print<L: TrainingLoopProtocol>(_ loop: inout L, event: TrainingLoopEvent) throws {
+    switch event {
+    case .epochStart:
+      guard let epochIndex = loop.epochIndex, let epochCount = loop.epochCount else {
+        // No-Op if trainingLoop doesn't set the required values for progress printing.
+        return
+      }
+
+      Swift.print("Epoch \(epochIndex + 1)/\(epochCount)")
+    case .batchEnd:
+      guard let batchIndex = loop.batchIndex, let batchCount = loop.batchCount else {
+        // No-Op if trainingLoop doesn't set the required values for progress printing.
+        return
+      }
+
+      let progressBar = formatProgressBar(
+        progress: Float(batchIndex + 1) / Float(batchCount), length: progressBarLength)
+      var stats: String = ""
+      if let lastStatsLog = loop.lastStatsLog {
+        stats = formatStats(lastStatsLog)
+      }
+
+      Swift.print(
+        "\r\(batchIndex + 1)/\(batchCount) \(progressBar)\(stats)",
+        terminator: ""
+      )
+      fflush(stdout)
+    case .epochEnd:
+      Swift.print("")
+    case .validationStart:
+      Swift.print("")
+    default:
+      return
+    }
+  }
+
+  func formatProgressBar(progress: Float, length: Int) -> String {
+    let progressSteps = Int(round(Float(length) * progress))
+    let leading = String(repeating: "=", count: progressSteps)
+    let separator: String
+    let trailing: String
+    if progressSteps < progressBarLength {
+      separator = ">"
+      trailing = String(repeating: ".", count: progressBarLength - progressSteps - 1)
+    } else {
+      separator = ""
+      trailing = ""
+    }
+    return "[\(leading)\(separator)\(trailing)]"
+  }
+
+  func formatStats(_ stats: [(String, Float)]) -> String {
+    var result = ""
+    for stat in stats {
+      result += " - \(stat.0): \(String(format: "%.4f", stat.1))"
+    }
+    return result
+  }
+}
diff --git a/TrainingLoop/Callbacks/StatisticsRecorder.swift b/TrainingLoop/Callbacks/StatisticsRecorder.swift
diff --git a/TrainingLoop/Metrics.swift b/TrainingLoop/Metrics.swift
diff --git a/TrainingLoop/TrainingLoop.swift b/TrainingLoop/TrainingLoop.swift
diff --git a/TrainingLoop/TrainingProgress.swift b/TrainingLoop/TrainingProgress.swift
diff --git a/TrainingLoop/TrainingStatistics.swift b/TrainingLoop/TrainingStatistics.swift

Original file line number	Diff line number	Diff line change
`@@ -39,12 +39,12 @@ public func scheduleLearningRate<L: TrainingLoopProtocol>(`
`39`	`39`	`}`
`40`	`40`	`}`
`41`	`41`
`42`		`-let trainingProgress = TrainingProgress()`
`43`	`42`	`var trainingLoop = TrainingLoop(`
`44`	`43`	`training: dataset.training,`
`45`	`44`	`validation: dataset.validation,`
`46`	`45`	`optimizer: optimizer,`
`47`	`46`	`lossFunction: softmaxCrossEntropy,`
`48`		`- callbacks: [trainingProgress.update, scheduleLearningRate])`
	`47`	`+ metrics: [.accuracy],`
	`48`	`+ callbacks: [scheduleLearningRate])`
`49`	`49`
`50`	`50`	`try! trainingLoop.fit(&model, epochs: 90, on: device)`
Original file line number	Diff line number	Diff line change
`@@ -39,4 +39,5 @@ public protocol File {`
`39`	`39`	`func read(position: Int, count: Int) throws -> Data`
`40`	`40`	`func write(_ value: Data) throws`
`41`	`41`	`func write(_ value: Data, position: Int) throws`
	`42`	`+ func append(_ value: Data) throws`
`42`	`43`	`}`
-Original file line number
+Diff line change
 +import TensorFlow
++
 +/// Metrics that can be registered into TrainingLoop.
 +public enum TrainingMetrics {
 +  case loss
 +  case accuracy
++
 +  public var name: String {
 +    switch self {
 +    case .loss:
 +      return "loss"
 +    case .accuracy:
 +      return "accuracy"
 +    }
 +  }
++
 +  public var measurer: MetricsMeasurer {
 +    switch self {
 +    case .loss:
 +      return LossMeasurer(self.name)
 +    case .accuracy:
 +      return AccuracyMeasurer(self.name)
 +    }
 +  }
 +}
++
 +/// A protocal defining functionalities of a metrics measurer.
 +public protocol MetricsMeasurer {
 +  var name: String { get set }
 +  mutating func reset()
 +  mutating func accumulate<Output, Target>(
 +    loss: Tensor<Float>?, predictions: Output?, labels: Target?
 +  )
 +  func measure() -> Float
 +}
++
 +/// A measurer for measuring loss.
 +public struct LossMeasurer: MetricsMeasurer {
 +  public var name: String
++
 +  private var totalBatchLoss: Float = 0
 +  private var batchCount: Int32 = 0
++
 +  public init(_ name: String = "loss") {
 +    self.name = name
 +  }
++
 +  public mutating func reset() {
 +    totalBatchLoss = 0
 +    batchCount = 0
 +  }
++
 +  public mutating func accumulate<Output, Target>(
 +    loss: Tensor<Float>?, predictions: Output?, labels: Target?
 +  ) {
 +    if let newBatchLoss = loss {
 +      totalBatchLoss += newBatchLoss.scalarized()
 +      batchCount += 1
 +    }
 +  }
++
 +  public func measure() -> Float {
 +    return totalBatchLoss / Float(batchCount)
 +  }
 +}
++
 +/// A measurer for measuring accuracy
 +public struct AccuracyMeasurer: MetricsMeasurer {
 +  public var name: String
++
 +  private var correctGuessCount: Int32 = 0
 +  private var totalGuessCount: Int32 = 0
++
 +  public init(_ name: String = "accuracy") {
 +    self.name = name
 +  }
++
 +  public mutating func reset() {
 +    correctGuessCount = 0
 +    totalGuessCount = 0
 +  }
++
 +  public mutating func accumulate<Output, Target>(
 +    loss: Tensor<Float>?, predictions: Output?, labels: Target?
 +  ) {
 +    guard let predictions = predictions as? Tensor<Float>, let labels = labels as? Tensor<Int32>
 +    else {
 +      fatalError(
 +        "For accuracy measurements, the model output must be Tensor<Float>, and the labels must be Tensor<Int>."
 +      )
 +    }
 +    correctGuessCount += Tensor<Int32>(predictions.argmax(squeezingAxis: 1) .== labels).sum()
 +      .scalarized()
 +    totalGuessCount += Int32(labels.shape[0])
 +  }
++
 +  public func measure() -> Float {
 +    return Float(correctGuessCount) / Float(totalGuessCount)
 +  }
 +}
-Original file line number
+Diff line change
 // Workaround https://bugs.swift.org/browse/TF-1122 that prevents us from registering a
 // loss function inside our TrainingLoop struct
 public final class LossFunctionWrapper<Output: Differentiable, Target> {
 -  public typealias F = @differentiable (Output, @noDerivative Target) -> Tensor<Float>
 +  public typealias F = @differentiable(Output, @noDerivative Target) -> Tensor<Float>
   public var f: F
   init(_ f: @escaping F) { self.f = f }
+}
   where
     Training: Sequence, Training.Element: Collection,
     Training.Element.Element == LabeledData<Opt.Model.Input, Target>
++
   /// The type of the collection of batches for the validation data.
   associatedtype Validation
   where
     Validation: Collection,
     Validation.Element == LabeledData<Opt.Model.Input, Target>
++
   /// The type of the target of our model.
   associatedtype Target
++
   /// The type of the optimizer used.
   associatedtype Opt: Optimizer where Opt.Model: Module
   // Typealiases
   /// The type of the model.
   typealias Model = Opt.Model
++
   /// The type of the input of the model.
   typealias Input = Opt.Model.Input
++
   /// The type of the output of the model.
   typealias Output = Opt.Model.Output
++
   /// The type of a batch.
   typealias Batch = LabeledData<Input, Target>
++
   // In a wrapper for now because of TF-1122.
   /// The type of the loss function.
   typealias LossFunction = LossFunctionWrapper<Output, Target>
   // Data
   /// The training epochs.
   var training: Training { get }
++
   /// The validation batches.
   var validation: Validation { get }
   // Optimizer and loss function
   /// The optimizer.
   var optimizer: Opt { get set }
++
   /// The loss function.
   var lossFunction: LossFunction { get set }
 +  /// The metrics
 +  var metrics: [TrainingMetrics] { get set }
++
   // Callbacks
   /// The callbacks used to customize the training loop.
   var callbacks: [TrainingLoopCallback<Self>] { get set }
   // Temporary data
++
 +  // MARK: - Step-level data
++
   /// The last input fed to the model.
 -  var lastInput: Input? { get set }
 +  var lastStepInput: Input? { get set }
++
   /// The last target.
 -  var lastTarget: Target? { get set }
 +  var lastStepTarget: Target? { get set }
++
   /// The last predictions of the model.
 -  var lastOutput: Output? { get set }
 +  var lastStepOutput: Output? { get set }
++
   /// The last gradients computed.
 -  var lastGradient: Model.TangentVector? { get set }
 +  var lastStepGradient: Model.TangentVector? { get set }
++
   /// The last loss.
 -  var lastLoss: Tensor<Float>? { get set }
 -  /// The number of epochs we are currently fitting for.
 -  var epochCount: Int? { get set }
 -  /// The index of the current epoch.
 -  var epochIndex: Int? { get set }
 +  var lastStepLoss: Tensor<Float>? { get set }
++
   /// The number of batches in the current collection of batches.
   var batchCount: Int? { get set }
++
   /// The index of the current batch.
   var batchIndex: Int? { get set }
++
 +  // MARK: - Epoch-level data
++
 +  /// The number of epochs we are currently fitting for.
 +  var epochCount: Int? { get set }
++
 +  /// The index of the current epoch.
 +  var epochIndex: Int? { get set }
++
 +  // MARK: - Others
++
 +  /// The log for last statistics
 +  var lastStatsLog: [(name: String, value: Float)]? { get set }
+}
 /// The events that occur during a call to `fit` in the `TrainingLoop`
 public enum TrainingLoopEvent {
   /// The start of a fit.
   case fitStart
++
   /// The end of a fit.
   case fitEnd
++
   /// The start of one epoch (training + validation).
   case epochStart
++
   /// The start of one epoch (training + validation).
   case epochEnd
++
   /// The start of a training phase.
   case trainingStart
++
   /// The end of a training phase.
   case trainingEnd
++
   /// The start of a validation phase.
   case validationStart
++
   /// The end of a validation phase.
   case validationEnd
++
   /// The start of a training or inference step on a batch.
   case batchStart
++
   /// The end of a training or inference step on a batch.
   case batchEnd
++
   /// At the start of the optimizer update, just after the differentiable step.
   case updateStart
++
   /// Just after the model prediction at inference, before computing the loss.
   case inferencePredictionEnd
+}
   // Typealiases
   /// The type of the model.
   public typealias Model = Opt.Model
++
   /// The type of the input of the model.
   public typealias Input = Opt.Model.Input
++
   /// The type of the output of the model.
   public typealias Output = Opt.Model.Output
++
   /// The type of a batch.
   public typealias Batch = LabeledData<Input, Target>
++
   // In a wrapper for now because of TF-1122.
   /// The type of the loss function.
   public typealias LossFunction = LossFunctionWrapper<Output, Target>
   // Data
   /// The training epochs.
   public let training: Training
++
   /// The validation batches.
   public let validation: Validation
   // Optimizer and loss function
   /// The optimizer.
   public var optimizer: Opt
++
   /// The loss function
   public var lossFunction: LossFunction
 -  // Callbacks
 -  /// The callbacks used to customize the training loop.
 -  public var callbacks: [TrainingLoopCallback<Self>] = []
 +  /// The metrics
 +  public var metrics: [TrainingMetrics]
++
 +  /// Callbacks
++
 +  // MARK: - The callbacks used to customize the training loop.
++
 +  public var callbacks: [TrainingLoopCallback<Self>]
++
 +  // MARK: - Default callback objects
++
 +  public var statisticsRecorder: StatisticsRecorder? = nil
++
 +  public var progressPrinter: ProgressPrinter? = nil
++
 +  /// Temporary data
++
 +  // MARK: - Step-level data
 -  // Temporary data
   /// The last input fed to the model.
 -  public var lastInput: Input? = nil
 +  public var lastStepInput: Input? = nil
++
   /// The last target.
 -  public var lastTarget: Target? = nil
 +  public var lastStepTarget: Target? = nil
++
   /// The last predictions of the model.
 -  public var lastOutput: Output? = nil
 +  public var lastStepOutput: Output? = nil
++
   /// The last gradients computed.
 -  public var lastGradient: Model.TangentVector? = nil
 +  public var lastStepGradient: Model.TangentVector? = nil
++
   /// The last loss.
 -  public var lastLoss: Tensor<Float>? = nil
 -  /// The number of epochs we are currently fitting for.
 -  public var epochCount: Int? = nil
 -  /// The index of the current epoch.
 -  public var epochIndex: Int? = nil
 +  public var lastStepLoss: Tensor<Float>? = nil
++
   /// The number of batches in the current collection of batches.
   public var batchCount: Int? = nil
++
   /// The index of the current batch.
   public var batchIndex: Int? = nil
 +  // MARK: - Epoch-level data
++
 +  /// The number of epochs we are currently fitting for.
 +  public var epochCount: Int? = nil
++
 +  /// The index of the current epoch.
 +  public var epochIndex: Int? = nil
++
 +  // MARK: - Others
++
 +  /// The log for last statistics
 +  public var lastStatsLog: [(name: String, value: Float)]? = nil
++
   /// Creates an instance from `training` and `validation` data, a `model`, an `optimizer` and a
   /// `lossFunction`.
   ///
   /// Parameter callbacks: Callbacks that the `TrainingLoop` will use in every call to fit.
   public init(
     training: Training, validation: Validation, optimizer: Opt,
 -    lossFunction: @escaping LossFunction.F, callbacks: [TrainingLoopCallback<Self>] = []
 +    lossFunction: @escaping LossFunction.F,
 +    metrics: [TrainingMetrics] = [],
 +    callbacks: [TrainingLoopCallback<Self>] = [],
 +    includeDefaultCallbacks: Bool = true
   ) {
     self.training = training
     self.validation = validation
     self.optimizer = optimizer
     self.lossFunction = LossFunction(lossFunction)
 -    self.callbacks = callbacks
 +    self.metrics = metrics
++
 +    if includeDefaultCallbacks {
 +      let statisticsRecorder = StatisticsRecorder(metrics: [.loss] + metrics)
 +      let progressPrinter = ProgressPrinter()
 +      self.statisticsRecorder = statisticsRecorder
 +      self.progressPrinter = progressPrinter
 +      self.callbacks = [
 +        statisticsRecorder.record,
 +        progressPrinter.print,
 +      ] + callbacks
 +    } else {
 +      self.callbacks = callbacks
 +    }
+  }
+}
 extension TrainingLoop {
   /// The default differentiable step.
   public mutating func differentiableStep(model: Model) throws {
 -    guard let data = lastInput else { return }
 -    guard let target = lastTarget else { return }
 -    (lastLoss, lastGradient) = valueWithGradient(at: model) { (model: Model) -> Tensor<Float> in
 +    guard let data = lastStepInput else { return }
 +    guard let target = lastStepTarget else { return }
 +    (lastStepLoss, lastStepGradient) = valueWithGradient(at: model) {
 +      (model: Model) -> Tensor<Float> in
       let predictions = model(data)
 -      lastOutput = predictions
 +      lastStepOutput = predictions
       return lossFunction.f(predictions, target)
+    }
+  }
   /// The step used for inference.
   public mutating func inferenceStep(model: Model) throws {
 -    guard let data = lastInput else { return }
 -    lastOutput = model(data)
 -    guard let target = lastTarget else { return }
 +    guard let data = lastStepInput else { return }
 +    lastStepOutput = model(data)
 +    guard let target = lastStepTarget else { return }
     try handleEvent(.inferencePredictionEnd)
 -    lastLoss = lossFunction.f(lastOutput!, target)
 +    lastStepLoss = lossFunction.f(lastStepOutput!, target)
+  }
   /// The step used for training.
   ) throws {
     try differentiableStep(model, &self)
     try handleEvent(.updateStart)
 -    optimizer.update(&model, along: lastGradient!)
 +    optimizer.update(&model, along: lastStepGradient!)
+  }
+}
 public enum TrainingLoopAction: Error {
   /// Abort actions in the current training/inference step and goes to the next batch.
   case cancelBatch
++
   /// Abort actions in the current training phase and goes to the validation phase.
   case cancelTraining
++
   /// Abort actions in the current validation phase and goes to the next epoch.
   case cancelValidation
++
   /// Abort actions in the current epoch and goes to the next epoch.
   case cancelEpoch
++
   /// Abort actions in the current fit and ends fitting.
   case cancelFit
+}
     batchCount = batches.count
     for (i, batch) in batches.enumerated() {
       batchIndex = i
 -      (lastInput, lastTarget) = (batch.data, batch.label)
 +      (lastStepInput, lastStepTarget) = (batch.data, batch.label)
       do {
         try handleEvent(.batchStart)
         try step(&self)
   public mutating func fit(
     _ model: inout Model, epochs: Int, callbacks: [TrainingLoopCallback<Self>] = [],
     on device: Device = Device.default,
 -    differentiableStep: (Model, inout Self) throws -> Void = { try $1.differentiableStep(model: $0) }
 +    differentiableStep: (Model, inout Self) throws -> Void = {
 +      try $1.differentiableStep(model: $0)
 +    }
   ) throws {
     let callbacksCount = self.callbacks.count
     self.callbacks += callbacks