From 7e23418d84d4513f2df75e0232525dddd9edf475 Mon Sep 17 00:00:00 2001
From: Adam Pocock <adam.pocock@oracle.com>
Date: Thu, 15 Sep 2022 14:44:24 -0400
Subject: [PATCH 1/8] Updating the docs to reference protobuf serialization.

---
 docs/Architecture.md    | 27 ++++++++++++++++++++++++++-
 docs/Internals.md       | 25 ++++++++++++++++++++++++-
 docs/PackageOverview.md | 33 ++++++++++++++++++++++-----------
 docs/Roadmap.md         | 15 +++++++++------
 docs/Security.md        |  4 ++++
 5 files changed, 85 insertions(+), 19 deletions(-)
diff --git a/docs/Architecture.md b/docs/Architecture.md
index 3bee56c57..fc9c7fce5 100644
--- a/docs/Architecture.md
+++ b/docs/Architecture.md
@@ -422,11 +422,36 @@ transparently hashes the inputs. The feature names tend to be particularly
 sensitive when working with NLP problems. For example, without such hashing,
 bigrams would appear in the feature domains.
 
+## Serialization
+
+Tribuo supports Java serialization (i.e., using `java.io.Serializable`) and from
+v4.3 it supports serializing objects to protobufs. Java serialization support is
+deprecated, and will be removed in the next major version. While using the Java 
+serialization support we recommend the use of a serialization filter, more 
+information is given in our [Security documentation](Security.md).
+Classes which support protobuf serialization
+now implement `ProtoSerializable<T>` where the type bound gives the type of the protobuf they
+serialize to. Tribuo's protobuf serialization supports
+all the types that Java serialization supports, with the exception of `Example`
+metadata values which previously supported any `java.io.Serializable` type, and now
+only support `String` values. Helper methods to deserialize objects from protobufs
+have been added to all the major interfaces of the form `<interface-name>.deserialize(<interface-name>Proto)`
+The protobuf definitions are packaged into Tribuo's jars, and the protobuf classes
+are compiled using protoc `v3.19.4`. Tribuo's protobuf support includes versioning
+of the protobufs to allow incremental modifications to the protobuf schemas as the
+types evolve. This flexibility should allow protobuf to remain the preferred serialization
+format for Tribuo without restricting the evolution of Tribuo's classes and interfaces.
+
+As Java's generic type system is erased, the objects returned from this serialization
+mechanism internally validate that the types are consistent, but users must validate
+that the `Model` is of the expected type using 
+`Model.validate(Class<? extends Output<?>>)` or similar.
+
 ## ONNX Export
 
 From v4.2 Tribuo supports exporting some models in the [ONNX](https://onnx.ai)
 model format. The ONNX format is a cross-platform model exchange format which
-can be loaded in by many different machine learning libraries. Tribuo supports
+can be loaded in by many machine learning libraries. Tribuo supports
 inference on ONNX models via ONNX Runtime. Models which can be exported
 implement the `ONNXExportable` interface, which provides methods for
 constructing the ONNX protobuf and serializing it to disk. As of the release of
diff --git a/docs/Internals.md b/docs/Internals.md
index c5c189ce7..20f5fea2b 100644
--- a/docs/Internals.md
+++ b/docs/Internals.md
@@ -102,7 +102,7 @@ this `Feature` was observed.
 
 At this point the `Dataset` can be transformed, by a `TransformationMap`. This
 applies an independent sequence of transformation to each `Feature`, so it can
-perform rescaling or binning, but not Principle Component Analysis (PCA).  The
+perform rescaling or binning, but not Principal Component Analysis (PCA).  The
 `TransformationMap` gathers the necessary statistics about the features, and
 then rewrites each `Example` according to the transformation, generating a
 `TransformerMap` which can be used to apply that specific transformations to
@@ -166,3 +166,26 @@ classification, RMSE for regression etc). Finally, the input data's
 `DataProvenance` and the `Model`'s `ModelProvenance` are queried, and the
 evaluation statistics, provenances and predictions are passed to the
 appropriate `Evaluation`'s constructor for storage.
+
+## Protobuf Serialization
+
+Tribuo's protobuf serialization is based around redirection and the `Any` packed
+protobuf to simulate polymorphic behaviour. Each type is packaged into a top
+level protobuf representing the interface it implements which has an integer 
+version field incrementing from 0, the class name of the class which can 
+deserialize this object, and a packed `Any` message which contains class specific serialization information. This protobuf is
+unpacked using the deserialization mechanism in `org.tribuo.protos.ProtoUtil` and
+then the method `deserializeFromProto(int version, String className, Any message)`
+is called on the `className` specified in the proto. The class name is passed through
+to allow redirection for Tribuo internal classes which may want to deserialize as a
+different type as we evolve the library. That method then typically checks that the
+version is supported by the current class, to prevent inaccurate deserialization of
+protobufs written by newer versions of Tribuo when loaded into older versions, and
+then the `Any` message is unpacked into a class specific protobuf, any necessary
+validation is performed, the deserialized object is constructed and then returned.
+
+There are two helper classes, `ModelDataCarrier` and `DatasetDataCarrier` which
+allow easy serialization/deserialization of shared fields in `Model` and 
+`Dataset` respectively (and the sequence variants thereof). These are considered
+an implementation detail as they may change to incorporate new fields, and may
+be converted into records when Tribuo moves to a newer version of Java.
diff --git a/docs/PackageOverview.md b/docs/PackageOverview.md
index b51e76647..c2916f87f 100644
--- a/docs/PackageOverview.md
+++ b/docs/PackageOverview.md
@@ -98,17 +98,18 @@ suitable for use with models like BERT.
 Multi-class classification is the act of assigning a single label from a set of
 labels to a test example.  The classification module has several submodules:
 
-| Folder | ArtifactID | Package root | Description |
-| --- | --- | --- | --- |
-| Core | `tribuo-classification-core` | `org.tribuo.classification` | Contains an Output subclass for use with multi-class classification tasks, evaluation code for checking model performance, and an implementation of Adaboost.SAMME. It also contains simple baseline classifiers. |
-| DecisionTree | `tribuo-classification-tree` | `org.tribuo.classification.dtree` | An implementation of CART decision trees. |
-| Experiments | `tribuo-classification-experiments` | `org.tribuo.classification.experiments` | A set of main functions for training & testing models on any supported dataset. This submodule depends on all the classifiers and allows easy comparison between them. It should not be imported into other projects since it is intended purely for development and testing. |
-| Explanations | `tribuo-classification-experiments` | `org.tribuo.classification.explanations` | An implementation of LIME for classification tasks. If you use the columnar data loader, LIME can extract more information about the feature domain and provide better explanations. |
-| LibLinear | `tribuo-classification-liblinear` | `org.tribuo.classification.liblinear` | A wrapper around the LibLinear-java library. This provides linear-SVMs and other l1 or l2 regularised linear classifiers. |
-| LibSVM | `tribuo-classification-libsvm` | `org.tribuo.classification.libsvm` | A wrapper around the Java version of LibSVM. This provides linear & kernel SVMs with sigmoid, gaussian and polynomial kernels. |
-| Multinomial Naive Bayes | `tribuo-classification-mnnaivebayes` | `org.tribuo.classification.mnb` | An implementation of a multinomial naive bayes classifier. Since it aims to store a compact in-memory representation of the model, it only keeps track of weights for observed feature/class pairs. |
-| SGD | `tribuo-classification-sgd` | `org.tribuo.classification.sgd` | An implementation of stochastic gradient descent based classifiers. It includes a linear package for logistic regression and linear-SVM (using log and hinge losses, respectively), a kernel package for training a kernel-SVM using the Pegasos algorithm, a crf package for training a linear-chain CRF, and a fm package for training pairwise factorization machines. These implementations depend upon the stochastic gradient optimisers in the main Math package. The linear, fm, and crf packages can use any of the provided gradient optimisers, which enforce various different kinds of regularisation or convergence metrics. This is the preferred package for linear classification and for sequence classification due to the speed and scalability of the SGD approach. |
-| XGBoost | `tribuo-classification-xgboost` | `org.tribuo.classification.xgboost` | A wrapper around the XGBoost Java API. XGBoost requires a C library accessed via JNI.  XGBoost is a scalable implementation of gradient boosted trees. |
+| Folder                  | ArtifactID | Package root | Description                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+|-------------------------| --- | --- |------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| Core                    | `tribuo-classification-core` | `org.tribuo.classification` | Contains an Output subclass for use with multi-class classification tasks, evaluation code for checking model performance, and an implementation of Adaboost.SAMME. It also contains simple baseline classifiers.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| DecisionTree            | `tribuo-classification-tree` | `org.tribuo.classification.dtree` | An implementation of CART decision trees.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| Experiments             | `tribuo-classification-experiments` | `org.tribuo.classification.experiments` | A set of main functions for training & testing models on any supported dataset. This submodule depends on all the classifiers and allows easy comparison between them. It should not be imported into other projects since it is intended purely for development and testing.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
+| Explanations            | `tribuo-classification-experiments` | `org.tribuo.classification.explanations` | An implementation of LIME for classification tasks. If you use the columnar data loader, LIME can extract more information about the feature domain and provide better explanations.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
+| FeatureSelection        | `tribuo-classification-fs` | `org.tribuo.classification.fs` | An implementation of several information theoretic feature selection algorithms for classification problems.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| LibLinear               | `tribuo-classification-liblinear` | `org.tribuo.classification.liblinear` | A wrapper around the LibLinear-java library. This provides linear-SVMs and other l1 or l2 regularised linear classifiers.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| LibSVM                  | `tribuo-classification-libsvm` | `org.tribuo.classification.libsvm` | A wrapper around the Java version of LibSVM. This provides linear & kernel SVMs with sigmoid, gaussian and polynomial kernels.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| Multinomial Naive Bayes | `tribuo-classification-mnnaivebayes` | `org.tribuo.classification.mnb` | An implementation of a multinomial naive bayes classifier. Since it aims to store a compact in-memory representation of the model, it only keeps track of weights for observed feature/class pairs.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| SGD                     | `tribuo-classification-sgd` | `org.tribuo.classification.sgd` | An implementation of stochastic gradient descent based classifiers. It includes a linear package for logistic regression and linear-SVM (using log and hinge losses, respectively), a kernel package for training a kernel-SVM using the Pegasos algorithm, a crf package for training a linear-chain CRF, and a fm package for training pairwise factorization machines. These implementations depend upon the stochastic gradient optimisers in the main Math package. The linear, fm, and crf packages can use any of the provided gradient optimisers, which enforce various different kinds of regularisation or convergence metrics. This is the preferred package for linear classification and for sequence classification due to the speed and scalability of the SGD approach. |
+| XGBoost                 | `tribuo-classification-xgboost` | `org.tribuo.classification.xgboost` | A wrapper around the XGBoost Java API. XGBoost requires a C library accessed via JNI.  XGBoost is a scalable implementation of gradient boosted trees.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
 
 ## Multi-label Classification
 
@@ -220,3 +221,13 @@ TensorFlow not just for Tribuo but for the Java community as a whole.
 Tribuo demonstrates the TensorFlow interop by including an example config file,
 several example model generation functions and protobuf for an MNIST model
 graph.
+
+## Other modules
+
+Tribuo has a number of other modules:
+
+|  Folder | ArtifactID | Package root | Description |
+|---------| --- | --- | --- | --- |
+| Json  | `tribuo-json` | `org.tribuo.json` | Contains support for reading and writing Json formatted data, along with a program for inspecting and removing provenance information from models. |
+| ModelCard | `tribuo-interop-modelcard` | `org.tribuo.interop.modelcard` | Contains support for reading and writing model cards in Json format, using the provenance information in Tribuo models to guide the card construction. |
+| Reproducibility | `tribuo-reproducibility` | `org.tribuo.reproducibility` | A utility for reproducing Tribuo models and datasets. |
diff --git a/docs/Roadmap.md b/docs/Roadmap.md
index 73dd4790a..c76591be9 100644
--- a/docs/Roadmap.md
+++ b/docs/Roadmap.md
@@ -37,14 +37,16 @@ specific operations (though this can be achieved today using `DatasetView` and p
 categorical and real valued features, and promotes the former to the latter when there
 are too many categories. This could be tied into the `RowProcessor` to give the user control
 over the feature types, which could filter down into algorithmic choices elsewhere in the package.
-- Serialization. We'd like to have alternate serialization mechanisms for models and datasets until
-Java's serialization mechanisms improve.
+- ~~Serialization. We'd like to have alternate serialization mechanisms for models and datasets until
+Java's serialization mechanisms improve.~~
+    - In 4.3 we added protobuf serialization to Tribuo and deprecated Java serialization.
 - Caching datasource. Datasources may currently perform expensive feature extraction steps 
 (I'm looking at you `RowProcessor`), and it would be useful to be able to cache the output of
 that locally, while maintaining the link to the original data. We don't have a firm design for
 this feature yet, but we're in need of it for some internal work.
-- KMeans & Nearest Neighbour share very little code, but are conceptually very similar. We'd like
-to refactor out the shared code (while maintaining serialization compatibility).
+- ~~KMeans & Nearest Neighbour share very little code, but are conceptually very similar. We'd like
+to refactor out the shared code (while maintaining serialization compatibility).~~
+    - In 4.3 we added a distance querying interface and refactored KMeans, KNN and HDBSCAN to use it.
 - Allow `DatasetView` to regenerate its feature and output domains. Currently all views of a dataset
 share the same immutable feature domain, but in some cases this can leak information from test time
 to train (e.g., when using the unselected data as an out of bag sample).
@@ -61,8 +63,9 @@ specify a minimum purity decrease requirement.~~
     - Integrated in Tribuo 4.1.
 - Gaussian Processes.
 - Vowpal Wabbit interface.
-- Feature selection. We already have several feature selection algorithms implemented 
-in a Tribuo compatible interface, but the codebase isn't quite ready for release.
+- ~~Feature selection. We already have several feature selection algorithms implemented 
+in a Tribuo compatible interface, but the codebase isn't quite ready for release.~~
+    - Feature selection for classification problems is integrated in Tribuo 4.3.
 - Support word embedding features.
 - ~~Support contextualised word embeddings (through the ONNX or TensorFlow interfaces).~~ 
     - ONNX support for BERT embeddings is integrated in Tribuo 4.1.
diff --git a/docs/Security.md b/docs/Security.md
index 8a7b0f641..309b236cd 100644
--- a/docs/Security.md
+++ b/docs/Security.md
@@ -24,6 +24,10 @@ Additionally, when running with a security manager, Tribuo will need access to
 the relevant filesystem locations to load or save model files. See the section 
 on [Configuration](#Configuration) for more details.
 
+In Tribuo 4.3 we introduced protobuf based serialization for all supported Java
+serializable types. This is the preferred serialization mechanism, and Java
+serialization support will be removed in the next major release of Tribuo.
+
 ## Database access
 Tribuo provides a SQL interface that can load data via a JDBC connection. As
 it's frequently necessary to load data via a joined query from an unknown

From 15e538fd16dca4a3a9d44a288be1aee81335e3c1 Mon Sep 17 00:00:00 2001
From: Adam Pocock <adam.pocock@oracle.com>
Date: Thu, 15 Sep 2022 14:45:33 -0400
Subject: [PATCH 2/8] Adding serde helpers to Model, Dataset, SequenceModel and
 SequenceDataset. Updating main methods to support protobuf.

---
 .../classification/sequence/SeqTrainTest.java |  42 +++++---
 .../classification/experiments/RunAll.java    |  16 ++-
 .../classification/experiments/Test.java      |  34 ++++--
 .../explanations/lime/LIMETextCLI.java        |  52 +++++----
 .../classification/sgd/crf/SeqTest.java       |  50 ++++++---
 Core/src/main/java/org/tribuo/Dataset.java    |  53 +++++++++
 Core/src/main/java/org/tribuo/Model.java      |  55 ++++++++++
 .../main/java/org/tribuo/ModelExplorer.java   |  47 +++++---
 .../org/tribuo/sequence/SequenceDataset.java  | 101 ++++++++++++++++++
 .../org/tribuo/sequence/SequenceModel.java    |  65 +++++++++++
 .../sequence/SequenceModelExplorer.java       |  49 ++++++---
 .../java/org/tribuo/data/DataOptions.java     |  52 ++++++++-
 .../java/org/tribuo/data/DatasetExplorer.java |  48 ++++++---
 .../tribuo/data/PreprocessAndSerialize.java   |  29 +++--
 .../org/tribuo/interop/oci/OCIModelCLI.java   |  28 ++++-
 .../tribuo/interop/tensorflow/TrainTest.java  |  17 ++-
 16 files changed, 609 insertions(+), 129 deletions(-)

diff --git a/Classification/Core/src/main/java/org/tribuo/classification/sequence/SeqTrainTest.java b/Classification/Core/src/main/java/org/tribuo/classification/sequence/SeqTrainTest.java
index d3bd0ce89..8b9797299 100644
--- a/Classification/Core/src/main/java/org/tribuo/classification/sequence/SeqTrainTest.java
+++ b/Classification/Core/src/main/java/org/tribuo/classification/sequence/SeqTrainTest.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2020, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -29,11 +29,10 @@
 import org.tribuo.util.Util;
 
 import java.io.BufferedInputStream;
-import java.io.FileInputStream;
-import java.io.FileOutputStream;
 import java.io.IOException;
 import java.io.ObjectInputStream;
 import java.io.ObjectOutputStream;
+import java.nio.file.Files;
 import java.nio.file.Path;
 import java.util.logging.Logger;
 
@@ -78,6 +77,9 @@ public String getOptionsDescription() {
          */
         @Option(charName = 't', longName = "trainer-name", usage = "Name of the trainer in the configuration file.")
         public SequenceTrainer<Label> trainer;
+
+        @Option(charName = 'p', longName = "protobuf-model", usage = "Load the model from a protobuf. Optional")
+        public boolean protobufFormat;
     }
 
     /**
@@ -111,19 +113,31 @@ public static void main(String[] args) throws ClassNotFoundException, IOExceptio
                 break;
             default:
                 if ((o.trainDataset != null) && (o.testDataset != null)) {
-                    logger.info("Loading training data from " + o.trainDataset);
-                    try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(o.trainDataset.toFile())));
-                         ObjectInputStream oits = new ObjectInputStream(new BufferedInputStream(new FileInputStream(o.testDataset.toFile())))) {
-                        @SuppressWarnings("unchecked") // deserialising a generic dataset.
-                        SequenceDataset<Label> tmpTrain = (SequenceDataset<Label>) ois.readObject();
-                        train = tmpTrain;
+                    if (o.protobufFormat) {
+                        logger.info("Loading protobuf format training data from " + o.trainDataset);
+                        SequenceDataset<?> tmpTrain = SequenceDataset.deserializeFromFile(o.trainDataset);
+                        train = SequenceDataset.castDataset(tmpTrain, Label.class);
                         logger.info(String.format("Loaded %d training examples for %s", train.size(), train.getOutputs().toString()));
                         logger.info("Found " + train.getFeatureIDMap().size() + " features");
-                        logger.info("Loading testing data from " + o.testDataset);
-                        @SuppressWarnings("unchecked") // deserialising a generic dataset.
-                        SequenceDataset<Label> tmpTest = (SequenceDataset<Label>) oits.readObject();
-                        test = tmpTest;
+                        logger.info("Loading protobuf format testing data from " + o.testDataset);
+                        SequenceDataset<?> tmpTest = SequenceDataset.deserializeFromFile(o.testDataset);
+                        test = SequenceDataset.castDataset(tmpTest, Label.class);
                         logger.info(String.format("Loaded %d testing examples", test.size()));
+                    } else {
+                        logger.info("Loading training data from " + o.trainDataset);
+                        try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(Files.newInputStream(o.trainDataset)));
+                             ObjectInputStream oits = new ObjectInputStream(new BufferedInputStream(Files.newInputStream(o.testDataset)))) {
+                            @SuppressWarnings("unchecked") // deserialising a generic dataset.
+                            SequenceDataset<Label> tmpTrain = (SequenceDataset<Label>) ois.readObject();
+                            train = tmpTrain;
+                            logger.info(String.format("Loaded %d training examples for %s", train.size(), train.getOutputs().toString()));
+                            logger.info("Found " + train.getFeatureIDMap().size() + " features");
+                            logger.info("Loading testing data from " + o.testDataset);
+                            @SuppressWarnings("unchecked") // deserialising a generic dataset.
+                            SequenceDataset<Label> tmpTest = (SequenceDataset<Label>) oits.readObject();
+                            test = tmpTest;
+                            logger.info(String.format("Loaded %d testing examples", test.size()));
+                        }
                     }
                 } else {
                     logger.warning("Unknown dataset " + o.datasetName);
@@ -148,7 +162,7 @@ public static void main(String[] args) throws ClassNotFoundException, IOExceptio
         System.out.println(evaluation.getConfusionMatrix().toString());
 
         if (o.outputPath != null) {
-            try (ObjectOutputStream oos = new ObjectOutputStream(new FileOutputStream(o.outputPath.toFile()))) {
+            try (ObjectOutputStream oos = new ObjectOutputStream(Files.newOutputStream(o.outputPath))) {
                 oos.writeObject(model);
                 logger.info("Serialized model to file: " + o.outputPath);
             }
diff --git a/Classification/Experiments/src/main/java/org/tribuo/classification/experiments/RunAll.java b/Classification/Experiments/src/main/java/org/tribuo/classification/experiments/RunAll.java
index 6bfff3fe3..7ef94f915 100644
--- a/Classification/Experiments/src/main/java/org/tribuo/classification/experiments/RunAll.java
+++ b/Classification/Experiments/src/main/java/org/tribuo/classification/experiments/RunAll.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2020, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -32,15 +32,14 @@
 import org.tribuo.classification.evaluation.LabelEvaluator;
 import org.tribuo.data.DataOptions;
 
-import java.io.BufferedWriter;
 import java.io.File;
 import java.io.FileOutputStream;
-import java.io.FileWriter;
 import java.io.IOException;
 import java.io.ObjectOutputStream;
 import java.io.OutputStreamWriter;
 import java.io.PrintWriter;
 import java.nio.charset.StandardCharsets;
+import java.nio.file.Paths;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
@@ -72,6 +71,9 @@ public String getOptionsDescription() {
          */
         @Option(charName = 'd', longName = "output-directory", usage = "Directory to write out the models and test reports.")
         public File directory;
+
+        @Option(longName = "write-protobuf-models", usage = "Write out models in protobuf format.")
+        public boolean protobuf;
     }
 
     /**
@@ -124,8 +126,12 @@ public static void main(String[] args) throws IOException {
                 logger.info("Found two trainers with the name " + name);
             }
             String outputPath = o.directory.toString()+"/"+name;
-            try (ObjectOutputStream oos = new ObjectOutputStream(new FileOutputStream(outputPath+".model"))) {
-                oos.writeObject(curModel);
+            if (o.protobuf) {
+                curModel.serializeToFile(Paths.get(outputPath + ".model"));
+            } else {
+                try (ObjectOutputStream oos = new ObjectOutputStream(new FileOutputStream(outputPath + ".model"))) {
+                    oos.writeObject(curModel);
+                }
             }
             try (PrintWriter writer = new PrintWriter(new OutputStreamWriter(new FileOutputStream(outputPath+".output"), StandardCharsets.UTF_8))) {
                 writer.println("Model = " + name);
diff --git a/Classification/Experiments/src/main/java/org/tribuo/classification/experiments/Test.java b/Classification/Experiments/src/main/java/org/tribuo/classification/experiments/Test.java
index 3f57bad57..7bbc806a1 100644
--- a/Classification/Experiments/src/main/java/org/tribuo/classification/experiments/Test.java
+++ b/Classification/Experiments/src/main/java/org/tribuo/classification/experiments/Test.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2020, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -116,6 +116,9 @@ public String getOptionsDescription() {
          */
         @Option(charName = 'v', longName = "testing-file", usage = "Path to the testing file.")
         public Path testingPath;
+
+        @Option(longName = "read-protobuf-model", usage = "Load the model in protobuf format.")
+        public boolean protobufModel;
     }
 
     /**
@@ -129,16 +132,17 @@ public static Pair<Model<Label>,Dataset<Label>> load(ConfigurableTestOptions o)
         Path modelPath = o.modelPath;
         Path datasetPath = o.testingPath;
         logger.info(String.format("Loading model from %s", modelPath));
-        Model<Label> model;
-        try (ObjectInputStream mois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(modelPath.toFile())))) {
-            model = (Model<Label>) mois.readObject();
-            boolean valid = model.validate(Label.class);
-            if (!valid) {
-                throw new ClassCastException("Failed to cast deserialised Model to Model<Label>");
+        Model<?> tmpModel;
+        if (o.protobufModel) {
+            tmpModel = Model.deserializeFromFile(modelPath);
+        } else {
+            try (ObjectInputStream mois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(modelPath.toFile())))) {
+                tmpModel = (Model<?>) mois.readObject();
+            } catch (ClassNotFoundException e) {
+                throw new IllegalArgumentException("Unknown class in serialised model", e);
             }
-        } catch (ClassNotFoundException e) {
-            throw new IllegalArgumentException("Unknown class in serialised model", e);
         }
+        Model<Label> model = tmpModel.castModel(Label.class);
         logger.info(String.format("Loading data from %s", datasetPath));
         Dataset<Label> test;
         switch (o.inputFormat) {
@@ -154,6 +158,18 @@ public static Pair<Model<Label>,Dataset<Label>> load(ConfigurableTestOptions o)
                     throw new IllegalArgumentException("Unknown class in serialised dataset", e);
                 }
                 break;
+            case SERIALIZED_PROTOBUF:
+                //
+                // Load Tribuo protobuf serialised datasets.
+                Dataset<?> tmp = Dataset.deserializeFromFile(datasetPath);
+                if (tmp.validate(Label.class)) {
+                    test = Dataset.castDataset(tmp, Label.class);
+                    test = ImmutableDataset.copyDataset(test,model.getFeatureIDMap(),model.getOutputIDInfo());
+                    logger.info(String.format("Loaded %d testing examples for %s", test.size(), test.getOutputs().toString()));
+                } else {
+                    throw new IllegalArgumentException("Invalid test dataset type, expected Label.class");
+                }
+                break;
             case LIBSVM:
                 //
                 // Load the libsvm text-based data format.
diff --git a/Classification/Explanations/src/main/java/org/tribuo/classification/explanations/lime/LIMETextCLI.java b/Classification/Explanations/src/main/java/org/tribuo/classification/explanations/lime/LIMETextCLI.java
index b9fa5774a..ea4c1ac7b 100644
--- a/Classification/Explanations/src/main/java/org/tribuo/classification/explanations/lime/LIMETextCLI.java
+++ b/Classification/Explanations/src/main/java/org/tribuo/classification/explanations/lime/LIMETextCLI.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2020, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -117,26 +117,36 @@ public void startShell() {
      * @param path The path to load the model from.
      * @return A status message.
      */
-    @Command(usage = "<filename> - Load a model from disk.", completers="fileCompleter")
-    public String loadModel(CommandInterpreter ci, File path) {
-        try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(path)))) {
-            @SuppressWarnings("unchecked") // deserialising generically typed model.
-            Model<Label> m = (Model<Label>) ois.readObject();
-            model = m;
-        } catch (ClassNotFoundException e) {
-            logger.log(Level.SEVERE,"Failed to load class from stream " + path.getAbsolutePath(),e);
-            return "Failed to load model";
-        } catch (FileNotFoundException e) {
-            logger.log(Level.SEVERE,"Failed to open file " + path.getAbsolutePath(),e);
-            return "Failed to load model";
-        } catch (IOException e) {
-            logger.log(Level.SEVERE,"IOException when reading from file " + path.getAbsolutePath(),e);
-            return "Failed to load model";
+    @Command(usage = "<filename> <load-protobuf> - Load a model from disk.", completers="fileCompleter")
+    public String loadModel(CommandInterpreter ci, File path, boolean protobuf) {
+        String output = "Failed to load model";
+        if (protobuf) {
+            try {
+                Model<?> tmpModel = Model.deserializeFromFile(path.toPath());
+                model = tmpModel.castModel(Label.class);
+                output = "Loaded model from path " + path.getAbsolutePath();
+            } catch (IllegalStateException e) {
+                logger.log(Level.SEVERE, "Failed to deserialize protobuf when reading from file " + path.getAbsolutePath(), e);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE, "IOException when reading from file " + path.getAbsolutePath(), e);
+            }
+        } else {
+            try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(path)))) {
+                Model<?> tmpModel = (Model<?>) ois.readObject();
+                model = tmpModel.castModel(Label.class);
+                output = "Loaded model from path " + path.getAbsolutePath();
+            } catch (ClassNotFoundException e) {
+                logger.log(Level.SEVERE, "Failed to load class from stream " + path.getAbsolutePath(), e);
+            } catch (FileNotFoundException e) {
+                logger.log(Level.SEVERE, "Failed to open file " + path.getAbsolutePath(), e);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE, "IOException when reading from file " + path.getAbsolutePath(), e);
+            }
         }
 
         limeText = new LIMEText(new SplittableRandom(1),model,limeTrainer,numSamples,extractor,tokenizer);
 
-        return "Loaded model from path " + path.toString();
+        return output;
     }
 
     /**
@@ -293,6 +303,12 @@ public static class LIMETextCLIOptions implements Options {
          */
         @Option(charName = 'f', longName = "filename", usage = "Model file to load. Optional.")
         public String modelFilename;
+
+        /**
+         * Load the model from a protobuf. Optional.
+         */
+        @Option(charName = 'p', longName = "protobuf-model", usage = "Load the model from a protobuf. Optional")
+        public boolean protobufFormat;
     }
 
     /**
@@ -305,7 +321,7 @@ public static void main(String[] args) {
             ConfigurationManager cm = new ConfigurationManager(args, options, false);
             LIMETextCLI driver = new LIMETextCLI();
             if (options.modelFilename != null) {
-                logger.log(Level.INFO, driver.loadModel(driver.shell, new File(options.modelFilename)));
+                logger.log(Level.INFO, driver.loadModel(driver.shell, new File(options.modelFilename), options.protobufFormat));
             }
             driver.startShell();
         } catch (UsageException e) {
diff --git a/Classification/SGD/src/main/java/org/tribuo/classification/sgd/crf/SeqTest.java b/Classification/SGD/src/main/java/org/tribuo/classification/sgd/crf/SeqTest.java
index ad59803df..1ed66861c 100644
--- a/Classification/SGD/src/main/java/org/tribuo/classification/sgd/crf/SeqTest.java
+++ b/Classification/SGD/src/main/java/org/tribuo/classification/sgd/crf/SeqTest.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2020, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -31,17 +31,15 @@
 import org.tribuo.math.StochasticGradientOptimiser;
 import org.tribuo.math.optimisers.GradientOptimiserOptions;
 import org.tribuo.sequence.HashingSequenceTrainer;
-import org.tribuo.sequence.ImmutableSequenceDataset;
 import org.tribuo.sequence.SequenceDataset;
 import org.tribuo.sequence.SequenceTrainer;
 import org.tribuo.util.Util;
 
 import java.io.BufferedInputStream;
-import java.io.FileInputStream;
-import java.io.FileOutputStream;
 import java.io.IOException;
 import java.io.ObjectInputStream;
 import java.io.ObjectOutputStream;
+import java.nio.file.Files;
 import java.nio.file.Path;
 import java.util.logging.Logger;
 
@@ -120,6 +118,9 @@ public String getOptionsDescription() {
          */
         @Option(longName = "model-hashing-salt", usage = "Salt for hashing the model.")
         public String modelHashingSalt = "";
+
+        @Option(longName = "protobuf-model", usage = "Load the model from a protobuf. Optional")
+        public boolean protobufFormat;
     }
 
     /**
@@ -159,16 +160,31 @@ public static void main(String[] args) throws ClassNotFoundException, IOExceptio
                 break;
             default:
                 if ((o.trainDataset != null) && (o.testDataset != null)) {
-                    logger.info("Loading training data from " + o.trainDataset);
-                    try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(o.trainDataset.toFile())));
-                         ObjectInputStream oits = new ObjectInputStream(new BufferedInputStream(new FileInputStream(o.testDataset.toFile())))) {
-                        train = (SequenceDataset<Label>) ois.readObject();
+                    if (o.protobufFormat) {
+                        logger.info("Loading protobuf format training data from " + o.trainDataset);
+                        SequenceDataset<?> tmpTrain = SequenceDataset.deserializeFromFile(o.trainDataset);
+                        train = SequenceDataset.castDataset(tmpTrain, Label.class);
                         logger.info(String.format("Loaded %d training examples for %s", train.size(), train.getOutputs().toString()));
                         logger.info("Found " + train.getFeatureIDMap().size() + " features");
-                        logger.info("Loading testing data from " + o.testDataset);
-                        SequenceDataset<Label> deserTest = (SequenceDataset<Label>) oits.readObject();
-                        test = ImmutableSequenceDataset.copyDataset(deserTest, train.getFeatureIDMap(), train.getOutputIDInfo());
+                        logger.info("Loading protobuf format testing data from " + o.testDataset);
+                        SequenceDataset<?> tmpTest = SequenceDataset.deserializeFromFile(o.testDataset);
+                        test = SequenceDataset.castDataset(tmpTest, Label.class);
                         logger.info(String.format("Loaded %d testing examples", test.size()));
+                    } else {
+                        logger.info("Loading training data from " + o.trainDataset);
+                        try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(Files.newInputStream(o.trainDataset)));
+                             ObjectInputStream oits = new ObjectInputStream(new BufferedInputStream(Files.newInputStream(o.testDataset)))) {
+                            @SuppressWarnings("unchecked") // deserialising a generic dataset.
+                            SequenceDataset<Label> tmpTrain = (SequenceDataset<Label>) ois.readObject();
+                            train = tmpTrain;
+                            logger.info(String.format("Loaded %d training examples for %s", train.size(), train.getOutputs().toString()));
+                            logger.info("Found " + train.getFeatureIDMap().size() + " features");
+                            logger.info("Loading testing data from " + o.testDataset);
+                            @SuppressWarnings("unchecked") // deserialising a generic dataset.
+                            SequenceDataset<Label> tmpTest = (SequenceDataset<Label>) oits.readObject();
+                            test = tmpTest;
+                            logger.info(String.format("Loaded %d testing examples", test.size()));
+                        }
                     }
                 } else {
                     logger.warning("Unknown dataset " + o.datasetName);
@@ -217,11 +233,13 @@ public static void main(String[] args) throws ClassNotFoundException, IOExceptio
         System.out.println(evaluation.getConfusionMatrix().toString());
 
         if (o.outputPath != null) {
-            FileOutputStream fout = new FileOutputStream(o.outputPath.toFile());
-            ObjectOutputStream oout = new ObjectOutputStream(fout);
-            oout.writeObject(model);
-            oout.close();
-            fout.close();
+            if (o.protobufFormat) {
+                model.serializeToFile(o.outputPath);
+            } else {
+                try (ObjectOutputStream oos = new ObjectOutputStream(Files.newOutputStream(o.outputPath))) {
+                    oos.writeObject(model);
+                }
+            }
             logger.info("Serialized model to file: " + o.outputPath);
         }
     }
diff --git a/Core/src/main/java/org/tribuo/Dataset.java b/Core/src/main/java/org/tribuo/Dataset.java
index ca7e8e15b..940808188 100644
--- a/Core/src/main/java/org/tribuo/Dataset.java
+++ b/Core/src/main/java/org/tribuo/Dataset.java
@@ -33,7 +33,14 @@
 import org.tribuo.transform.TransformerMap;
 import org.tribuo.util.Util;
 
+import java.io.BufferedInputStream;
+import java.io.BufferedOutputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.OutputStream;
 import java.io.Serializable;
+import java.nio.file.Files;
+import java.nio.file.Path;
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.HashMap;
@@ -130,6 +137,52 @@ public static Dataset<?> deserialize(DatasetProto datasetProto) {
         return ProtoUtil.deserialize(datasetProto);
     }
 
+    /**
+     * Reads an instance of {@link DatasetProto} from the supplied path and deserializes it.
+     * @param path The path to read.
+     * @return The deserialized dataset.
+     * @throws IOException If the path could not be read from, or the parsing failed.
+     */
+    public static Dataset<?> deserializeFromFile(Path path) throws IOException {
+        try (InputStream is = new BufferedInputStream(Files.newInputStream(path))) {
+            return deserializeFromStream(is);
+        }
+    }
+
+    /**
+     * Reads an instance of {@link DatasetProto} from the supplied input stream and deserializes it.
+     * @param is The input stream to read.
+     * @return The deserialized dataset.
+     * @throws IOException If the stream could not be read from, or the parsing failed.
+     */
+    public static Dataset<?> deserializeFromStream(InputStream is) throws IOException {
+        DatasetProto proto = DatasetProto.parseFrom(is);
+        return deserialize(proto);
+    }
+
+    /**
+     * Serializes this dataset to a {@link DatasetProto} and writes it to the supplied path.
+     * @param path The path to write to.
+     * @throws IOException If the path could not be written to.
+     */
+    public void serializeToFile(Path path) throws IOException {
+        try (OutputStream os = new BufferedOutputStream(Files.newOutputStream(path))) {
+            serializeToStream(os);
+        }
+    }
+
+    /**
+     * Serializes this dataset to a {@link DatasetProto} and writes it to the supplied output stream.
+     * <p>
+     * Does not close the stream.
+     * @param stream The output stream to write to.
+     * @throws IOException If the stream could not be written to.
+     */
+    public void serializeToStream(OutputStream stream) throws IOException {
+        DatasetProto proto = serialize();
+        proto.writeTo(stream);
+    }
+
     /**
      * A String description of this dataset.
      * @return The description
diff --git a/Core/src/main/java/org/tribuo/Model.java b/Core/src/main/java/org/tribuo/Model.java
index cd51ed325..2051e6d96 100644
--- a/Core/src/main/java/org/tribuo/Model.java
+++ b/Core/src/main/java/org/tribuo/Model.java
@@ -27,7 +27,14 @@
 import org.tribuo.protos.core.ModelProto;
 import org.tribuo.provenance.ModelProvenance;
 
+import java.io.BufferedInputStream;
+import java.io.BufferedOutputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.OutputStream;
 import java.io.Serializable;
+import java.nio.file.Files;
+import java.nio.file.Path;
 import java.util.ArrayList;
 import java.util.List;
 import java.util.Map;
@@ -332,6 +339,29 @@ public ModelProto serialize() {
         throw new UnsupportedOperationException("The default implementation of Model.serialize() must be overridden to support protobuf serialization.");
     }
 
+    /**
+     * Serializes this model to a {@link ModelProto} and writes it to the supplied path.
+     * @param path The path to write to.
+     * @throws IOException If the path could not be written to.
+     */
+    public void serializeToFile(Path path) throws IOException {
+        try (OutputStream os = new BufferedOutputStream(Files.newOutputStream(path))) {
+            serializeToStream(os);
+        }
+    }
+
+    /**
+     * Serializes this model to a {@link ModelProto} and writes it to the supplied output stream.
+     * <p>
+     * Does not close the stream.
+     * @param stream The output stream to write to.
+     * @throws IOException If the stream could not be written to.
+     */
+    public void serializeToStream(OutputStream stream) throws IOException {
+        ModelProto proto = serialize();
+        proto.writeTo(stream);
+    }
+
     /**
      * Deserializes the model from the supplied protobuf.
      * @param proto The protobuf to deserialize.
@@ -341,6 +371,31 @@ public static Model<?> deserialize(ModelProto proto) {
         return ProtoUtil.deserialize(proto);
     }
 
+    /**
+     * Reads an instance of {@link ModelProto} from the supplied path and deserializes it.
+     * @param path The path to read.
+     * @return The deserialized model.
+     * @throws IOException If the path could not be read from, or the parsing failed.
+     */
+    public static Model<?> deserializeFromFile(Path path) throws IOException {
+        try (InputStream is = new BufferedInputStream(Files.newInputStream(path))) {
+            return deserializeFromStream(is);
+        }
+    }
+
+    /**
+     * Reads an instance of {@link ModelProto} from the supplied input stream and deserializes it.
+     * <p>
+     * Does not close the stream.
+     * @param is The input stream to read.
+     * @return The deserialized model.
+     * @throws IOException If the stream could not be read from, or the parsing failed.
+     */
+    public static Model<?> deserializeFromStream(InputStream is) throws IOException {
+        ModelProto proto = ModelProto.parseFrom(is);
+        return deserialize(proto);
+    }
+
     /**
      * Constructs the data carrier for serialization.
      * @return The serialization data carrier.
diff --git a/Core/src/main/java/org/tribuo/ModelExplorer.java b/Core/src/main/java/org/tribuo/ModelExplorer.java
index 3d9e1eead..fc870e822 100644
--- a/Core/src/main/java/org/tribuo/ModelExplorer.java
+++ b/Core/src/main/java/org/tribuo/ModelExplorer.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2020, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -89,24 +89,35 @@ public void startShell() {
      * Loads a model.
      * @param ci The shell instance.
      * @param path The path to load.
+     * @param protobuf If the model is a protobuf.
      * @return A status string.
      */
     @Command(usage = "<filename> - Load a model from disk.", completers="fileCompleter")
-    public String loadModel(CommandInterpreter ci, File path) {
-        try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(path)))) {
-            model = (Model<?>) ois.readObject();
-        } catch (ClassNotFoundException e) {
-            logger.log(Level.SEVERE,"Failed to load class from stream " + path.getAbsolutePath(),e);
-            return "Failed to load model";
-        } catch (FileNotFoundException e) {
-            logger.log(Level.SEVERE,"Failed to open file " + path.getAbsolutePath(),e);
-            return "Failed to load model";
-        } catch (IOException e) {
-            logger.log(Level.SEVERE,"IOException when reading from file " + path.getAbsolutePath(),e);
-            return "Failed to load model";
+    public String loadModel(CommandInterpreter ci, File path, boolean protobuf) {
+        String output = "Failed to load model";
+        if (protobuf) {
+            try {
+                model = Model.deserializeFromFile(path.toPath());
+                output = "Loaded model from path " + path.getAbsolutePath();
+            } catch (IllegalStateException e) {
+                logger.log(Level.SEVERE, "Failed to deserialize protobuf when reading from file " + path.getAbsolutePath(), e);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE, "IOException when reading from file " + path.getAbsolutePath(), e);
+            }
+        } else {
+            try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(path)))) {
+                model = (Model<?>) ois.readObject();
+                output = "Loaded model from path " + path.getAbsolutePath();
+            } catch (ClassNotFoundException e) {
+                logger.log(Level.SEVERE, "Failed to load class from stream " + path.getAbsolutePath(), e);
+            } catch (FileNotFoundException e) {
+                logger.log(Level.SEVERE, "Failed to open file " + path.getAbsolutePath(), e);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE, "IOException when reading from file " + path.getAbsolutePath(), e);
+            }
         }
 
-        return "Loaded model from path " + path.toString();
+        return output;
     }
 
     /**
@@ -202,6 +213,12 @@ public static class ModelExplorerOptions implements Options {
          */
         @Option(charName = 'f', longName = "filename", usage = "Model file to load. Optional.")
         public String modelFilename;
+
+        /**
+         * Load the model from a protobuf. Optional.
+         */
+        @Option(charName = 'p', longName = "protobuf-model", usage = "Load the model from a protobuf. Optional")
+        public boolean protobufFormat;
     }
 
     /**
@@ -213,7 +230,7 @@ public static void main(String[] args) {
         ConfigurationManager cm = new ConfigurationManager(args,options,false);
         ModelExplorer driver = new ModelExplorer();
         if (options.modelFilename != null) {
-            logger.log(Level.INFO,driver.loadModel(driver.shell, new File(options.modelFilename)));
+            logger.log(Level.INFO,driver.loadModel(driver.shell, new File(options.modelFilename), options.protobufFormat));
         }
         driver.startShell();
     }
diff --git a/Core/src/main/java/org/tribuo/sequence/SequenceDataset.java b/Core/src/main/java/org/tribuo/sequence/SequenceDataset.java
index f12f39863..f614eb6db 100644
--- a/Core/src/main/java/org/tribuo/sequence/SequenceDataset.java
+++ b/Core/src/main/java/org/tribuo/sequence/SequenceDataset.java
@@ -30,12 +30,20 @@
 import org.tribuo.Tribuo;
 import org.tribuo.impl.DatasetDataCarrier;
 import org.tribuo.protos.ProtoSerializable;
+import org.tribuo.protos.ProtoUtil;
 import org.tribuo.protos.core.SequenceDatasetProto;
 import org.tribuo.protos.core.SequenceExampleProto;
 import org.tribuo.provenance.DataProvenance;
 import org.tribuo.provenance.DatasetProvenance;
 
+import java.io.BufferedInputStream;
+import java.io.BufferedOutputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.OutputStream;
 import java.io.Serializable;
+import java.nio.file.Files;
+import java.nio.file.Path;
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.Iterator;
@@ -189,6 +197,99 @@ public String toString() {
         return "SequenceDataset(source=" + sourceProvenance.toString() + ")";
     }
 
+    /**
+     * Validates that this SequenceDataset does in fact contain the supplied output type.
+     * <p>
+     * As the output type is erased at runtime, deserialising a SequenceDataset is an unchecked
+     * operation. This method allows the user to check that the deserialised dataset is
+     * of the appropriate type, rather than seeing if the Dataset throws a {@link ClassCastException}
+     * when used.
+     * @param clazz The class object to verify the output type against.
+     * @return True if the output type is assignable to the class object type, false otherwise.
+     */
+    public boolean validate(Class<? extends Output<?>> clazz) {
+        Set<T> domain = getOutputInfo().getDomain();
+        boolean output = true;
+        for (T type : domain) {
+            output &= clazz.isInstance(type);
+        }
+        return output;
+    }
+
+    /**
+     * Casts the dataset to the specified output type, assuming it is valid.
+     * <p>
+     * If it's not valid, throws {@link ClassCastException}.
+     * @param inputDataset The model to cast.
+     * @param outputType The output type to cast to.
+     * @param <T> The output type.
+     * @return The model cast to the correct value.
+     */
+    public static <T extends Output<T>> SequenceDataset<T> castDataset(SequenceDataset<?> inputDataset, Class<T> outputType) {
+        if (inputDataset.validate(outputType)) {
+            @SuppressWarnings("unchecked") // guarded by validate
+            SequenceDataset<T> castedModel = (SequenceDataset<T>) inputDataset;
+            return castedModel;
+        } else {
+            throw new ClassCastException("Attempted to cast dataset to " + outputType.getName() + " which is not valid for dataset " + inputDataset.toString());
+        }
+    }
+
+    /**
+     * Deserializes a sequence dataset proto into a sequence dataset.
+     * @param sequenceProto The proto to deserialize.
+     * @return The sequence dataset.
+     */
+    public static SequenceDataset<?> deserialize(SequenceDatasetProto sequenceProto) {
+        return ProtoUtil.deserialize(sequenceProto);
+    }
+
+    /**
+     * Reads an instance of {@link SequenceDatasetProto} from the supplied path and deserializes it.
+     * @param path The path to read.
+     * @return The deserialized sequence dataset.
+     * @throws IOException If the path could not be read from, or the parsing failed.
+     */
+    public static SequenceDataset<?> deserializeFromFile(Path path) throws IOException {
+        try (InputStream is = new BufferedInputStream(Files.newInputStream(path))) {
+            return deserializeFromStream(is);
+        }
+    }
+
+    /**
+     * Reads an instance of {@link SequenceDatasetProto} from the supplied input stream and deserializes it.
+     * @param is The input stream to read.
+     * @return The deserialized sequence dataset.
+     * @throws IOException If the stream could not be read from, or the parsing failed.
+     */
+    public static SequenceDataset<?> deserializeFromStream(InputStream is) throws IOException {
+        SequenceDatasetProto proto = SequenceDatasetProto.parseFrom(is);
+        return deserialize(proto);
+    }
+
+    /**
+     * Serializes this sequence dataset to a {@link SequenceDatasetProto} and writes it to the supplied path.
+     * @param path The path to write to.
+     * @throws IOException If the path could not be written to.
+     */
+    public void serializeToFile(Path path) throws IOException {
+        try (OutputStream os = new BufferedOutputStream(Files.newOutputStream(path))) {
+            serializeToStream(os);
+        }
+    }
+
+    /**
+     * Serializes this sequence dataset to a {@link SequenceDatasetProto} and writes it to the supplied output stream.
+     * <p>
+     * Does not close the stream.
+     * @param stream The output stream to write to.
+     * @throws IOException If the stream could not be written to.
+     */
+    public void serializeToStream(OutputStream stream) throws IOException {
+        SequenceDatasetProto proto = serialize();
+        proto.writeTo(stream);
+    }
+
     /**
      * Constructs the data carrier for serialization.
      * @param featureMap The feature domain.
diff --git a/Core/src/main/java/org/tribuo/sequence/SequenceModel.java b/Core/src/main/java/org/tribuo/sequence/SequenceModel.java
index 7a4ed559f..b6cc24337 100644
--- a/Core/src/main/java/org/tribuo/sequence/SequenceModel.java
+++ b/Core/src/main/java/org/tribuo/sequence/SequenceModel.java
@@ -24,10 +24,18 @@
 import org.tribuo.Prediction;
 import org.tribuo.impl.ModelDataCarrier;
 import org.tribuo.protos.ProtoSerializable;
+import org.tribuo.protos.ProtoUtil;
 import org.tribuo.protos.core.SequenceModelProto;
 import org.tribuo.provenance.ModelProvenance;
 
+import java.io.BufferedInputStream;
+import java.io.BufferedOutputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.OutputStream;
 import java.io.Serializable;
+import java.nio.file.Files;
+import java.nio.file.Path;
 import java.util.ArrayList;
 import java.util.List;
 import java.util.Map;
@@ -173,6 +181,63 @@ public SequenceModelProto serialize() {
         throw new UnsupportedOperationException("The default implementation of SequenceModel.serialize() must be overridden to support protobuf serialization.");
     }
 
+    /**
+     * Serializes this model to a {@link SequenceModelProto} and writes it to the supplied path.
+     * @param path The path to write to.
+     * @throws IOException If the path could not be written to.
+     */
+    public void serializeToFile(Path path) throws IOException {
+        try (OutputStream os = new BufferedOutputStream(Files.newOutputStream(path))) {
+            serializeToStream(os);
+        }
+    }
+
+    /**
+     * Serializes this model to a {@link SequenceModelProto} and writes it to the supplied output stream.
+     * <p>
+     * Does not close the stream.
+     * @param stream The output stream to write to.
+     * @throws IOException If the stream could not be written to.
+     */
+    public void serializeToStream(OutputStream stream) throws IOException {
+        SequenceModelProto proto = serialize();
+        proto.writeTo(stream);
+    }
+
+    /**
+     * Deserializes the model from the supplied protobuf.
+     * @param proto The protobuf to deserialize.
+     * @return The model.
+     */
+    public static SequenceModel<?> deserialize(SequenceModelProto proto) {
+        return ProtoUtil.deserialize(proto);
+    }
+
+    /**
+     * Reads an instance of {@link SequenceModelProto} from the supplied path and deserializes it.
+     * @param path The path to read.
+     * @return The deserialized model.
+     * @throws IOException If the path could not be read from, or the parsing failed.
+     */
+    public static SequenceModel<?> deserializeFromFile(Path path) throws IOException {
+        try (InputStream is = new BufferedInputStream(Files.newInputStream(path))) {
+            return deserializeFromStream(is);
+        }
+    }
+
+    /**
+     * Reads an instance of {@link SequenceModelProto} from the supplied input stream and deserializes it.
+     * <p>
+     * Does not close the stream.
+     * @param is The input stream to read.
+     * @return The deserialized model.
+     * @throws IOException If the stream could not be read from, or the parsing failed.
+     */
+    public static SequenceModel<?> deserializeFromStream(InputStream is) throws IOException {
+        SequenceModelProto proto = SequenceModelProto.parseFrom(is);
+        return deserialize(proto);
+    }
+
     /**
      * Constructs the data carrier for serialization.
      * @return The serialization data carrier.
diff --git a/Core/src/main/java/org/tribuo/sequence/SequenceModelExplorer.java b/Core/src/main/java/org/tribuo/sequence/SequenceModelExplorer.java
index dfb163d1e..f2034cf41 100644
--- a/Core/src/main/java/org/tribuo/sequence/SequenceModelExplorer.java
+++ b/Core/src/main/java/org/tribuo/sequence/SequenceModelExplorer.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2020, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -22,6 +22,7 @@
 import com.oracle.labs.mlrg.olcut.config.ConfigurationManager;
 import com.oracle.labs.mlrg.olcut.config.Option;
 import com.oracle.labs.mlrg.olcut.config.Options;
+import org.tribuo.Model;
 import org.tribuo.VariableInfo;
 import org.jline.builtins.Completers;
 import org.jline.reader.Completer;
@@ -89,22 +90,32 @@ public void startShell() {
      * @param path The path to load.
      * @return A status string.
      */
-    @Command(usage = "<filename> - Load a model from disk.", completers="fileCompleter")
-    public String loadModel(CommandInterpreter ci, File path) {
-        try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(path)))) {
-            model = (SequenceModel<?>) ois.readObject();
-        } catch (ClassNotFoundException e) {
-            logger.log(Level.SEVERE,"Failed to load class from stream " + path.getAbsolutePath(),e);
-            return "Failed to load model";
-        } catch (FileNotFoundException e) {
-            logger.log(Level.SEVERE,"Failed to open file " + path.getAbsolutePath(),e);
-            return "Failed to load model";
-        } catch (IOException e) {
-            logger.log(Level.SEVERE,"IOException when reading from file " + path.getAbsolutePath(),e);
-            return "Failed to load model";
+    @Command(usage = "<filename> <is-protobuf-format> - Load a model from disk.", completers="fileCompleter")
+    public String loadModel(CommandInterpreter ci, File path, boolean protobuf) {
+        String output = "Failed to load model";
+        if (protobuf) {
+            try {
+                model = SequenceModel.deserializeFromFile(path.toPath());
+                output = "Loaded model from path " + path.getAbsolutePath();
+            } catch (IllegalStateException e) {
+                logger.log(Level.SEVERE, "Failed to deserialize protobuf when reading from file " + path.getAbsolutePath(), e);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE, "IOException when reading from file " + path.getAbsolutePath(), e);
+            }
+        } else {
+            try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(path)))) {
+                model = (SequenceModel<?>) ois.readObject();
+                output = "Loaded model from path " + path.getAbsolutePath();
+            } catch (ClassNotFoundException e) {
+                logger.log(Level.SEVERE, "Failed to load class from stream " + path.getAbsolutePath(), e);
+            } catch (FileNotFoundException e) {
+                logger.log(Level.SEVERE, "Failed to open file " + path.getAbsolutePath(), e);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE, "IOException when reading from file " + path.getAbsolutePath(), e);
+            }
         }
 
-        return "Loaded model from path " + path.toString();
+        return output;
     }
 
     /**
@@ -190,6 +201,12 @@ public static class SequenceModelExplorerOptions implements Options {
          */
         @Option(charName = 'f', longName = "filename", usage = "Model file to load. Optional.")
         public String modelFilename;
+
+        /**
+         * Load the model from a protobuf. Optional.
+         */
+        @Option(charName = 'p', longName = "protobuf-model", usage = "Load the model from a protobuf. Optional")
+        public boolean protobufFormat;
     }
 
     /**
@@ -201,7 +218,7 @@ public static void main(String[] args) {
         ConfigurationManager cm = new ConfigurationManager(args,options,false);
         SequenceModelExplorer driver = new SequenceModelExplorer();
         if (options.modelFilename != null) {
-            logger.log(Level.INFO,driver.loadModel(driver.shell, new File(options.modelFilename)));
+            logger.log(Level.INFO,driver.loadModel(driver.shell, new File(options.modelFilename), options.protobufFormat));
         }
         driver.startShell();
     }
diff --git a/Data/src/main/java/org/tribuo/data/DataOptions.java b/Data/src/main/java/org/tribuo/data/DataOptions.java
index 8b64696f1..805b32b3d 100644
--- a/Data/src/main/java/org/tribuo/data/DataOptions.java
+++ b/Data/src/main/java/org/tribuo/data/DataOptions.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2021, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -43,10 +43,10 @@
 
 import java.io.BufferedInputStream;
 import java.io.FileInputStream;
-import java.io.FileOutputStream;
 import java.io.IOException;
 import java.io.ObjectInputStream;
 import java.io.ObjectOutputStream;
+import java.nio.file.Files;
 import java.nio.file.Path;
 import java.util.Collections;
 import java.util.Locale;
@@ -66,6 +66,10 @@ public enum InputFormat {
          * Serialized Tribuo datasets.
          */
         SERIALIZED,
+        /**
+         * Protobuf serialized Tribuo datasets.
+         */
+        SERIALIZED_PROTOBUF,
         /**
          * LibSVM/svm-light format data.
          */
@@ -136,6 +140,11 @@ public String getOptionsDescription() {
      */
     @Option(charName = 'f', longName = "model-output-path", usage = "Path to serialize model to.")
     public Path outputPath;
+    /**
+     * Write the model out as a protobuf.
+     */
+    @Option(longName = "model-output-protobuf", usage = "Serialize the model as a protobuf.")
+    public boolean modelOutputProtobuf;
     /**
      * RNG seed.
      */
@@ -223,6 +232,7 @@ public <T extends Output<T>> Pair<Dataset<T>,Dataset<T>> load(OutputFactory<T> o
                     }
                     logger.info(String.format("Loaded %d training examples for %s", train.size(), train.getOutputs().toString()));
                     logger.info("Found " + train.getFeatureIDMap().size() + " features, and " + train.getOutputInfo().size() + " response dimensions");
+                    logger.info("Deserialising dataset from " + testingPath);
                     @SuppressWarnings("unchecked")
                     Dataset<T> deserTest = (Dataset<T>) oits.readObject();
                     test = new ImmutableDataset<>(deserTest, deserTest.getSourceProvenance(), deserTest.getOutputFactory(), train.getFeatureIDMap(), train.getOutputIDInfo(), true);
@@ -230,6 +240,33 @@ public <T extends Output<T>> Pair<Dataset<T>,Dataset<T>> load(OutputFactory<T> o
                     throw new IllegalArgumentException("Unknown class in serialised files", e);
                 }
                 break;
+            case SERIALIZED_PROTOBUF:
+                //
+                // Load Tribuo protobuf serialised datasets.
+                logger.info("Deserialising protobuf dataset from " + trainingPath);
+                Dataset<?> tmp = Dataset.deserializeFromFile(trainingPath);
+                if (tmp.validate((Class<? extends Output<?>>) outputFactory.getUnknownOutput().getClass())) {
+                    train = Dataset.castDataset(tmp, outputFactory.getUnknownOutput().getClass());
+                    if (minCount > 0) {
+                        logger.info("Found " + train.getFeatureIDMap().size() + " features");
+                        logger.info("Removing features that occur fewer than " + minCount + " times.");
+                        train = new MinimumCardinalityDataset<>(train, minCount);
+                    }
+                    logger.info(String.format("Loaded %d training examples for %s", train.size(), train.getOutputs().toString()));
+                    logger.info("Found " + train.getFeatureIDMap().size() + " features, and " + train.getOutputInfo().size() + " response dimensions");
+
+                    logger.info("Deserialising protobuf dataset from " + testingPath);
+                    tmp = Dataset.deserializeFromFile(testingPath);
+                    if (tmp.validate((Class<? extends Output<?>>) outputFactory.getUnknownOutput().getClass())) {
+                        Dataset<T> deserTest = Dataset.castDataset(tmp, outputFactory.getUnknownOutput().getClass());
+                        test = new ImmutableDataset<>(deserTest, deserTest.getSourceProvenance(), deserTest.getOutputFactory(), train.getFeatureIDMap(), train.getOutputIDInfo(), true);
+                    } else {
+                        throw new IllegalArgumentException("Invalid test dataset type, expected " + outputFactory.getUnknownOutput().getClass());
+                    }
+                } else {
+                    throw new IllegalArgumentException("Invalid train dataset type, expected " + outputFactory.getUnknownOutput().getClass());
+                }
+                break;
             case LIBSVM:
                 //
                 // Load the libsvm text-based data format.
@@ -320,9 +357,14 @@ public <T extends Output<T>> Pair<Dataset<T>,Dataset<T>> load(OutputFactory<T> o
      * @throws IOException If the model could not be saved.
      */
     public <T extends Output<T>> void saveModel(Model<T> model) throws IOException {
-        try (ObjectOutputStream oos = new ObjectOutputStream(new FileOutputStream(outputPath.toFile()))) {
-            oos.writeObject(model);
-            logger.info("Serialized model to file: " + outputPath);
+        if (modelOutputProtobuf) {
+            model.serializeToFile(outputPath);
+            logger.info("Serialized model as a protobuf to file: " + outputPath);
+        } else {
+            try (ObjectOutputStream oos = new ObjectOutputStream(Files.newOutputStream(outputPath))) {
+                oos.writeObject(model);
+                logger.info("Serialized model to file: " + outputPath);
+            }
         }
     }
 }
diff --git a/Data/src/main/java/org/tribuo/data/DatasetExplorer.java b/Data/src/main/java/org/tribuo/data/DatasetExplorer.java
index 1a8be5d5d..be3abef92 100644
--- a/Data/src/main/java/org/tribuo/data/DatasetExplorer.java
+++ b/Data/src/main/java/org/tribuo/data/DatasetExplorer.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2020, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -92,22 +92,32 @@ public void startShell() {
      * @param path The path to load.
      * @return A status string.
      */
-    @Command(usage = "<filename> - Load a dataset from disk.", completers="fileCompleter")
-    public String loadDataset(CommandInterpreter ci, File path) {
-        try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(path)))) {
-            dataset = (Dataset<?>) ois.readObject();
-        } catch (ClassNotFoundException e) {
-            logger.log(Level.SEVERE,"Failed to load class from stream " + path.getAbsolutePath(),e);
-            return "Failed to load dataset";
-        } catch (FileNotFoundException e) {
-            logger.log(Level.SEVERE,"Failed to open file " + path.getAbsolutePath(),e);
-            return "Failed to load dataset";
-        } catch (IOException e) {
-            logger.log(Level.SEVERE,"IOException when reading from file " + path.getAbsolutePath(),e);
-            return "Failed to load dataset";
+    @Command(usage = "<filename> <is-protobuf> - Load a dataset from disk.", completers="fileCompleter")
+    public String loadDataset(CommandInterpreter ci, File path, boolean protobuf) {
+        String output = "Failed to load dataset";
+        if (protobuf) {
+            try {
+                dataset = Dataset.deserializeFromFile(path.toPath());
+                output = "Loaded dataset from path " + path.getAbsolutePath();
+            } catch (IllegalStateException e) {
+                logger.log(Level.SEVERE, "Failed to deserialize protobuf when reading from file " + path.getAbsolutePath(), e);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE, "IOException when reading from file " + path.getAbsolutePath(), e);
+            }
+        } else {
+            try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(path)))) {
+                dataset = (Dataset<?>) ois.readObject();
+                output = "Loaded dataset from path " + path.getAbsolutePath();
+            } catch (ClassNotFoundException e) {
+                logger.log(Level.SEVERE, "Failed to load class from stream " + path.getAbsolutePath(), e);
+            } catch (FileNotFoundException e) {
+                logger.log(Level.SEVERE, "Failed to open file " + path.getAbsolutePath(), e);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE, "IOException when reading from file " + path.getAbsolutePath(), e);
+            }
         }
 
-        return "Loaded dataset from path " + path.toString();
+        return output;
     }
 
     /**
@@ -220,6 +230,12 @@ public static class DatasetExplorerOptions implements Options {
          */
         @Option(charName = 'f', longName = "filename", usage = "Dataset file to load. Optional.")
         public String modelFilename;
+
+        /**
+         * Load the model from a protobuf. Optional.
+         */
+        @Option(charName = 'p', longName = "protobuf-model", usage = "Load the model from a protobuf. Optional")
+        public boolean protobufFormat;
     }
 
     /**
@@ -231,7 +247,7 @@ public static void main(String[] args) {
         ConfigurationManager cm = new ConfigurationManager(args,options,false);
         DatasetExplorer driver = new DatasetExplorer();
         if (options.modelFilename != null) {
-            logger.log(Level.INFO,driver.loadDataset(driver.shell, new File(options.modelFilename)));
+            logger.log(Level.INFO,driver.loadDataset(driver.shell, new File(options.modelFilename), options.protobufFormat));
         }
         driver.startShell();
     }
diff --git a/Data/src/main/java/org/tribuo/data/PreprocessAndSerialize.java b/Data/src/main/java/org/tribuo/data/PreprocessAndSerialize.java
index 1a98e868e..3b1ea5e4f 100644
--- a/Data/src/main/java/org/tribuo/data/PreprocessAndSerialize.java
+++ b/Data/src/main/java/org/tribuo/data/PreprocessAndSerialize.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2020, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -28,9 +28,12 @@
 
 import java.io.IOException;
 import java.io.ObjectOutputStream;
+import java.io.OutputStream;
+import java.nio.file.Files;
 import java.nio.file.Path;
 import java.util.logging.Level;
 import java.util.logging.Logger;
+import java.util.zip.GZIPOutputStream;
 
 /**
  * Reads in a Datasource, processes all the data, and writes it out as a serialized dataset. This makes sharing
@@ -55,6 +58,12 @@ public static class PreprocessAndSerializeOptions implements Options {
          */
         @Option(charName = 'o', longName = "serialized-dataset", usage = "path to serialize the dataset")
         public Path output;
+
+        /**
+         * Save the dataset as a protobuf.
+         */
+        @Option(charName = 'p', longName = "save-as-protobuf", usage = "Save the dataset as a protobuf.")
+        public boolean protobufFormat;
     }
 
     /**
@@ -82,11 +91,19 @@ public static void main(String[] args) {
         if(opts.output.endsWith("gz")) {
             logger.info("Writing zipped dataset");
         }
-        try(ObjectOutputStream os = IOUtil.getObjectOutputStream(opts.output.toString(), opts.output.endsWith("gz"))) {
-            os.writeObject(dataset);
-        } catch (IOException e) {
-            logger.log(Level.SEVERE,  "Error writing serialized dataset", e);
-            System.exit(1);
+        if (opts.protobufFormat) {
+            try (OutputStream os = opts.output.endsWith("gz") ? new GZIPOutputStream(Files.newOutputStream(opts.output)) : Files.newOutputStream(opts.output)) {
+                dataset.serializeToStream(os);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE, "Error writing serialized dataset", e);
+            }
+        } else {
+            try(ObjectOutputStream os = IOUtil.getObjectOutputStream(opts.output.toString(), opts.output.endsWith("gz"))) {
+                os.writeObject(dataset);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE,  "Error writing serialized dataset", e);
+                System.exit(1);
+            }
         }
     }
 }
diff --git a/Interop/OCI/src/main/java/org/tribuo/interop/oci/OCIModelCLI.java b/Interop/OCI/src/main/java/org/tribuo/interop/oci/OCIModelCLI.java
index 81db75aa9..5a96b6e85 100644
--- a/Interop/OCI/src/main/java/org/tribuo/interop/oci/OCIModelCLI.java
+++ b/Interop/OCI/src/main/java/org/tribuo/interop/oci/OCIModelCLI.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2021, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -63,8 +63,12 @@ private OCIModelCLI() {}
     private static void createModelAndDeploy(OCIModelOptions options) throws IOException, ClassNotFoundException {
         // Load the Tribuo model
         Model<Label> model;
-        try (ObjectInputStream ois = new ObjectInputStream(Files.newInputStream(options.modelPath))) {
-            model = ((Model<?>)ois.readObject()).castModel(Label.class);
+        if (options.modelProtobuf) {
+            model = Model.deserializeFromFile(options.modelPath).castModel(Label.class);
+        } else {
+            try (ObjectInputStream ois = new ObjectInputStream(Files.newInputStream(options.modelPath))) {
+                model = ((Model<?>)ois.readObject()).castModel(Label.class);
+            }
         }
         if (!(model instanceof ONNXExportable)) {
             throw new IllegalArgumentException("Model not ONNXExportable, received " + model.toString());
@@ -120,8 +124,12 @@ private static void deploy(OCIModelOptions options) throws IOException {
     private static void modelScoring(OCIModelOptions options) throws IOException, ClassNotFoundException {
         // Load the dataset
         Dataset<Label> dataset;
-        try (ObjectInputStream ois = new ObjectInputStream(Files.newInputStream(options.datasetPath))) {
-            dataset = Dataset.castDataset((Dataset<?>) ois.readObject(), Label.class);
+        if (options.datasetProtobuf) {
+            dataset = Dataset.castDataset(Dataset.deserializeFromFile(options.datasetPath), Label.class);
+        } else {
+            try (ObjectInputStream ois = new ObjectInputStream(Files.newInputStream(options.datasetPath))) {
+                dataset = Dataset.castDataset((Dataset<?>) ois.readObject(), Label.class);
+            }
         }
         ImmutableFeatureMap featureIDMap = dataset.getFeatureIDMap();
 
@@ -230,6 +238,11 @@ public String getOptionsDescription() {
          */
         @Option(charName='d',longName="deploy-model-path",usage="Path to the serialized model to deploy to OCI DS.")
         public Path modelPath;
+        /**
+         * Is the model stored in protobuf format?
+         */
+        @Option(longName="model-protobuf",usage="Is the model stored in protobuf format?")
+        public boolean modelProtobuf;
         /**
          * Model display name.
          */
@@ -261,6 +274,11 @@ public String getOptionsDescription() {
          */
         @Option(charName='s',longName="dataset-path",usage="Path to the serialized dataset to score.")
         public Path datasetPath;
+        /**
+         * Is the serialized dataset in protobuf format?
+         */
+        @Option(longName="dataset-protobuf",usage="Is the serialized dataset a protobuf?")
+        public boolean datasetProtobuf;
         /**
          * The id of the model deployment.
          */
diff --git a/Interop/Tensorflow/src/main/java/org/tribuo/interop/tensorflow/TrainTest.java b/Interop/Tensorflow/src/main/java/org/tribuo/interop/tensorflow/TrainTest.java
index 46d85ccd2..cb22ff599 100644
--- a/Interop/Tensorflow/src/main/java/org/tribuo/interop/tensorflow/TrainTest.java
+++ b/Interop/Tensorflow/src/main/java/org/tribuo/interop/tensorflow/TrainTest.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2020, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -35,9 +35,9 @@
 import org.tribuo.datasource.LibSVMDataSource;
 import org.tribuo.util.Util;
 
-import java.io.FileOutputStream;
 import java.io.IOException;
 import java.io.ObjectOutputStream;
+import java.nio.file.Files;
 import java.nio.file.Path;
 import java.util.ArrayList;
 import java.util.HashMap;
@@ -107,6 +107,11 @@ public String getOptionsDescription() {
          */
         @Option(charName = 'f', longName = "model-output-path", usage = "Path to serialize model to.")
         public Path outputPath;
+        /**
+         * Save the Tribuo model out as a protobuf.
+         */
+        @Option(longName = "model-save-to-proto", usage = "Save the Tribuo model out as a protobuf.")
+        public boolean saveToProto;
         /**
          * Path to the libsvm format training file.
          */
@@ -286,8 +291,12 @@ public static void main(String[] args) throws IOException {
         System.out.println(evaluation.getConfusionMatrix().toString());
 
         if (o.outputPath != null) {
-            try (ObjectOutputStream oos = new ObjectOutputStream(new FileOutputStream(o.outputPath.toFile()))) {
-                oos.writeObject(model);
+            if (o.saveToProto) {
+                model.serializeToFile(o.outputPath);
+            } else {
+                try (ObjectOutputStream oos = new ObjectOutputStream(Files.newOutputStream(o.outputPath))) {
+                    oos.writeObject(model);
+                }
             }
             logger.info("Serialized model to file: " + o.outputPath);
         }

From 7ee586554258d9d923edbfa5e174fa0b9497f8ed Mon Sep 17 00:00:00 2001
From: Adam Pocock <adam.pocock@oracle.com>
Date: Thu, 15 Sep 2022 14:56:20 -0400
Subject: [PATCH 3/8] Adding protobuf support to StripProvenance.

---
 .../java/org/tribuo/json/StripProvenance.java | 87 +++++++++++--------
 1 file changed, 53 insertions(+), 34 deletions(-)

diff --git a/Json/src/main/java/org/tribuo/json/StripProvenance.java b/Json/src/main/java/org/tribuo/json/StripProvenance.java
index 925b49807..fd6650e3c 100644
--- a/Json/src/main/java/org/tribuo/json/StripProvenance.java
+++ b/Json/src/main/java/org/tribuo/json/StripProvenance.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2020, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2015, 2022, Oracle and/or its affiliates. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -76,7 +76,8 @@
 public final class StripProvenance {
     private static final Logger logger = Logger.getLogger(StripProvenance.class.getName());
 
-    private StripProvenance() { }
+    private StripProvenance() {
+    }
 
     /**
      * Types of provenance that can be removed.
@@ -106,9 +107,10 @@ public enum ProvenanceTypes {
 
     /**
      * Creates a new model provenance with the requested provenances stripped out.
-     * @param old The old model provenance.
+     *
+     * @param old            The old model provenance.
      * @param provenanceHash The hash of the provenance (if requested it can be written into the new provenance for tracking).
-     * @param opt The program options.
+     * @param opt            The program options.
      * @return A new model provenance.
      */
     private static ModelProvenance cleanProvenance(ModelProvenance old, String provenanceHash, StripProvenanceOptions opt) {
@@ -138,7 +140,7 @@ private static ModelProvenance cleanProvenance(ModelProvenance old, String prove
         }
         if (opt.storeHash) {
             logger.info("Writing provenance hash into instance map.");
-            instanceProvenance.put("original-provenance-hash",new HashProvenance(opt.hashType,"original-provenance-hash",provenanceHash));
+            instanceProvenance.put("original-provenance-hash", new HashProvenance(opt.hashType, "original-provenance-hash", provenanceHash));
         }
 
         boolean stripSystem;
@@ -148,15 +150,16 @@ private static ModelProvenance cleanProvenance(ModelProvenance old, String prove
             stripSystem = false;
         }
 
-        return new ModelProvenance(old.getClassName(),time,datasetProvenance,trainerProvenance,instanceProvenance,!stripSystem);
+        return new ModelProvenance(old.getClassName(), time, datasetProvenance, trainerProvenance, instanceProvenance, !stripSystem);
     }
 
     /**
      * Creates a new ensemble provenance with the requested information removed.
-     * @param old The old ensemble provenance.
+     *
+     * @param old              The old ensemble provenance.
      * @param memberProvenance The new member provenances.
-     * @param provenanceHash The old ensemble provenance hash.
-     * @param opt The program options.
+     * @param provenanceHash   The old ensemble provenance hash.
+     * @param opt              The program options.
      * @return The new ensemble provenance with the requested fields removed.
      */
     private static EnsembleModelProvenance cleanEnsembleProvenance(EnsembleModelProvenance old, ListProvenance<ModelProvenance> memberProvenance, String provenanceHash, StripProvenanceOptions opt) {
@@ -186,21 +189,22 @@ private static EnsembleModelProvenance cleanEnsembleProvenance(EnsembleModelProv
         }
         if (opt.storeHash) {
             logger.info("Writing provenance hash into instance map.");
-            instanceProvenance.put("original-provenance-hash",new HashProvenance(opt.hashType,"original-provenance-hash",provenanceHash));
+            instanceProvenance.put("original-provenance-hash", new HashProvenance(opt.hashType, "original-provenance-hash", provenanceHash));
         }
-        return new EnsembleModelProvenance(old.getClassName(),time,datasetProvenance,trainerProvenance,instanceProvenance,memberProvenance);
+        return new EnsembleModelProvenance(old.getClassName(), time, datasetProvenance, trainerProvenance, instanceProvenance, memberProvenance);
     }
 
     /**
      * Creates a copy of the old model with the requested provenance removed.
-     * @param oldModel The model to remove provenance from.
+     *
+     * @param oldModel       The model to remove provenance from.
      * @param provenanceHash A hash of the old provenance.
-     * @param opt The program options.
-     * @param <T> The output type.
+     * @param opt            The program options.
+     * @param <T>            The output type.
      * @return A copy of the model with redacted provenance.
      * @throws InvocationTargetException If the model doesn't expose a copy method (all models should do).
-     * @throws IllegalAccessException If the model's copy method is not accessible.
-     * @throws NoSuchMethodException If the model's copy method isn't present.
+     * @throws IllegalAccessException    If the model's copy method is not accessible.
+     * @throws NoSuchMethodException     If the model's copy method isn't present.
      */
     @SuppressWarnings("unchecked") // cast of model after call to copy which returns model.
     private static <T extends Output<T>> ModelTuple<T> convertModel(Model<T> oldModel, String provenanceHash, StripProvenanceOptions opt) throws InvocationTargetException, IllegalAccessException, NoSuchMethodException {
@@ -209,12 +213,12 @@ private static <T extends Output<T>> ModelTuple<T> convertModel(Model<T> oldMode
             List<ModelProvenance> newProvenances = new ArrayList<>();
             List<Model<T>> newModels = new ArrayList<>();
             for (Model<T> e : ((EnsembleModel<T>) oldModel).getModels()) {
-                ModelTuple<T> tuple = convertModel(e,provenanceHash,opt);
+                ModelTuple<T> tuple = convertModel(e, provenanceHash, opt);
                 newProvenances.add(tuple.provenance);
                 newModels.add(tuple.model);
             }
             ListProvenance<ModelProvenance> listProv = new ListProvenance<>(newProvenances);
-            EnsembleModelProvenance cleanedProvenance = cleanEnsembleProvenance(oldProvenance,listProv,provenanceHash,opt);
+            EnsembleModelProvenance cleanedProvenance = cleanEnsembleProvenance(oldProvenance, listProv, provenanceHash, opt);
             Class<? extends Model> clazz = oldModel.getClass();
             Method copyMethod = clazz.getDeclaredMethod("copy", String.class, ModelProvenance.class, List.class);
             boolean accessible = copyMethod.isAccessible();
@@ -276,14 +280,19 @@ public String getOptionsDescription() {
          */
         @Option(charName = 't', longName = "hash-type", usage = "The hash type to use.")
         public ProvenanceUtil.HashType hashType = ObjectProvenance.DEFAULT_HASH_TYPE;
+        /**
+         * Read and write protobuf formatted models.
+         */
+        @Option(longName = "model-protobuf", usage = "Read and write protobuf formatted models.")
+        public boolean protobuf;
     }
 
     /**
      * Runs StripProvenance.
+     *
      * @param args the command line arguments
      * @param <T>  The {@link Output} subclass.
      */
-    @SuppressWarnings("unchecked")
     public static <T extends Output<T>> void main(String[] args) {
 
         //
@@ -304,12 +313,18 @@ public static <T extends Output<T>> void main(String[] args) {
             System.exit(1);
         }
 
-        try (ObjectInputStream ois = IOUtil.getObjectInputStream(o.inputModel);
-             ObjectOutputStream oos = new ObjectOutputStream(new FileOutputStream(o.outputModel))) {
+        try {
             logger.info("Loading model from " + o.inputModel);
-            Model<T> input = (Model<T>) ois.readObject();
+            Model<?> model;
+            if (o.protobuf) {
+                model = Model.deserializeFromFile(o.inputModel.toPath());
+            } else {
+                try (ObjectInputStream ois = IOUtil.getObjectInputStream(o.inputModel)) {
+                    model = (Model<?>) ois.readObject();
+                }
+            }
 
-            ModelProvenance oldProvenance = input.getProvenance();
+            ModelProvenance oldProvenance = model.getProvenance();
 
             logger.info("Marshalling provenance and creating JSON.");
             JsonProvenanceSerialization jsonProvenanceSerialization = new JsonProvenanceSerialization(true);
@@ -328,9 +343,11 @@ public static <T extends Output<T>> void main(String[] args) {
                 }
             }
 
-            ModelTuple<T> tuple = convertModel(input,provenanceHash,o);
+            ModelTuple<?> tuple = convertModel(model, provenanceHash, o);
             logger.info("Writing model to " + o.outputModel);
-            oos.writeObject(tuple.model);
+            try (ObjectOutputStream oos = new ObjectOutputStream(new FileOutputStream(o.outputModel))) {
+                oos.writeObject(tuple.model);
+            }
 
             ModelProvenance newProvenance = tuple.provenance;
             logger.info("Marshalling provenance and creating JSON.");
@@ -339,26 +356,27 @@ public static <T extends Output<T>> void main(String[] args) {
             logger.info("Old provenance = \n" + jsonResult);
             logger.info("New provenance = \n" + newJsonResult);
         } catch (NoSuchMethodException e) {
-            logger.log(Level.SEVERE, "Model.copy method missing on a class which extends Model.",e);
+            logger.log(Level.SEVERE, "Model.copy method missing on a class which extends Model.", e);
         } catch (IllegalAccessException e) {
-            logger.log(Level.SEVERE, "Failed to modify protection on inner copy method on Model.",e);
+            logger.log(Level.SEVERE, "Failed to modify protection on inner copy method on Model.", e);
         } catch (InvocationTargetException e) {
-            logger.log(Level.SEVERE, "Failed to invoke inner copy method on Model.",e);
+            logger.log(Level.SEVERE, "Failed to invoke inner copy method on Model.", e);
         } catch (UnsupportedEncodingException e) {
-            logger.log(Level.SEVERE, "Unsupported encoding exception.",e);
+            logger.log(Level.SEVERE, "Unsupported encoding exception.", e);
         } catch (FileNotFoundException e) {
-            logger.log(Level.SEVERE, "Failed to find the input file.",e);
+            logger.log(Level.SEVERE, "Failed to find the input file.", e);
         } catch (IOException e) {
-            logger.log(Level.SEVERE, "IO error when reading or writing a file.",e);
+            logger.log(Level.SEVERE, "IO error when reading or writing a file.", e);
         } catch (ClassNotFoundException e) {
-            logger.log(Level.SEVERE, "The model and/or provenance classes are not on the classpath.",e);
+            logger.log(Level.SEVERE, "The model and/or provenance classes are not on the classpath.", e);
         }
 
     }
 
     /**
      * It's a record. Or at least it will be.
-     * @param <T> The ouput type.
+     *
+     * @param <T> The output type.
      */
     private static class ModelTuple<T extends Output<T>> {
         public final Model<T> model;
@@ -366,7 +384,8 @@ private static class ModelTuple<T extends Output<T>> {
 
         /**
          * Constructs a model tuple.
-         * @param model The model.
+         *
+         * @param model      The model.
          * @param provenance The provenance.
          */
         public ModelTuple(Model<T> model, ModelProvenance provenance) {

From f9d3b1cafb98c99e1c2f736ab6fa6f21409f8a80 Mon Sep 17 00:00:00 2001
From: Adam Pocock <adam.pocock@oracle.com>
Date: Thu, 15 Sep 2022 16:17:57 -0400
Subject: [PATCH 4/8] Suppressing an unchecked type warning which is guarded
 elsewhere.

---
 .../src/main/java/org/tribuo/common/xgboost/XGBoostModel.java | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/Common/XGBoost/src/main/java/org/tribuo/common/xgboost/XGBoostModel.java b/Common/XGBoost/src/main/java/org/tribuo/common/xgboost/XGBoostModel.java
index e5bc1d2fd..b0c543abe 100644
--- a/Common/XGBoost/src/main/java/org/tribuo/common/xgboost/XGBoostModel.java
+++ b/Common/XGBoost/src/main/java/org/tribuo/common/xgboost/XGBoostModel.java
@@ -138,7 +138,9 @@ public static XGBoostModel<?> deserializeFromProto(int version, String className
             throw new IllegalStateException("Invalid protobuf, no XGBoost models were found");
         }
 
-        return new XGBoostModel(carrier.name(),carrier.provenance(),carrier.featureDomain(),carrier.outputDomain(),models,converter);
+        @SuppressWarnings({"rawtypes","unchecked"}) // guarded by getClass check on the converter and domain above
+        XGBoostModel<?> model = new XGBoostModel(carrier.name(),carrier.provenance(),carrier.featureDomain(),carrier.outputDomain(),models,converter);
+        return model;
     }
 
     /**

From a2a8818634a3364658689c14625f0996cb6af54a Mon Sep 17 00:00:00 2001
From: Adam Pocock <adam.pocock@oracle.com>
Date: Thu, 15 Sep 2022 16:18:36 -0400
Subject: [PATCH 5/8] Adding a type witness to OutputFactory with a default
 implementation that throws, for use when deserializing datasets.

---
 .../src/main/java/org/tribuo/anomaly/AnomalyFactory.java  | 5 +++++
 .../main/java/org/tribuo/classification/LabelFactory.java | 5 +++++
 .../java/org/tribuo/clustering/ClusteringFactory.java     | 5 +++++
 Core/src/main/java/org/tribuo/OutputFactory.java          | 8 ++++++++
 .../test/java/org/tribuo/test/MockMultiOutputFactory.java | 5 +++++
 Core/src/test/java/org/tribuo/test/MockOutputFactory.java | 5 +++++
 Data/src/main/java/org/tribuo/data/DataOptions.java       | 8 ++++----
 .../java/org/tribuo/multilabel/MultiLabelFactory.java     | 5 +++++
 .../java/org/tribuo/regression/RegressionFactory.java     | 5 +++++
 9 files changed, 47 insertions(+), 4 deletions(-)

diff --git a/AnomalyDetection/Core/src/main/java/org/tribuo/anomaly/AnomalyFactory.java b/AnomalyDetection/Core/src/main/java/org/tribuo/anomaly/AnomalyFactory.java
index 73d4d6b8e..66af87598 100644
--- a/AnomalyDetection/Core/src/main/java/org/tribuo/anomaly/AnomalyFactory.java
+++ b/AnomalyDetection/Core/src/main/java/org/tribuo/anomaly/AnomalyFactory.java
@@ -121,6 +121,11 @@ public Evaluator<Event, AnomalyEvaluation> getEvaluator() {
         return evaluator;
     }
 
+    @Override
+    public Class<Event> getTypeWitness() {
+        return Event.class;
+    }
+
     @Override
     public int hashCode() {
         return "AnomalyFactory".hashCode();
diff --git a/Classification/Core/src/main/java/org/tribuo/classification/LabelFactory.java b/Classification/Core/src/main/java/org/tribuo/classification/LabelFactory.java
index 2a3571c91..b22df0a4a 100644
--- a/Classification/Core/src/main/java/org/tribuo/classification/LabelFactory.java
+++ b/Classification/Core/src/main/java/org/tribuo/classification/LabelFactory.java
@@ -120,6 +120,11 @@ public Evaluator<Label,LabelEvaluation> getEvaluator() {
         return evaluator;
     }
 
+    @Override
+    public Class<Label> getTypeWitness() {
+        return Label.class;
+    }
+
     @Override
     public int hashCode() {
         return "LabelFactory".hashCode();
diff --git a/Clustering/Core/src/main/java/org/tribuo/clustering/ClusteringFactory.java b/Clustering/Core/src/main/java/org/tribuo/clustering/ClusteringFactory.java
index b38c1d5a8..570c82a06 100644
--- a/Clustering/Core/src/main/java/org/tribuo/clustering/ClusteringFactory.java
+++ b/Clustering/Core/src/main/java/org/tribuo/clustering/ClusteringFactory.java
@@ -121,6 +121,11 @@ public Evaluator<ClusterID, ClusteringEvaluation> getEvaluator() {
         return evaluator;
     }
 
+    @Override
+    public Class<ClusterID> getTypeWitness() {
+        return ClusterID.class;
+    }
+
     @Override
     public int hashCode() {
         return "ClusteringFactory".hashCode();
diff --git a/Core/src/main/java/org/tribuo/OutputFactory.java b/Core/src/main/java/org/tribuo/OutputFactory.java
index c0f4a90f8..473ce1e86 100644
--- a/Core/src/main/java/org/tribuo/OutputFactory.java
+++ b/Core/src/main/java/org/tribuo/OutputFactory.java
@@ -88,6 +88,14 @@ public interface OutputFactory<T extends Output<T>> extends Configurable, ProtoS
      */
     public Evaluator<T,? extends Evaluation<T>> getEvaluator();
 
+    /**
+     * Gets the output class that this factory supports.
+     * @return The output class.
+     */
+    default public Class<T> getTypeWitness() {
+        throw new UnsupportedOperationException("This class must be updated to support protobuf serialization");
+    }
+
     /**
      * Generate a list of outputs from the supplied list of inputs.
      * <p>
diff --git a/Core/src/test/java/org/tribuo/test/MockMultiOutputFactory.java b/Core/src/test/java/org/tribuo/test/MockMultiOutputFactory.java
index bf0df3dcb..d9ab9c081 100644
--- a/Core/src/test/java/org/tribuo/test/MockMultiOutputFactory.java
+++ b/Core/src/test/java/org/tribuo/test/MockMultiOutputFactory.java
@@ -97,6 +97,11 @@ public ImmutableOutputInfo<MockMultiOutput> constructInfoForExternalModel(Map<Mo
         throw new UnsupportedOperationException("generateEvaluator not implemented");
     }
 
+    @Override
+    public Class<MockMultiOutput> getTypeWitness() {
+        return MockMultiOutput.class;
+    }
+
     @Override
     public int hashCode() {
         return this.getClass().hashCode();
diff --git a/Core/src/test/java/org/tribuo/test/MockOutputFactory.java b/Core/src/test/java/org/tribuo/test/MockOutputFactory.java
index f31130473..6d1913af9 100644
--- a/Core/src/test/java/org/tribuo/test/MockOutputFactory.java
+++ b/Core/src/test/java/org/tribuo/test/MockOutputFactory.java
@@ -85,6 +85,11 @@ public ImmutableOutputInfo<MockOutput> constructInfoForExternalModel(Map<MockOut
         throw new UnsupportedOperationException("generateEvaluator not implemented");
     }
 
+    @Override
+    public Class<MockOutput> getTypeWitness() {
+        return MockOutput.class;
+    }
+
     @Override
     public int hashCode() {
         return "MockOutputFactory".hashCode();
diff --git a/Data/src/main/java/org/tribuo/data/DataOptions.java b/Data/src/main/java/org/tribuo/data/DataOptions.java
index 805b32b3d..6f155cc99 100644
--- a/Data/src/main/java/org/tribuo/data/DataOptions.java
+++ b/Data/src/main/java/org/tribuo/data/DataOptions.java
@@ -245,8 +245,8 @@ public <T extends Output<T>> Pair<Dataset<T>,Dataset<T>> load(OutputFactory<T> o
                 // Load Tribuo protobuf serialised datasets.
                 logger.info("Deserialising protobuf dataset from " + trainingPath);
                 Dataset<?> tmp = Dataset.deserializeFromFile(trainingPath);
-                if (tmp.validate((Class<? extends Output<?>>) outputFactory.getUnknownOutput().getClass())) {
-                    train = Dataset.castDataset(tmp, outputFactory.getUnknownOutput().getClass());
+                if (tmp.validate(outputFactory.getTypeWitness())) {
+                    train = Dataset.castDataset(tmp, outputFactory.getTypeWitness());
                     if (minCount > 0) {
                         logger.info("Found " + train.getFeatureIDMap().size() + " features");
                         logger.info("Removing features that occur fewer than " + minCount + " times.");
@@ -257,8 +257,8 @@ public <T extends Output<T>> Pair<Dataset<T>,Dataset<T>> load(OutputFactory<T> o
 
                     logger.info("Deserialising protobuf dataset from " + testingPath);
                     tmp = Dataset.deserializeFromFile(testingPath);
-                    if (tmp.validate((Class<? extends Output<?>>) outputFactory.getUnknownOutput().getClass())) {
-                        Dataset<T> deserTest = Dataset.castDataset(tmp, outputFactory.getUnknownOutput().getClass());
+                    if (tmp.validate(outputFactory.getTypeWitness())) {
+                        Dataset<T> deserTest = Dataset.castDataset(tmp, outputFactory.getTypeWitness());
                         test = new ImmutableDataset<>(deserTest, deserTest.getSourceProvenance(), deserTest.getOutputFactory(), train.getFeatureIDMap(), train.getOutputIDInfo(), true);
                     } else {
                         throw new IllegalArgumentException("Invalid test dataset type, expected " + outputFactory.getUnknownOutput().getClass());
diff --git a/MultiLabel/Core/src/main/java/org/tribuo/multilabel/MultiLabelFactory.java b/MultiLabel/Core/src/main/java/org/tribuo/multilabel/MultiLabelFactory.java
index 1d352d650..12e4fbba3 100644
--- a/MultiLabel/Core/src/main/java/org/tribuo/multilabel/MultiLabelFactory.java
+++ b/MultiLabel/Core/src/main/java/org/tribuo/multilabel/MultiLabelFactory.java
@@ -128,6 +128,11 @@ public Evaluator<MultiLabel, MultiLabelEvaluation> getEvaluator() {
         return evaluator;
     }
 
+    @Override
+    public Class<MultiLabel> getTypeWitness() {
+        return MultiLabel.class;
+    }
+
     @Override
     public int hashCode() {
         return "MultiLabelFactory".hashCode();
diff --git a/Regression/Core/src/main/java/org/tribuo/regression/RegressionFactory.java b/Regression/Core/src/main/java/org/tribuo/regression/RegressionFactory.java
index 72a6421cc..f0614f86b 100644
--- a/Regression/Core/src/main/java/org/tribuo/regression/RegressionFactory.java
+++ b/Regression/Core/src/main/java/org/tribuo/regression/RegressionFactory.java
@@ -202,6 +202,11 @@ public Evaluator<Regressor, RegressionEvaluation> getEvaluator() {
         return evaluator;
     }
 
+    @Override
+    public Class<Regressor> getTypeWitness() {
+        return Regressor.class;
+    }
+
     @Override
     public int hashCode() {
         return "RegressionFactory".hashCode() ^ Character.hashCode(splitChar);

From 1b997aaffb2a35025b599cebe2eb6837c64a6d3b Mon Sep 17 00:00:00 2001
From: Adam Pocock <adam.pocock@oracle.com>
Date: Thu, 22 Sep 2022 14:03:32 -0400
Subject: [PATCH 6/8] Fixing an issue where model provenance would return nulls
 for new fields added in 4.1 which breaks the provenance infrastructure as
 nothing should be null.

---
 .../java/org/tribuo/provenance/ModelProvenance.java | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/Core/src/main/java/org/tribuo/provenance/ModelProvenance.java b/Core/src/main/java/org/tribuo/provenance/ModelProvenance.java
index 61d8d8c69..921712f23 100644
--- a/Core/src/main/java/org/tribuo/provenance/ModelProvenance.java
+++ b/Core/src/main/java/org/tribuo/provenance/ModelProvenance.java
@@ -24,6 +24,7 @@
 import com.oracle.labs.mlrg.olcut.util.Pair;
 import org.tribuo.Tribuo;
 
+import java.io.IOException;
 import java.time.OffsetDateTime;
 import java.util.ArrayList;
 import java.util.Collections;
@@ -206,7 +207,7 @@ public String getTribuoVersion() {
      * @return The Java version.
      */
     public String getJavaVersion() {
-        return javaVersionString;
+        return javaVersionString == null ? UNKNOWN_VERSION : javaVersionString;
     }
 
     /**
@@ -214,7 +215,7 @@ public String getJavaVersion() {
      * @return The OS name.
      */
     public String getOS() {
-        return osString;
+        return osString == null ? UNKNOWN_VERSION : osString;
     }
 
     /**
@@ -222,7 +223,7 @@ public String getOS() {
      * @return The CPU architecture.
      */
     public String getArch() {
-        return archString;
+        return archString == null ? UNKNOWN_VERSION : archString;
     }
 
     @Override
@@ -269,9 +270,9 @@ protected List<Pair<String,Provenance>> internalProvenances() {
         iterable.add(new Pair<>(TRAINING_TIME,new DateTimeProvenance(TRAINING_TIME,time)));
         iterable.add(new Pair<>(INSTANCE_VALUES,instanceProvenance));
         iterable.add(new Pair<>(TRIBUO_VERSION_STRING,new StringProvenance(TRIBUO_VERSION_STRING,versionString)));
-        iterable.add(new Pair<>(JAVA_VERSION_STRING,new StringProvenance(JAVA_VERSION_STRING,javaVersionString)));
-        iterable.add(new Pair<>(OS_STRING,new StringProvenance(OS_STRING,osString)));
-        iterable.add(new Pair<>(ARCH_STRING,new StringProvenance(ARCH_STRING,archString)));
+        iterable.add(new Pair<>(JAVA_VERSION_STRING,new StringProvenance(JAVA_VERSION_STRING,getJavaVersion())));
+        iterable.add(new Pair<>(OS_STRING,new StringProvenance(OS_STRING,getOS())));
+        iterable.add(new Pair<>(ARCH_STRING,new StringProvenance(ARCH_STRING,getArch())));
         return iterable;
     }
 

From 03ebba60203235c3bd30c1ef066b53fbd76d88f7 Mon Sep 17 00:00:00 2001
From: Adam Pocock <adam.pocock@oracle.com>
Date: Thu, 22 Sep 2022 14:04:02 -0400
Subject: [PATCH 7/8] Adding protobuf support to ModelCardCLI.

---
 Interop/ModelCard/pom.xml                     |  13 +-
 .../tribuo/interop/modelcard/ModelCard.java   |  15 ++
 .../interop/modelcard/ModelCardCLI.java       | 250 ++++++++++++------
 .../interop/modelcard/TestingDetails.java     |   7 +
 .../interop/modelcard/TrainingDetails.java    |   7 +-
 5 files changed, 206 insertions(+), 86 deletions(-)

diff --git a/Interop/ModelCard/pom.xml b/Interop/ModelCard/pom.xml
index aef278eb3..5ad71462e 100644
--- a/Interop/ModelCard/pom.xml
+++ b/Interop/ModelCard/pom.xml
@@ -24,11 +24,6 @@
             <artifactId>tribuo-core</artifactId>
             <version>${project.version}</version>
         </dependency>
-        <dependency>
-            <groupId>org.tribuo</groupId>
-            <artifactId>tribuo-data</artifactId>
-            <version>${project.version}</version>
-        </dependency>
         <dependency>
             <groupId>org.tribuo</groupId>
             <artifactId>tribuo-interop-core</artifactId>
@@ -53,25 +48,25 @@
         </dependency>
         <dependency>
             <groupId>org.tribuo</groupId>
-            <artifactId>tribuo-classification-core</artifactId>
+            <artifactId>tribuo-data</artifactId>
             <version>${project.version}</version>
             <scope>test</scope>
         </dependency>
         <dependency>
             <groupId>org.tribuo</groupId>
-            <artifactId>tribuo-classification-libsvm</artifactId>
+            <artifactId>tribuo-classification-core</artifactId>
             <version>${project.version}</version>
             <scope>test</scope>
         </dependency>
         <dependency>
             <groupId>org.tribuo</groupId>
-            <artifactId>tribuo-classification-sgd</artifactId>
+            <artifactId>tribuo-classification-libsvm</artifactId>
             <version>${project.version}</version>
             <scope>test</scope>
         </dependency>
         <dependency>
             <groupId>org.tribuo</groupId>
-            <artifactId>tribuo-common-sgd</artifactId>
+            <artifactId>tribuo-classification-sgd</artifactId>
             <version>${project.version}</version>
             <scope>test</scope>
         </dependency>
diff --git a/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/ModelCard.java b/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/ModelCard.java
index b961ecc37..dc349d396 100644
--- a/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/ModelCard.java
+++ b/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/ModelCard.java
@@ -102,6 +102,21 @@ public ModelCard(Model<?> model, Evaluation<?> evaluation) {
         this(model, evaluation, Collections.emptyMap(), null);
     }
 
+    /**
+     * Creates an instance of ModelCard that does not include any testing metrics and has its {@link UsageDetails} set to null.
+     * <p>
+     * @param model The trained model for which a model card will be built.
+     */
+    ModelCard(Model<?> model) {
+        if (model instanceof ExternalModel) {
+            throw new IllegalArgumentException("External models currently not supported by ModelCard.");
+        }
+        modelDetails = new ModelDetails(model);
+        trainingDetails = new TrainingDetails(model);
+        testingDetails = new TestingDetails();
+        usageDetails = null;
+    }
+
     /**
      * Creates an instance of ModelCard.
      * <p>
diff --git a/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/ModelCardCLI.java b/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/ModelCardCLI.java
index 26252fbe1..1a0b99f38 100644
--- a/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/ModelCardCLI.java
+++ b/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/ModelCardCLI.java
@@ -15,15 +15,27 @@
  */
 package org.tribuo.interop.modelcard;
 
+import com.fasterxml.jackson.core.JsonProcessingException;
 import com.fasterxml.jackson.databind.node.ObjectNode;
 import com.oracle.labs.mlrg.olcut.command.Command;
 import com.oracle.labs.mlrg.olcut.command.CommandGroup;
 import com.oracle.labs.mlrg.olcut.command.CommandInterpreter;
+import com.oracle.labs.mlrg.olcut.config.ConfigurationManager;
+import com.oracle.labs.mlrg.olcut.config.Option;
+import com.oracle.labs.mlrg.olcut.config.Options;
+import com.oracle.labs.mlrg.olcut.provenance.ProvenanceUtil;
+import org.tribuo.Model;
 
+import java.io.BufferedInputStream;
 import java.io.File;
+import java.io.FileInputStream;
+import java.io.FileNotFoundException;
 import java.io.IOException;
+import java.io.ObjectInputStream;
 import java.util.ArrayList;
 import java.util.List;
+import java.util.logging.Level;
+import java.util.logging.Logger;
 
 import static org.tribuo.interop.modelcard.ModelCard.mapper;
 
@@ -32,10 +44,22 @@
  * existing ModelCard.
  */
 public class ModelCardCLI implements CommandGroup {
+    private static final Logger logger = Logger.getLogger(ModelCardCLI.class.getName());
     /**
      * The command shell instance.
      */
     private final CommandInterpreter shell = new CommandInterpreter();
+
+    /**
+     * The model instance.
+     */
+    private Model<?> model;
+
+    /**
+     * The model card.
+     */
+    private ModelCard modelCard;
+
     /**
      * The {@link UsageDetailsBuilder} instance.
      */
@@ -50,7 +74,7 @@ public class ModelCardCLI implements CommandGroup {
      * Starts the command shell.
      */
     public void startShell() {
-        shell.setPrompt("CLI% ");
+        shell.setPrompt("modelcard sh%% ");
         shell.add(this);
         shell.start();
     }
@@ -65,15 +89,50 @@ public String getDescription() {
         return "CLI for building a UsageDetails for a model card.";
     }
 
+    /**
+     * Loads in a model and builds a partial model card from the provenance.
+     * @param ci The command shell.
+     * @param path The path to load.
+     * @param protobuf Is the model a protobuf?
+     * @return A status string.
+     */
+    @Command(usage = "<path> <is-protobuf> - Loads a model in and builds a partial model card from the provenance.")
+    public String loadModel(CommandInterpreter ci, File path, boolean protobuf) {
+        String output = "Failed to load model";
+        if (protobuf) {
+            try {
+                model = Model.deserializeFromFile(path.toPath());
+                output = "Loaded model from path " + path.getAbsolutePath();
+            } catch (IllegalStateException e) {
+                logger.log(Level.SEVERE, "Failed to deserialize protobuf when reading from file " + path.getAbsolutePath(), e);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE, "IOException when reading from file " + path.getAbsolutePath(), e);
+            }
+        } else {
+            try (ObjectInputStream ois = new ObjectInputStream(new BufferedInputStream(new FileInputStream(path)))) {
+                model = (Model<?>) ois.readObject();
+                output = "Loaded model from path " + path.getAbsolutePath();
+            } catch (ClassNotFoundException e) {
+                logger.log(Level.SEVERE, "Failed to load class from stream " + path.getAbsolutePath(), e);
+            } catch (FileNotFoundException e) {
+                logger.log(Level.SEVERE, "Failed to open file " + path.getAbsolutePath(), e);
+            } catch (IOException e) {
+                logger.log(Level.SEVERE, "IOException when reading from file " + path.getAbsolutePath(), e);
+            }
+        }
+
+        modelCard = new ModelCard(model);
+
+        return output;
+    }
+
     /**
      * Records the intended use of the model documented by the ModelCard.
      * @param ci The command shell.
      * @param use The intended use of model.
      * @return A status string.
      */
-    @Command(
-            usage = "<String> Records intended use of model."
-    )
+    @Command(usage = "<String> Records intended use of model.")
     public String intendedUse(CommandInterpreter ci, String use) {
         builder.intendedUse(use);
         return("Recorded intended use as " + use + ".");
@@ -85,9 +144,7 @@ public String intendedUse(CommandInterpreter ci, String use) {
      * @param users The intended users of model.
      * @return A status string.
      */
-    @Command(
-            usage = "<String> Records intended users of model."
-    )
+    @Command(usage = "<String> Records intended users of model.")
     public String intendedUsers(CommandInterpreter ci, String users) {
         builder.intendedUsers(users);
         return("Recorded intended users as " + users + ".");
@@ -99,9 +156,7 @@ public String intendedUsers(CommandInterpreter ci, String users) {
      * @param use The description of an out-of-scope use of the model.
      * @return A status string.
      */
-    @Command(
-            usage = "<String> Adds an out-of-scope use to list of out-of-scope uses."
-    )
+    @Command(usage = "<String> Adds an out-of-scope use to list of out-of-scope uses.")
     public String addOutOfScopeUse(CommandInterpreter ci, String use) {
         outOfScopeUses.add(use);
         return("Added an out-of-scope use to list of out-of-scope uses.");
@@ -113,9 +168,7 @@ public String addOutOfScopeUse(CommandInterpreter ci, String use) {
      * @param index The index of the out-of-scope use to be removed.
      * @return A status string.
      */
-    @Command(
-            usage = "<int> Remove out-of-scope use at specified index (0-indexed)."
-    )
+    @Command(usage = "<int> Remove out-of-scope use at specified index (0-indexed).")
     public String removeOutOfScopeUse(CommandInterpreter ci, int index) {
         outOfScopeUses.remove(index);
         return("Removed out-of-scope use at specified index.");
@@ -126,9 +179,7 @@ public String removeOutOfScopeUse(CommandInterpreter ci, int index) {
      * @param ci The command shell.
      * @return A status string.
      */
-    @Command(
-            usage = "Displays all added out-of-scope uses."
-    )
+    @Command(usage = "Displays all added out-of-scope uses.")
     public String viewOutOfScopeUse(CommandInterpreter ci) {
         for (int i = 0; i < outOfScopeUses.size(); i++) {
             System.out.println("\t" + i + ") "+ outOfScopeUses.get(i));
@@ -142,9 +193,7 @@ public String viewOutOfScopeUse(CommandInterpreter ci) {
      * @param step The description of a pre-processing step.
      * @return A status string.
      */
-    @Command(
-            usage = "<String> Adds pre-processing step to list of steps."
-    )
+    @Command(usage = "<String> Adds pre-processing step to list of steps.")
     public String addPreProcessingStep(CommandInterpreter ci, String step) {
         preProcessingSteps.add(step);
         return("Added pre-processing step to list of steps.");
@@ -156,9 +205,7 @@ public String addPreProcessingStep(CommandInterpreter ci, String step) {
      * @param index The index of the pre-processing step to be removed.
      * @return A status string.
      */
-    @Command(
-            usage = "<int> Remove pro-processing step at specified index (0-indexed)."
-    )
+    @Command(usage = "<int> Remove pro-processing step at specified index (0-indexed).")
     public String removePreProcessingStep(CommandInterpreter ci, int index) {
         preProcessingSteps.remove(index);
         return("Removed pre-processing step at specified index.");
@@ -169,9 +216,7 @@ public String removePreProcessingStep(CommandInterpreter ci, int index) {
      * @param ci The command shell.
      * @return A status string.
      */
-    @Command(
-            usage = "Displays all added pre-processing steps."
-    )
+    @Command(usage = "Displays all added pre-processing steps.")
     public String viewPreProcessingSteps(CommandInterpreter ci) {
         for (int i = 0; i < preProcessingSteps.size(); i++) {
             System.out.println("\t" + i + ") "+ preProcessingSteps.get(i));
@@ -185,9 +230,7 @@ public String viewPreProcessingSteps(CommandInterpreter ci) {
      * @param consideration The description of a consideration.
      * @return A status string.
      */
-    @Command(
-            usage = "<String> Adds consideration to list of considerations."
-    )
+    @Command(usage = "<String> Adds consideration to list of considerations.")
     public String addConsideration(CommandInterpreter ci, String consideration) {
         considerations.add(consideration);
         return("Added consideration to list of considerations.");
@@ -199,9 +242,7 @@ public String addConsideration(CommandInterpreter ci, String consideration) {
      * @param index The index of the consideration to be removed.
      * @return A status string.
      */
-    @Command(
-            usage = "<int> Remove consideration at specified index (0-indexed)."
-    )
+    @Command(usage = "<int> Remove consideration at specified index (0-indexed).")
     public String removeConsideration(CommandInterpreter ci, int index) {
         considerations.remove(index);
         return("Removed consideration at specified index.");
@@ -212,9 +253,7 @@ public String removeConsideration(CommandInterpreter ci, int index) {
      * @param ci The command shell.
      * @return A status string.
      */
-    @Command(
-            usage = "Displays all added considerations."
-    )
+    @Command(usage = "Displays all added considerations.")
     public String viewConsiderations(CommandInterpreter ci) {
         for (int i = 0; i < considerations.size(); i++) {
             System.out.println("\t" + i + ") "+ considerations.get(i));
@@ -228,9 +267,7 @@ public String viewConsiderations(CommandInterpreter ci) {
      * @param factor The description of a factor.
      * @return A status string.
      */
-    @Command(
-            usage = "<String> Adds relevant factor to list of factors."
-    )
+    @Command(usage = "<String> Adds relevant factor to list of factors.")
     public String addFactor(CommandInterpreter ci, String factor) {
         factors.add(factor);
         return("Added factor to list of factors.");
@@ -255,9 +292,7 @@ public String removeFactor(CommandInterpreter ci, int index) {
      * @param ci The command shell.
      * @return A status string.
      */
-    @Command(
-            usage = "Displays all added factors."
-    )
+    @Command(usage = "Displays all added factors.")
     public String viewFactors(CommandInterpreter ci) {
         for (int i = 0; i < factors.size(); i++) {
             System.out.println("\t" + i + ") "+ factors.get(i));
@@ -271,9 +306,7 @@ public String viewFactors(CommandInterpreter ci) {
      * @param resource The description of a resource.
      * @return A status string.
      */
-    @Command(
-            usage = "<String> Adds resource to list of resources."
-    )
+    @Command(usage = "<String> Adds resource to list of resources.")
     public String addResource(CommandInterpreter ci, String resource) {
         resources.add(resource);
         return("Added resource to list of resources.");
@@ -285,9 +318,7 @@ public String addResource(CommandInterpreter ci, String resource) {
      * @param index The index of the resource to be removed.
      * @return A status string.
      */
-    @Command(
-            usage = "<int> Remove resource at specified index (0-indexed)."
-    )
+    @Command(usage = "<int> Remove resource at specified index (0-indexed).")
     public String removeResource(CommandInterpreter ci, int index) {
         resources.remove(index);
         return("Removed resource at specified index.");
@@ -298,9 +329,7 @@ public String removeResource(CommandInterpreter ci, int index) {
      * @param ci The command shell.
      * @return A status string.
      */
-    @Command(
-            usage = "Displays all added resources."
-    )
+    @Command(usage = "Displays all added resources.")
     public String viewResources(CommandInterpreter ci) {
         for (int i = 0; i < resources.size(); i++) {
             System.out.println("\t" + i + ") "+ resources.get(i));
@@ -314,9 +343,7 @@ public String viewResources(CommandInterpreter ci) {
      * @param contact The primary contact person of the model.
      * @return A status string.
      */
-    @Command(
-            usage = "<String> Records primary contact in case of questions or comments."
-    )
+    @Command(usage = "<String> Records primary contact in case of questions or comments.")
     public String primaryContact(CommandInterpreter ci, String contact) {
         builder.primaryContact(contact);
         return("Recorded primary contact as " + contact + ".");
@@ -328,9 +355,7 @@ public String primaryContact(CommandInterpreter ci, String contact) {
      * @param citation The citation the model.
      * @return A status string.
      */
-    @Command(
-            usage = "<String> Records model's citation."
-    )
+    @Command(usage = "<String> Records model's citation.")
     public String modelCitation(CommandInterpreter ci, String citation) {
         builder.modelCitation(citation);
         return("Recorded model citation as " + citation + ".");
@@ -342,9 +367,7 @@ public String modelCitation(CommandInterpreter ci, String citation) {
      * @param license The license the model.
      * @return A status string.
      */
-    @Command(
-            usage = "<String> Records model's license."
-    )
+    @Command(usage = "<String> Records model's license.")
     public String modelLicense(CommandInterpreter ci, String license) {
         builder.modelLicense(license);
         return("Recorded model license as " + license + ".");
@@ -363,6 +386,24 @@ private UsageDetails createUsageDetails() {
         return builder.build();
     }
 
+    /**
+     * Loads a model card in from disk. Fails if the model card already includes the usage information.
+     * @param ci The command interpreter.
+     * @param modelCardFile The model card file to load.
+     * @return A status string.
+     * @throws IOException If the card failed to load.
+     */
+    @Command(usage = "<filename> - Loads in an existing model card without usage details")
+    public String loadModelCard(CommandInterpreter ci, File modelCardFile) throws IOException {
+        var modelCardTmp = ModelCard.deserializeFromJson(modelCardFile.toPath());
+        if (modelCardTmp.getUsageDetails() != null) {
+            return "This ModelCard already contains a UsageDetails.";
+        } else {
+            modelCard = modelCardTmp;
+            return "Loaded model card from " + modelCardFile;
+        }
+    }
+
     /**
      * Saves a serialized version of the {@link UsageDetails} created by the builder to the destination file.
      * <p>
@@ -370,25 +411,26 @@ private UsageDetails createUsageDetails() {
      * Throws {@link IOException} if a problem is encountered when reading/writing to file.
      * Throws {@link IllegalArgumentException} if the serialized ModelCard stored at the destination file already
      * contains a non-null UsageDetails.
+     * @param ci The command shelll.
      * @param destinationFile The Json file path corresponding to a serialized ModelCard to which a serialized
      * UsageDetails will be appended.
      * @return A status string.
      */
-    @Command(
-            usage = "<filename> Saves UsageDetails to an existing ModelCard file."
-    )
+    @Command(usage = "<filename> Saves UsageDetails to an existing ModelCard file.")
     public String saveUsageDetails(CommandInterpreter ci, File destinationFile) throws IOException {
+        if (modelCard == null) {
+            return "Error, must load in a model card before saving the completed one.";
+        }
+
         UsageDetails usageDetails = createUsageDetails();
 
         ObjectNode usageDetailsObject = usageDetails.toJson();
-        ObjectNode modelCardObject = mapper.readValue(destinationFile, ObjectNode.class);
-        if (!modelCardObject.get("UsageDetails").isNull()) {
-            throw new IllegalArgumentException("This ModelCard already contains a UsageDetails.");
-        }
+
+        ObjectNode modelCardObject = modelCard.toJson();
         modelCardObject.set("UsageDetails", usageDetailsObject);
         mapper.writeValue(destinationFile, modelCardObject);
 
-        return "Saved UsageDetails to destination file.";
+        return "Saved UsageDetails to destination file '" + destinationFile + "'.";
     }
 
     /**
@@ -396,16 +438,16 @@ public String saveUsageDetails(CommandInterpreter ci, File destinationFile) thro
      * @param ci The command shell.
      * @return A status string.
      */
-    @Command(
-            usage = "Removes all previously written fields for UsageDetails to write a new UsageDetails."
-    )
-    public String newUsageDetails(CommandInterpreter ci) {
+    @Command(usage = "Removes all previously written fields for UsageDetails and clears the model to write a new UsageDetails.")
+    public String clearUsageDetails(CommandInterpreter ci) {
         builder = new UsageDetailsBuilder();
         outOfScopeUses.clear();
         preProcessingSteps.clear();
         considerations.clear();
         factors.clear();
         resources.clear();
+        model = null;
+        modelCard = null;
         return "Started a new UsageDetails.";
     }
 
@@ -414,32 +456,88 @@ public String newUsageDetails(CommandInterpreter ci) {
      * @param ci The command shell.
      * @return A status string.
      */
-    @Command(
-            usage = "Displays current state of UsageDetails."
-    )
+    @Command(usage = "Displays current state of UsageDetails.")
     public String viewUsageDetails(CommandInterpreter ci) {
         System.out.println(createUsageDetails());
         return "Displayed current state of UsageDetails.";
     }
 
+    /**
+     * Prints the current model card, incorporating the current usage details.
+     * @param ci The command shell.
+     * @return A status string.
+     */
+    @Command(usage = "Displays the current model card.")
+    public String viewModelCard(CommandInterpreter ci) {
+        if (modelCard == null) {
+            return "Error, must load in a model card before viewing it.";
+        }
+
+        UsageDetails usageDetails = createUsageDetails();
+
+        ObjectNode usageDetailsObject = usageDetails.toJson();
+
+        ObjectNode modelCardObject = modelCard.toJson();
+        modelCardObject.set("UsageDetails", usageDetailsObject);
+
+        return modelCardObject.toPrettyString();
+    }
+
+    /**
+     * Prints the current model provenance.
+     * @param ci The command shell.
+     * @return A status string.
+     */
+    @Command(usage = "Displays the currently loaded model, if there is one.")
+    public String viewModelProvenance(CommandInterpreter ci) {
+        if (model == null) {
+            return "Error, must load a model to view it.";
+        }
+        try {
+            System.out.println(mapper.writeValueAsString(ProvenanceUtil.convertToMap(model.getProvenance())));
+        } catch (JsonProcessingException e) {
+            logger.log(Level.SEVERE, "Failed to produce JSON from model provenance", e);
+        }
+        return "";
+    }
 
     /**
      * Closes the command shell
      */
-    @Command(
-            usage = "Closes CLI without explicitly saving anything recorded."
-    )
+    @Command(usage = "Closes CLI without explicitly saving anything recorded.")
     public String close(CommandInterpreter ci) {
         shell.close();
         return "Closed ClI.";
     }
 
+    /**
+     * CLI options for {@link ModelCardCLI}.
+     */
+    public static class ModelCardCLIOptions implements Options {
+        /**
+         * Model file to load. Optional.
+         */
+        @Option(charName = 'f', longName = "filename", usage = "Model file to load. Optional.")
+        public String modelFilename;
+
+        /**
+         * Load the model from a protobuf. Optional.
+         */
+        @Option(charName = 'p', longName = "protobuf-model", usage = "Load the model from a protobuf. Optional")
+        public boolean protobufFormat;
+    }
+
     /**
      * Entry point.
      * @param args CLI args.
      */
     public static void main(String[] args) {
+        ModelCardCLIOptions options = new ModelCardCLIOptions();
+        ConfigurationManager cm = new ConfigurationManager(args,options,false);
         ModelCardCLI driver = new ModelCardCLI();
+        if (options.modelFilename != null) {
+            logger.log(Level.INFO,driver.loadModel(driver.shell, new File(options.modelFilename), options.protobufFormat));
+        }
         driver.startShell();
     }
 }
diff --git a/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/TestingDetails.java b/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/TestingDetails.java
index 3e4e18f95..db35fbbe5 100644
--- a/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/TestingDetails.java
+++ b/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/TestingDetails.java
@@ -54,6 +54,13 @@ public TestingDetails(Evaluation<?> evaluation) {
         this(evaluation, Collections.emptyMap());
     }
 
+    /**
+     * Creates an empty TestingDetails.
+     */
+    TestingDetails() {
+        testingSetSize = 0;
+    }
+
     /**
      * Creates an instance of TestingDetails.
      * <p>
diff --git a/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/TrainingDetails.java b/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/TrainingDetails.java
index c074fc98e..4daa1ecaa 100644
--- a/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/TrainingDetails.java
+++ b/Interop/ModelCard/src/main/java/org/tribuo/interop/modelcard/TrainingDetails.java
@@ -23,7 +23,12 @@
 import org.tribuo.Model;
 import org.tribuo.regression.Regressor;
 
-import java.util.*;
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.Objects;
 
 import static org.tribuo.interop.modelcard.ModelCard.mapper;
 

From 127c5bc9e34269a9c628c242fc37b211b833e656 Mon Sep 17 00:00:00 2001
From: Adam Pocock <adam.pocock@oracle.com>
Date: Thu, 22 Sep 2022 14:18:53 -0400
Subject: [PATCH 8/8] Updating the model card tutorial.

---
 tutorials/modelcard-tribuo-v4.ipynb | 246 +++++++++++++++++++++++++---
 1 file changed, 225 insertions(+), 21 deletions(-)

diff --git a/tutorials/modelcard-tribuo-v4.ipynb b/tutorials/modelcard-tribuo-v4.ipynb
index f4ab5650b..04c75bc6d 100644
--- a/tutorials/modelcard-tribuo-v4.ipynb
+++ b/tutorials/modelcard-tribuo-v4.ipynb
@@ -17,7 +17,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 1,
    "metadata": {
     "vscode": {
      "languageId": "java"
@@ -31,7 +31,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 2,
    "metadata": {
     "vscode": {
      "languageId": "java"
@@ -39,6 +39,7 @@
    },
    "outputs": [],
    "source": [
+    "import com.oracle.labs.mlrg.olcut.provenance.ProvenanceUtil;\n",
     "import org.tribuo.MutableDataset;\n",
     "import org.tribuo.interop.modelcard.ModelCard;\n",
     "import org.tribuo.interop.modelcard.UsageDetailsBuilder;\n",
@@ -67,7 +68,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 3,
    "metadata": {
     "vscode": {
      "languageId": "java"
@@ -83,9 +84,212 @@
       "obj = 289.5926348816893, rho = 3.144570476807895\n",
       "nSV = 296, nBSV = 114\n",
       "\n",
-      "Model(class-name=org.tribuo.common.libsvm.LibSVMModel,dataset=Dataset(class-name=org.tribuo.MutableDataset,datasource=DataSource(class-name=org.tribuo.anomaly.example.GaussianAnomalyDataSource,expectedMeans=[1.0, 2.0, 1.0, 2.0, 5.0],anomalousMeans=[-2.0, 2.0, -2.0, 2.0, -10.0],seed=1,numSamples=2000,fractionAnomalous=0.0,anomalousVariances=[1.0, 0.5, 0.25, 1.0, 0.1],expectedVariances=[1.0, 0.5, 0.25, 1.0, 0.1],host-short-name=DataSource),transformations=[],is-sequence=false,is-dense=true,num-examples=2000,num-features=5,num-outputs=2,tribuo-version=4.3.0-SNAPSHOT),trainer=Trainer(class-name=org.tribuo.anomaly.libsvm.LibSVMAnomalyTrainer,cost=1.0,coef0=0.0,seed=12345,cache_size=500.0,probability=false,nu=0.1,degree=3,eps=0.001,kernelType=RBF,p=0.1,shrinking=true,svmType=SVMType(class-name=org.tribuo.anomaly.libsvm.SVMAnomalyType,type=ONE_CLASS,host-short-name=SVMType),gamma=1.0,tribuo-version=4.3.0-SNAPSHOT,train-invocation-count=0,is-sequence=false,host-short-name=Trainer),trained-at=2022-07-25T23:32:07.729242-07:00,instance-values={},tribuo-version=4.3.0-SNAPSHOT,java-version=18.0.1.1,os-name=Mac OS X,os-arch=x86_64)\n",
+      "LibSVMModel(\n",
+      "\tclass-name = org.tribuo.common.libsvm.LibSVMModel\n",
+      "\tdataset = MutableDataset(\n",
+      "\t\t\tclass-name = org.tribuo.MutableDataset\n",
+      "\t\t\tdatasource = GaussianAnomalyDataSource(\n",
+      "\t\t\t\t\tclass-name = org.tribuo.anomaly.example.GaussianAnomalyDataSource\n",
+      "\t\t\t\t\texpectedMeans = List[\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t5.0\n",
+      "\t\t\t\t\t]\n",
+      "\t\t\t\t\tanomalousMeans = List[\n",
+      "\t\t\t\t\t\t-2.0\n",
+      "\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t-2.0\n",
+      "\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t-10.0\n",
+      "\t\t\t\t\t]\n",
+      "\t\t\t\t\tseed = 1\n",
+      "\t\t\t\t\tnumSamples = 2000\n",
+      "\t\t\t\t\tfractionAnomalous = 0.0\n",
+      "\t\t\t\t\tanomalousVariances = List[\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t0.5\n",
+      "\t\t\t\t\t\t0.25\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t0.1\n",
+      "\t\t\t\t\t]\n",
+      "\t\t\t\t\texpectedVariances = List[\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t0.5\n",
+      "\t\t\t\t\t\t0.25\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t0.1\n",
+      "\t\t\t\t\t]\n",
+      "\t\t\t\t\thost-short-name = DataSource\n",
+      "\t\t\t\t)\n",
+      "\t\t\ttransformations = List[]\n",
+      "\t\t\tis-sequence = false\n",
+      "\t\t\tis-dense = true\n",
+      "\t\t\tnum-examples = 2000\n",
+      "\t\t\tnum-features = 5\n",
+      "\t\t\tnum-outputs = 2\n",
+      "\t\t\ttribuo-version = 4.3.0-SNAPSHOT\n",
+      "\t\t)\n",
+      "\ttrainer = LibSVMAnomalyTrainer(\n",
+      "\t\t\tclass-name = org.tribuo.anomaly.libsvm.LibSVMAnomalyTrainer\n",
+      "\t\t\tcost = 1.0\n",
+      "\t\t\tcoef0 = 0.0\n",
+      "\t\t\tseed = 12345\n",
+      "\t\t\tcache_size = 500.0\n",
+      "\t\t\tprobability = false\n",
+      "\t\t\tnu = 0.1\n",
+      "\t\t\tdegree = 3\n",
+      "\t\t\teps = 0.001\n",
+      "\t\t\tkernelType = RBF\n",
+      "\t\t\tp = 0.1\n",
+      "\t\t\tshrinking = true\n",
+      "\t\t\tsvmType = SVMAnomalyType(\n",
+      "\t\t\t\t\tclass-name = org.tribuo.anomaly.libsvm.SVMAnomalyType\n",
+      "\t\t\t\t\ttype = ONE_CLASS\n",
+      "\t\t\t\t\thost-short-name = SVMType\n",
+      "\t\t\t\t)\n",
+      "\t\t\tgamma = 1.0\n",
+      "\t\t\ttribuo-version = 4.3.0-SNAPSHOT\n",
+      "\t\t\ttrain-invocation-count = 0\n",
+      "\t\t\tis-sequence = false\n",
+      "\t\t\thost-short-name = Trainer\n",
+      "\t\t)\n",
+      "\ttrained-at = 2022-09-22T14:18:03.073938-04:00\n",
+      "\tinstance-values = Map{}\n",
+      "\ttribuo-version = 4.3.0-SNAPSHOT\n",
+      "\tjava-version = 17.0.4.1\n",
+      "\tos-name = Mac OS X\n",
+      "\tos-arch = x86_64\n",
+      ")\n",
       "\n",
-      "Evaluation(class-name=org.tribuo.provenance.EvaluationProvenance,model-provenance=Model(class-name=org.tribuo.common.libsvm.LibSVMModel,dataset=Dataset(class-name=org.tribuo.MutableDataset,datasource=DataSource(class-name=org.tribuo.anomaly.example.GaussianAnomalyDataSource,expectedMeans=[1.0, 2.0, 1.0, 2.0, 5.0],anomalousMeans=[-2.0, 2.0, -2.0, 2.0, -10.0],seed=1,numSamples=2000,fractionAnomalous=0.0,anomalousVariances=[1.0, 0.5, 0.25, 1.0, 0.1],expectedVariances=[1.0, 0.5, 0.25, 1.0, 0.1],host-short-name=DataSource),transformations=[],is-sequence=false,is-dense=true,num-examples=2000,num-features=5,num-outputs=2,tribuo-version=4.3.0-SNAPSHOT),trainer=Trainer(class-name=org.tribuo.anomaly.libsvm.LibSVMAnomalyTrainer,cost=1.0,coef0=0.0,seed=12345,cache_size=500.0,probability=false,nu=0.1,degree=3,eps=0.001,kernelType=RBF,p=0.1,shrinking=true,svmType=SVMType(class-name=org.tribuo.anomaly.libsvm.SVMAnomalyType,type=ONE_CLASS,host-short-name=SVMType),gamma=1.0,tribuo-version=4.3.0-SNAPSHOT,train-invocation-count=0,is-sequence=false,host-short-name=Trainer),trained-at=2022-07-25T23:32:07.729242-07:00,instance-values={},tribuo-version=4.3.0-SNAPSHOT,java-version=18.0.1.1,os-name=Mac OS X,os-arch=x86_64),dataset-provenance=Dataset(class-name=org.tribuo.MutableDataset,datasource=DataSource(class-name=org.tribuo.anomaly.example.GaussianAnomalyDataSource,expectedMeans=[1.0, 2.0, 1.0, 2.0, 5.0],anomalousMeans=[-2.0, 2.0, -2.0, 2.0, -10.0],seed=2,numSamples=2000,fractionAnomalous=0.2,anomalousVariances=[1.0, 0.5, 0.25, 1.0, 0.1],expectedVariances=[1.0, 0.5, 0.25, 1.0, 0.1],host-short-name=DataSource),transformations=[],is-sequence=false,is-dense=true,num-examples=2000,num-features=5,num-outputs=2,tribuo-version=4.3.0-SNAPSHOT),tribuo-version=4.3.0-SNAPSHOT)\n"
+      "EvaluationProvenance(\n",
+      "\tclass-name = org.tribuo.provenance.EvaluationProvenance\n",
+      "\tmodel-provenance = LibSVMModel(\n",
+      "\t\t\tclass-name = org.tribuo.common.libsvm.LibSVMModel\n",
+      "\t\t\tdataset = MutableDataset(\n",
+      "\t\t\t\t\tclass-name = org.tribuo.MutableDataset\n",
+      "\t\t\t\t\tdatasource = GaussianAnomalyDataSource(\n",
+      "\t\t\t\t\t\t\tclass-name = org.tribuo.anomaly.example.GaussianAnomalyDataSource\n",
+      "\t\t\t\t\t\t\texpectedMeans = List[\n",
+      "\t\t\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t\t\t5.0\n",
+      "\t\t\t\t\t\t\t]\n",
+      "\t\t\t\t\t\t\tanomalousMeans = List[\n",
+      "\t\t\t\t\t\t\t\t-2.0\n",
+      "\t\t\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t\t\t-2.0\n",
+      "\t\t\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t\t\t-10.0\n",
+      "\t\t\t\t\t\t\t]\n",
+      "\t\t\t\t\t\t\tseed = 1\n",
+      "\t\t\t\t\t\t\tnumSamples = 2000\n",
+      "\t\t\t\t\t\t\tfractionAnomalous = 0.0\n",
+      "\t\t\t\t\t\t\tanomalousVariances = List[\n",
+      "\t\t\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t\t\t0.5\n",
+      "\t\t\t\t\t\t\t\t0.25\n",
+      "\t\t\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t\t\t0.1\n",
+      "\t\t\t\t\t\t\t]\n",
+      "\t\t\t\t\t\t\texpectedVariances = List[\n",
+      "\t\t\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t\t\t0.5\n",
+      "\t\t\t\t\t\t\t\t0.25\n",
+      "\t\t\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t\t\t0.1\n",
+      "\t\t\t\t\t\t\t]\n",
+      "\t\t\t\t\t\t\thost-short-name = DataSource\n",
+      "\t\t\t\t\t\t)\n",
+      "\t\t\t\t\ttransformations = List[]\n",
+      "\t\t\t\t\tis-sequence = false\n",
+      "\t\t\t\t\tis-dense = true\n",
+      "\t\t\t\t\tnum-examples = 2000\n",
+      "\t\t\t\t\tnum-features = 5\n",
+      "\t\t\t\t\tnum-outputs = 2\n",
+      "\t\t\t\t\ttribuo-version = 4.3.0-SNAPSHOT\n",
+      "\t\t\t\t)\n",
+      "\t\t\ttrainer = LibSVMAnomalyTrainer(\n",
+      "\t\t\t\t\tclass-name = org.tribuo.anomaly.libsvm.LibSVMAnomalyTrainer\n",
+      "\t\t\t\t\tcost = 1.0\n",
+      "\t\t\t\t\tcoef0 = 0.0\n",
+      "\t\t\t\t\tseed = 12345\n",
+      "\t\t\t\t\tcache_size = 500.0\n",
+      "\t\t\t\t\tprobability = false\n",
+      "\t\t\t\t\tnu = 0.1\n",
+      "\t\t\t\t\tdegree = 3\n",
+      "\t\t\t\t\teps = 0.001\n",
+      "\t\t\t\t\tkernelType = RBF\n",
+      "\t\t\t\t\tp = 0.1\n",
+      "\t\t\t\t\tshrinking = true\n",
+      "\t\t\t\t\tsvmType = SVMAnomalyType(\n",
+      "\t\t\t\t\t\t\tclass-name = org.tribuo.anomaly.libsvm.SVMAnomalyType\n",
+      "\t\t\t\t\t\t\ttype = ONE_CLASS\n",
+      "\t\t\t\t\t\t\thost-short-name = SVMType\n",
+      "\t\t\t\t\t\t)\n",
+      "\t\t\t\t\tgamma = 1.0\n",
+      "\t\t\t\t\ttribuo-version = 4.3.0-SNAPSHOT\n",
+      "\t\t\t\t\ttrain-invocation-count = 0\n",
+      "\t\t\t\t\tis-sequence = false\n",
+      "\t\t\t\t\thost-short-name = Trainer\n",
+      "\t\t\t\t)\n",
+      "\t\t\ttrained-at = 2022-09-22T14:18:03.073938-04:00\n",
+      "\t\t\tinstance-values = Map{}\n",
+      "\t\t\ttribuo-version = 4.3.0-SNAPSHOT\n",
+      "\t\t\tjava-version = 17.0.4.1\n",
+      "\t\t\tos-name = Mac OS X\n",
+      "\t\t\tos-arch = x86_64\n",
+      "\t\t)\n",
+      "\tdataset-provenance = MutableDataset(\n",
+      "\t\t\tclass-name = org.tribuo.MutableDataset\n",
+      "\t\t\tdatasource = GaussianAnomalyDataSource(\n",
+      "\t\t\t\t\tclass-name = org.tribuo.anomaly.example.GaussianAnomalyDataSource\n",
+      "\t\t\t\t\texpectedMeans = List[\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t5.0\n",
+      "\t\t\t\t\t]\n",
+      "\t\t\t\t\tanomalousMeans = List[\n",
+      "\t\t\t\t\t\t-2.0\n",
+      "\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t-2.0\n",
+      "\t\t\t\t\t\t2.0\n",
+      "\t\t\t\t\t\t-10.0\n",
+      "\t\t\t\t\t]\n",
+      "\t\t\t\t\tseed = 2\n",
+      "\t\t\t\t\tnumSamples = 2000\n",
+      "\t\t\t\t\tfractionAnomalous = 0.2\n",
+      "\t\t\t\t\tanomalousVariances = List[\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t0.5\n",
+      "\t\t\t\t\t\t0.25\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t0.1\n",
+      "\t\t\t\t\t]\n",
+      "\t\t\t\t\texpectedVariances = List[\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t0.5\n",
+      "\t\t\t\t\t\t0.25\n",
+      "\t\t\t\t\t\t1.0\n",
+      "\t\t\t\t\t\t0.1\n",
+      "\t\t\t\t\t]\n",
+      "\t\t\t\t\thost-short-name = DataSource\n",
+      "\t\t\t\t)\n",
+      "\t\t\ttransformations = List[]\n",
+      "\t\t\tis-sequence = false\n",
+      "\t\t\tis-dense = true\n",
+      "\t\t\tnum-examples = 2000\n",
+      "\t\t\tnum-features = 5\n",
+      "\t\t\tnum-outputs = 2\n",
+      "\t\t\ttribuo-version = 4.3.0-SNAPSHOT\n",
+      "\t\t)\n",
+      "\ttribuo-version = 4.3.0-SNAPSHOT\n",
+      ")\n"
      ]
     }
    ],
@@ -102,9 +306,9 @@
     "var evaluation = evaluator.evaluate(model,evalData);\n",
     "\n",
     "System.out.println();\n",
-    "System.out.println(model.getProvenance());\n",
+    "System.out.println(ProvenanceUtil.formattedProvenanceString(model.getProvenance()));\n",
     "System.out.println();\n",
-    "System.out.println(evaluation.getProvenance());"
+    "System.out.println(ProvenanceUtil.formattedProvenanceString(evaluation.getProvenance()));"
    ]
   },
   {
@@ -116,7 +320,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 10,
+   "execution_count": 4,
    "metadata": {
     "vscode": {
      "languageId": "java"
@@ -133,7 +337,7 @@
       "    \"model-type\" : \"LibSVMAnomalyModel\",\n",
       "    \"model-package\" : \"org.tribuo.anomaly.libsvm.LibSVMAnomalyModel\",\n",
       "    \"tribuo-version\" : \"4.3.0-SNAPSHOT\",\n",
-      "    \"java-version\" : \"18.0.1.1\",\n",
+      "    \"java-version\" : \"17.0.4.1\",\n",
       "    \"configured-parameters\" : {\n",
       "      \"cost\" : \"1.0\",\n",
       "      \"coef0\" : \"0.0\",\n",
@@ -161,7 +365,7 @@
       "  },\n",
       "  \"TrainingDetails\" : {\n",
       "    \"schema-version\" : \"1.0\",\n",
-      "    \"training-time\" : \"2022-07-25T23:32:07.729242-07:00\",\n",
+      "    \"training-time\" : \"2022-09-22T14:18:03.073938-04:00\",\n",
       "    \"training-set-size\" : 2000,\n",
       "    \"num-features\" : 5,\n",
       "    \"features-list\" : [ \"A\", \"B\", \"C\", \"D\", \"E\" ],\n",
@@ -195,7 +399,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 11,
+   "execution_count": 5,
    "metadata": {
     "vscode": {
      "languageId": "java"
@@ -212,7 +416,7 @@
       "    \"model-type\" : \"LibSVMAnomalyModel\",\n",
       "    \"model-package\" : \"org.tribuo.anomaly.libsvm.LibSVMAnomalyModel\",\n",
       "    \"tribuo-version\" : \"4.3.0-SNAPSHOT\",\n",
-      "    \"java-version\" : \"18.0.1.1\",\n",
+      "    \"java-version\" : \"17.0.4.1\",\n",
       "    \"configured-parameters\" : {\n",
       "      \"cost\" : \"1.0\",\n",
       "      \"coef0\" : \"0.0\",\n",
@@ -240,7 +444,7 @@
       "  },\n",
       "  \"TrainingDetails\" : {\n",
       "    \"schema-version\" : \"1.0\",\n",
-      "    \"training-time\" : \"2022-07-25T23:32:07.729242-07:00\",\n",
+      "    \"training-time\" : \"2022-09-22T14:18:03.073938-04:00\",\n",
       "    \"training-set-size\" : 2000,\n",
       "    \"num-features\" : 5,\n",
       "    \"features-list\" : [ \"A\", \"B\", \"C\", \"D\", \"E\" ],\n",
@@ -281,7 +485,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
+   "execution_count": 6,
    "metadata": {
     "vscode": {
      "languageId": "java"
@@ -298,7 +502,7 @@
       "    \"model-type\" : \"LibSVMAnomalyModel\",\n",
       "    \"model-package\" : \"org.tribuo.anomaly.libsvm.LibSVMAnomalyModel\",\n",
       "    \"tribuo-version\" : \"4.3.0-SNAPSHOT\",\n",
-      "    \"java-version\" : \"18.0.1.1\",\n",
+      "    \"java-version\" : \"17.0.4.1\",\n",
       "    \"configured-parameters\" : {\n",
       "      \"cost\" : \"1.0\",\n",
       "      \"coef0\" : \"0.0\",\n",
@@ -326,7 +530,7 @@
       "  },\n",
       "  \"TrainingDetails\" : {\n",
       "    \"schema-version\" : \"1.0\",\n",
-      "    \"training-time\" : \"2022-07-25T23:32:07.729242-07:00\",\n",
+      "    \"training-time\" : \"2022-09-22T14:18:03.073938-04:00\",\n",
       "    \"training-set-size\" : 2000,\n",
       "    \"num-features\" : 5,\n",
       "    \"features-list\" : [ \"A\", \"B\", \"C\", \"D\", \"E\" ],\n",
@@ -380,7 +584,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 13,
+   "execution_count": 7,
    "metadata": {
     "vscode": {
      "languageId": "java"
@@ -397,7 +601,7 @@
       "    \"model-type\" : \"LibSVMAnomalyModel\",\n",
       "    \"model-package\" : \"org.tribuo.anomaly.libsvm.LibSVMAnomalyModel\",\n",
       "    \"tribuo-version\" : \"4.3.0-SNAPSHOT\",\n",
-      "    \"java-version\" : \"18.0.1.1\",\n",
+      "    \"java-version\" : \"17.0.4.1\",\n",
       "    \"configured-parameters\" : {\n",
       "      \"cost\" : \"1.0\",\n",
       "      \"coef0\" : \"0.0\",\n",
@@ -425,7 +629,7 @@
       "  },\n",
       "  \"TrainingDetails\" : {\n",
       "    \"schema-version\" : \"1.0\",\n",
-      "    \"training-time\" : \"2022-07-25T23:32:07.729242-07:00\",\n",
+      "    \"training-time\" : \"2022-09-22T14:18:03.073938-04:00\",\n",
       "    \"training-set-size\" : 2000,\n",
       "    \"num-features\" : 5,\n",
       "    \"features-list\" : [ \"A\", \"B\", \"C\", \"D\", \"E\" ],\n",
@@ -465,7 +669,7 @@
        "true"
       ]
      },
-     "execution_count": 13,
+     "execution_count": 7,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -509,7 +713,7 @@
    "mimetype": "text/x-java-source",
    "name": "Java",
    "pygments_lexer": "java",
-   "version": "18.0.1.1+2-6"
+   "version": "17.0.4.1+1-LTS-2"
   }
  },
  "nbformat": 4,