sodascience · qubixes · Jul 7, 2023 · Jul 4, 2023 · Jul 7, 2023 · vankesteren
diff --git a/metasynth/dataset.py b/metasynth/dataset.py
@@ -117,6 +117,9 @@ def from_dataframe(cls,
         else:
             spec = deepcopy(spec)
 
+        if set(list(spec)) - set(df.columns):
+            raise ValueError("Specifications found for column that were not found in the "
+                             f"dataset itself: {set(list(spec)) - set(df.columns)}")
         all_vars = []
         for col_name in df.columns:
             series = df[col_name]

diff --git a/tests/test_dataset.py b/tests/test_dataset.py
@@ -92,6 +92,10 @@ def check_dataset(dataset):
         print(name, dataset.descriptions[name])
         assert dataset.descriptions[name] == name
 
+    # Check whether non-columns raise an error
+    with pytest.raises(ValueError):
+        dataset = MetaDataset.from_dataframe(df, spec={"unicorn": {"prop_missing": 0.5}})
+
 
 def test_distributions(tmp_path):
     tmp_fp = tmp_path / "tmp.json"