diff --git a/examples/common/builders.py b/examples/common/builders.py
index 312d2e94e..7081e56b5 100644
--- a/examples/common/builders.py
+++ b/examples/common/builders.py
@@ -103,6 +103,7 @@ def _validate_cfg(icl_cfg):
         assert 'example_delimiter' in icl_cfg
         assert 'continuation_delimiter' in icl_cfg
         assert 'label' in icl_cfg
+        assert 'destination_path' in icl_cfg
 
     for icl_cfg in cfg.icl_tasks:
         _validate_cfg(icl_cfg)
@@ -124,7 +125,9 @@ def _validate_cfg(icl_cfg):
                 num_fewshot=num_fewshot,
                 prompt_string=icl_cfg.prompt_string,
                 example_delimiter=icl_cfg.example_delimiter,
-                continuation_delimiter=icl_cfg.continuation_delimiter)
+                continuation_delimiter=icl_cfg.continuation_delimiter,
+                destination_path=icl_cfg.destination_path,
+            )
             logger_keys.extend([f'metrics/{label}/{m}' for m in metric_names])
             evaluators.append(
                 Evaluator(label=label,
diff --git a/examples/llm/icl_eval/evaluate_model.py b/examples/llm/icl_eval/evaluate_model.py
index f8243e1d4..7e305b011 100644
--- a/examples/llm/icl_eval/evaluate_model.py
+++ b/examples/llm/icl_eval/evaluate_model.py
@@ -3,14 +3,16 @@
 
 import sys
 import time
+from typing import List
 
 import torch
-from composer.loggers import InMemoryLogger
+from composer.loggers import InMemoryLogger, LoggerDestination
 from composer.trainer import Trainer
+from composer.utils import reproducibility
 from omegaconf import DictConfig
 from omegaconf import OmegaConf as om
 
-from examples.common.builders import build_icl_evaluators
+from examples.common.builders import build_icl_evaluators, build_logger
 from examples.llm.src.model_registry import COMPOSER_MODEL_REGISTRY
 from examples.llm.src.tokenizer import TOKENIZER_REGISTRY
 
@@ -21,6 +23,8 @@
     cli_cfg = om.from_cli(args_list)
     cfg = DictConfig(om.merge(yaml_cfg, cli_cfg))
 
+    reproducibility.seed_all(cfg.get('seed', 1234))
+
     composer_model = COMPOSER_MODEL_REGISTRY[cfg.model.name](cfg.model)
     tokenizer = TOKENIZER_REGISTRY[cfg.tokenizer.type](**cfg.tokenizer.args)
     evaluators, logger_keys = build_icl_evaluators(cfg, tokenizer)
@@ -28,6 +32,11 @@
         composer_model.add_eval_metrics(evaluator)
 
     in_memory_logger = InMemoryLogger()  # track metrics in the in_memory_logger
+    loggers: List[LoggerDestination] = [
+        build_logger(name, logger_cfg)
+        for name, logger_cfg in (cfg.get('loggers') or {}).items()
+    ]
+    loggers.append(in_memory_logger)
 
     fsdp_config = cfg.get('fsdp_config', None)
     fsdp_config = om.to_container(
@@ -37,7 +46,7 @@
 
     trainer = Trainer(
         model=composer_model,
-        loggers=in_memory_logger,
+        loggers=loggers,
         fsdp_config=fsdp_config,  # type: ignore
         load_path=load_path,
         load_weights_only=True,
diff --git a/examples/llm/icl_eval/yamls/gpt_neo_eval.yaml b/examples/llm/icl_eval/yamls/gpt_neo_eval.yaml
index 36e2f8762..c9c91ab9e 100644
--- a/examples/llm/icl_eval/yamls/gpt_neo_eval.yaml
+++ b/examples/llm/icl_eval/yamls/gpt_neo_eval.yaml
@@ -30,6 +30,7 @@ icl_tasks:
   prompt_string: '' # this goes at the beginning of each input
   example_delimiter: '\n' # this goes between fewshot examples
   continuation_delimiter: ' ' # this separates questions from answers
+  destination_path: piqa_local.jsonl
 -
   label: lambada
   dataset_uri: # ADD YOUR OWN DATASET URI
@@ -41,4 +42,5 @@ icl_tasks:
   - InContextLearningLMAccuracy
   prompt_string: '' # this goes at the beginning of each input
   example_delimiter: '\n' # this goes between fewshot examples
-  continuation_delimiter: '' # this separates contexts from continuations
+  continuation_delimiter: ' ' # this separates contexts from continuations
+  destination_path: lambada_local.jsonl
diff --git a/examples/llm/icl_eval/yamls/mosaic_gpt_eval.yaml b/examples/llm/icl_eval/yamls/mosaic_gpt_eval.yaml
index 14eea2fbe..16733e087 100644
--- a/examples/llm/icl_eval/yamls/mosaic_gpt_eval.yaml
+++ b/examples/llm/icl_eval/yamls/mosaic_gpt_eval.yaml
@@ -39,6 +39,7 @@ icl_tasks:
   prompt_string: '' # this goes at the beginning of each input
   example_delimiter: '\n' # this goes between fewshot examples
   continuation_delimiter: ' ' # this separates questions from answers
+  destination_path: piqa_local.jsonl
 -
   label: lambada
   dataset_uri: # ADD YOUR OWN DATASET URI
@@ -50,4 +51,5 @@ icl_tasks:
   - InContextLearningLMAccuracy
   prompt_string: '' # this goes at the beginning of each input
   example_delimiter: '\n' # this goes between fewshot examples
-  continuation_delimiter: '' # this separates contexts from continuations
+  continuation_delimiter: ' ' # this separates contexts from continuations
+  destination_path: lambada_local.jsonl