mosaicml
diff --git a/‎llmfoundry/data/finetuning/tasks.py
Lines changed: 1 addition & 1 deletion b/‎llmfoundry/data/finetuning/tasks.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎llmfoundry/utils/__init__.py
Lines changed: 11 additions & 6 deletions b/‎llmfoundry/utils/__init__.py
Lines changed: 11 additions & 6 deletions
@@ -434,7 +434,7 @@ def dataset_mapper(example: Dict):
 
             detected_cpu_count = os.cpu_count() or 1
             detected_cpus_with_margin = detected_cpu_count - 8
-            num_cpus_to_use = detected_cpu_count # Hack for Valiation instead of max(1, detected_cpus_with_margin)
+            num_cpus_to_use = detected_cpu_count  # Hack for Valiation instead of max(1, detected_cpus_with_margin)
 
             columns_to_remove = list(dataset[0].keys())
             tokenized_dataset = dataset.map(
 
@@ -13,12 +13,17 @@
                                                update_batch_size_info)
     from llmfoundry.utils.model_download_utils import (
         download_from_cache_server, download_from_hf_hub)
-
-    from llmfoundry.utils.validation_utils import (
-        create_om_cfg, token_counts_and_validation, token_counts,
-        check_HF_datasets, is_hf_dataset_path, is_uc_delta_table,
-        pandas_processing_fn, integrity_check, convert_text_to_mds,
-        parse_args, _args_str, plot_hist, dataframe_to_mds)
+    from llmfoundry.utils.validation_utils import (_args_str, check_HF_datasets,
+                                                   convert_text_to_mds,
+                                                   create_om_cfg,
+                                                   dataframe_to_mds,
+                                                   integrity_check,
+                                                   is_hf_dataset_path,
+                                                   is_uc_delta_table,
+                                                   pandas_processing_fn,
+                                                   parse_args, plot_hist,
+                                                   token_counts,
+                                                   token_counts_and_validation)
 
 except ImportError as e:
     raise ImportError(