huggingface · polinaeterna · Mar 9, 2023 · Mar 3, 2023 · Mar 3, 2023 · Mar 8, 2023
diff --git a/src/datasets/builder.py b/src/datasets/builder.py
@@ -357,10 +357,11 @@ def __init__(
             os.makedirs(self._cache_dir_root, exist_ok=True)
             lock_path = os.path.join(self._cache_dir_root, self._cache_dir.replace(os.sep, "_") + ".lock")
             with FileLock(lock_path):
-                if os.path.exists(self._cache_dir):  # check if data exist
-                    if len(os.listdir(self._cache_dir)) > 0:
-                        logger.info("Overwrite dataset info from restored data version.")
-                        self.info = DatasetInfo.from_directory(self._cache_dir)
+                if os.path.exists(self._cache_dir) > 0:  # check if data exist
+                    if len(os.listdir(self._cache_dir)):
-                if os.path.exists(self._cache_dir) > 0:  # check if data exist
-                    if len(os.listdir(self._cache_dir)):
+                if os.path.exists(self._cache_dir):  # check if data exist
+                    if len(os.listdir(self._cache_dir)) > 0:
-                if os.path.exists(self._cache_dir) > 0:  # check if data exist
-                    if len(os.listdir(self._cache_dir)):
+                if os.path.exists(self._cache_dir):  # check if data exist
+                    if len(os.listdir(self._cache_dir)) > 0:
+                        logger.info("Overwrite dataset info from restored data version if exists.")
+                        if os.path.exists(path_join(self._cache_dir, config.DATASET_INFO_FILENAME)):
+                            self.info = DatasetInfo.from_directory(self._cache_dir)
                     else:  # dir exists but no data, remove the empty dir as data aren't available anymore
                         logger.warning(
                             f"Old caching folder {self._cache_dir} for dataset {self.name} exists but not data were found. Removing it. "
@@ -374,7 +375,7 @@ def __init__(
         # Set download manager
         self.dl_manager = None
 
-        # Record infos even if verification_mode="none"; used by "datasets-cli test" to generate file checksums for (deprecated) dataset_infos.json
+        # Set to True by "datasets-cli test" to generate file checksums for (deprecated) dataset_infos.json independently of verification_mode value
         self._record_infos = False
 
         # Enable streaming (e.g. it patches "open" to work with remote files)
@@ -718,10 +719,10 @@ def download_and_prepare(
         ```
         """
         if ignore_verifications != "deprecated":
-            verification_mode = "none" if ignore_verifications else "full"
+            verification_mode = VerificationMode.NO_CHECKS if ignore_verifications else VerificationMode.ALL_CHECKS
             warnings.warn(
                 "'ignore_verifications' was deprecated in favor of 'verification_mode' in version 2.9.1 and will be removed in 3.0.0.\n"
-                f"You can remove this warning by passing 'verification_mode={verification_mode}' instead.",
+                f"You can remove this warning by passing 'verification_mode={verification_mode.value}' instead.",
                 FutureWarning,
             )
         if use_auth_token != "deprecated":
@@ -880,7 +881,8 @@ def incomplete_dir(dirname):
                     self.info.download_checksums = dl_manager.get_recorded_sizes_checksums()
                     self.info.size_in_bytes = self.info.dataset_size + self.info.download_size
                     # Save info
-                    self._save_info()
+                    if verification_mode is not VerificationMode.NO_CHECKS:
+                        self._save_info()
 
             # Download post processing resources
             self.download_post_processing_resources(dl_manager)
@@ -1078,10 +1080,10 @@ def as_dataset(
         ```
         """
         if ignore_verifications != "deprecated":
-            verification_mode = "none" if ignore_verifications else "full"
+            verification_mode = verification_mode.NO_CHECKS if ignore_verifications else VerificationMode.ALL_CHECKS
             warnings.warn(
                 "'ignore_verifications' was deprecated in favor of 'verification' in version 2.9.1 and will be removed in 3.0.0.\n"
-                f"You can remove this warning by passing 'verification_mode={verification_mode}' instead.",
+                f"You can remove this warning by passing 'verification_mode={verification_mode.value}' instead.",
                 FutureWarning,
             )
         is_local = not is_remote_filesystem(self._fs)