From 00a7a7367eb69221b6ff395151a392080cef32c8 Mon Sep 17 00:00:00 2001
From: Bjoern Ludwig <bjoern.ludwig@ptb.de>
Date: Fri, 30 Dec 2022 12:47:09 -0500
Subject: [PATCH] fix(dataset): remove strict hash checking to drastically
 increase performance

---
 src/zema_emc_annotated/dataset.py | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/src/zema_emc_annotated/dataset.py b/src/zema_emc_annotated/dataset.py
index af8f699..e246384 100644
--- a/src/zema_emc_annotated/dataset.py
+++ b/src/zema_emc_annotated/dataset.py
@@ -4,7 +4,6 @@ __all__ = [
     "ExtractionDataType",
     "LOCAL_ZEMA_DATASET_PATH",
     "ZeMASamples",
-    "ZEMA_DATASET_HASH",
     "ZEMA_DATASET_URL",
     "ZEMA_QUANTITIES",
 ]
@@ -27,9 +26,6 @@ from pooch import retrieve
 from zema_emc_annotated.data_types import RealMatrix, RealVector, UncertainArray
 
 LOCAL_ZEMA_DATASET_PATH = Path(dirname(__file__), "datasets")
-ZEMA_DATASET_HASH = (
-    "sha256:fb0e80de4e8928ae8b859ad9668a1b6ea6310028a6690bb8d4c1abee31cb8833"
-)
 ZEMA_DATASET_URL = "https://zenodo.org/record/5185953/files/axis11_2kHz_ZeMA_PTB_SI.h5"
 ZEMA_QUANTITIES = (
     "Acceleration",
@@ -104,7 +100,7 @@ class ZeMASamples:
     def _extract_data(self, normalize: bool) -> UncertainArray:
         dataset_full_path = retrieve(
             url=ZEMA_DATASET_URL,
-            known_hash=ZEMA_DATASET_HASH,
+            known_hash=None,
             path=LOCAL_ZEMA_DATASET_PATH,
             progressbar=True,
         )
-- 
GitLab