encode path only for old versions of hfh

huggingface · Nov 14, 2022 · 67a6122 · 67a6122 · github-actions · Nov 14, 2022
1 parent 1b81805
commit 67a6122
Showing 1 changed file with 5 additions and 1 deletion.
diff --git a/src/datasets/utils/hub.py b/src/datasets/utils/hub.py
@@ -2,7 +2,11 @@
 from urllib.parse import quote
 
 import huggingface_hub as hfh
+from packaging import version
 
 
 def hf_hub_url(repo_id: str, path: str, revision: Optional[str] = None) -> str:
-    return hfh.hf_hub_url(repo_id, quote(path), repo_type="dataset", revision=revision)
+    if version.parse(hfh.__version__) < version.parse("0.11.0"):
+        # old versions of hfh don't url-encode the file path
+        path = quote(path)
+    return hfh.hf_hub_url(repo_id, path, repo_type="dataset", revision=revision)