forked from eugr/spark-vllm-docker
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathflashinfer_cache.patch
More file actions
18 lines (18 loc) · 826 Bytes
/
flashinfer_cache.patch
File metadata and controls
18 lines (18 loc) · 826 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
--- a/flashinfer/artifacts.py
+++ b/flashinfer/artifacts.py
@@ -203,9 +203,13 @@
with ThreadPoolExecutor(num_threads) as pool:
futures = []
- for name, _ in cubin_files:
- source = safe_urljoin(FLASHINFER_CUBINS_REPOSITORY, name)
- local_path = FLASHINFER_CUBIN_DIR / name
+ for name, checksum in cubin_files:
+ local_path = FLASHINFER_CUBIN_DIR / name
+ if local_path.exists() and verify_cubin(str(local_path), checksum):
+ pbar.update(1)
+ continue
+
+ source = safe_urljoin(FLASHINFER_CUBINS_REPOSITORY, name)
# Ensure parent directory exists
local_path.parent.mkdir(parents=True, exist_ok=True)
fut = pool.submit(