Skip to content

Commit 3c7bd48

Browse files
committed
get rid of some more hf bloat
1 parent 1df0230 commit 3c7bd48

File tree

5 files changed

+6
-82
lines changed

5 files changed

+6
-82
lines changed

exo/download/test_new_shard_download.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
from exo.download.hf.new_shard_download import download_shard, NewShardDownloader
1+
from exo.download.new_shard_download import download_shard, NewShardDownloader
22
from exo.inference.shard import Shard
33
from exo.models import get_model_id
44
from pathlib import Path

exo/inference/mlx/test_non_blocking.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -2,15 +2,15 @@
22
import time
33
import numpy as np
44
from exo.inference.mlx.sharded_inference_engine import MLXDynamicShardInferenceEngine
5-
from exo.download.hf.hf_shard_download import HFShardDownloader
5+
from exo.download.new_shard_download import NewShardDownloader
66
from exo.inference.shard import Shard
77
from exo.models import build_base_shard
88
from collections import deque
99
from statistics import mean, median
1010

1111
async def test_non_blocking():
1212
# Setup
13-
shard_downloader = HFShardDownloader()
13+
shard_downloader = NewShardDownloader()
1414
engine = MLXDynamicShardInferenceEngine(shard_downloader)
1515
_shard = build_base_shard("llama-3.1-8b", "MLXDynamicShardInferenceEngine")
1616
shard = Shard(_shard.model_id, _shard.start_layer, _shard.n_layers - 1, _shard.n_layers)

exo/inference/test_inference_engine.py

+3-3
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
from exo.inference.mlx.sharded_inference_engine import MLXDynamicShardInferenceEngine
2-
from exo.download.hf.hf_shard_download import HFShardDownloader
32
from exo.inference.inference_engine import InferenceEngine
3+
from exo.download.new_shard_download import NewShardDownloader
44
from exo.inference.shard import Shard
55
from exo.helpers import DEBUG
66
import os
@@ -44,13 +44,13 @@ async def test_inference_engine(inference_engine_1: InferenceEngine, inference_e
4444
assert np.array_equal(next_resp_full, resp4)
4545

4646

47-
asyncio.run(test_inference_engine(MLXDynamicShardInferenceEngine(HFShardDownloader()), MLXDynamicShardInferenceEngine(HFShardDownloader()), "llama-3.2-1b", 16))
47+
asyncio.run(test_inference_engine(MLXDynamicShardInferenceEngine(NewShardDownloader()), MLXDynamicShardInferenceEngine(NewShardDownloader()), "llama-3.2-1b", 16))
4848

4949
if os.getenv("RUN_TINYGRAD", default="0") == "1":
5050
import tinygrad
5151
import os
5252
from exo.inference.tinygrad.inference import TinygradDynamicShardInferenceEngine
5353
tinygrad.helpers.DEBUG.value = int(os.getenv("TINYGRAD_DEBUG", default="0"))
5454
asyncio.run(
55-
test_inference_engine(TinygradDynamicShardInferenceEngine(HFShardDownloader()), TinygradDynamicShardInferenceEngine(HFShardDownloader()), "llama-3-8b", 32)
55+
test_inference_engine(TinygradDynamicShardInferenceEngine(NewShardDownloader()), TinygradDynamicShardInferenceEngine(NewShardDownloader()), "llama-3-8b", 32)
5656
)

extra/download_hf.py

-50
This file was deleted.

test/test_hf.py

-26
This file was deleted.

0 commit comments

Comments
 (0)