Skip to content

Commit 652c5ed

Browse files
authored
revert #358 and #325 (#366)
Because they broke CI
1 parent e4c7c20 commit 652c5ed

File tree

4 files changed

+2
-451
lines changed

4 files changed

+2
-451
lines changed

shortfin/python/shortfin_apps/llm/components/service.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -73,7 +73,7 @@ def start(self):
7373
)
7474
]
7575
+ self.inference_modules,
76-
devices=self.sysman.ls.devices,
76+
fiber=self.main_fiber,
7777
trace_execution=False,
7878
)
7979
# Resolve prefill entrypoints.
@@ -393,7 +393,7 @@ async def run(self):
393393
"".join([f"\n {i}: {ary.shape}" for i, ary in enumerate(args)]),
394394
)
395395
# Invoke. Logits are of shape [bs, bsl, d].
396-
(logits,) = await fn(*args, fiber=self.fiber)
396+
(logits,) = await fn(*args)
397397

398398
# Return results.
399399
for i in range(req_count):

shortfin/requirements-tests.txt

-2
Original file line numberDiff line numberDiff line change
@@ -11,8 +11,6 @@ wheel
1111
# Deps needed for shortfin_apps.llm
1212
dataclasses-json
1313
tokenizers
14-
numpy
15-
sentencepiece
1614

1715
# Deps needed for shortfin_apps.sd
1816
pillow

shortfin/tests/apps/llm/cpu_llm_server_test.py

-173
This file was deleted.

0 commit comments

Comments
 (0)