Skip to content

Commit

Permalink
fix
Browse files Browse the repository at this point in the history
  • Loading branch information
sunggg committed Jan 8, 2024
1 parent d58c75e commit 58a1720
Showing 1 changed file with 5 additions and 5 deletions.
10 changes: 5 additions & 5 deletions serve/mlc_serve/utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -56,24 +56,24 @@ def create_mlc_engine(args: argparse.Namespace):
"max_decode_steps": args.max_decode_steps,
}
)

# type: off
if args.use_staging_engine:
engine = StagingInferenceEngine(
tokenizer_module=HfTokenizerModule(args.model_artifact_path),
model_module_loader=PagedCacheModelModule,
model_module_loader=PagedCacheModelModule,
model_module_loader_kwargs={
"model_artifact_path": args.model_artifact_path,
"engine_config": engine_config,
},
)
engine.start()
else:
engine = SynchronousInferenceEngine(
PagedCacheModelModule(
engine = SynchronousInferenceEngine(
PagedCacheModelModule(
model_artifact_path=args.model_artifact_path,
engine_config=engine_config,
)
)

# type: on
return engine

0 comments on commit 58a1720

Please sign in to comment.