Skip to content

Commit

Permalink
Merge pull request #157 from runpod-workers/m-c
Browse files Browse the repository at this point in the history
Enabling model caching.
  • Loading branch information
pandyamarut authored Feb 6, 2025
2 parents 9e8d919 + 3f0a20d commit 6fc7704
Showing 1 changed file with 3 additions and 0 deletions.
3 changes: 3 additions & 0 deletions src/engine.py
Original file line number Diff line number Diff line change
Expand Up @@ -24,7 +24,10 @@ class vLLMEngine:
def __init__(self, engine = None):
load_dotenv() # For local development
self.engine_args = get_engine_args()
if os.getenv("MODEL_CACHE_ENABLE"):
self.engine_args.model = f"/runpod/cache/model/{os.getenv('MODEL_NAME')}/main"
logging.info(f"Engine args: {self.engine_args}")

self.tokenizer = TokenizerWrapper(self.engine_args.tokenizer or self.engine_args.model,
self.engine_args.tokenizer_revision,
self.engine_args.trust_remote_code)
Expand Down

0 comments on commit 6fc7704

Please sign in to comment.