We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents 9e8d919 + 3f0a20d commit 6fc7704Copy full SHA for 6fc7704
src/engine.py
@@ -24,7 +24,10 @@ class vLLMEngine:
24
def __init__(self, engine = None):
25
load_dotenv() # For local development
26
self.engine_args = get_engine_args()
27
+ if os.getenv("MODEL_CACHE_ENABLE"):
28
+ self.engine_args.model = f"/runpod/cache/model/{os.getenv('MODEL_NAME')}/main"
29
logging.info(f"Engine args: {self.engine_args}")
30
+
31
self.tokenizer = TokenizerWrapper(self.engine_args.tokenizer or self.engine_args.model,
32
self.engine_args.tokenizer_revision,
33
self.engine_args.trust_remote_code)
0 commit comments