Skip to content

Commit

Permalink
Disable model caching
Browse files Browse the repository at this point in the history
  • Loading branch information
cornzz committed Sep 9, 2024
1 parent 61bdeef commit 867f94c
Showing 1 changed file with 9 additions and 9 deletions.
18 changes: 9 additions & 9 deletions kubernetes/deployment.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -29,17 +29,17 @@ spec:
volumeMounts:
- name: flagged-data
mountPath: /demo/flagged
- name: cache
mountPath: /demo/cache
# - name: cache
# mountPath: /demo/cache
env:
- name: APP_PATH
value: /compress
- name: LLM_LIST
value: meta-llama/Meta-Llama-3.1-70B-Instruct, CohereForAI/c4ai-command-r-plus
- name: HF_HUB_CACHE
value: /demo/cache/huggingface
- name: TIKTOKEN_CACHE_DIR
value: /demo/cache/tiktoken
# - name: HF_HUB_CACHE
# value: /demo/cache/huggingface
# - name: TIKTOKEN_CACHE_DIR
# value: /demo/cache/tiktoken
- name: LLM_ENDPOINT
valueFrom:
secretKeyRef:
Expand All @@ -59,6 +59,6 @@ spec:
- name: flagged-data
persistentVolumeClaim:
claimName: llmlingua-demo-data
- name: cache
persistentVolumeClaim:
claimName: llmlingua-demo-cache
# - name: cache
# persistentVolumeClaim:
# claimName: llmlingua-demo-cache

0 comments on commit 867f94c

Please sign in to comment.