Browse Source

fixed failing node

tags/v0.3.11-rc1
ShashwatPatil 10 months ago
parent
commit
e06d8ea22f
1 changed files with 1 additions and 2 deletions
  1. +1
    -2
      node-hub/dora-transformer/dora_transformer/main.py

+ 1
- 2
node-hub/dora-transformer/dora_transformer/main.py View File

@@ -129,8 +129,7 @@ def generate_response(model, tokenizer, text: str, history, max_retries: int = 3
else:
# Final retry: Reduce token count
logging.info("Reducing token count for final attempt")
global MAX_TOKENS
MAX_TOKENS = max(32, MAX_TOKENS // 2)
MAX_TOKENS = 24
continue
else:
# For non-CUDA OOM errors, raise immediately


Loading…
Cancel
Save