Update app.py
Browse files
app.py
CHANGED
|
@@ -79,6 +79,11 @@ def safe_load_pretrained_model(model_path, model_base=None, model_name=None, **k
|
|
| 79 |
tokenizer.add_special_tokens({'pad_token': '[PAD]'})
|
| 80 |
print('[INFO] Added [PAD] token to tokenizer')
|
| 81 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 82 |
# Force all model components to CPU (keep original dtype if possible, fallback to float32)
|
| 83 |
print('[INFO] Ensuring all components are on CPU...')
|
| 84 |
try:
|
|
|
|
| 79 |
tokenizer.add_special_tokens({'pad_token': '[PAD]'})
|
| 80 |
print('[INFO] Added [PAD] token to tokenizer')
|
| 81 |
|
| 82 |
+
# Set padding_side to left for Llama 3 (prevents empty generation)
|
| 83 |
+
if hasattr(tokenizer, 'padding_side'):
|
| 84 |
+
tokenizer.padding_side = "left"
|
| 85 |
+
print('[INFO] Set tokenizer.padding_side to "left" for proper generation')
|
| 86 |
+
|
| 87 |
# Force all model components to CPU (keep original dtype if possible, fallback to float32)
|
| 88 |
print('[INFO] Ensuring all components are on CPU...')
|
| 89 |
try:
|