Update modeling_quiet.py
Browse files- modeling_quiet.py +1 -1
modeling_quiet.py
CHANGED
@@ -1069,7 +1069,7 @@ class QuietModel(QuietPreTrainedModel):
|
|
1069 |
"You are attempting to perform batched generation with padding_side='right'"
|
1070 |
" this may lead to unexpected behaviour for Flash Attention version of Quiet. Make sure to "
|
1071 |
" call `tokenizer.padding_side = 'left'` before tokenizing the input. "
|
1072 |
-
|
1073 |
if self._attn_implementation == "flash_attention_2":
|
1074 |
# Convert 2D mask to 4D and adjust size
|
1075 |
attention_mask = _prepare_4d_causal_attention_mask(
|
|
|
1069 |
"You are attempting to perform batched generation with padding_side='right'"
|
1070 |
" this may lead to unexpected behaviour for Flash Attention version of Quiet. Make sure to "
|
1071 |
" call `tokenizer.padding_side = 'left'` before tokenizing the input. "
|
1072 |
+
)
|
1073 |
if self._attn_implementation == "flash_attention_2":
|
1074 |
# Convert 2D mask to 4D and adjust size
|
1075 |
attention_mask = _prepare_4d_causal_attention_mask(
|