Update server.py
Browse files
server.py
CHANGED
|
@@ -129,16 +129,12 @@ class SFTVisionT5Model(nn.Module):
|
|
| 129 |
encoder_hidden_states.size()[:2], device=pixel_values.device
|
| 130 |
)
|
| 131 |
|
| 132 |
-
# BUG FIX 3: repetition_penalty + no_repeat_ngram_size breaks
|
| 133 |
-
# the "Projection: Projection: Projection:" loop
|
| 134 |
generated_ids = self.t5.generate(
|
| 135 |
encoder_outputs=encoder_outputs,
|
| 136 |
attention_mask=attn,
|
| 137 |
max_length=max_length,
|
| 138 |
num_beams=4,
|
| 139 |
early_stopping=True,
|
| 140 |
-
no_repeat_ngram_size=3,
|
| 141 |
-
repetition_penalty=1.3,
|
| 142 |
)
|
| 143 |
|
| 144 |
reports = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)
|
|
@@ -186,8 +182,6 @@ class PPOVisionT5Model(nn.Module):
|
|
| 186 |
max_length=max_length,
|
| 187 |
num_beams=4,
|
| 188 |
early_stopping=True,
|
| 189 |
-
no_repeat_ngram_size=3,
|
| 190 |
-
repetition_penalty=1.3,
|
| 191 |
)
|
| 192 |
|
| 193 |
reports = tokenizer.batch_decode(generated, skip_special_tokens=True)
|
|
|
|
| 129 |
encoder_hidden_states.size()[:2], device=pixel_values.device
|
| 130 |
)
|
| 131 |
|
|
|
|
|
|
|
| 132 |
generated_ids = self.t5.generate(
|
| 133 |
encoder_outputs=encoder_outputs,
|
| 134 |
attention_mask=attn,
|
| 135 |
max_length=max_length,
|
| 136 |
num_beams=4,
|
| 137 |
early_stopping=True,
|
|
|
|
|
|
|
| 138 |
)
|
| 139 |
|
| 140 |
reports = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)
|
|
|
|
| 182 |
max_length=max_length,
|
| 183 |
num_beams=4,
|
| 184 |
early_stopping=True,
|
|
|
|
|
|
|
| 185 |
)
|
| 186 |
|
| 187 |
reports = tokenizer.batch_decode(generated, skip_special_tokens=True)
|