Spaces:
Sleeping
Sleeping
Update training/train_agent.py
Browse files- training/train_agent.py +1 -1
training/train_agent.py
CHANGED
|
@@ -328,7 +328,7 @@ def generate_plots(trainer):
|
|
| 328 |
|
| 329 |
fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(13, 5))
|
| 330 |
fig.suptitle("GRPO Training β SQL Database Engineer Agent\n"
|
| 331 |
-
"Qwen2.5-
|
| 332 |
fontsize=13, fontweight="bold")
|
| 333 |
|
| 334 |
# ββ LEFT: Loss with smoothing ββββββββββββββββββββββββββββββ
|
|
|
|
| 328 |
|
| 329 |
fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(13, 5))
|
| 330 |
fig.suptitle("GRPO Training β SQL Database Engineer Agent\n"
|
| 331 |
+
"Qwen2.5-7B fine-tuned with Unsloth + TRL",
|
| 332 |
fontsize=13, fontweight="bold")
|
| 333 |
|
| 334 |
# ββ LEFT: Loss with smoothing ββββββββββββββββββββββββββββββ
|