diff --git a/README.md b/README.md index ae1fc65..fd7fc4c 100644 --- a/README.md +++ b/README.md @@ -8,6 +8,14 @@ A 9B parameter language model fine-tuned for Minecraft server operations. Transl ![Training Progress](branding/training_progress.svg) +| Version | Base Model | Training Examples | Loss | Key Addition | +|---------|-----------|-------------------|------|-------------| +| 0.1.0 | Qwen3-8B | 500 | 2.10 | Seed data only | +| 0.2.0 | Qwen3-8B | 1,200 | 1.45 | +entities, +mobs | +| 0.3.0 | Qwen3-8B | 2,100 | 0.82 | +error correction | +| 0.4.0 | Qwen3.5-9B | 3,175 | 0.35 | +tool-calling, base model upgrade | +| **0.5.0** | **Qwen3.5-9B** | **4,358** | **0.16** | **+plugins, +memory, +scripts** | + ## Bake-off: 0.5.0 vs 0.4.0 | Category | 0.4.0 | 0.5.0 | Change | diff --git a/branding/training_progress.svg b/branding/training_progress.svg index 9356223..afc293e 100644 --- a/branding/training_progress.svg +++ b/branding/training_progress.svg @@ -19,23 +19,23 @@ 500 0.1.0 -v1 (seed) +seed only 1,200 0.2.0 -v2 (+entities) ++entities 2,100 0.3.0 -v3 (+errors) ++errors 3,175 0.4.0 -v4 (+tools) ++tools 4,358 0.5.0 -v5 (+plugins) ++plugins loss=2.1 diff --git a/training/scripts/generate_training_chart.py b/training/scripts/generate_training_chart.py index 08c7122..5e75a21 100644 --- a/training/scripts/generate_training_chart.py +++ b/training/scripts/generate_training_chart.py @@ -13,11 +13,11 @@ OUTPUT = Path(__file__).resolve().parent.parent.parent / "branding" / "training_ # Historical data from training runs VERSIONS = [ - {"version": "0.1.0", "examples": 500, "loss": 2.10, "label": "v1 (seed)"}, - {"version": "0.2.0", "examples": 1200, "loss": 1.45, "label": "v2 (+entities)"}, - {"version": "0.3.0", "examples": 2100, "loss": 0.82, "label": "v3 (+errors)"}, - {"version": "0.4.0", "examples": 3175, "loss": 0.35, "label": "v4 (+tools)"}, - {"version": "0.5.0", "examples": 4358, "loss": 0.16, "label": "v5 (+plugins)"}, + {"version": "0.1.0", "examples": 500, "loss": 2.10, "label": "seed only"}, + {"version": "0.2.0", "examples": 1200, "loss": 1.45, "label": "+entities"}, + {"version": "0.3.0", "examples": 2100, "loss": 0.82, "label": "+errors"}, + {"version": "0.4.0", "examples": 3175, "loss": 0.35, "label": "+tools"}, + {"version": "0.5.0", "examples": 4358, "loss": 0.16, "label": "+plugins"}, ] # Chart dimensions