הבעיה

איך מודל שפה עובר מייצור טקסט לעשייה בעולם האמיתי?

המודל יכול לחשוב, לתכנן ולייצר קוד — אבל אין לו ידיים. הוא לא יכול להריץ פקודה, לקרוא קובץ או לבדוק תוצאה. הוא מוח בצנצנת.

הפתרון

לולאה אחת. כלי אחד. זו כל הארכיטקטורה.

while True:
  response = LLM(messages, tools)
  if stop_reason != "tool_use": return
  execute tools
  append results
  loop back

המודל מחליט מתי לקרוא לכלים ומתי לעצור. הקוד רק מבצע את מה שהמודל מבקש.

הלולאה המרכזית

def agent_loop(messages):
    while True:
        response = client.messages.create(
            model=MODEL, system=SYSTEM,
            messages=messages, tools=TOOLS, max_tokens=8000,
        )
        messages.append({"role": "assistant", "content": response.content})

        if response.stop_reason != "tool_use":
            return

        results = []
        for block in response.content:
            if block.type == "tool_use":
                output = TOOL_HANDLERS[block.name](**block.input)
                results.append({
                    "type": "tool_result",
                    "tool_use_id": block.id,
                    "content": output,
                })
        messages.append({"role": "user", "content": results})

ארבעה שלבים, חוזרים על עצמם:

הוסף את ההנחיה של המשתמש להיסטוריית ההודעות
שלח הודעות + הגדרות כלים ל-LLM
בדוק stop_reason — אם זה לא tool_use, המודל סיים
בצע כל קריאת כלי, הוסף את התוצאות, חזור ללולאה

כלי ה-Bash

TOOLS = [{
    "name": "bash",
    "description": "Run a shell command.",
    "input_schema": {
        "type": "object",
        "properties": {"command": {"type": "string"}},
        "required": ["command"],
    },
}]

def run_bash(command: str) -> str:
    dangerous = ["rm -rf /", "sudo", "shutdown", "reboot", "> /dev/"]
    if any(d in command for d in dangerous):
        return "Error: Dangerous command blocked"
    r = subprocess.run(command, shell=True, cwd=os.getcwd(),
                       capture_output=True, text=True, timeout=120)
    out = (r.stdout + r.stderr).strip()
    return out[:50000] if out else "(no output)"

הגדרת כלי אחת. handler אחד. כעת יש למודל ידיים — הוא יכול להריץ כל פקודת shell ולקרוא את הפלט.

המימוש המלא

#!/usr/bin/env python3
"""s01_agent_loop.py - The Agent Loop"""

import os, subprocess
from anthropic import Anthropic
from dotenv import load_dotenv

load_dotenv(override=True)
client = Anthropic()
MODEL = os.environ["MODEL_ID"]
SYSTEM = f"You are a coding agent at {os.getcwd()}. Use bash to solve tasks."

TOOLS = [{
    "name": "bash",
    "description": "Run a shell command.",
    "input_schema": {
        "type": "object",
        "properties": {"command": {"type": "string"}},
        "required": ["command"],
    },
}]

def run_bash(command: str) -> str:
    dangerous = ["rm -rf /", "sudo", "shutdown", "reboot", "> /dev/"]
    if any(d in command for d in dangerous):
        return "Error: Dangerous command blocked"
    try:
        r = subprocess.run(command, shell=True, cwd=os.getcwd(),
                           capture_output=True, text=True, timeout=120)
        out = (r.stdout + r.stderr).strip()
        return out[:50000] if out else "(no output)"
    except subprocess.TimeoutExpired:
        return "Error: Timeout (120s)"

def agent_loop(messages: list):
    while True:
        response = client.messages.create(
            model=MODEL, system=SYSTEM, messages=messages,
            tools=TOOLS, max_tokens=8000,
        )
        messages.append({"role": "assistant", "content": response.content})
        if response.stop_reason != "tool_use":
            return
        results = []
        for block in response.content:
            if block.type == "tool_use":
                print(f"\033[33m$ {block.input['command']}\033[0m")
                output = run_bash(block.input["command"])
                print(output[:200])
                results.append({"type": "tool_result",
                                "tool_use_id": block.id,
                                "content": output})
        messages.append({"role": "user", "content": results})

if __name__ == "__main__":
    history = []
    while True:
        try:
            query = input("\033[36ms01 >> \033[0m")
        except (EOFError, KeyboardInterrupt):
            break
        if query.strip().lower() in ("q", "exit", ""):
            break
        history.append({"role": "user", "content": query})
        agent_loop(history)

מסקנה מרכזית

הסוד השלם של סוכן קוד מבוסס AI הוא הלולאה הזו. המודל הוא הבינה — הוא מחליט מה לעשות. הקוד הוא הרתמה — הוא נותן למודל כלי ומזין חזרה תוצאות. בסשן הבא (שימוש בכלים), נוסיף עוד כלים מבלי לשנות את הלולאה כלל.

1. לולאת הסוכן

מה זה API?

מה זה 'while True'?

מה זה קריאת כלי (tool call)?