mirror of
https://github.com/microsoft/SkillOpt.git
synced 2026-07-05 07:11:18 +08:00
- Rename teacher -> optimizer, student -> target across all code, configs, docs, prompts - CLI: --teacher_model -> --optimizer_model, --student_model -> --target_model - Remove best_skill files, keep only initial skills - Fix slow update gate (force write into skill) - Fix SLOW_UPDATE marker stripping - Remove deep_reflect and meta_reflect mechanisms - Update .env.example with export prefix and azure_cli docs - Add endpoint empty validation in azure_openai.py Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
165 lines
5.8 KiB
Python
165 lines
5.8 KiB
Python
"""ReflACT skill operations — edit application and patch processing.
|
|
|
|
The Update stage (⑤) of the ReflACT pipeline: apply a ranked set of
|
|
edits to the current skill document, producing an updated candidate.
|
|
Analogous to optimizer.step() in neural network training.
|
|
"""
|
|
from __future__ import annotations
|
|
|
|
from typing import TYPE_CHECKING
|
|
|
|
if TYPE_CHECKING:
|
|
from skillopt.types import Edit as EditType, Patch as PatchType
|
|
|
|
SLOW_UPDATE_START = "<!-- SLOW_UPDATE_START -->"
|
|
SLOW_UPDATE_END = "<!-- SLOW_UPDATE_END -->"
|
|
|
|
|
|
def _is_in_slow_update_region(skill: str, target: str) -> bool:
|
|
"""Check if *target* text falls within the protected slow update region."""
|
|
start_idx = skill.find(SLOW_UPDATE_START)
|
|
end_idx = skill.find(SLOW_UPDATE_END)
|
|
if start_idx == -1 or end_idx == -1:
|
|
return False
|
|
target_idx = skill.find(target)
|
|
if target_idx == -1:
|
|
return False
|
|
region_end = end_idx + len(SLOW_UPDATE_END)
|
|
return start_idx <= target_idx < region_end
|
|
|
|
|
|
def _strip_slow_update_markers(text: str) -> str:
|
|
"""Remove any SLOW_UPDATE markers from edit content to prevent duplication."""
|
|
return (
|
|
text.replace(SLOW_UPDATE_START, "")
|
|
.replace(SLOW_UPDATE_END, "")
|
|
)
|
|
|
|
|
|
def _edit_fields(edit: EditType | dict) -> tuple[str, str, str]:
|
|
op = edit.op if hasattr(edit, "op") else edit.get("op", "")
|
|
content = _strip_slow_update_markers(
|
|
(edit.content if hasattr(edit, "content") else edit.get("content", "")).strip()
|
|
)
|
|
target = edit.target if hasattr(edit, "target") else edit.get("target", "")
|
|
return op, content, target
|
|
|
|
|
|
def _apply_edit_with_report(skill: str, edit: EditType | dict) -> tuple[str, dict]:
|
|
op, content, target = _edit_fields(edit)
|
|
report = {
|
|
"op": op,
|
|
"target": target[:200],
|
|
"content_preview": content[:200],
|
|
"status": "unknown",
|
|
}
|
|
|
|
if target and _is_in_slow_update_region(skill, target):
|
|
report["status"] = "skipped_protected_slow_update_region"
|
|
return skill, report
|
|
|
|
if op == "append":
|
|
su_start = skill.find(SLOW_UPDATE_START)
|
|
if su_start != -1:
|
|
before = skill[:su_start].rstrip()
|
|
after = skill[su_start:]
|
|
report["status"] = "applied_append_before_slow_update"
|
|
return before + "\n\n" + content + "\n\n" + after, report
|
|
report["status"] = "applied_append"
|
|
return skill.rstrip() + "\n\n" + content + "\n", report
|
|
|
|
if op == "insert_after":
|
|
if not target or target not in skill:
|
|
su_start = skill.find(SLOW_UPDATE_START)
|
|
if su_start != -1:
|
|
before = skill[:su_start].rstrip()
|
|
after = skill[su_start:]
|
|
report["status"] = "applied_insert_after_fallback_before_slow_update"
|
|
return before + "\n\n" + content + "\n\n" + after, report
|
|
report["status"] = "applied_insert_after_fallback_append"
|
|
return skill.rstrip() + "\n\n" + content + "\n", report
|
|
idx = skill.index(target) + len(target)
|
|
newline = skill.find("\n", idx)
|
|
insert_at = newline + 1 if newline != -1 else len(skill)
|
|
report["status"] = "applied_insert_after"
|
|
return skill[:insert_at] + "\n" + content + "\n" + skill[insert_at:], report
|
|
|
|
if op == "replace":
|
|
if not target:
|
|
report["status"] = "skipped_replace_missing_target"
|
|
return skill, report
|
|
if target not in skill:
|
|
report["status"] = "skipped_replace_target_not_found"
|
|
return skill, report
|
|
report["status"] = "applied_replace"
|
|
return skill.replace(target, content, 1), report
|
|
|
|
if op == "delete":
|
|
if not target:
|
|
report["status"] = "skipped_delete_missing_target"
|
|
return skill, report
|
|
if target not in skill:
|
|
report["status"] = "skipped_delete_target_not_found"
|
|
return skill, report
|
|
report["status"] = "applied_delete"
|
|
return skill.replace(target, "", 1), report
|
|
|
|
report["status"] = "skipped_unknown_op"
|
|
return skill, report
|
|
|
|
|
|
def apply_edit(skill: str, edit: EditType | dict) -> str:
|
|
"""Apply a single edit operation to the skill document.
|
|
|
|
Parameters
|
|
----------
|
|
skill : str
|
|
Current skill document content.
|
|
edit : Edit | dict
|
|
An :class:`~skillopt.types.Edit` instance or a plain dict with
|
|
keys ``op``, ``content``, ``target``.
|
|
|
|
Edits targeting the protected slow-update region are silently skipped.
|
|
"""
|
|
updated_skill, _ = _apply_edit_with_report(skill, edit)
|
|
return updated_skill
|
|
|
|
|
|
def apply_patch_with_report(
|
|
skill: str,
|
|
patch: PatchType | dict,
|
|
) -> tuple[str, list[dict]]:
|
|
"""Apply a patch and return a per-edit report for observability."""
|
|
edits = patch.edits if hasattr(patch, "edits") else patch.get("edits", [])
|
|
reports: list[dict] = []
|
|
for idx, edit in enumerate(edits, 1):
|
|
try:
|
|
skill, report = _apply_edit_with_report(skill, edit)
|
|
report["index"] = idx
|
|
except Exception as exc: # noqa: BLE001
|
|
report = {
|
|
"index": idx,
|
|
"op": "",
|
|
"target": "",
|
|
"content_preview": "",
|
|
"status": "error",
|
|
"error": str(exc),
|
|
}
|
|
reports.append(report)
|
|
return skill, reports
|
|
|
|
|
|
def apply_patch(skill: str, patch: PatchType | dict) -> str:
|
|
"""Apply a patch (list of edits) to the skill document sequentially.
|
|
|
|
Parameters
|
|
----------
|
|
skill : str
|
|
Current skill document content.
|
|
patch : Patch | dict
|
|
A :class:`~skillopt.types.Patch` instance or a plain dict with
|
|
key ``edits`` containing a list of edit operations.
|
|
"""
|
|
updated_skill, _ = apply_patch_with_report(skill, patch)
|
|
return updated_skill
|