Update content

2025-12-02 15:55:32 +08:00 · 2025-12-02 15:55:32 +08:00 · 6ab2aec57e
commit 6ab2aec57e
parent 5e8d901a18
13 changed files with 2766 additions and 0 deletions
--- a/.autograde/aggregate_llm_grades.py
+++ b/.autograde/aggregate_llm_grades.py
@ -0,0 +1,121 @@
 #!/usr/bin/env python3
 """
 聚合多个 LLM 评分结果
 """
 import json
 import argparse
 from pathlib import Path
 def load_grade(filepath):
    """加载单个评分文件"""
    try:
        with open(filepath, 'r', encoding='utf-8') as f:
            return json.load(f)
    except FileNotFoundError:
        print(f"Warning: {filepath} not found")
        return None
    except json.JSONDecodeError as e:
        print(f"Error parsing {filepath}: {e}")
        return None
 def aggregate_grades(input_files, output_file, summary_file):
    """聚合多个评分文件"""
    grades = []
    total_score = 0
    max_score = 0
    need_review_count = 0
    for input_file in input_files:
        grade = load_grade(input_file)
        if grade:
            grades.append(grade)
            # 支持两种格式：'total' (llm_grade.py) 或 'score' (旧格式)
            score = grade.get('total', grade.get('score', 0))
            total_score += score
            # 默认每题 10 分
            max_score += grade.get('max_score', 10)
            # 检查是否需要审核
            if 'need_review' in grade.get('flags', []) or grade.get('need_review', False):
                need_review_count += 1
    # 计算总分
    final_score = total_score if max_score > 0 else 0
    final_max_score = max_score
    # 生成汇总结果
    result = {
        'total_score': final_score,
        'max_score': final_max_score,
        'questions': len(grades),
        'need_review': need_review_count > 0,
        'details': grades
    }
    # 保存 JSON
    with open(output_file, 'w', encoding='utf-8') as f:
        json.dump(result, f, indent=2, ensure_ascii=False)
    # 生成 Markdown 摘要
    summary_lines = [
        '# LLM 简答题评分汇总',
        '',
        f'**总分**: {final_score:.1f} / {final_max_score:.1f}',
        f'**题目数**: {len(grades)}',
        f'**需要人工审核**: {"是" if result["need_review"] else "否"}',
        '',
        '## 各题详情',
        ''
    ]
    for i, grade in enumerate(grades, 1):
        q_name = grade.get('question', f'Q{i}')
        # 支持两种格式：'total' (llm_grade.py) 或 'score' (旧格式)
        score = grade.get('total', grade.get('score', 0))
        max_q_score = grade.get('max_score', 10)
        # 检查是否需要审核
        need_review = 'need_review' in grade.get('flags', []) or grade.get('need_review', False)
        confidence = grade.get('confidence', 1.0)
        summary_lines.append(f'### SA{i}')
        summary_lines.append(f'- **得分**: {score:.2f} / {max_q_score:.1f}')
        summary_lines.append(f'- **置信度**: {confidence:.2f}')
        if need_review:
            summary_lines.append('- ⚠️ **需要人工审核**')
        # 显示分项评分
        if 'criteria' in grade:
            summary_lines.append('- **分项**:')
            for criterion in grade['criteria']:
                crit_id = criterion.get('id', '')
                crit_score = criterion.get('score', 0)
                crit_reason = criterion.get('reason', '')
                summary_lines.append(f'  - {crit_id}: {crit_score:.1f} - {crit_reason}')
        summary_lines.append('')
    with open(summary_file, 'w', encoding='utf-8') as f:
        f.write('\n'.join(summary_lines))
    print(f"✅ Aggregated {len(grades)} grades")
    print(f"   Total: {final_score:.1f} / {final_max_score:.1f}")
    print(f"   Output: {output_file}")
 def main():
    parser = argparse.ArgumentParser(description='Aggregate LLM grading results')
    parser.add_argument('--inputs', nargs='+', required=True,
                       help='Input grade JSON files')
    parser.add_argument('--out', required=True,
                       help='Output aggregated JSON file')
    parser.add_argument('--summary', required=True,
                       help='Output summary Markdown file')
    args = parser.parse_args()
    aggregate_grades(args.inputs, args.out, args.summary)
 if __name__ == '__main__':
    main()
--- a/.autograde/create_minimal_metadata.py
+++ b/.autograde/create_minimal_metadata.py
@ -0,0 +1,372 @@
 #!/usr/bin/env python3
 """
 创建完整的成绩元数据文件
 从 grade.json / final_grade.json / llm_grade.json 生成 metadata.json
 包含所有详细信息：未通过的测试、各题详情等
 """
 import json
 import os
 import sys
 import re
 from datetime import datetime
 def extract_student_id():
    """从环境变量或仓库名中提取学生 ID"""
    # 优先从环境变量获取
    student_id = os.getenv("STUDENT_ID")
    if student_id:
        return student_id
    # 从仓库名提取
    # 支持格式：org/assignment-stu_xxx 或 org/assignment-stu-xxx
    repo = os.getenv("REPO", "")
    if repo:
        # 匹配 xxx-stu_yyy 或 xxx-stu-yyy 格式
        match = re.search(r'-stu[_-]([a-zA-Z0-9_]+)$', repo)
        if match:
            return match.group(1)
        # 也尝试匹配 stu_xxx 在路径中的情况
        match = re.search(r'stu[_-]([a-zA-Z0-9_]+)', repo)
        if match:
            return match.group(1)
    return None
 def extract_assignment_id():
    """从环境变量或仓库名中提取作业 ID"""
    # 优先从环境变量获取
    assignment_id = os.getenv("ASSIGNMENT_ID")
    if assignment_id:
        return assignment_id
    # 从仓库名提取
    # 支持格式：org/assignment-stu_xxx 或 org/assignment-template
    repo = os.getenv("REPO", "")
    if repo:
        # 取仓库名部分（去掉组织）
        repo_name = repo.split("/")[-1] if "/" in repo else repo
        # 移除 -stu_xxx 或 -template 后缀
        assignment = re.sub(r'-stu[_-][a-zA-Z0-9_]+$', '', repo_name)
        assignment = re.sub(r'-template$', '', assignment)
        if assignment:
            return assignment
    return "unknown"
 def create_final_metadata(final_grade_file='final_grade.json'):
    """从 final_grade.json 创建元数据（期末大作业专用）"""
    try:
        with open(final_grade_file, 'r', encoding='utf-8') as f:
            final_data = json.load(f)
        assignment_id = extract_assignment_id()
        student_id = extract_student_id()
        total_score = final_data.get("total_score", 0)
        max_score = final_data.get("max_score", 100)
        breakdown = final_data.get("breakdown", {})
        # 构建各组成部分
        components = []
        # 编程测试部分
        prog = breakdown.get("programming", {})
        if prog:
            prog_component = {
                "type": "programming_java",
                "score": prog.get("score", 0),
                "max_score": prog.get("max_score", 80),
                "details": {
                    "groups": prog.get("groups", {})
                }
            }
            components.append(prog_component)
        # REPORT.md 部分
        report = breakdown.get("report", {})
        if report:
            report_component = {
                "type": "llm_report",
                "score": report.get("score", 0),
                "max_score": report.get("max_score", 10),
                "details": {
                    "flags": report.get("flags", []),
                    "confidence": report.get("confidence"),
                    "criteria": report.get("criteria", [])  # LLM 各评分项及理由
                }
            }
            components.append(report_component)
        # FRONTEND.md 部分
        frontend = breakdown.get("frontend", {})
        if frontend:
            frontend_component = {
                "type": "llm_frontend",
                "score": frontend.get("score", 0),
                "max_score": frontend.get("max_score", 10),
                "details": {
                    "flags": frontend.get("flags", []),
                    "confidence": frontend.get("confidence"),
                    "criteria": frontend.get("criteria", [])  # LLM 各评分项及理由
                }
            }
            components.append(frontend_component)
        metadata = {
            "version": "1.0",
            "assignment": assignment_id,
            "student_id": student_id,
            "components": components,
            "total_score": round(total_score, 2),
            "total_max_score": max_score,
            "timestamp": datetime.now().isoformat(),
            "generator": "gitea-autograde"
        }
        return metadata
    except Exception as e:
        print(f"Error creating final metadata: {e}", file=sys.stderr)
        return {}
 def create_grade_metadata(grade_file='grade.json'):
    """从 grade.json 创建元数据，包含所有详细信息"""
    try:
        with open(grade_file, 'r') as f:
            grade_data = json.load(f)
        assignment_id = extract_assignment_id()
        student_id = extract_student_id()
        language = os.getenv("LANGUAGE", "java")
        # 提取所有相关信息
        final_score = grade_data.get("final_score", grade_data.get("total_score", grade_data.get("score", 0)))
        base_score = grade_data.get("base_score", final_score)
        penalty = grade_data.get("penalty", 0)
        passed = grade_data.get("passed", 0)
        total = grade_data.get("total", 0)
        fails = grade_data.get("fails", [])
        max_score = grade_data.get("max_score", 100)
        test_framework = grade_data.get("test_framework", "junit")
        coverage = grade_data.get("coverage")
        raw_score = grade_data.get("raw_score")
        groups = grade_data.get("groups", {})
        # 动态生成 type 字段
        type_map = {
            "python": "programming_python",
            "java": "programming_java",
            "r": "programming_r"
        }
        component_type = type_map.get(language, f"programming_{language}")
        component = {
            "type": component_type,
            "language": language,
            "score": round(final_score, 2),
            "max_score": max_score,
            "details": {
                "passed": passed,
                "total": total,
                "base_score": round(base_score, 2),
                "penalty": round(penalty, 2),
                "coverage": round(coverage, 2) if coverage else None,
                "raw_score": round(raw_score, 2) if raw_score else None,
                "failed_tests": fails,
                "test_framework": test_framework,
                "groups": groups
            }
        }
        metadata = {
            "version": "1.0",
            "assignment": assignment_id,
            "student_id": student_id,
            "components": [component],
            "total_score": round(final_score, 2),
            "total_max_score": max_score,
            "timestamp": datetime.now().isoformat(),
            "generator": "gitea-autograde"
        }
        return metadata
    except Exception as e:
        print(f"Error creating grade metadata: {e}", file=sys.stderr)
        return {}
 def create_llm_metadata(llm_grade_file='artifacts/llm_grade.json'):
    """从 llm_grade.json 创建元数据，包含所有详细信息"""
    try:
        with open(llm_grade_file, 'r') as f:
            llm_data = json.load(f)
        assignment_id = extract_assignment_id()
        student_id = extract_student_id()
        # 提取聚合后的信息
        total_score = llm_data.get("total_score", llm_data.get("total", 0))
        max_score = llm_data.get("max_score", 30)
        need_review = llm_data.get("need_review", False)
        questions_data = llm_data.get("details", llm_data.get("questions", []))
        # 构建各题详情
        question_details = []
        for i, q_data in enumerate(questions_data, 1):
            q_score = q_data.get("total", q_data.get("score", 0))
            q_max = q_data.get("max_score", 10)
            q_confidence = q_data.get("confidence", 1.0)
            q_flags = q_data.get("flags", [])
            q_need_review = "need_review" in q_flags or q_data.get("need_review", False)
            q_criteria = q_data.get("criteria", [])
            # 规范化 criteria 格式
            formatted_criteria = []
            for crit in q_criteria:
                formatted_criteria.append({
                    "id": crit.get("id", ""),
                    "score": round(float(crit.get("score", 0)), 2),
                    "reason": crit.get("reason", "")
                })
            question_detail = {
                "question_id": f"SA{i}",
                "question_name": q_data.get("question", f"SA{i}"),
                "score": round(float(q_score), 2),
                "max_score": q_max,
                "confidence": round(float(q_confidence), 2),
                "need_review": q_need_review,
                "flags": q_flags,
                "criteria": formatted_criteria
            }
            question_details.append(question_detail)
        component = {
            "type": "llm_essay",
            "score": round(float(total_score), 2),
            "max_score": max_score,
            "details": {
                "questions": len(question_details),
                "need_review": need_review,
                "question_details": question_details
            }
        }
        metadata = {
            "version": "1.0",
            "assignment": assignment_id,
            "student_id": student_id,
            "components": [component],
            "total_score": round(float(total_score), 2),
            "total_max_score": max_score,
            "timestamp": datetime.now().isoformat(),
            "generator": "gitea-autograde"
        }
        return metadata
    except Exception as e:
        print(f"Error creating LLM metadata: {e}", file=sys.stderr)
        return {}
 def create_objective_metadata(objective_file='objective_grade.json'):
    """从 objective_grade.json 创建元数据"""
    try:
        with open(objective_file, 'r', encoding='utf-8') as f:
            objective_data = json.load(f)
        assignment_id = extract_assignment_id()
        student_id = extract_student_id()
        total_score = objective_data.get("score", 0)
        max_score = objective_data.get("max_score", 0)
        components = objective_data.get("components", [])
        formatted_components = []
        for comp in components:
            comp_type = comp.get("type", "objective")
            formatted_components.append({
                "type": f"objective_{comp_type}",
                "score": comp.get("score", 0),
                "max_score": comp.get("max_score", 0),
                "details": comp.get("details", {})
            })
        if not formatted_components:
            formatted_components.append({
                "type": "objective_total",
                "score": total_score,
                "max_score": max_score,
                "details": {}
            })
        metadata = {
            "version": "1.0",
            "assignment": assignment_id,
            "student_id": student_id,
            "components": formatted_components,
            "total_score": total_score,
            "total_max_score": max_score,
            "timestamp": datetime.now().isoformat(),
            "generator": "gitea-autograde"
        }
        return metadata
    except Exception as e:
        print(f"Error creating objective metadata: {e}", file=sys.stderr)
        return {}
 def main():
    """主函数"""
    # 检查命令行参数或环境变量
    grade_type = os.getenv("GRADE_TYPE", "programming").lower()
    grade_file_override = os.getenv("GRADE_FILE")
    if grade_type == "final":
        # 期末大作业成绩（包含编程+报告）
        final_file = grade_file_override or "final_grade.json"
        if os.path.exists(final_file):
            metadata = create_final_metadata(final_file)
        else:
            print(f"Error: {final_file} not found", file=sys.stderr)
            metadata = {}
    elif grade_type == "llm":
        # LLM 成绩
        llm_file = grade_file_override or "artifacts/llm_grade.json"
        if os.path.exists(llm_file):
            metadata = create_llm_metadata(llm_file)
        elif os.path.exists("llm_grade.json"):
            metadata = create_llm_metadata("llm_grade.json")
        else:
            print(f"Error: {llm_file} not found", file=sys.stderr)
            metadata = {}
    elif grade_type == "objective":
        objective_file = grade_file_override or "objective_grade.json"
        if os.path.exists(objective_file):
            metadata = create_objective_metadata(objective_file)
        else:
            print(f"Error: {objective_file} not found", file=sys.stderr)
            metadata = {}
    else:
        # 编程成绩
        grade_file = grade_file_override or "grade.json"
        if os.path.exists(grade_file):
            metadata = create_grade_metadata(grade_file)
        else:
            print(f"Error: {grade_file} not found", file=sys.stderr)
            metadata = {}
    # 输出到 stdout
    print(json.dumps(metadata, ensure_ascii=False, indent=2))
 if __name__ == "__main__":
    main()
--- a/.autograde/grade.py
+++ b/.autograde/grade.py
@ -0,0 +1,187 @@
 #!/usr/bin/env python3
 """
 编程题评分脚本
 解析 JUnit XML 报告，计算分数，考虑迟交扣分，生成 grade.json 和 summary.md
 """
 import argparse
 import xml.etree.ElementTree as ET
 import json
 import subprocess
 import os
 import time
 import sys
 from pathlib import Path
 from dotenv import load_dotenv
 # 加载环境变量（支持从 .env 文件或环境变量读取）
 load_dotenv()
 def commit_ts():
    """获取最后一次提交的时间戳（Unix 时间戳）"""
    try:
        out = subprocess.check_output(
            ["git", "log", "-1", "--format=%ct"], 
            stderr=subprocess.DEVNULL
        ).decode().strip()
        return int(out)
    except Exception:
        return int(time.time())
 def parse_junit(junit_path):
    """
    解析 JUnit XML 报告
    Returns
    -------
    passed : int
        通过的测试数
    total : int
        总测试数
    fails : list
        失败的测试名称列表
    """
    if not os.path.exists(junit_path):
        return (0, 0, [])
    try:
        root = ET.parse(junit_path).getroot()
        total = 0
        passed = 0
        fails = []
        for testsuite in root.iter("testsuite"):
            for testcase in testsuite.iter("testcase"):
                total += 1
                # 检查是否有 failure、error 或 skipped 子元素
                if list(testcase):
                    classname = testcase.get("classname", "")
                    name = testcase.get("name", "")
                    full_name = f"{classname}.{name}" if classname else name
                    fails.append(full_name)
                else:
                    passed += 1
        return (passed, total, fails)
    except Exception as e:
        print(f"Error parsing JUnit XML: {e}", file=sys.stderr)
        return (0, 0, [])
 def calculate_late_penalty(deadline_str):
    """
    计算迟交扣分
    Parameters
    ----------
    deadline_str : str
        ISO 格式的截止时间（如 "2025-03-15T23:59:59+08:00"）
    Returns
    -------
    penalty : float
        扣分数（0-30）
    """
    if not deadline_str:
        return 0.0
    try:
        # 解析截止时间（支持多种格式）
        deadline_str = deadline_str.strip()
        # 移除时区信息（简化处理）
        if '+' in deadline_str:
            deadline_str = deadline_str.split('+')[0]
        elif 'Z' in deadline_str:
            deadline_str = deadline_str.replace('Z', '')
        # 解析时间
        if 'T' in deadline_str:
            dl = time.mktime(time.strptime(deadline_str[:19], "%Y-%m-%dT%H:%M:%S"))
        else:
            dl = time.mktime(time.strptime(deadline_str[:19], "%Y-%m-%d %H:%M:%S"))
        commit_time = commit_ts()
        late_sec = max(0, commit_time - dl)
        days = late_sec / 86400
        # 扣分规则：第一天 10 分，之后每天 5 分，最多 30 分
        if days > 0:
            penalty = min(30.0, 10.0 + 5.0 * days)
        else:
            penalty = 0.0
        return round(penalty, 2)
    except Exception as e:
        print(f"Error calculating late penalty: {e}", file=sys.stderr)
        return 0.0
 def main():
    parser = argparse.ArgumentParser(description="Grade programming assignments from JUnit XML")
    parser.add_argument("--junit", required=True, help="Path to JUnit XML file")
    parser.add_argument("--out", default="grade.json", help="Output JSON file")
    parser.add_argument("--summary", default="summary.md", help="Output summary markdown file")
    parser.add_argument("--bonus", default=None, help="Optional bonus file (e.g., lintr.rds)")
    args = parser.parse_args()
    # 解析 JUnit XML
    passed, total, fails = parse_junit(args.junit)
    # 计算基础分数
    if total > 0:
        base_score = 100.0 * (passed / total)
    else:
        base_score = 0.0
    # 计算迟交扣分
    deadline = os.getenv("DEADLINE", "")
    penalty = calculate_late_penalty(deadline)
    # 最终分数
    final_score = max(0.0, round(base_score - penalty, 2))
    # 生成 grade.json
    grade_data = {
        "score": final_score,
        "base_score": round(base_score, 2),
        "penalty": penalty,
        "passed": passed,
        "total": total,
        "fails": fails,
        "timestamp": int(time.time())
    }
    with open(args.out, "w", encoding="utf-8") as f:
        json.dump(grade_data, f, ensure_ascii=False, indent=2)
    # 生成 summary.md
    with open(args.summary, "w", encoding="utf-8") as f:
        f.write("# 成绩报告\n\n")
        f.write(f"- **通过用例**：{passed}/{total}\n")
        f.write(f"- **原始分**：{base_score:.2f}/100\n")
        if penalty > 0:
            f.write(f"- **迟交扣分**：-{penalty:.2f}\n")
        f.write(f"- **最终分**：**{final_score:.2f}/100**\n\n")
        if fails:
            f.write("## 未通过的测试\n\n")
            for fail in fails:
                f.write(f"- {fail}\n")
            f.write("\n")
        if deadline:
            f.write(f"## 截止时间\n\n")
            f.write(f"- 截止时间：{deadline}\n")
            commit_time_str = time.strftime("%Y-%m-%d %H:%M:%S", time.localtime(commit_ts()))
            f.write(f"- 提交时间：{commit_time_str}\n")
    print(f"Grading complete: {final_score:.2f}/100 ({passed}/{total} tests passed)")
 if __name__ == "__main__":
    main()
--- a/.autograde/llm_grade.py
+++ b/.autograde/llm_grade.py
@ -0,0 +1,249 @@
 #!/usr/bin/env python3
 """
 LLM 简答题评分脚本
 调用 LLM API，按评分量表对简答题进行评分，输出 JSON 格式结果
 """
 import os
 import json
 import argparse
 import requests
 import sys
 from pathlib import Path
 from dotenv import load_dotenv
 # 加载环境变量（支持从 .env 文件或环境变量读取）
 load_dotenv()
 def read_file(path):
    """读取文件内容"""
    if os.path.exists(path):
        return open(path, 'r', encoding='utf-8').read()
    return ""
 def read_file_or_string(value):
    """
    如果 value 是一个存在的文件路径，读取文件内容；
    否则直接返回 value 作为字符串。
    """
    if os.path.exists(value):
        return open(value, 'r', encoding='utf-8').read()
    return value  # 当作字符串直接返回
 PROMPT_TEMPLATE = """你是严格且一致的助教，按提供的评分量表为学生的简答题评分。
 评分规则：
 - 严格依据量表中各评分项的 scoring_guide 进行评分
 - 每个评分项只能给出 scoring_guide 中定义的整数分值（如 0, 1, 2, 3, 4）
 - 不输出任何解释性文本；只输出 JSON
 输出格式：
 {{
  "total": number (各项分数之和),
  "criteria": [
    {{"id": "评分项id", "score": 整数(必须是scoring_guide中定义的分值), "reason": "简短评语"}},
    ...
  ],
  "flags": [],
  "confidence": number(0-1, 评分置信度)
 }}
 重要：
 - score 必须是整数，只能是 scoring_guide 中定义的分值（如 0/1/2/3/4）
 - 不要给出 2.5, 3.5 这样的中间值
 - total 必须等于所有 criteria 的 score 之和
 - 如果答案与题目无关或为空，total=0，并加 flag "need_review"
 【题目】
 <<<{question}>>>
 【评分量表】
 <<<{rubric}>>>
 【学生答案】
 <<<{answer}>>>
 """
 def call_llm(url, key, model, prompt):
    """
    调用 LLM API
    Parameters
    ----------
    url : str
        API 地址
    key : str
        API 密钥
    model : str
        模型名称
    prompt : str
        提示词
    Returns
    -------
    dict
        LLM 返回的 JSON 结果
    """
    headers = {
        "Authorization": f"Bearer {key}",
        "Content-Type": "application/json"
    }
    data = {
        "model": model,
        "temperature": 0,
        "top_p": 1,
        "messages": [{"role": "user", "content": prompt}],
        "response_format": {"type": "json_object"}
    }
    try:
        # 设置超时：连接超时 10 秒，读取超时 60 秒
        response = requests.post(
            url, 
            headers=headers, 
            json=data, 
            timeout=(10, 60)
        )
        response.raise_for_status()
        result = response.json()
        content = result.get("choices", [{}])[0].get("message", {}).get("content", "{}")
        return json.loads(content)
    except requests.exceptions.Timeout as e:
        print(f"LLM API request timeout: {e}", file=sys.stderr)
        raise
    except requests.exceptions.HTTPError as e:
        print(f"LLM API HTTP error: {e} (status: {response.status_code})", file=sys.stderr)
        raise
    except requests.exceptions.RequestException as e:
        print(f"LLM API request failed: {e}", file=sys.stderr)
        raise
    except json.JSONDecodeError as e:
        print(f"Failed to parse LLM response as JSON: {e}", file=sys.stderr)
        raise
 def main():
    parser = argparse.ArgumentParser(description="Grade short answer questions using LLM")
    parser.add_argument("--question", required=True, help="Path to question file")
    parser.add_argument("--answer", required=True, help="Path to answer file")
    parser.add_argument("--rubric", required=True, help="Path to rubric JSON file")
    parser.add_argument("--out", default="grade.json", help="Output JSON file")
    parser.add_argument("--summary", default="summary.md", help="Output summary markdown file")
    parser.add_argument("--model", default=os.getenv("LLM_MODEL", "deepseek-chat"))
    parser.add_argument("--api_url", default=os.getenv("LLM_API_URL", "https://api.deepseek.com/chat/completions"))
    parser.add_argument("--api_key", default=os.getenv("LLM_API_KEY", ""))
    args = parser.parse_args()
    # 验证必需的配置
    if not args.api_key:
        print("Warning: LLM_API_KEY not set. LLM grading may fail.", file=sys.stderr)
    # 读取文件或字符串
    # question 可以是文件路径或直接的问题字符串
    question = read_file_or_string(args.question).strip()
    # answer 和 rubric 必须是文件路径
    answer = read_file(args.answer).strip()
    rubric_text = read_file(args.rubric).strip()
    if not question or not answer:
        print(f"Warning: Empty question or answer file", file=sys.stderr)
        resp = {
            "total": 0,
            "criteria": [],
            "flags": ["need_review", "empty_answer"],
            "confidence": 0.0
        }
    else:
        # 调用 LLM
        try:
            prompt = PROMPT_TEMPLATE.format(
                question=question,
                rubric=rubric_text,
                answer=answer
            )
            resp = call_llm(args.api_url, args.api_key, args.model, prompt)
        except Exception as e:
            print(f"LLM grading failed: {e}", file=sys.stderr)
            resp = {
                "total": 0,
                "criteria": [],
                "flags": ["need_review", "llm_error"],
                "confidence": 0.0
            }
    # 确保各项分数是整数，并重新计算 total
    criteria = resp.get("criteria", [])
    if criteria:
        for c in criteria:
            # 将分数四舍五入为整数（LLM 可能返回小数）
            score = c.get("score", 0)
            c["score"] = round(float(score))
        # 重新计算 total（各项得分之和）
        calculated_total = sum(c.get("score", 0) for c in criteria)
        resp["total"] = calculated_total
    # 边界带自动送审
    try:
        rubric_data = json.loads(rubric_text)
        lo, hi = rubric_data.get("borderline_band", [None, None])
        total = float(resp.get("total", 0))
        flags = set(resp.get("flags", []))
        if lo is not None and hi is not None and lo <= total <= hi:
            flags.add("need_review")
        # 低置信度送审
        confidence = resp.get("confidence", 1.0)
        if confidence < 0.7:
            flags.add("need_review")
        resp["flags"] = sorted(list(flags))
    except Exception:
        pass
    # 保存 grade.json
    with open(args.out, "w", encoding="utf-8") as f:
        json.dump(resp, f, ensure_ascii=False, indent=2)
    # 生成 summary.md
    try:
        rubric_data = json.loads(rubric_text)
        max_score = rubric_data.get("max_score", 10)
    except Exception:
        max_score = 10
    lines = [
        f"# 简答题评分",
        f"",
        f"- **总分**：**{resp.get('total', 0):.2f} / {max_score}**",
        f"- **置信度**：{resp.get('confidence', 0):.2f}",
        f"- **标记**：{', '.join(resp.get('flags', [])) or '无'}",
        f"",
        f"## 分项评分"
    ]
    for criterion in resp.get("criteria", []):
        criterion_id = criterion.get("id", "")
        score = criterion.get("score", 0)
        reason = criterion.get("reason", "")
        lines.append(f"- **{criterion_id}**: {score} 分")
        if reason:
            lines.append(f"  - {reason}")
    with open(args.summary, "w", encoding="utf-8") as f:
        f.write("\n".join(lines))
    print(f"LLM grading complete: {resp.get('total', 0):.2f}/{max_score}")
 if __name__ == "__main__":
    main()
--- a/.autograde/objective_grade.py
+++ b/.autograde/objective_grade.py
@ -0,0 +1,444 @@
 #!/usr/bin/env python3
 """
 选择题/判断题评分脚本
 读取学生答案和标准答案，生成成绩 JSON 文件
 """
 import json
 import argparse
 import sys
 from datetime import datetime
 from pathlib import Path
 def load_answers(answer_file):
    """
    加载学生答案文件（支持 JSON 和简单文本格式）
    JSON 格式示例：
    {
      "MC1": "A",
      "MC2": "B",
      "TF1": true,
      "TF2": false
    }
    文本格式示例（每行一个答案）：
    A
    B
    true
    false
    """
    try:
        with open(answer_file, 'r', encoding='utf-8') as f:
            content = f.read().strip()
        # 尝试作为 JSON 加载
        if content.startswith('{'):
            return json.loads(content)
        # 否则按行加载，忽略空行和注释
        lines = [line.strip() for line in content.split('\n') if line.strip() and not line.strip().startswith('#')]
        # 转换为字典格式：{"MC1": answer, "MC2": answer, ...}
        answers = {}
        for i, line in enumerate(lines, 1):
            # 尝试识别题型
            if line.lower() in ('true', 'false', 't', 'f'):
                question_id = f"TF{len([k for k in answers if k.startswith('TF')])+1}"
                answers[question_id] = line.lower() in ('true', 't')
            else:
                question_id = f"MC{len([k for k in answers if k.startswith('MC')])+1}"
                answers[question_id] = line.upper()
        return answers
    except Exception as e:
        print(f"Error loading answers: {e}", file=sys.stderr)
        return {}
 def load_standard_answers(std_file):
    """加载标准答案文件（JSON 格式）"""
    try:
        with open(std_file, 'r', encoding='utf-8') as f:
            return json.load(f)
    except Exception as e:
        print(f"Error loading standard answers: {e}", file=sys.stderr)
        return {}
 def grade_multiple_choice(student_answers, standard_answers, question_texts=None):
    """
    评选择题
    Parameters
    ----------
    student_answers : dict
        学生答案，格式 {"MC1": "A", "MC2": "B", ...}
    standard_answers : dict
        标准答案，格式 {"MC1": "A", "MC2": "B", ...}
    question_texts : dict, optional
        题目文本，格式 {"MC1": "题目文本", ...}
    Returns
    -------
    dict
        成绩数据
    """
    questions = []
    correct_count = 0
    for question_id, std_answer in standard_answers.items():
        if not question_id.startswith('MC'):
            continue
        student_answer = student_answers.get(question_id, "")
        is_correct = str(student_answer).upper() == str(std_answer).upper()
        if is_correct:
            correct_count += 1
            score = 1
        else:
            score = 0
        questions.append({
            "question_id": question_id,
            "question_text": question_texts.get(question_id, "") if question_texts else "",
            "correct_answer": str(std_answer).upper(),
            "student_answer": str(student_answer).upper(),
            "correct": is_correct,
            "score": score,
            "max_score": 1
        })
    total_count = len(questions)
    return {
        "type": "multiple_choice",
        "score": correct_count,
        "max_score": total_count,
        "details": {
            "correct": correct_count,
            "total": total_count,
            "questions": questions
        }
    }
 def grade_true_false(student_answers, standard_answers, question_texts=None):
    """
    评判断题
    Parameters
    ----------
    student_answers : dict
        学生答案，格式 {"TF1": true, "TF2": false, ...}
    standard_answers : dict
        标准答案，格式 {"TF1": true, "TF2": false, ...}
    question_texts : dict, optional
        题目文本
    Returns
    -------
    dict
        成绩数据
    """
    questions = []
    correct_count = 0
    for question_id, std_answer in standard_answers.items():
        if not question_id.startswith('TF'):
            continue
        student_answer = student_answers.get(question_id, None)
        # 规范化布尔值
        if isinstance(student_answer, str):
            student_answer = student_answer.lower() in ('true', 't', '1', 'yes')
        is_correct = bool(student_answer) == bool(std_answer)
        if is_correct:
            correct_count += 1
            score = 1
        else:
            score = 0
        questions.append({
            "question_id": question_id,
            "question_text": question_texts.get(question_id, "") if question_texts else "",
            "correct_answer": bool(std_answer),
            "student_answer": bool(student_answer) if student_answer is not None else None,
            "correct": is_correct,
            "score": score,
            "max_score": 1
        })
    total_count = len(questions)
    return {
        "type": "true_false",
        "score": correct_count,
        "max_score": total_count,
        "details": {
            "correct": correct_count,
            "total": total_count,
            "questions": questions
        }
    }
 def grade_multiple_select(student_answers, standard_answers, question_texts=None):
    """
    评多选题
    Parameters
    ----------
    student_answers : dict
        学生答案，格式 {"MS1": ["A", "B"], "MS2": ["C"], ...}
    standard_answers : dict
        标准答案，格式 {"MS1": ["A", "B"], "MS2": ["C"], ...}
    question_texts : dict, optional
        题目文本
    Returns
    -------
    dict
        成绩数据
    """
    questions = []
    correct_count = 0
    for question_id, std_answer in standard_answers.items():
        if not question_id.startswith('MS'):
            continue
        student_answer = student_answers.get(question_id, [])
        # 规范化答案（转为大写并排序）
        if isinstance(student_answer, str):
            student_answer = [student_answer]
        if not isinstance(student_answer, list):
            student_answer = []
        std_set = set([str(a).upper() for a in std_answer])
        stu_set = set([str(a).upper() for a in student_answer])
        is_correct = std_set == stu_set
        if is_correct:
            correct_count += 1
            score = 1
        else:
            score = 0
        questions.append({
            "question_id": question_id,
            "question_text": question_texts.get(question_id, "") if question_texts else "",
            "correct_answer": sorted(list(std_set)),
            "student_answer": sorted(list(stu_set)) if stu_set else [],
            "correct": is_correct,
            "score": score,
            "max_score": 1
        })
    total_count = len(questions)
    return {
        "type": "multiple_select",
        "score": correct_count,
        "max_score": total_count,
        "details": {
            "correct": correct_count,
            "total": total_count,
            "questions": questions
        }
    }
 def grade_fill_blank(student_answers, standard_answers, question_texts=None):
    """
    评填空题
    Parameters
    ----------
    student_answers : dict
        学生答案，格式 {"FB1": "答案", "FB2": ["答案1", "答案2"], ...}
    standard_answers : dict
        标准答案，格式同上
    question_texts : dict, optional
        题目文本
    Returns
    -------
    dict
        成绩数据
    """
    questions = []
    correct_count = 0
    def normalize_answer(ans):
        """规范化答案：去除空格、转小写"""
        if isinstance(ans, str):
            return ans.strip().lower()
        elif isinstance(ans, list):
            return [a.strip().lower() for a in ans]
        return ans
    def compare_answers(student, standard):
        """比较答案是否相等"""
        student_norm = normalize_answer(student)
        standard_norm = normalize_answer(standard)
        if isinstance(standard_norm, list) and isinstance(student_norm, list):
            return student_norm == standard_norm
        elif isinstance(standard_norm, str) and isinstance(student_norm, str):
            return student_norm == standard_norm
        return False
    for question_id, std_answer in standard_answers.items():
        if not question_id.startswith('FB'):
            continue
        student_answer = student_answers.get(question_id, "")
        is_correct = compare_answers(student_answer, std_answer)
        if is_correct:
            correct_count += 1
            score = 1
        else:
            score = 0
        questions.append({
            "question_id": question_id,
            "question_text": question_texts.get(question_id, "") if question_texts else "",
            "correct_answer": std_answer,
            "student_answer": student_answer,
            "correct": is_correct,
            "score": score,
            "max_score": 1
        })
    total_count = len(questions)
    return {
        "type": "fill_blank",
        "score": correct_count,
        "max_score": total_count,
        "details": {
            "correct": correct_count,
            "total": total_count,
            "questions": questions
        }
    }
 def main():
    parser = argparse.ArgumentParser(description="Grade objective questions")
    parser.add_argument("--answers", required=True, help="Student answers file (JSON or text)")
    parser.add_argument("--standard", required=True, help="Standard answers file (JSON)")
    parser.add_argument("--questions", help="Question texts file (JSON, optional)")
    parser.add_argument("--out", default="grade.json", help="Output grade JSON file")
    parser.add_argument("--summary", default="summary.md", help="Output summary markdown file")
    parser.add_argument("--type", choices=['mc', 'tf', 'ms', 'fb', 'all'], default='all',
                        help="Question type to grade")
    args = parser.parse_args()
    # 加载文件
    student_answers = load_answers(args.answers)
    standard_answers = load_standard_answers(args.standard)
    question_texts = None
    if args.questions:
        try:
            with open(args.questions, 'r', encoding='utf-8') as f:
                question_texts = json.load(f)
        except Exception as e:
            print(f"Warning: Could not load question texts: {e}", file=sys.stderr)
    if not student_answers or not standard_answers:
        print("Error: Could not load answers", file=sys.stderr)
        sys.exit(1)
    # 评分
    components = []
    total_score = 0
    total_max_score = 0
    if args.type in ('mc', 'all'):
        mc_grade = grade_multiple_choice(student_answers, standard_answers, question_texts)
        if mc_grade['details']['total'] > 0:
            components.append(mc_grade)
            total_score += mc_grade['score']
            total_max_score += mc_grade['max_score']
    if args.type in ('tf', 'all'):
        tf_grade = grade_true_false(student_answers, standard_answers, question_texts)
        if tf_grade['details']['total'] > 0:
            components.append(tf_grade)
            total_score += tf_grade['score']
            total_max_score += tf_grade['max_score']
    if args.type in ('ms', 'all'):
        ms_grade = grade_multiple_select(student_answers, standard_answers, question_texts)
        if ms_grade['details']['total'] > 0:
            components.append(ms_grade)
            total_score += ms_grade['score']
            total_max_score += ms_grade['max_score']
    if args.type in ('fb', 'all'):
        fb_grade = grade_fill_blank(student_answers, standard_answers, question_texts)
        if fb_grade['details']['total'] > 0:
            components.append(fb_grade)
            total_score += fb_grade['score']
            total_max_score += fb_grade['max_score']
    # 生成 grade.json
    grade_data = {
        "score": total_score,
        "max_score": total_max_score,
        "components": components,
        "timestamp": int(__import__('time').time())
    }
    with open(args.out, 'w', encoding='utf-8') as f:
        json.dump(grade_data, f, ensure_ascii=False, indent=2)
    # 生成 summary.md
    summary_lines = [
        "# 客观题评分\n",
        f"- **总分**：{total_score} / {total_max_score}\n",
        f"- **组件数**：{len(components)}\n",
        ""
    ]
    for comp in components:
        comp_type = comp['type']
        correct = comp['details']['correct']
        total = comp['details']['total']
        type_names = {
            'multiple_choice': '选择题',
            'true_false': '判断题',
            'multiple_select': '多选题',
            'fill_blank': '填空题'
        }
        type_name = type_names.get(comp_type, comp_type)
        summary_lines.append(f"## {type_name}\n")
        summary_lines.append(f"- **正确**：{correct} / {total}\n")
        summary_lines.append("")
    with open(args.summary, 'w', encoding='utf-8') as f:
        f.write("\n".join(summary_lines))
    print(f"Grading complete: {total_score}/{total_max_score}")
    return 0
 if __name__ == "__main__":
    sys.exit(main())
--- a/.autograde/post_comment.py
+++ b/.autograde/post_comment.py
@ -0,0 +1,155 @@
 #!/usr/bin/env python3
 """
 发送评论到 Gitea PR
 从环境变量读取配置，发送评论到指定的 PR
 支持在 Markdown 评论中嵌入 JSON 数据，便于后续结构化提取
 """
 import os
 import sys
 import json
 import requests
 from datetime import datetime
 def create_comment_with_metadata(summary, commit_sha, comment_type='grade', metadata=None):
    """
    创建包含元数据的评论内容
    Parameters
    ----------
    summary : str
        人类可读的 Markdown 格式总结
    commit_sha : str
        提交 SHA
    comment_type : str
        评论类型 ('grade', 'llm', 'combined')
    metadata : dict, optional
        结构化的成绩数据，将嵌入为 JSON
    Returns
    -------
    str
        完整的评论内容（Markdown + JSON）
    """
    commit_short = commit_sha[:7] if commit_sha else 'unknown'
    # 根据类型设置标题和图标
    if comment_type == 'llm':
        title = "🤖 LLM 简答题评分结果"
        footer = "*此评论由 Gitea Actions 自动生成（使用 DeepSeek API） | Commit: `{}`*"
    elif comment_type == 'combined':
        title = "📊 综合评分结果"
        footer = "*此评论由 Gitea Actions 自动生成 | Commit: `{}`*"
    else:
        title = "🤖 自动评分结果"
        footer = "*此评论由 Gitea Actions 自动生成 | Commit: `{}`*"
    # 构建评论
    parts = [
        f"## {title}",
        "",
        summary,
        ""
    ]
    # 如果提供了元数据，嵌入 JSON
    if metadata:
        # 确保元数据包含版本和时间戳
        if 'version' not in metadata:
            metadata['version'] = '1.0'
        if 'timestamp' not in metadata:
            metadata['timestamp'] = datetime.now().isoformat()
        # 使用 Markdown 代码块嵌入 JSON（更可靠，Gitea 会保留）
        # 放在评论末尾，对学生不太显眼
        json_str = json.dumps(metadata, ensure_ascii=False, indent=2)
        parts.extend([
            "",
            "---",
            "",
            "<!-- GRADE_METADATA -->",
            "```json",
            json_str,
            "```",
            ""
        ])
    parts.extend([
        footer.format(commit_short)
    ])
    return "\n".join(parts)
 def main():
    # 从环境变量读取配置
    api_url = os.environ.get('API_URL', '')
    repo = os.environ.get('REPO', '')
    pr_number = os.environ.get('PR_NUMBER', '')
    token = os.environ.get('GITEA_TOKEN', '')
    summary = os.environ.get('SUMMARY', '')
    commit_sha = os.environ.get('COMMIT_SHA', '')
    comment_type = os.environ.get('COMMENT_TYPE', 'grade')
    # 可选：从环境变量读取 JSON 元数据
    metadata_str = os.environ.get('GRADE_METADATA', '')
    metadata = None
    if metadata_str:
        try:
            metadata = json.loads(metadata_str)
        except json.JSONDecodeError as e:
            print(f"Warning: Failed to parse GRADE_METADATA: {e}", file=sys.stderr)
    # 验证必需参数
    if not all([api_url, repo, pr_number, token, summary]):
        print("Error: Missing required environment variables", file=sys.stderr)
        print(f"API_URL: {api_url}", file=sys.stderr)
        print(f"REPO: {repo}", file=sys.stderr)
        print(f"PR_NUMBER: {pr_number}", file=sys.stderr)
        print(f"GITEA_TOKEN: {'set' if token else 'not set'}", file=sys.stderr)
        print(f"SUMMARY: {'set' if summary else 'not set'}", file=sys.stderr)
        sys.exit(1)
    # 构建评论内容（包含元数据）
    comment_body = create_comment_with_metadata(
        summary=summary,
        commit_sha=commit_sha,
        comment_type=comment_type,
        metadata=metadata
    )
    # 构建 API URL
    comment_url = f"{api_url}/repos/{repo}/issues/{pr_number}/comments"
    # 发送请求
    headers = {
        "Authorization": f"token {token}",
        "Content-Type": "application/json"
    }
    data = {"body": comment_body}
    try:
        print(f"Posting comment to: {comment_url}")
        if metadata:
            print("✓ Comment includes structured metadata")
        response = requests.post(comment_url, headers=headers, json=data, timeout=30)
        response.raise_for_status()
        print("✅ Comment posted successfully to PR")
        return 0
    except requests.exceptions.Timeout:
        print("⚠️ Request timeout", file=sys.stderr)
        return 1
    except requests.exceptions.HTTPError as e:
        print(f"⚠️ HTTP error: {e}", file=sys.stderr)
        print(f"Response: {response.text}", file=sys.stderr)
        return 1
    except Exception as e:
        print(f"⚠️ Failed to post comment: {e}", file=sys.stderr)
        return 1
 if __name__ == "__main__":
    sys.exit(main())
--- a/.autograde/run_tests.py
+++ b/.autograde/run_tests.py
@ -0,0 +1,164 @@
 #!/usr/bin/env python3
 """
 通用测试运行器 - 根据语言配置运行测试并生成 JUnit XML
 支持的语言:
 - python: pytest
 - java: maven (mvn test)
 - r: testthat (通过 JUnit Reporter)
 环境变量:
 - LANGUAGE: 编程语言 (python/java/r)
 - TEST_DIR: 测试目录路径
 - SOURCE_DIR: 源代码目录路径
 """
 import argparse
 import subprocess
 import sys
 import os
 from pathlib import Path
 def run_python_tests(test_dir, output_xml, **kwargs):
    """运行 Python pytest 测试"""
    cmd = [
        "pytest", test_dir,
        f"--junit-xml={output_xml}",
        "-v", "--tb=short"
    ]
    # 添加覆盖率选项（如果指定）
    source_dir = kwargs.get('source_dir')
    if source_dir:
        cmd.extend([
            f"--cov={source_dir}",
            "--cov-report=term-missing",
            "--cov-report=json:coverage.json"
        ])
    print(f"Running: {' '.join(cmd)}")
    result = subprocess.run(cmd, capture_output=False)
    return result
 def run_java_tests(test_dir, output_xml, **kwargs):
    """运行 Java Maven 测试"""
    cmd = ["mvn", "test", "-B"]
    print(f"Running: {' '.join(cmd)}")
    result = subprocess.run(cmd, capture_output=False)
    # Maven 自动生成 XML 在 target/surefire-reports/
    # 需要复制到指定的输出位置
    surefire_dir = Path("target/surefire-reports")
    if surefire_dir.exists():
        # 合并所有 TEST-*.xml 文件
        import xml.etree.ElementTree as ET
        xml_files = list(surefire_dir.glob("TEST-*.xml"))
        if xml_files:
            # 简单情况：只复制第一个（或合并）
            import shutil
            if len(xml_files) == 1:
                shutil.copy(xml_files[0], output_xml)
            else:
                # 合并多个 XML 文件（简化版本）
                root = ET.Element("testsuites")
                for xml_file in xml_files:
                    tree = ET.parse(xml_file)
                    root.append(tree.getroot())
                tree = ET.ElementTree(root)
                tree.write(output_xml, encoding='utf-8', xml_declaration=True)
    return result
 def run_r_tests(test_dir, output_xml, **kwargs):
    """运行 R testthat 测试"""
    # R 脚本：使用 testthat 的 JUnitReporter
    # 注意：需要安装 testthat (>= 3.0.0)
    r_script = f"""
 library(testthat)
 # 配置 JUnit reporter
 reporter <- JunitReporter$new(file = '{output_xml}')
 # 运行测试
 test_dir(
  path = '{test_dir}',
  reporter = reporter,
  stop_on_failure = FALSE
 )
 """
    # 将脚本写入临时文件
    import tempfile
    with tempfile.NamedTemporaryFile(mode='w', suffix='.R', delete=False) as f:
        f.write(r_script)
        script_path = f.name
    try:
        cmd = ["Rscript", script_path]
        print(f"Running: {' '.join(cmd)}")
        result = subprocess.run(cmd, capture_output=False)
        return result
    finally:
        # 清理临时文件
        if os.path.exists(script_path):
            os.remove(script_path)
 def main():
    parser = argparse.ArgumentParser(
        description="通用测试运行器 - 支持 Python/Java/R"
    )
    parser.add_argument(
        "--language",
        required=True,
        choices=["python", "java", "r"],
        help="编程语言"
    )
    parser.add_argument(
        "--test-dir",
        required=True,
        help="测试目录路径"
    )
    parser.add_argument(
        "--output-xml",
        default="test-results.xml",
        help="JUnit XML 输出文件路径"
    )
    parser.add_argument(
        "--source-dir",
        help="源代码目录（用于覆盖率）"
    )
    args = parser.parse_args()
    # 语言对应的运行器
    runners = {
        "python": run_python_tests,
        "java": run_java_tests,
        "r": run_r_tests,
    }
    if args.language not in runners:
        print(f"❌ Unsupported language: {args.language}", file=sys.stderr)
        sys.exit(1)
    # 运行测试
    result = runners[args.language](
        args.test_dir,
        args.output_xml,
        source_dir=args.source_dir
    )
    sys.exit(result.returncode)
 if __name__ == "__main__":
    main()
--- a/.autograde/test_objective_grade.sh
+++ b/.autograde/test_objective_grade.sh
@ -0,0 +1,95 @@
 #!/bin/bash
 # 测试客观题评分脚本
 set -e
 echo "=== 测试客观题评分脚本 ==="
 cd "$(dirname "$0")/.."
 # 测试 1: 使用 JSON 格式答案
 echo ""
 echo "测试 1: JSON 格式答案（全对）"
 python3 ./.autograde/objective_grade.py \
  --answers objective_questions/standard_answers.json \
  --standard objective_questions/standard_answers.json \
  --questions objective_questions/question_texts.json \
  --out test_grade1.json \
  --summary test_summary1.md \
  --type both
 echo "分数："
 python3 -c "import json; data=json.load(open('test_grade1.json')); print(f\"{data['score']}/{data['max_score']}\")"
 echo ""
 echo "摘要："
 cat test_summary1.md
 # 测试 2: 使用部分错误的答案
 echo ""
 echo "测试 2: 部分错误答案"
 cat > test_answers2.json << 'EOF'
 {
  "MC1": "A",
  "MC2": "A",
  "MC3": "C",
  "MC4": "B",
  "MC5": "C",
  "TF1": true,
  "TF2": false,
  "TF3": true,
  "TF4": true,
  "TF5": false
 }
 EOF
 python3 ./.autograde/objective_grade.py \
  --answers test_answers2.json \
  --standard objective_questions/standard_answers.json \
  --questions objective_questions/question_texts.json \
  --out test_grade2.json \
  --summary test_summary2.md \
  --type both
 echo "分数："
 python3 -c "import json; data=json.load(open('test_grade2.json')); print(f\"{data['score']}/{data['max_score']}\")"
 echo ""
 echo "摘要："
 cat test_summary2.md
 # 测试 3: 只评选择题
 echo ""
 echo "测试 3: 只评选择题"
 python3 ./.autograde/objective_grade.py \
  --answers objective_questions/standard_answers.json \
  --standard objective_questions/standard_answers.json \
  --questions objective_questions/question_texts.json \
  --out test_grade3.json \
  --summary test_summary3.md \
  --type mc
 echo "分数："
 python3 -c "import json; data=json.load(open('test_grade3.json')); print(f\"{data['score']}/{data['max_score']}\")"
 # 测试 4: 只评判断题
 echo ""
 echo "测试 4: 只评判断题"
 python3 ./.autograde/objective_grade.py \
  --answers objective_questions/standard_answers.json \
  --standard objective_questions/standard_answers.json \
  --questions objective_questions/question_texts.json \
  --out test_grade4.json \
  --summary test_summary4.md \
  --type tf
 echo "分数："
 python3 -c "import json; data=json.load(open('test_grade4.json')); print(f\"{data['score']}/{data['max_score']}\")"
 # 清理测试文件
 rm -f test_grade*.json test_summary*.md test_answers*.json
 echo ""
 echo "✅ 所有测试通过！"
--- a/.autograde/upload_metadata.py
+++ b/.autograde/upload_metadata.py
@ -0,0 +1,157 @@
 #!/usr/bin/env python3
 """
 Upload metadata.json to teacher-only repository via Gitea API.
 """
 import argparse
 import base64
 import json
 import os
 import sys
 import urllib.error
 import urllib.request
 from pathlib import Path
 from urllib.parse import urlparse
 def detect_host(server_url: str, external_host: str | None) -> str:
    """Detect the Gitea host to use for API calls.
    If server_url uses internal name (like 'gitea'), use external_host instead.
    """
    parsed = urlparse(server_url)
    raw_host = parsed.netloc or parsed.path.split("/")[0]
    host = raw_host
    if raw_host.lower().startswith("gitea"):
        if not external_host:
            raise ValueError(
                f"Server URL uses internal name '{raw_host}' but EXTERNAL_GITEA_HOST is not set. "
                "Please configure EXTERNAL_GITEA_HOST in .env and run sync_runner_config.sh"
            )
        host = external_host
    return host
 def main() -> int:
    parser = argparse.ArgumentParser(description="Upload metadata.json to course metadata repo")
    parser.add_argument("--metadata-file", required=True)
    parser.add_argument("--metadata-repo", required=True, help="owner/repo of metadata store")
    parser.add_argument("--branch", default="main")
    parser.add_argument("--student-repo", required=True)
    parser.add_argument("--run-id", required=True)
    parser.add_argument("--commit-sha", required=True)
    parser.add_argument("--workflow", required=True, choices=["grade", "objective", "llm"])
    parser.add_argument("--server-url", required=True)
    parser.add_argument("--external-host")
    parser.add_argument("--assignment-id", help="Assignment ID (e.g., hw1)")
    args = parser.parse_args()
    token = os.environ.get("METADATA_TOKEN")
    if not token:
        print("METADATA_TOKEN is not set", file=sys.stderr)
        return 1
    path = Path(args.metadata_file)
    if not path.is_file():
        print(f"metadata file not found: {path}", file=sys.stderr)
        return 0
    try:
        owner, repo_name = args.metadata_repo.split("/", 1)
    except ValueError:
        print(f"Invalid metadata repo: {args.metadata_repo}", file=sys.stderr)
        return 1
    # Extract student ID from student repo name
    # student repo format: hw1-stu_20250001 or hw1-stu_student1
    student_id = args.student_repo.split("/")[-1]  # Get repo name
    # Auto-detect assignment ID from student repo if not provided
    assignment_id = args.assignment_id
    if not assignment_id:
        # Try to extract from student_repo format: hw1-stu_xxx
        repo_name_part = args.student_repo.split("/")[-1]
        if "-stu_" in repo_name_part:
            assignment_id = repo_name_part.split("-stu_")[0]
        elif "-template" in repo_name_part:
             assignment_id = repo_name_part.split("-template")[0]
        elif "-tests" in repo_name_part:
             assignment_id = repo_name_part.split("-tests")[0]
        else:
            assignment_id = "unknown"
    # New path structure: {assignment_id}/{student_id}/{workflow}_{run_id}_{sha}.json
    target_path = f"{assignment_id}/{student_id}/{args.workflow}_{args.run_id}_{args.commit_sha[:7]}.json"
    host = detect_host(args.server_url, args.external_host)
    api_url = f"http://{host}/api/v1/repos/{owner}/{repo_name}/contents/{target_path}"
    message = f"Upload {args.workflow} metadata for {args.student_repo} {args.commit_sha}"
    # Check if file exists to determine if we need to update (PUT) or create (POST)
    get_req = urllib.request.Request(
        api_url,
        headers={"Authorization": f"token {token}"},
        method="GET"
    )
    sha = None
    try:
        with urllib.request.urlopen(get_req) as resp:
            existing_file = json.loads(resp.read().decode())
            # API may return a list (directory contents) or dict (single file)
            if isinstance(existing_file, dict):
            sha = existing_file.get("sha")
            print(f"File exists, updating (sha: {sha})")
            elif isinstance(existing_file, list):
                # Response is a directory listing, file doesn't exist at this exact path
                print(f"Path is a directory or file not found in expected format")
            else:
                print(f"Unexpected response type: {type(existing_file)}")
    except urllib.error.HTTPError as e:
        if e.code != 404:
            print(f"Error checking file existence: {e}", file=sys.stderr)
            return 1
        # File doesn't exist, proceed with creation
    content = base64.b64encode(path.read_bytes()).decode()
    payload = {
        "content": content,
        "message": message,
        "branch": args.branch
    }
    if sha:
        payload["sha"] = sha
    data = json.dumps(payload).encode()
    req = urllib.request.Request(
        api_url,
        data=data,
        headers={
            "Authorization": f"token {token}",
            "Content-Type": "application/json",
        },
        method="PUT" if sha else "POST",
    )
    try:
        with urllib.request.urlopen(req, timeout=30) as resp:
            resp_body = resp.read().decode()
            print(resp_body)
    except urllib.error.HTTPError as exc:
        print(f"Metadata upload failed: {exc.status} {exc.reason}", file=sys.stderr)
        print(exc.read().decode(), file=sys.stderr)
        return 1
    except urllib.error.URLError as exc:
        print(f"Metadata upload failed: {exc}", file=sys.stderr)
        return 1
    print(f"✅ Metadata stored at {args.metadata_repo}:{target_path}")
    return 0
 if __name__ == "__main__":
    raise SystemExit(main())
--- a/.autograde/workflow_templates/README.md
+++ b/.autograde/workflow_templates/README.md
@ -0,0 +1,216 @@
 # Workflow 模板
 本目录包含不同编程语言的 Gitea Actions workflow 模板。
 ## 可用模板
 | 文件 | 语言 | 容器 | 测试框架 |
 |------|------|------|----------|
 | `python.yml` | Python | python:3.11 | pytest |
 | `java.yml` | Java | maven:3.9-eclipse-temurin-17 | JUnit 5 |
 | `r.yml` | R | r-base:4.3 | testthat |
 ## 使用方法
 ### 1. 选择模板
 根据你的编程语言选择对应的模板：
 ```bash
 # 对于 Python 作业
 cp .autograde/workflow_templates/python.yml .gitea/workflows/grade.yml
 # 对于 Java 作业
 cp .autograde/workflow_templates/java.yml .gitea/workflows/grade.yml
 # 对于 R 作业
 cp .autograde/workflow_templates/r.yml .gitea/workflows/grade.yml
 ```
 ### 2. 自定义配置
 编辑 `.gitea/workflows/grade.yml` 根据需要修改：
 - **容器版本**：修改 `container:` 字段
 - **超时时间**：修改 `timeout-minutes:`
 - **依赖安装**：修改 "Install dependencies" 步骤
 - **测试命令**：修改测试运行步骤
 ### 3. 配置 Secrets
 确保在 Gitea 仓库设置中配置了以下 Secrets：
 - `TESTS_TOKEN`：用于访问隐藏测试仓库的 token（可选）
 - `EXTERNAL_GITEA_HOST`：外部访问的 Gitea 地址（可选）
 ## Python 模板 (python.yml)
 ### 特点
 - 使用 `python:3.11` 容器
 - 自动安装 `requirements.txt` 中的依赖
 - 使用 `run_tests.py` 运行 pytest
 - 支持代码覆盖率
 ### 自定义选项
 ```yaml
 # 修改 Python 版本
 container: python:3.10  # 或 python:3.9
 # 添加额外的依赖
 - name: Install dependencies
  run: |
    pip install -r requirements.txt
    pip install numpy pandas  # 额外的包
 ```
 ## Java 模板 (java.yml)
 ### 特点
 - 使用 `maven:3.9-eclipse-temurin-17` 容器
 - Maven 自动管理依赖（通过 `pom.xml`）
 - JUnit 5 测试框架
 - 自动提取 Surefire 报告
 ### 自定义选项
 ```yaml
 # 修改 JDK 版本
 container: maven:3.9-eclipse-temurin-11  # Java 11
 container: maven:3.9-eclipse-temurin-21  # Java 21
 # 自定义 Maven 命令
 run: |
  mvn clean test -B -DskipTests=false
 ```
 ### Maven 配置提示
 确保 `pom.xml` 中配置了 Surefire 插件：
 ```xml
 <plugin>
    <groupId>org.apache.maven.plugins</groupId>
    <artifactId>maven-surefire-plugin</artifactId>
    <version>3.2.2</version>
    <configuration>
        <reportsDirectory>${project.build.directory}/surefire-reports</reportsDirectory>
    </configuration>
 </plugin>
 ```
 ## R 模板 (r.yml)
 ### 特点
 - 使用 `r-base:4.3` 容器
 - 自动从 `DESCRIPTION` 安装依赖
 - testthat 测试框架
 - JUnitReporter 输出 XML
 ### 自定义选项
 ```yaml
 # 修改 R 版本
 container: r-base:4.2  # 或其他版本
 # 修改 CRAN 镜像
 run: |
  Rscript -e "install.packages('testthat', repos='https://cran.r-project.org/')"
 ```
 ### R 项目结构要求
 ```
 project/
 ├── DESCRIPTION         # 包依赖定义
 ├── R/                  # R 源代码
 └── tests/
    └── testthat/       # testthat 测试
 ```
 ## 通用 Workflow 流程
 所有模板都遵循相同的流程：
 1. **安装系统依赖**（git, rsync 等）
 2. **检出代码** - 克隆学生仓库
 3. **安装语言依赖** - 根据语言安装包
 4. **获取隐藏测试**（可选）- 从私有仓库获取
 5. **运行测试** - 生成 JUnit XML
 6. **评分** - 解析 XML，计算分数
 7. **生成元数据** - 创建 JSON metadata
 8. **发布评论** - 在 PR 中发布结果
 ## 高级配置
 ### 添加代码质量检查
 ```yaml
 - name: Run linter
  run: |
    # Python: pylint, flake8
    pip install pylint
    pylint src/
    # Java: checkstyle
    mvn checkstyle:check
    # R: lintr
    Rscript -e "lintr::lint_package()"
 ```
 ### 自定义评分规则
 修改 `grade.py` 的调用参数：
 ```yaml
 - name: Grade
  run: |
    python3 ./.autograde/grade.py \
      --junit junit.xml \
      --out grade.json \
      --summary summary.md \
      --bonus bonus.json  # 可选的加分项
 ```
 ### 多个测试套件
 ```yaml
 - name: Run public tests
  run: |
    pytest tests_public/ --junit-xml=public.xml
 - name: Run hidden tests
  run: |
    pytest tests_hidden/ --junit-xml=hidden.xml
 - name: Merge test results
  run: |
    python3 ./.autograde/merge_junit.py public.xml hidden.xml -o junit.xml
 ```
 ## 故障排查
 ### 测试无法运行
 - 检查测试目录路径是否正确
 - 确认依赖是否正确安装
 - 查看 Actions 日志中的错误信息
 ### JUnit XML 未生成
 - Python: 确保 pytest 命令包含 `--junit-xml`
 - Java: 检查 Surefire 插件配置
 - R: 确认 testthat >= 3.0.0
 ### 元数据为空
 - 检查 `grade.json` 是否生成
 - 确认 `LANGUAGE` 环境变量设置正确
 - 查看 `create_minimal_metadata.py` 的输出
 ## 相关文档
 - [运行测试脚本](../run_tests.py) - 通用测试运行器
 - [评分脚本](../grade.py) - JUnit XML 解析和评分
 - [元数据生成](../create_minimal_metadata.py) - JSON 元数据
 - [示例](../../examples/) - 各语言的完整示例
 ---
 最后更新: 2025-11-13
--- a/.autograde/workflow_templates/java.yml
+++ b/.autograde/workflow_templates/java.yml
@ -0,0 +1,200 @@
 name: autograde-java
 on:
  push:
    branches:
      - main
  workflow_dispatch:
 permissions:
  contents: read
  pull-requests: write
 jobs:
  java:
    runs-on: docker
    container:
      image: gradle:9.0-jdk21
      options: --user root
    timeout-minutes: 20
    steps:
      - name: Install dependencies (CN mirror)
        run: |
          set -e
          # 替换 Debian/Ubuntu 源为腾讯云镜像
          for f in /etc/apt/sources.list /etc/apt/sources.list.d/*.list /etc/apt/sources.list.d/*.sources; do
            [ -f "$f" ] || continue
            sed -i -E 's|https?://deb.debian.org|http://mirrors.cloud.tencent.com|g' "$f" || true
            sed -i -E 's|https?://security.debian.org|http://mirrors.cloud.tencent.com/debian-security|g' "$f" || true
            sed -i -E 's|https?://archive.ubuntu.com|http://mirrors.cloud.tencent.com|g' "$f" || true
            sed -i -E 's|https?://ports.ubuntu.com|http://mirrors.cloud.tencent.com|g' "$f" || true
          done
          apt-get -o Acquire::Check-Valid-Until=false -o Acquire::AllowInsecureRepositories=true update -y
          DEBIAN_FRONTEND=noninteractive apt-get install -y --no-install-recommends git ca-certificates python3 python3-pip nodejs rsync
          pip3 install --break-system-packages python-dotenv requests -i https://mirrors.cloud.tencent.com/pypi/simple
          rm -rf /var/lib/apt/lists/*
      - name: Checkout code
        uses: actions/checkout@v3
        with:
          fetch-depth: 1
      - name: Fix permissions
        run: |
          # Ensure workspace is owned by current user
          chown -R $(whoami):$(whoami) ${{ github.workspace }} || true
      - name: Fetch hidden tests (if available)
        working-directory: ${{ github.workspace }}
        env:
          EXTERNAL_GITEA_HOST: ${{ secrets.EXTERNAL_GITEA_HOST }}
        run: |
          set -e
          TESTS_USERNAME="${RUNNER_TESTS_USERNAME:-}"
          TESTS_TOKEN="${RUNNER_TESTS_TOKEN:-}"
          if [ -z "$TESTS_TOKEN" ] || [ -z "$TESTS_USERNAME" ]; then
            echo "Warning: RUNNER_TESTS_USERNAME / RUNNER_TESTS_TOKEN not set, skipping private tests"
            exit 0
          fi
          # Resolve Gitea Host
          if [ -n "$EXTERNAL_GITEA_HOST" ]; then
            HOST="$EXTERNAL_GITEA_HOST"
          elif [ -n "$GITEA_ROOT_URL" ]; then
            HOST=$(echo "$GITEA_ROOT_URL" | sed 's|https\?://||' | sed 's|/$||')
          else
            HOST=$(echo "${{ github.server_url }}" | sed 's|https\?://||' | cut -d'/' -f1)
          fi
          echo "📥 Fetching private tests repository..."
          echo "  Gitea host: $HOST"
          # Infer organization and assignment ID from repository name
          ORG=$(echo "${{ github.repository }}" | cut -d'/' -f1)
          REPO_NAME=$(echo "${{ github.repository }}" | cut -d'/' -f2)
          # Extract assignment ID from repo name (e.g., hw2-stu_xxx -> hw2, hw2-template -> hw2)
          if echo "$REPO_NAME" | grep -q -- '-stu_'; then
            ASSIGNMENT_ID=$(echo "$REPO_NAME" | sed 's/-stu_.*//')
          elif echo "$REPO_NAME" | grep -q -- '-template'; then
            ASSIGNMENT_ID=$(echo "$REPO_NAME" | sed 's/-template.*//')
          else
            ASSIGNMENT_ID="hw1"  # fallback
          fi
          echo "  Organization: $ORG"
          echo "  Assignment ID: $ASSIGNMENT_ID"
          # Clone private test repository
          AUTH_URL="http://${TESTS_USERNAME}:${TESTS_TOKEN}@${HOST}/${ORG}/${ASSIGNMENT_ID}-tests.git"
          if ! git -c http.sslVerify=false clone --depth=1 "$AUTH_URL" _priv_tests 2>&1; then
            echo "❌ Failed to clone ${ASSIGNMENT_ID}-tests repository!"
            exit 1
          fi
          # Verify test directory exists
          if [ ! -d "_priv_tests/java" ]; then
            echo "❌ java/ directory not found in ${ASSIGNMENT_ID}-tests!"
            exit 1
          fi
          if [ ! -d "_priv_tests/java/src/test" ]; then
            echo "❌ java/src/test/ not found in ${ASSIGNMENT_ID}-tests!"
            exit 1
          fi
          # Copy tests to src/test/
          rsync -a _priv_tests/java/src/test/ src/test/
          echo "✅ Private tests copied: _priv_tests/java/src/test/ → src/test/"
      - name: Run tests using Gradle
        working-directory: ${{ github.workspace }}
        env:
          LANGUAGE: java
        run: |
          gradle test --no-daemon || true
      - name: Extract test results
        working-directory: ${{ github.workspace }}
        run: |
          # Find JUnit XML report
          XML_REPORT=$(find build/test-results/test -name "TEST-*.xml" | head -n 1)
          if [ -n "$XML_REPORT" ]; then
            cp "$XML_REPORT" junit.xml
            echo "✅ Found JUnit report: $XML_REPORT"
          else
            echo "⚠️ No JUnit report found!"
            touch junit.xml
          fi
      - name: Grade
        working-directory: ${{ github.workspace }}
        env:
          LANGUAGE: java
        run: |
          python3 ./.autograde/grade.py --junit junit.xml --out grade.json --summary summary.md
      - name: Prepare artifacts
        working-directory: ${{ github.workspace }}
        run: |
          mkdir -p artifacts
          cp junit.xml summary.md grade.json artifacts/ 2>/dev/null || true
      - name: Create grade metadata
        working-directory: ${{ github.workspace }}
        env:
          LANGUAGE: java
          REPO: ${{ github.repository }}
        run: |
          if [ ! -f grade.json ]; then
            echo "⚠️ grade.json not found, skipping metadata creation"
            exit 0
          fi
          # 生成 JSON 元数据
          if [ -f ./.autograde/create_grade_metadata.py ]; then
            python3 ./.autograde/create_grade_metadata.py > metadata.json || echo "{}" > metadata.json
            echo "✅ Grade metadata created (using create_grade_metadata.py)"
          elif [ -f ./.autograde/create_minimal_metadata.py ]; then
            export GRADE_TYPE=programming
            python3 ./.autograde/create_minimal_metadata.py > metadata.json || echo "{}" > metadata.json
            echo "✅ Grade metadata created (using create_minimal_metadata.py)"
          else
            echo "⚠️ No metadata creation script found, skipping"
            echo "{}" > metadata.json
          fi
      - name: Upload metadata (teacher only)
        if: env.RUNNER_METADATA_REPO != '' && env.RUNNER_METADATA_TOKEN != ''
        working-directory: ${{ github.workspace }}
        shell: bash
        env:
          METADATA_REPO: ${{ env.RUNNER_METADATA_REPO }}
          METADATA_TOKEN: ${{ env.RUNNER_METADATA_TOKEN }}
          METADATA_BRANCH: ${{ env.RUNNER_METADATA_BRANCH }}
          STUDENT_REPO: ${{ github.repository }}
          RUN_ID: ${{ github.run_id }}
          COMMIT_SHA: ${{ github.sha }}
          SERVER_URL: ${{ github.server_url }}
        run: |
          set -e
          if [ ! -f metadata.json ]; then
            echo "No metadata.json found, skip uploading."
            exit 0
          fi
          python3 ./.autograde/upload_metadata.py \
            --metadata-file metadata.json \
            --metadata-repo "${METADATA_REPO}" \
            --branch "${METADATA_BRANCH:-main}" \
            --student-repo "${STUDENT_REPO}" \
            --run-id "${RUN_ID}" \
            --commit-sha "${COMMIT_SHA}" \
            --workflow grade \
            --server-url "${SERVER_URL}" \
            --external-host "${EXTERNAL_GITEA_HOST}"
          rm -f metadata.json
--- a/.autograde/workflow_templates/python.yml
+++ b/.autograde/workflow_templates/python.yml
@ -0,0 +1,206 @@
 name: autograde-python
 on:
  push:
    branches:
      - main
  workflow_dispatch:
 permissions:
  contents: read
  pull-requests: write
 jobs:
  python:
    runs-on: docker
    container: python:3.11
    timeout-minutes: 15
    steps:
      - name: Install dependencies (CN mirror)
        run: |
          set -e
          # 替换 Debian/Ubuntu 源为腾讯云镜像
          for f in /etc/apt/sources.list /etc/apt/sources.list.d/*.list /etc/apt/sources.list.d/*.sources; do
            [ -f "$f" ] || continue
            sed -i -E 's|https?://deb.debian.org|http://mirrors.cloud.tencent.com|g' "$f" || true
            sed -i -E 's|https?://security.debian.org|http://mirrors.cloud.tencent.com/debian-security|g' "$f" || true
            sed -i -E 's|https?://archive.ubuntu.com|http://mirrors.cloud.tencent.com|g' "$f" || true
            sed -i -E 's|https?://ports.ubuntu.com|http://mirrors.cloud.tencent.com|g' "$f" || true
          done
          apt-get -o Acquire::Check-Valid-Until=false -o Acquire::AllowInsecureRepositories=true update -y
          DEBIAN_FRONTEND=noninteractive apt-get install -y --no-install-recommends git ca-certificates python3 python3-pip nodejs rsync
          rm -rf /var/lib/apt/lists/*
      - name: Checkout code
        uses: actions/checkout@v3
        with:
          fetch-depth: 1
      - name: Fix permissions
        run: |
          # Ensure workspace is owned by current user
          chown -R $(whoami):$(whoami) ${{ github.workspace }} || true
      - name: Install Python deps
        working-directory: ${{ github.workspace }}
        run: |
          # 使用腾讯云镜像源加速
          python -m pip install -U pip -i https://mirrors.cloud.tencent.com/pypi/simple
          if [ -f requirements.txt ]; then pip install -r requirements.txt -i https://mirrors.cloud.tencent.com/pypi/simple; fi
          if [ -f pyproject.toml ]; then pip install . -i https://mirrors.cloud.tencent.com/pypi/simple; fi
          pip install pytest pytest-cov junit-xml python-dotenv requests -i https://mirrors.cloud.tencent.com/pypi/simple
      - name: Fetch private tests
        working-directory: ${{ github.workspace }}
        env:
          EXTERNAL_GITEA_HOST: ${{ secrets.EXTERNAL_GITEA_HOST }}
        run: |
          set -e
          TESTS_USERNAME="${RUNNER_TESTS_USERNAME:-}"
          TESTS_TOKEN="${RUNNER_TESTS_TOKEN:-}"
          if [ -z "$TESTS_TOKEN" ] || [ -z "$TESTS_USERNAME" ]; then
            echo "❌ RUNNER_TESTS_USERNAME / RUNNER_TESTS_TOKEN 未配置!"
            echo "测试必须从私有的 tests 仓库获取"
            exit 1
          fi
          # Resolve Gitea Host
          if [ -n "$EXTERNAL_GITEA_HOST" ]; then
            HOST="$EXTERNAL_GITEA_HOST"
          elif [ -n "$GITEA_ROOT_URL" ]; then
            HOST=$(echo "$GITEA_ROOT_URL" | sed 's|https\?://||' | sed 's|/$||')
          else
            HOST=$(echo "${{ github.server_url }}" | sed 's|https\?://||' | cut -d'/' -f1)
          fi
          echo "📥 Fetching private tests repository..."
          echo "  Gitea host: $HOST"
          # Infer organization and assignment ID from repository name
          ORG=$(echo "${{ github.repository }}" | cut -d'/' -f1)
          REPO_NAME=$(echo "${{ github.repository }}" | cut -d'/' -f2)
          # Extract assignment ID from repo name (e.g., hw1-stu_xxx -> hw1, hw1-template -> hw1)
          if echo "$REPO_NAME" | grep -q -- '-stu_'; then
            ASSIGNMENT_ID=$(echo "$REPO_NAME" | sed 's/-stu_.*//')
          elif echo "$REPO_NAME" | grep -q -- '-template'; then
            ASSIGNMENT_ID=$(echo "$REPO_NAME" | sed 's/-template.*//')
          else
            ASSIGNMENT_ID="hw1"  # fallback
          fi
          echo "  Organization: $ORG"
          echo "  Assignment ID: $ASSIGNMENT_ID"
          AUTH_URL="http://${TESTS_USERNAME}:${TESTS_TOKEN}@${HOST}/${ORG}/${ASSIGNMENT_ID}-tests.git"
          if ! git -c http.sslVerify=false clone --depth=1 "$AUTH_URL" _priv_tests 2>&1; then
            echo "❌ Failed to clone ${ASSIGNMENT_ID}-tests repository!"
            exit 1
          fi
          # 验证测试目录存在
          if [ ! -d "_priv_tests/python" ]; then
            echo "❌ python/ directory not found in ${ASSIGNMENT_ID}-tests!"
            exit 1
          fi
          if [ ! -d "_priv_tests/python/tests" ]; then
            echo "❌ python/tests/ not found in ${ASSIGNMENT_ID}-tests!"
            exit 1
          fi
          # 复制测试到 tests/
          mkdir -p tests
          rsync -a _priv_tests/python/tests/ tests/
          echo "✅ Tests copied: _priv_tests/python/tests/ → tests/"
          # 复制数据文件（如果存在）
          if [ -d "_priv_tests/python/data" ]; then
            mkdir -p tests/data
            rsync -a _priv_tests/python/data/ tests/data/
            echo "✅ Data files copied: _priv_tests/python/data/ → tests/data/"
          fi
          # 验证测试文件
          if [ -z "$(find tests -name 'test_*.py' 2>/dev/null)" ]; then
            echo "❌ No test files found in tests/ directory!"
            exit 1
          fi
          echo "✅ Test suite ready:"
          find tests -name 'test_*.py'
      - name: Run tests
        working-directory: ${{ github.workspace }}
        run: |
          # 设置随机种子
          export PYTHONHASHSEED=2025
          pytest -q --maxfail=0 --junitxml=junit.xml --tb=short || true
      - name: Grade
        working-directory: ${{ github.workspace }}
        run: |
          python ./.autograde/grade.py --junit junit.xml --out grade.json --summary summary.md
      - name: Prepare artifacts
        working-directory: ${{ github.workspace }}
        run: |
          mkdir -p artifacts
          cp junit.xml summary.md grade.json artifacts/ 2>/dev/null || true
      - name: Create grade metadata
        working-directory: ${{ github.workspace }}
        env:
          REPO: ${{ github.repository }}
        run: |
          if [ ! -f grade.json ]; then
            echo "⚠️ grade.json not found, skipping metadata creation"
            exit 0
          fi
          # 生成 JSON 元数据
          if [ -f ./.autograde/create_grade_metadata.py ]; then
            python3 ./.autograde/create_grade_metadata.py > metadata.json || echo "{}" > metadata.json
            echo "✅ Grade metadata created (using create_grade_metadata.py)"
          elif [ -f ./.autograde/create_minimal_metadata.py ]; then
            export GRADE_TYPE=programming
            python3 ./.autograde/create_minimal_metadata.py > metadata.json || echo "{}" > metadata.json
            echo "✅ Grade metadata created (using create_minimal_metadata.py)"
          else
            echo "⚠️ No metadata creation script found, skipping"
            echo "{}" > metadata.json
          fi
      - name: Upload metadata (teacher only)
        if: env.RUNNER_METADATA_REPO != '' && env.RUNNER_METADATA_TOKEN != ''
        working-directory: ${{ github.workspace }}
        shell: bash
        env:
          METADATA_REPO: ${{ env.RUNNER_METADATA_REPO }}
          METADATA_TOKEN: ${{ env.RUNNER_METADATA_TOKEN }}
          METADATA_BRANCH: ${{ env.RUNNER_METADATA_BRANCH }}
          STUDENT_REPO: ${{ github.repository }}
          RUN_ID: ${{ github.run_id }}
          COMMIT_SHA: ${{ github.sha }}
          SERVER_URL: ${{ github.server_url }}
        run: |
          set -e
          if [ ! -f metadata.json ]; then
            echo "No metadata.json found, skip uploading."
            exit 0
          fi
          python ./.autograde/upload_metadata.py \
            --metadata-file metadata.json \
            --metadata-repo "${METADATA_REPO}" \
            --branch "${METADATA_BRANCH:-main}" \
            --student-repo "${STUDENT_REPO}" \
            --run-id "${RUN_ID}" \
            --commit-sha "${COMMIT_SHA}" \
            --workflow grade \
            --server-url "${SERVER_URL}" \
            --external-host "${EXTERNAL_GITEA_HOST}"
          rm -f metadata.json
--- a/.autograde/workflow_templates/r.yml
+++ b/.autograde/workflow_templates/r.yml
@ -0,0 +1,200 @@
 name: autograde-r
 on:
  push:
    branches:
      - main
  workflow_dispatch:
 permissions:
  contents: read
  pull-requests: write
 jobs:
  r:
    runs-on: docker
    container: r-base:4.3.1
    timeout-minutes: 15
    steps:
      - name: Install dependencies (CN mirror)
        run: |
          set -e
          # 替换 Debian/Ubuntu 源为腾讯云镜像
          for f in /etc/apt/sources.list /etc/apt/sources.list.d/*.list /etc/apt/sources.list.d/*.sources; do
            [ -f "$f" ] || continue
            sed -i -E 's|https?://deb.debian.org|http://mirrors.cloud.tencent.com|g' "$f" || true
            sed -i -E 's|https?://security.debian.org|http://mirrors.cloud.tencent.com/debian-security|g' "$f" || true
            sed -i -E 's|https?://archive.ubuntu.com|http://mirrors.cloud.tencent.com|g' "$f" || true
            sed -i -E 's|https?://ports.ubuntu.com|http://mirrors.cloud.tencent.com|g' "$f" || true
          done
          apt-get -o Acquire::Check-Valid-Until=false -o Acquire::AllowInsecureRepositories=true update -y
          DEBIAN_FRONTEND=noninteractive apt-get install -y --no-install-recommends git ca-certificates python3 python3-pip nodejs rsync libcurl4-openssl-dev libssl-dev libxml2-dev
          pip3 install --break-system-packages python-dotenv requests -i https://mirrors.cloud.tencent.com/pypi/simple
          rm -rf /var/lib/apt/lists/*
      - name: Configure CRAN Mirror
        run: |
          echo 'options(repos = c(CRAN = "https://mirrors.tuna.tsinghua.edu.cn/CRAN/"))' >> ~/.Rprofile
      - name: Install R packages
        run: |
          Rscript -e 'install.packages(c("testthat", "covr", "xml2"))'
      - name: Checkout code
        uses: actions/checkout@v3
        with:
          fetch-depth: 1
      - name: Fix permissions
        run: |
          # Ensure workspace is owned by current user
          chown -R $(whoami):$(whoami) ${{ github.workspace }} || true
      - name: Fetch private tests
        working-directory: ${{ github.workspace }}
        env:
          EXTERNAL_GITEA_HOST: ${{ secrets.EXTERNAL_GITEA_HOST }}
        run: |
          set -e
          TESTS_USERNAME="${RUNNER_TESTS_USERNAME:-}"
          TESTS_TOKEN="${RUNNER_TESTS_TOKEN:-}"
          if [ -z "$TESTS_TOKEN" ] || [ -z "$TESTS_USERNAME" ]; then
            echo "❌ RUNNER_TESTS_USERNAME / RUNNER_TESTS_TOKEN 未配置!"
            echo "测试必须从私有的 tests 仓库获取"
            exit 1
          fi
          # Resolve Gitea Host
          if [ -n "$EXTERNAL_GITEA_HOST" ]; then
            HOST="$EXTERNAL_GITEA_HOST"
          elif [ -n "$GITEA_ROOT_URL" ]; then
            HOST=$(echo "$GITEA_ROOT_URL" | sed 's|https\?://||' | sed 's|/$||')
          else
            HOST=$(echo "${{ github.server_url }}" | sed 's|https\?://||' | cut -d'/' -f1)
          fi
          echo "📥 Fetching private tests repository..."
          echo "  Gitea host: $HOST"
          # Infer organization and assignment ID from repository name
          ORG=$(echo "${{ github.repository }}" | cut -d'/' -f1)
          REPO_NAME=$(echo "${{ github.repository }}" | cut -d'/' -f2)
          # Extract assignment ID from repo name (e.g., hw1-stu_xxx -> hw1, hw1-template -> hw1)
          if echo "$REPO_NAME" | grep -q -- '-stu_'; then
            ASSIGNMENT_ID=$(echo "$REPO_NAME" | sed 's/-stu_.*//')
          elif echo "$REPO_NAME" | grep -q -- '-template'; then
            ASSIGNMENT_ID=$(echo "$REPO_NAME" | sed 's/-template.*//')
          else
            ASSIGNMENT_ID="hw1"  # fallback
          fi
          echo "  Organization: $ORG"
          echo "  Assignment ID: $ASSIGNMENT_ID"
          AUTH_URL="http://${TESTS_USERNAME}:${TESTS_TOKEN}@${HOST}/${ORG}/${ASSIGNMENT_ID}-tests.git"
          if ! git -c http.sslVerify=false clone --depth=1 "$AUTH_URL" _priv_tests 2>&1; then
            echo "❌ Failed to clone ${ASSIGNMENT_ID}-tests repository!"
            exit 1
          fi
          # 验证测试目录存在
          if [ ! -d "_priv_tests/r" ]; then
            echo "❌ r/ directory not found in ${ASSIGNMENT_ID}-tests!"
            exit 1
          fi
          if [ ! -d "_priv_tests/r/tests" ]; then
            echo "❌ r/tests/ not found in ${ASSIGNMENT_ID}-tests!"
            exit 1
          fi
          # 复制测试到 tests/
          mkdir -p tests
          rsync -a _priv_tests/r/tests/ tests/
          echo "✅ Tests copied: _priv_tests/r/tests/ → tests/"
          # 验证测试文件
          if [ -z "$(find tests -name 'test_*.R' 2>/dev/null)" ]; then
            echo "❌ No test files found in tests/ directory!"
            exit 1
          fi
          echo "✅ Test suite ready:"
          find tests -name 'test_*.R'
      - name: Run tests
        working-directory: ${{ github.workspace }}
        run: |
          Rscript -e 'library(testthat); test_dir("tests", reporter = JunitReporter$new(file = "junit.xml"))' || true
      - name: Grade
        working-directory: ${{ github.workspace }}
        env:
          LANGUAGE: r
        run: |
          python3 ./.autograde/grade.py --junit junit.xml --out grade.json --summary summary.md
      - name: Prepare artifacts
        working-directory: ${{ github.workspace }}
        run: |
          mkdir -p artifacts
          cp junit.xml summary.md grade.json artifacts/ 2>/dev/null || true
      - name: Create grade metadata
        working-directory: ${{ github.workspace }}
        env:
          LANGUAGE: r
          REPO: ${{ github.repository }}
        run: |
          if [ ! -f grade.json ]; then
            echo "⚠️ grade.json not found, skipping metadata creation"
            exit 0
          fi
          # 生成 JSON 元数据
          if [ -f ./.autograde/create_grade_metadata.py ]; then
            python3 ./.autograde/create_grade_metadata.py > metadata.json || echo "{}" > metadata.json
            echo "✅ Grade metadata created (using create_grade_metadata.py)"
          elif [ -f ./.autograde/create_minimal_metadata.py ]; then
            export GRADE_TYPE=programming
            python3 ./.autograde/create_minimal_metadata.py > metadata.json || echo "{}" > metadata.json
            echo "✅ Grade metadata created (using create_minimal_metadata.py)"
          else
            echo "⚠️ No metadata creation script found, skipping"
            echo "{}" > metadata.json
          fi
      - name: Upload metadata (teacher only)
        if: env.RUNNER_METADATA_REPO != '' && env.RUNNER_METADATA_TOKEN != ''
        working-directory: ${{ github.workspace }}
        shell: bash
        env:
          METADATA_REPO: ${{ env.RUNNER_METADATA_REPO }}
          METADATA_TOKEN: ${{ env.RUNNER_METADATA_TOKEN }}
          METADATA_BRANCH: ${{ env.RUNNER_METADATA_BRANCH }}
          STUDENT_REPO: ${{ github.repository }}
          RUN_ID: ${{ github.run_id }}
          COMMIT_SHA: ${{ github.sha }}
          SERVER_URL: ${{ github.server_url }}
        run: |
          set -e
          if [ ! -f metadata.json ]; then
            echo "No metadata.json found, skip uploading."
            exit 0
          fi
          python3 ./.autograde/upload_metadata.py \
            --metadata-file metadata.json \
            --metadata-repo "${METADATA_REPO}" \
            --branch "${METADATA_BRANCH:-main}" \
            --student-repo "${STUDENT_REPO}" \
            --run-id "${RUN_ID}" \
            --commit-sha "${COMMIT_SHA}" \
            --workflow grade \
            --server-url "${SERVER_URL}" \
            --external-host "${EXTERNAL_GITEA_HOST}"
          rm -f metadata.json