From 66ed92cbea622604155f3b8ea3ce91bfc0b62111 Mon Sep 17 00:00:00 2001 From: feilong Date: Wed, 21 Jun 2023 15:37:28 +0800 Subject: [PATCH] refactor directories --- README.md | 20 +++++++++++++++++- ...\346\215\256\350\257\204\344\274\260.xlsx" | Bin {data => backup}/llm-codeing.json | 0 main.py | 0 requirements.txt | 0 5 files changed, 19 insertions(+), 1 deletion(-) rename "AIGC\346\225\260\346\215\256\350\257\204\344\274\260.xlsx" => "backup/AIGC\346\225\260\346\215\256\350\257\204\344\274\260.xlsx" (100%) rename {data => backup}/llm-codeing.json (100%) create mode 100644 main.py create mode 100644 requirements.txt diff --git a/README.md b/README.md index 80afa77..99f959d 100644 --- a/README.md +++ b/README.md @@ -1,3 +1,21 @@ # llm-coding-eval -大模型写代码能力评测 \ No newline at end of file +大模型写代码能力评测 + +## 目录说明 + +* backup/ + * 最早版本的评测,测试例子来自真实的用户查询 + * 评测体系来自基本的分类 +* eval_set/ + * 体系化设计的评测用例 + * 从简单到复杂的编程粒度设计 +* llm_set/ + * 大模型配置列表,配置每一种大模型的元数据 +* src/ + * 评测源代码 +* mian.py 程序入口 + +## 同类评测项目 + +1. 斯坦福大学的评测:AlpacaEval Logo Leaderboard diff --git "a/AIGC\346\225\260\346\215\256\350\257\204\344\274\260.xlsx" "b/backup/AIGC\346\225\260\346\215\256\350\257\204\344\274\260.xlsx" similarity index 100% rename from "AIGC\346\225\260\346\215\256\350\257\204\344\274\260.xlsx" rename to "backup/AIGC\346\225\260\346\215\256\350\257\204\344\274\260.xlsx" diff --git a/data/llm-codeing.json b/backup/llm-codeing.json similarity index 100% rename from data/llm-codeing.json rename to backup/llm-codeing.json diff --git a/main.py b/main.py new file mode 100644 index 0000000..e69de29 diff --git a/requirements.txt b/requirements.txt new file mode 100644 index 0000000..e69de29 -- GitLab