Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 2 additions & 1 deletion .github/workflows/pr-auto-label.yml
Original file line number Diff line number Diff line change
Expand Up @@ -37,7 +37,8 @@ jobs:
'dependabot': 'dependencies',
'upgrade': 'dependencies',
'security': 'security',
'ci': 'ci'
'ci': 'ci',
'refactor': 'maintenance'
};

// 提取标题的第一个单词(冒号前的部分)
Expand Down
8 changes: 1 addition & 7 deletions evaluate/base/evaluation.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
import re
import time
import uuid
from typing import Dict, Any, List

from bohrium import Bohrium
from dotenv import load_dotenv, find_dotenv
Expand Down Expand Up @@ -115,13 +116,6 @@ def multi_turn_evaluation_task(dataset_item):
return result


import asyncio
import json
import re
import time
from typing import Dict, Any, List


async def _run_conversation(dataset_item: Dict[str, Any], max_turn_count: int, save_mode: str = 'w') -> Dict[str, Any]:
"""
执行一次对话测试,并返回结果
Expand Down
Original file line number Diff line number Diff line change
@@ -1,16 +1,26 @@
#!/bin/bash
PYTHON=.venv/bin/python # your .venv

SCRIPT_PATH=$(realpath "$BASH_SOURCE")
MATMASTER_DIR=$(dirname $(dirname $(dirname $(dirname "$SCRIPT_PATH"))))
THREADS_DIR=$MATMASTER_DIR/evaluate/experiments/threads

if [ x"$1" == x ];then
echo "Please specify evaluation type...[$(ls -l $THREADS_DIR | grep '^d' | awk '{print $9}'| xargs)]"
exit 1
fi

PYTHON=$MATMASTER_DIR/.venv/bin/python # your .venv
set -a
source .env # your .env
source $MATMASTER_DIR/.env # your .env
set +a

export PYTHONPATH=/your/matmaster/path/MatMaster:$PYTHONPATH
export PYTHONPATH=$MATMASTER_DIR:$PYTHONPATH
export MAX_JOBS=3

TOTAL=$($PYTHON -c "
import os
import json
with open('database_search.json') as f:
with open('$THREADS_DIR/$1/$1.json') as f:
dataset_json = json.load(f)
print(len(dataset_json))
")
Expand All @@ -22,7 +32,7 @@ running_jobs=0
for ((i=0; i<$TOTAL; i++)); do
echo "🚀 提交任务: item $i"
sleep 3
$PYTHON database_search_bash.py \
$PYTHON $THREADS_DIR/$1/$1_bash.py \
--item_id $i > item_$i.log 2>&1 &

((running_jobs++))
Expand Down
39 changes: 0 additions & 39 deletions evaluate/experiments/threads/structure_generate/run.sh

This file was deleted.

Loading