ACL2026_Logibreak/api.py at main · Applied-Machine-Learning-Lab/ACL2026_Logibreak · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
from openai import OpenAI
import os
import logging
import time


class LLMCall:
    def __init__(self, model_name, API_key=None, max_tokens=256) -> None:
        super().__init__()
        self.API_key = ""
        self.model_name = model_name
        self.max_tokens = max_tokens  # ★★ 新增：最大生成 token 限制 默认 256

        # ====== API Base + Key 按模型类型自动选择 ======
        if self.model_name.lower().startswith("deepseek") and '7b' in self.model_name.lower():
            API_base = ""
        elif self.model_name.lower().startswith("deepseek") and '32b' in self.model_name.lower():
            API_base = ""
            self.API_key = ""
        elif self.model_name.lower().startswith("qwen") and '7b' in self.model_name.lower():
            API_base = ""
        elif self.model_name.lower().startswith("llama3") and '8b' in self.model_name.lower():
            API_base = ""
        elif self.model_name.lower().startswith('llama3') and '70b' in self.model_name.lower():
            API_base = ""
            self.API_key = ""
        elif self.model_name.lower().startswith('gpt'):
            API_base = ""
            self.API_key = ""
        elif self.model_name == 'r1-api':
            API_base = ""
            self.API_key = ""
        elif self.model_name == 'v3-api':
            API_base = ""
            self.API_key = ""

        self.client = OpenAI(api_key=self.API_key, base_url=API_base)

    # ====== 对外接口 ======
    def call(self, messages, seed=0, temperature=1.0):
        response = None

        while response is None:
            try:
                # ====== Deepseek 7B ======
                if self.model_name.lower().startswith("deepseek") and '7b' in self.model_name.lower():
                    response = self.client.chat.completions.create(
                        model="/data/share_weight/DeepSeek-R1-Distill-Qwen-7B",
                        messages=messages,
                        temperature=temperature,
                        seed=seed,
                        max_tokens=self.max_tokens  # ★★ 新增
                    )

                # ====== Deepseek 32B ======
                elif self.model_name.lower().startswith("deepseek") and '32b' in self.model_name.lower():
                    response = self.client.chat.completions.create(
                        model="deepseek-r1-distill-qwen-32b-250120",
                        messages=messages,
                        temperature=temperature,
                        seed=seed,
                        max_tokens=self.max_tokens
                    )

                # ====== Qwen ======
                elif self.model_name.lower().startswith("qwen") and '7b' in self.model_name.lower():
                    response = self.client.chat.completions.create(
                        model="/data/share_weight/Qwen2.5-7B-Instruct",
                        messages=messages,
                        temperature=temperature,
                        seed=seed,
                        max_tokens=self.max_tokens
                    )

                # ====== Llama3 8B ======
                elif self.model_name.lower().startswith("llama3.1") and '8b' in self.model_name.lower():
                    response = self.client.chat.completions.create(
                        model="/data/share_weight/Llama-3.1-8B-Instruct",
                        messages=messages,
                        temperature=temperature,
                        seed=seed,
                        max_tokens=self.max_tokens
                    )

                elif self.model_name.lower().startswith("llama3.2") and '11b' in self.model_name.lower():
                    response = self.client.chat.completions.create(
                        model="/data/share_weight/Llama-3.2-11B-Vision-Instruct",
                        messages=messages,
                        temperature=temperature,
                        seed=seed,
                        max_tokens=self.max_tokens
                    )

                elif self.model_name.lower().startswith("llama3") and '8b' in self.model_name.lower():
                    response = self.client.chat.completions.create(
                        model="/data/share_weight/Meta-Llama-3-8B-Instruct",
                        messages=messages,
                        temperature=temperature,
                        seed=seed,
                        max_tokens=self.max_tokens
                    )

                # ====== Llama3 70B ======
                elif self.model_name.lower().startswith('llama3') and '70b' in self.model_name.lower():
                    response = self.client.chat.completions.create(
                        model="llama3-70b",
                        messages=messages,
                        temperature=temperature,
                        seed=seed,
                        max_tokens=self.max_tokens
                    )

                # ====== o3-mini ======
                elif 'o3-mini' in self.model_name.lower():
                    response = self.client.chat.completions.create(
                        model='o3-mini',
                        messages=messages,
                        temperature=temperature,
                        max_tokens=self.max_tokens
                    )

                # ====== GPT 系列 ======
                elif 'gpt' in self.model_name.lower():
                    if '4o-mini' in self.model_name:
                        response = self.client.chat.completions.create(
                            model='gpt-4o-mini',
                            messages=messages,
                            temperature=temperature,
                            max_tokens=self.max_tokens
                        )
                    elif 'gpt-4' in self.model_name:
                        response = self.client.chat.completions.create(
                            model='gpt-4-turbo',
                            messages=messages,
                            temperature=temperature,
                            max_tokens=self.max_tokens
                        )
                    elif 'gpt-3.5' in self.model_name:
                        response = self.client.chat.completions.create(
                            model='gpt-3.5-turbo',
                            messages=messages,
                            temperature=temperature,
                            max_tokens=self.max_tokens
                        )

                # ====== r1-api ======
                elif self.model_name == 'r1-api':
                    response = self.client.chat.completions.create(
                        model='deepseek-reasoner',
                        messages=messages,
                        temperature=temperature,
                        max_tokens=self.max_tokens
                    )

                # ====== v3-api ======
                elif self.model_name == 'v3-api':
                    response = self.client.chat.completions.create(
                        model='deepseek-v3-250324',
                        messages=messages,
                        temperature=temperature,
                        max_tokens=self.max_tokens
                    )

                else:
                    return "Unsupported model name."

            except Exception as e:
                logging.warning(e)
                return "Unable to reach the response due to some reasons."

        return response.choices[0].message.content