forked from vitrixLab/AIOpsLab
-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathgpt.py
More file actions
126 lines (96 loc) · 4.26 KB
/
gpt.py
File metadata and controls
126 lines (96 loc) · 4.26 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
"""Naive GPT4 client (with shell access) for AIOpsLab.
Achiam, Josh, Steven Adler, Sandhini Agarwal, Lama Ahmad, Ilge Akkaya, Florencia Leoni Aleman, Diogo Almeida et al.
"Gpt-4 technical report." arXiv preprint arXiv:2303.08774 (2023).
Code: https://openai.com/index/gpt-4-research/
Paper: https://arxiv.org/abs/2303.08774
"""
import os
import asyncio
import tiktoken
import wandb
from aiopslab.orchestrator import Orchestrator
from aiopslab.orchestrator.problems.registry import ProblemRegistry
from clients.utils.llm import GPTClient
from dotenv import load_dotenv
from clients.utils.templates import DOCS_SHELL_ONLY
# Load environment variables from the .env file
load_dotenv()
def count_message_tokens(message, enc):
# Each message format adds ~4 tokens of overhead
tokens = 4 # <|start|>role/name + content + <|end|>
tokens += len(enc.encode(message.get("content", "")))
return tokens
def trim_history_to_token_limit(history, max_tokens=120000, model="gpt-4"):
enc = tiktoken.encoding_for_model(model)
trimmed = []
total_tokens = 0
# Always include the last message
last_msg = history[-1]
last_msg_tokens = count_message_tokens(last_msg, enc)
if last_msg_tokens > max_tokens:
# If even the last message is too big, truncate its content
truncated_content = enc.decode(enc.encode(last_msg["content"])[:max_tokens - 4])
return [{"role": last_msg["role"], "content": truncated_content}]
trimmed.insert(0, last_msg)
total_tokens += last_msg_tokens
# Add earlier messages in reverse until limit is reached
for message in reversed(history[:-1]):
message_tokens = count_message_tokens(message, enc)
if total_tokens + message_tokens > max_tokens:
break
trimmed.insert(0, message)
total_tokens += message_tokens
return trimmed
class GPTAgent:
def __init__(self):
self.history = []
self.llm = GPTClient()
def test(self):
return self.llm.run([{"role": "system", "content": "hello"}])
def init_context(self, problem_desc: str, instructions: str, apis: str):
"""Initialize the context for the agent."""
self.shell_api = self._filter_dict(apis, lambda k, _: "exec_shell" in k)
self.submit_api = self._filter_dict(apis, lambda k, _: "submit" in k)
stringify_apis = lambda apis: "\n\n".join(
[f"{k}\n{v}" for k, v in apis.items()]
)
self.system_message = DOCS_SHELL_ONLY.format(
prob_desc=problem_desc,
shell_api=stringify_apis(self.shell_api),
submit_api=stringify_apis(self.submit_api),
)
self.task_message = instructions
self.history.append({"role": "system", "content": self.system_message})
self.history.append({"role": "user", "content": self.task_message})
async def get_action(self, input) -> str:
"""Wrapper to interface the agent with OpsBench.
Args:
input (str): The input from the orchestrator/environment.
Returns:
str: The response from the agent.
"""
self.history.append({"role": "user", "content": input})
trimmed_history = trim_history_to_token_limit(self.history)
response = self.llm.run(trimmed_history)
print(f"===== Agent (GPT-4o-mini) ====\n{response}")
self.history.append({"role": "assistant", "content": response[0]})
return response[0]
def _filter_dict(self, dictionary, filter_func):
return {k: v for k, v in dictionary.items() if filter_func(k, v)}
if __name__ == "__main__":
# Load use_wandb from environment variable with a default of False
use_wandb = os.getenv("USE_WANDB", "false").lower() == "true"
if use_wandb:
# Initialize wandb running
wandb.init(project="AIOpsLab", entity="AIOpsLab")
problems = ProblemRegistry().PROBLEM_REGISTRY
for pid in problems:
agent = GPTAgent()
orchestrator = Orchestrator()
orchestrator.register_agent(agent, name="gpt-w-shell")
problem_desc, instructs, apis = orchestrator.init_problem(pid)
agent.init_context(problem_desc, instructs, apis)
asyncio.run(orchestrator.start_problem(max_steps=30))
if use_wandb:
# Finish the wandb run
wandb.finish()