forked from jinhaoduan/GTBench
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathjson_example.jsonl
173 lines (172 loc) · 10.9 KB
/
json_example.jsonl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
{
"game_config":{
"game_name":"KuhnPoker"
},
"agents_config":[
{
"agent_name":"PromptAgent",
"num_generations":1,
"majority_vote":false
},
{
"agent_name":"PromptAgent",
"num_generations":1,
"majority_vote":false
}
],
"models_config":[
{
"llm_model_path":"codellama/CodeLlama-34b-Instruct-hf",
"max_tokens":1024,
"timeout":60,
"temperature":0.2,
"model_type":"LLMModel",
"nick_name":"Alice"
},
{
"llm_model_path":"codellama/CodeLlama-34b-Instruct-hf",
"max_tokens":1024,
"timeout":60,
"temperature":0.2,
"model_type":"LLMModel",
"nick_name":"Bob"
}
],
"win_rate":{
"PromptAgent_Bob":1.0
},
"matches":[
{
"winner":"PromptAgent_Bob",
"agents":[
"PromptAgent"
],
"steps":[
{
"agent":"PromptAgent",
"observation":{
"card":"1",
"moves":null,
"player_idx":0,
"openspiel_legal_actions":[
0,
1
],
"legal_moves":[
"<Pass>",
"<Bet>"
],
"env_name":"kuhn_poker"
},
"move":"<Pass>",
"queries":[
{
"messages":[
{
"role":"system",
"content":"You are a powerful gaming agent who can make proper decisions to beat the user in gaming tasks. You are a helpful assistant that strictly follows the user's instructions."
},
{
"role":"user",
"content":"You are currently playing Kuhn Poker, a simplified two-player zero-sum game characterized by imperfect information. The deck consists of only three cards: King (K), Queen (Q), and Jack (J). In this setup, one card is dealt to each player, with the third card set aside and unseen.\nYour card is Queen (Q).\nThis is the first round.\nThe game's betting dynamics are as follows:\nEach player's bet increases the pot by an amount equal to the bet size, typically set at 1 unit per bet.\nIf you <Bet>, you commit 1 unit to the pot, challenging your opponent to either match your bet or fold.\nIf you <Pass>, you avoid increasing the pot and the game proceeds based on the opponent's response.\nYour legal moves are:\n<Bet>: Place 1 unit into the pot, prompting your opponent to either call by matching the bet, increasing the pot further, or to fold, conceding the pot to you.\n<Pass>: Opt out of betting, which, if followed by your opponent's pass, leads to a showdown where the higher card wins the accumulated pot.\nThe objective is to strategically choose an action based on your card and the potential actions of your opponent, aiming to maximize the reward or minimize losses.\nChoose your action based on strategic considerations of your card strength, the opponent's potential card, and the betting history:\nYou should consider choose <Pass> when you have Jack (J) and <Bet> when you have King (K).\n\nPlease output your decision in the following format:\nAction:\n<Your chosen action here>\nEnsure that \"Your chosen action here\" is replaced with either <Pass> or <Bet>, reflecting your decision for this turn in the game. Please return your decision without additional explanation or commentary.\nYou must choose an legal action to set up advantages.\n\nYour output must be in the following format:\n\nAction:\nYour action wrapped with <>, <Pass|Bet> e.g., <Pass>\n\nPlease return your answer without explanation!\n"
}
],
"prompt_type":"move",
"llm_output":[
" Action: <Pass>"
],
"token_size":543
}
],
"token_size":543,
"model_name":"Alice"
},
{
"agent":"PromptAgent",
"observation":{
"card":"2",
"moves":"p",
"player_idx":1,
"openspiel_legal_actions":[
0,
1
],
"legal_moves":[
"<Pass>",
"<Bet>"
],
"env_name":"kuhn_poker"
},
"move":"<Bet>",
"queries":[
{
"messages":[
{
"role":"system",
"content":"You are a powerful gaming agent who can make proper decisions to beat the user in gaming tasks. You are a helpful assistant that strictly follows the user's instructions."
},
{
"role":"user",
"content":"You are currently playing Kuhn Poker, a simplified two-player zero-sum game characterized by imperfect information. The deck consists of only three cards: King (K), Queen (Q), and Jack (J). In this setup, one card is dealt to each player, with the third card set aside and unseen.\nYour card is King (K).\nHere are the past moves in this match:\nIn the 1-st round, the opponent chose to <Pass>.\nThe game's betting dynamics are as follows:\nEach player's bet increases the pot by an amount equal to the bet size, typically set at 1 unit per bet.\nIf you <Bet>, you commit 1 unit to the pot, challenging your opponent to either match your bet or fold.\nIf you <Pass>, you avoid increasing the pot and the game proceeds based on the opponent's response.\nYour legal moves are:\n<Bet>: Place 1 unit into the pot, prompting your opponent to either call by matching the bet, increasing the pot further, or to fold, conceding the pot to you.\n<Pass>: Opt out of betting, which, if followed by your opponent's pass, leads to a showdown where the higher card wins the accumulated pot.\nThe objective is to strategically choose an action based on your card and the potential actions of your opponent, aiming to maximize the reward or minimize losses.\nChoose your action based on strategic considerations of your card strength, the opponent's potential card, and the betting history:\nYou should consider choose <Pass> when you have Jack (J) and <Bet> when you have King (K).\n\nPlease output your decision in the following format:\nAction:\n<Your chosen action here>\nEnsure that \"Your chosen action here\" is replaced with either <Pass> or <Bet>, reflecting your decision for this turn in the game. Please return your decision without additional explanation or commentary.\nYou must choose an legal action to set up advantages.\n\nYour output must be in the following format:\n\nAction:\nYour action wrapped with <>, <Pass|Bet> e.g., <Pass>\n\nPlease return your answer without explanation!\n"
}
],
"prompt_type":"move",
"llm_output":[
" Action: <Bet>"
],
"token_size":564
}
],
"token_size":564,
"model_name":"Bob"
},
{
"agent":"PromptAgent",
"observation":{
"card":"1",
"moves":"pb",
"player_idx":0,
"openspiel_legal_actions":[
0,
1
],
"legal_moves":[
"<Pass>",
"<Bet>"
],
"env_name":"kuhn_poker"
},
"move":"<Bet>",
"queries":[
{
"messages":[
{
"role":"system",
"content":"You are a powerful gaming agent who can make proper decisions to beat the user in gaming tasks. You are a helpful assistant that strictly follows the user's instructions."
},
{
"role":"user",
"content":"You are currently playing Kuhn Poker, a simplified two-player zero-sum game characterized by imperfect information. The deck consists of only three cards: King (K), Queen (Q), and Jack (J). In this setup, one card is dealt to each player, with the third card set aside and unseen.\nYour card is Queen (Q).\nHere are the past moves in this match:\nIn the 1-st round, you chose to <Pass>.\nIn the 2-nd round, the opponent chose to <Bet>.\nThe game's betting dynamics are as follows:\nEach player's bet increases the pot by an amount equal to the bet size, typically set at 1 unit per bet.\nIf you <Bet>, you commit 1 unit to the pot, challenging your opponent to either match your bet or fold.\nIf you <Pass>, you avoid increasing the pot and the game proceeds based on the opponent's response.\nYour legal moves are:\n<Bet>: Place 1 unit into the pot, prompting your opponent to either call by matching the bet, increasing the pot further, or to fold, conceding the pot to you.\n<Pass>: Opt out of betting, which, if followed by your opponent's pass, leads to a showdown where the higher card wins the accumulated pot.\nThe objective is to strategically choose an action based on your card and the potential actions of your opponent, aiming to maximize the reward or minimize losses.\nChoose your action based on strategic considerations of your card strength, the opponent's potential card, and the betting history:\nYou should consider choose <Pass> when you have Jack (J) and <Bet> when you have King (K).\n\nPlease output your decision in the following format:\nAction:\n<Your chosen action here>\nEnsure that \"Your chosen action here\" is replaced with either <Pass> or <Bet>, reflecting your decision for this turn in the game. Please return your decision without additional explanation or commentary.\nYou must choose an legal action to set up advantages.\n\nYour output must be in the following format:\n\nAction:\nYour action wrapped with <>, <Pass|Bet> e.g., <Pass>\n\nPlease return your answer without explanation!\n"
}
],
"prompt_type":"move",
"llm_output":[
" Action: <Bet>"
],
"token_size":580
}
],
"token_size":580,
"model_name":"Alice"
}
],
"status":"Normal",
"agents_at_fault":[
],
"winner_score":2.0,
"loser_score":-2.0,
"token_size":1687
}
],
"token_size":1687
}