Context Navigation

← Previous Revision
Latest Revision
Next Revision →
Blame
Revision Log

dreamteam109_agent.py@ 77

Last change on this file since 77 was 75, checked in by wouter, 2 years ago
#6 added ANAC2022 parties
File size: 16.0 KB

Line
1	import datetime
2	import json
3	import logging
4	from math import floor
5	from random import randint
6	import time
7	from decimal import Decimal
8	from os import path
9	from typing import TypedDict, cast
10
11	from geniusweb.actions.Accept import Accept
12	from geniusweb.actions.Action import Action
13	from geniusweb.actions.Offer import Offer
14	from geniusweb.actions.PartyId import PartyId
15	from geniusweb.bidspace.AllBidsList import AllBidsList
16	from geniusweb.inform.ActionDone import ActionDone
17	from geniusweb.inform.Finished import Finished
18	from geniusweb.inform.Inform import Inform
19	from geniusweb.inform.Settings import Settings
20	from geniusweb.inform.YourTurn import YourTurn
21	from geniusweb.issuevalue.Bid import Bid
22	from geniusweb.issuevalue.Domain import Domain
23	from geniusweb.party.Capabilities import Capabilities
24	from geniusweb.party.DefaultParty import DefaultParty
25	from geniusweb.issuevalue.Value import Value
26	from geniusweb.profile.utilityspace.LinearAdditiveUtilitySpace import (
27	LinearAdditiveUtilitySpace,
28	)
29	from geniusweb.profileconnection.ProfileConnectionFactory import (
30	ProfileConnectionFactory,
31	)
32	from geniusweb.progress.ProgressTime import ProgressTime
33	from geniusweb.references.Parameters import Parameters
34	from tudelft_utilities_logging.ReportToLogger import ReportToLogger
35	from .utils.logger import Logger
36
37	from .utils.opponent_model import OpponentModel
38	from .utils.utils import bid_to_string
39
40	class SessionData(TypedDict):
41	progressAtFinish: float
42	utilityAtFinish: float
43	didAccept: bool
44	isGood: bool
45	topBidsPercentage: float
46	forceAcceptAtRemainingTurns: float
47
48	class DataDict(TypedDict):
49	sessions: list[SessionData]
50
51	class DreamTeam109Agent(DefaultParty):
52
53	def __init__(self):
54	super().__init__()
55	self.logger: Logger = Logger(self.getReporter(), id(self))
56
57	self.domain: Domain = None
58	self.parameters: Parameters = None
59	self.profile: LinearAdditiveUtilitySpace = None
60	self.progress: ProgressTime = None
61	self.me: PartyId = None
62	self.other: PartyId = None
63	self.other_name: str = None
64	self.settings: Settings = None
65	self.storage_dir: str = None
66
67	self.data_dict: DataDict = None
68
69	self.last_received_bid: Bid = None
70	self.opponent_model: OpponentModel = None
71	self.all_bids: AllBidsList = None
72	self.bids_with_utilities: list[tuple[Bid, float]] = None
73	self.num_of_top_bids: int = 1
74	self.min_util: float = 0.9
75
76	self.round_times: list[Decimal] = []
77	self.last_time = None
78	self.avg_time = None
79	self.utility_at_finish: float = 0
80	self.did_accept: bool = False
81	self.top_bids_percentage: float = 1 / 300
82	self.force_accept_at_remaining_turns: float = 1
83	self.force_accept_at_remaining_turns_light: float = 1
84	self.opponent_best_bid: Bid = None
85	self.logger.log(logging.INFO, "party is initialized")
86
87	def notifyChange(self, data: Inform):
88	"""MUST BE IMPLEMENTED
89	This is the entry point of all interaction with your agent after is has been initialised.
90	How to handle the received data is based on its class type.
91
92	Args:
93	info (Inform): Contains either a request for action or information.
94	"""
95
96	# a Settings message is the first message that will be send to your
97	# agent containing all the information about the negotiation session.
98	if isinstance(data, Settings):
99	self.settings = cast(Settings, data)
100	self.me = self.settings.getID()
101
102	# progress towards the deadline has to be tracked manually through the use of the Progress object
103	self.progress = self.settings.getProgress()
104
105	self.parameters = self.settings.getParameters()
106	self.storage_dir = self.parameters.get("storage_dir")
107
108	# the profile contains the preferences of the agent over the domain
109	profile_connection = ProfileConnectionFactory.create(
110	data.getProfile().getURI(), self.getReporter()
111	)
112	self.profile = profile_connection.getProfile()
113	self.domain = self.profile.getDomain()
114	# compose a list of all possible bids
115	self.all_bids = AllBidsList(self.domain)
116
117	profile_connection.close()
118
119	# ActionDone informs you of an action (an offer or an accept)
120	# that is performed by one of the agents (including yourself).
121	elif isinstance(data, ActionDone):
122	action = cast(ActionDone, data).getAction()
123	actor = action.getActor()
124
125	# ignore action if it is our action
126	if actor != self.me:
127	if self.other is None:
128	self.other = actor
129	# obtain the name of the opponent, cutting of the position ID.
130	self.other_name = str(actor).rsplit("_", 1)[0]
131	self.attempt_load_data()
132	self.learn_from_past_sessions(self.data_dict["sessions"])
133
134	# process action done by opponent
135	self.opponent_action(action)
136	# YourTurn notifies you that it is your turn to act
137	elif isinstance(data, YourTurn):
138	# execute a turn
139	self.my_turn()
140
141	# Finished will be send if the negotiation has ended (through agreement or deadline)
142	elif isinstance(data, Finished):
143	agreements = cast(Finished, data).getAgreements()
144	if len(agreements.getMap()) > 0:
145	agreed_bid = agreements.getMap()[self.me]
146	self.logger.log(logging.INFO, "agreed_bid = " + bid_to_string(agreed_bid))
147	self.utility_at_finish = float(self.profile.getUtility(agreed_bid))
148	else:
149	self.logger.log(logging.INFO, "no agreed bid (timeout? some agent crashed?)")
150
151	self.update_data_dict()
152	self.save_data()
153
154	# terminate the agent MUST BE CALLED
155	self.logger.log(logging.INFO, "party is terminating")
156	super().terminate()
157	else:
158	self.logger.log(logging.WARNING, "Ignoring unknown info " + str(data))
159
160	def getCapabilities(self) -> Capabilities:
161	"""MUST BE IMPLEMENTED
162	Method to indicate to the protocol what the capabilities of this agent are.
163	Leave it as is for the ANL 2022 competition
164
165	Returns:
166	Capabilities: Capabilities representation class
167	"""
168	return Capabilities(
169	set(["SAOP"]),
170	set(["geniusweb.profile.utilityspace.LinearAdditive"]),
171	)
172
173	def send_action(self, action: Action):
174	"""Sends an action to the opponent(s)
175
176	Args:
177	action (Action): action of this agent
178	"""
179	self.getConnection().send(action)
180
181	# give a description of your agent
182	def getDescription(self) -> str:
183	"""MUST BE IMPLEMENTED
184	Returns a description of your agent. 1 or 2 sentences.
185
186	Returns:
187	str: Agent description
188	"""
189	return "DreamTeam109 agent for the ANL 2022 competition"
190
191	def opponent_action(self, action):
192	"""Process an action that was received from the opponent.
193
194	Args:
195	action (Action): action of opponent
196	"""
197	# if it is an offer, set the last received bid
198	if isinstance(action, Offer):
199	# create opponent model if it was not yet initialised
200	if self.opponent_model is None:
201	self.opponent_model = OpponentModel(self.domain, self.logger)
202
203	bid = cast(Offer, action).getBid()
204
205	# update opponent model with bid
206	self.opponent_model.update(bid)
207	# set bid as last received
208	self.last_received_bid = bid
209
210	if self.opponent_best_bid is None:
211	self.opponent_best_bid = bid
212	elif self.profile.getUtility(bid) > self.profile.getUtility(self.opponent_best_bid):
213	self.opponent_best_bid = bid
214
215	def my_turn(self):
216	"""This method is called when it is our turn. It should decide upon an action
217	to perform and send this action to the opponent.
218	"""
219
220	# For calculating average time per round
221	if self.last_time is not None:
222	self.round_times.append(datetime.datetime.now().timestamp() - self.last_time.timestamp())
223	self.avg_time = sum(self.round_times[-3:])/3
224	self.last_time = datetime.datetime.now()
225
226	# check if the last received offer is good enough
227	# if self.accept_condition(self.last_received_bid):
228	if self.accept_condition(self.last_received_bid):
229	self.logger.log(logging.INFO, "accepting bid : " + bid_to_string(self.last_received_bid))
230	# if so, accept the offer
231	action = Accept(self.me, self.last_received_bid)
232	self.did_accept = True
233	else:
234	# if not, find a bid to propose as counter offer
235	bid = self.find_bid()
236	self.logger.log(logging.INFO, "Offering bid : " + bid_to_string(bid))
237	action = Offer(self.me, bid)
238
239	# send the action
240	self.send_action(action)
241
242	def get_data_file_path(self) -> str:
243	return f"{self.storage_dir}/{self.other_name}.json"
244
245	def attempt_load_data(self):
246	if path.exists(self.get_data_file_path()):
247	with open(self.get_data_file_path()) as f:
248	self.data_dict = json.load(f)
249	self.logger.log(logging.INFO, "Loaded previous data about opponent: " + self.other_name)
250	self.logger.log(logging.INFO, "data_dict = " + str(self.data_dict))
251	else:
252	self.logger.log(logging.WARN, "No previous data saved about opponent: " + self.other_name)
253	# initialize an empty data dict
254	self.data_dict = {
255	"sessions": []
256	}
257
258	def update_data_dict(self):
259	# NOTE: We shouldn't do extensive calculations in this method (see note in save_data method)
260
261	progress_at_finish = self.progress.get(time.time() * 1000)
262
263	session_data: SessionData = {
264	"progressAtFinish": progress_at_finish,
265	"utilityAtFinish": self.utility_at_finish,
266	"didAccept": self.did_accept,
267	"isGood": self.utility_at_finish >= self.min_util,
268	"topBidsPercentage": self.top_bids_percentage,
269	"forceAcceptAtRemainingTurns": self.force_accept_at_remaining_turns
270	}
271
272	self.logger.log(logging.INFO, "Updating data dict with session data: " + str(session_data))
273	self.data_dict["sessions"].append(session_data)
274
275	def save_data(self):
276	"""This method is called after the negotiation is finished. It can be used to store data
277	for learning capabilities. Note that no extensive calculations can be done within this method.
278	Taking too much time might result in your agent being killed, so use it for storage only.
279	"""
280	if self.other_name is None:
281	self.logger.log(logging.WARNING, "Opponent name was not set; skipping save data")
282	else:
283	json_data = json.dumps(self.data_dict, sort_keys=True, indent=4)
284	with open(self.get_data_file_path(), "w") as f:
285	f.write(json_data)
286	self.logger.log(logging.INFO, "Saved data about opponent: " + self.other_name)
287
288	def learn_from_past_sessions(self, sessions: list[SessionData]):
289	accept_levels = [0, 0, 1, 1.1]
290	light_accept_levels = [0, 1, 1.1]
291	top_bids_levels = [1 / 300, 1 / 100, 1 / 30]
292
293	self.force_accept_at_remaining_turns = accept_levels[min(len(accept_levels) - 1, len(list(filter(self.did_fail, sessions))))]
294	self.force_accept_at_remaining_turns_light = light_accept_levels[min(len(light_accept_levels) - 1, len(list(filter(self.did_fail, sessions))))]
295	self.top_bids_percentage = top_bids_levels[min(len(top_bids_levels) - 1, len(list(filter(self.low_utility, sessions))))]
296
297	def did_fail(self, session: SessionData):
298	return session["utilityAtFinish"] == 0
299
300	def low_utility(self, session: SessionData):
301	return session["utilityAtFinish"] < 0.5
302
303	def accept_condition(self, bid: Bid) -> bool:
304	if bid is None:
305	return False
306
307	# progress of the negotiation session between 0 and 1 (1 is deadline)
308	progress = self.progress.get(time.time() * 1000)
309	threshold = 0.98
310	light_threshold = 0.95
311
312	if self.avg_time is not None:
313	threshold = 1 - 1000 * self.force_accept_at_remaining_turns * self.avg_time / self.progress.getDuration()
314	light_threshold = 1 - 5000 * self.force_accept_at_remaining_turns_light * self.avg_time / self.progress.getDuration()
315
316	conditions = [
317	self.profile.getUtility(bid) >= self.min_util,
318	progress >= threshold,
319	progress > light_threshold and self.profile.getUtility(bid) >= self.bids_with_utilities[floor(len(self.bids_with_utilities) / 5) - 1][1]
320	]
321	return any(conditions)
322
323	def find_bid(self) -> Bid:
324	self.logger.log(logging.INFO, "finding bid...")
325
326	num_of_bids = self.all_bids.size()
327
328	if self.bids_with_utilities is None:
329	self.logger.log(logging.INFO, "calculating bids_with_utilities...")
330	startTime = time.time()
331	self.bids_with_utilities = []
332
333	for index in range(num_of_bids):
334	bid = self.all_bids.get(index)
335	bid_utility = float(self.profile.getUtility(bid))
336	self.bids_with_utilities.append((bid, bid_utility))
337
338	self.bids_with_utilities.sort(key=lambda tup: tup[1], reverse=True)
339
340	endTime = time.time()
341	self.logger.log(logging.INFO, "calculating bids_with_utilities took (in seconds): " + str(endTime - startTime))
342
343	self.num_of_top_bids = max(5, num_of_bids * self.top_bids_percentage)
344
345	if (self.last_received_bid is None):
346	return self.bids_with_utilities[0][0]
347
348	progress = self.progress.get(time.time() * 1000)
349	light_threshold = 0.95
350
351	if self.avg_time is not None:
352	light_threshold = 1 - 5000 * self.force_accept_at_remaining_turns_light * self.avg_time / self.progress.getDuration()
353
354	if (progress > light_threshold):
355	return self.opponent_best_bid
356
357	if (num_of_bids < self.num_of_top_bids):
358	self.num_of_top_bids = num_of_bids / 2
359
360	self.min_util = self.bids_with_utilities[floor(self.num_of_top_bids) - 1][1]
361	self.logger.log(logging.INFO, "min_util = " + str(self.min_util))
362
363	picked_ranking = randint(0, floor(self.num_of_top_bids) - 1)
364
365	return self.bids_with_utilities[picked_ranking][0]
366
367	def score_bid(self, bid: Bid, alpha: float = 0.95, eps: float = 0.1) -> float:
368	"""Calculate heuristic score for a bid
369
370	Args:
371	bid (Bid): Bid to score
372	alpha (float, optional): Trade-off factor between self interested and
373	altruistic behaviour. Defaults to 0.95.
374	eps (float, optional): Time pressure factor, balances between conceding
375	and Boulware behaviour over time. Defaults to 0.1.
376
377	Returns:
378	float: score
379	"""
380	progress = self.progress.get(time.time() * 1000)
381
382	our_utility = float(self.profile.getUtility(bid))
383
384	time_pressure = 1.0 - progress ** (1 / eps)
385	score = alpha * time_pressure * our_utility
386
387	if self.opponent_model is not None:
388	opponent_utility = self.opponent_model.get_predicted_utility(bid)
389	opponent_score = (1.0 - alpha * time_pressure) * opponent_utility
390	score += opponent_score
391
392	return score

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: ANL2022/dreamteam109_agent/dreamteam109_agent.py@ 77

Download in other formats: