Spaces:

ksort
/

K-Sort-Arena

Running on Zero

App Files Files Community

K-Sort-Arena / model /matchmaker.py

ksort

Update ssh

afa1318 3 months ago

raw

history blame

No virus

4.15 kB

	import numpy as np
	import json
	from trueskill import TrueSkill
	import paramiko
	import io, os
	import sys
	sys.path.append('../')
	from serve.constants import SSH_SERVER, SSH_PORT, SSH_USER, SSH_PASSWORD, SSH_SKILL
	trueskill_env = TrueSkill()

	ssh_matchmaker_client = None
	sftp_matchmaker_client = None

	def create_ssh_matchmaker_client(server, port, user, password):
	global ssh_matchmaker_client, sftp_matchmaker_client
	ssh_matchmaker_client = paramiko.SSHClient()
	ssh_matchmaker_client.load_system_host_keys()
	ssh_matchmaker_client.set_missing_host_key_policy(paramiko.AutoAddPolicy())
	ssh_matchmaker_client.connect(server, port, user, password)

	transport = ssh_matchmaker_client.get_transport()
	transport.set_keepalive(60)

	sftp_matchmaker_client = ssh_matchmaker_client.open_sftp()
	def is_connected():
	global ssh_matchmaker_client, sftp_matchmaker_client
	if ssh_matchmaker_client is None or sftp_matchmaker_client is None:
	return False
	# 检查SSH连接是否正常
	if not ssh_matchmaker_client.get_transport().is_active():
	return False
	# 检查SFTP连接是否正常
	try:
	sftp_matchmaker_client.listdir('.') # 尝试列出根目录
	except Exception as e:
	print(f"Error checking SFTP connection: {e}")
	return False
	return True
	def ucb_score(trueskill_diff, t, n):
	exploration_term = np.sqrt((2 * np.log(t + 1e-5)) / (n + 1e-5))
	ucb = -trueskill_diff + 1.0 * exploration_term
	return ucb

	def update_trueskill(ratings, ranks):
	new_ratings = trueskill_env.rate(ratings, ranks)
	return new_ratings

	def serialize_rating(rating):
	return {'mu': rating.mu, 'sigma': rating.sigma}

	def deserialize_rating(rating_dict):
	return trueskill_env.Rating(mu=rating_dict['mu'], sigma=rating_dict['sigma'])

	def save_json_via_sftp(ratings, comparison_counts, total_comparisons):
	global sftp_matchmaker_client
	if not is_connected():
	create_ssh_matchmaker_client(SSH_SERVER, SSH_PORT, SSH_USER, SSH_PASSWORD)
	data = {
	'ratings': [serialize_rating(r) for r in ratings],
	'comparison_counts': comparison_counts.tolist(),
	'total_comparisons': total_comparisons
	}
	json_data = json.dumps(data)
	with sftp_matchmaker_client.open(SSH_SKILL, 'w') as f:
	f.write(json_data)

	def load_json_via_sftp():
	global sftp_matchmaker_client
	if not is_connected():
	create_ssh_matchmaker_client(SSH_SERVER, SSH_PORT, SSH_USER, SSH_PASSWORD)
	with sftp_matchmaker_client.open(SSH_SKILL, 'r') as f:
	data = json.load(f)
	ratings = [deserialize_rating(r) for r in data['ratings']]
	comparison_counts = np.array(data['comparison_counts'])
	total_comparisons = data['total_comparisons']
	return ratings, comparison_counts, total_comparisons


	class RunningPivot(object):
	running_pivot = []

	def matchmaker(num_players, k_group=4):
	trueskill_env = TrueSkill()

	ratings, comparison_counts, total_comparisons = load_json_via_sftp()

	ratings = ratings[:num_players]
	comparison_counts = comparison_counts[:num_players, :num_players]

	# Randomly select a player
	# selected_player = np.random.randint(0, num_players)
	comparison_counts[:, RunningPivot.running_pivot] = float('inf')
	selected_player = np.argmin(comparison_counts.sum(axis=1))

	RunningPivot.running_pivot.append(selected_player)
	RunningPivot.running_pivot = RunningPivot.running_pivot[-5:]

	selected_trueskill_score = trueskill_env.expose(ratings[selected_player])
	trueskill_scores = np.array([trueskill_env.expose(p) for p in ratings])
	trueskill_diff = np.abs(trueskill_scores - selected_trueskill_score)
	n = comparison_counts[selected_player]
	ucb_scores = ucb_score(trueskill_diff, total_comparisons, n)

	# Exclude self, select opponent with highest UCB score
	ucb_scores[selected_player] = -float('inf') # minimize the score for the selected player to exclude it
	opponents = np.argsort(ucb_scores)[-k_group + 1:].tolist()

	# Group players
	model_ids = [selected_player] + opponents

	return model_ids