Refinement

2020-05-13 13:08:00 -05:00 · 2020-05-13 13:08:00 -05:00 · 1a48af157d
parent 131607a3f9
commit 1a48af157d
3 changed files with 10 additions and 90 deletions
--- a/.gitignore
+++ b/.gitignore
@ -25,4 +25,4 @@ yarn-error.log*
 db.sqlite3
 __pycache__
 *.swp
-/uploaded_agents
+uploaded_agents
--- a/server/media/uploaded_agents/example_model.py
+++ b/server/media/uploaded_agents/example_model.py
@ -1,84 +0,0 @@
-''' Leduc Hold 'em rule model
-'''
-import rlcard
-from rlcard.models.model import Model
-
-class LeducHoldemRuleAgentV2(object):
-    ''' Leduc Hold 'em Rule agent version 2
-    '''
-    def __init__(self):
-        self.use_raw = True
-
-    def step(self, state):
-        ''' Predict the action when given raw state. A simple rule-based AI.
-        Args:
-            state (dict): Raw state from the game
-
-        Returns:
-            action (str): Predicted action
-        '''
-        legal_actions = state['raw_legal_actions']
-        state = state['raw_obs']
-        hand = state['hand']
-        public_card = state['public_card']
-        action = 'fold'
-        '''
-        When having only 2 hand cards at the game start, choose fold to drop terrible cards:
-        Acceptable hand cards:
-        Pairs
-        AK, AQ, AJ, AT
-        A9s, A8s, ... A2s(s means flush)
-        KQ, KJ, QJ, JT
-        Fold all hand types except those mentioned above to save money
-        '''
-        if public_card:
-            if public_card[1] == hand[1]:
-                action = 'raise'
-            else:
-                action = 'fold'
-        else:
-            if hand[0] == 'K':
-                action = 'raise'
-            elif hand[0] == 'Q':
-                action = 'check'
-            else:
-                action = 'fold'
-
-        #return action
-        if action in legal_actions:
-            return action
-        else:
-            if action == 'raise':
-                return 'call'
-            if action == 'check':
-                return 'fold'
-            if action == 'call':
-                return 'raise'
-            else:
-                return action
-
-    def eval_step(self, state):
-        return self.step(state), []
-
-class LeducHoldemRuleModelV2(Model):
-    ''' Leduc holdem Rule Model version 2
-    '''
-
-    def __init__(self):
-        ''' Load pretrained model
-        '''
-        env = rlcard.make('leduc-holdem')
-        rule_agent = LeducHoldemRuleAgentV2()
-        self.rule_agents = [rule_agent for _ in range(env.player_num)]
-
-    @property
-    def agents(self):
-        ''' Get a list of agents for each position in a the game
-
-        Returns:
-            agents (list): A list of agents
-
-        Note: Each agent should be just like RL agent with step and eval_step
-              functioning well.
-        '''
-        return self.rule_agents
--- a/server/tournament/views.py
+++ b/server/tournament/views.py
@ -16,7 +16,7 @@ from .models import Game, Payoff, UploadedAgent

 from .tournament import Tournament

-def reset_model_ids():
+def _reset_model_ids():
    from .rlcard_wrap import rlcard, MODEL_IDS
    agents = UploadedAgent.objects.all()
    for agent in agents:
@ -69,8 +69,12 @@ def query_payoff(request):
@transaction.atomic
 def launch(request):
    if request.method == 'GET':
+        try:
            eval_num = int(request.GET['eval_num'])
            game = request.GET['name']
+        except:
+            return HttpResponse(json.dumps({'value': -1, 'info': 'parameters error'}))
+
        games_data, payoffs_data = Tournament(game, MODEL_IDS[game], eval_num).launch()
        Game.objects.filter(name=game).delete()
        Payoff.objects.filter(name=game).delete()
@ -103,7 +107,7 @@ def upload_agent(request):

        a = UploadedAgent(name=name, game=game, f=f, entry=entry)
        a.save()
-        reset_model_ids()
+        _reset_model_ids()
        return HttpResponse(json.dumps({'value': 0, 'info': 'success'}))

 def delete_agent(request):
@ -113,7 +117,7 @@ def delete_agent(request):
            return HttpResponse(json.dumps({'value': -1, 'info': 'name not exists'}))

        UploadedAgent.objects.filter(name=name).delete()
-        reset_model_ids()
+        _reset_model_ids()
        return HttpResponse(json.dumps({'value': 0, 'info': 'success'}))

 def list_agents(request):