Aimbot-PPO/Aimbot-PPO-Python/Tensorflow/rewardAIClass.py
Koha9 742529ccd7 Archive all tensorflow agents and env
archive all TF py&ipynb
turn face to pytorch.
2022-10-26 03:15:37 +09:00

58 lines
1.5 KiB
Python

import numpy as np
class rewardAI(object):
def __init__(
self,
nonReward,
shootReward,
shootWithoutReadyReward,
hitReward,
winReward,
loseReward,
killReward,
):
self.nonReward = nonReward
self.shootReward = shootReward
self.shootWithoutReadyReward = shootWithoutReadyReward
self.hitReward = hitReward
self.winReward = winReward
self.loseReward = loseReward
self.killReward = killReward
def getRewards(self, remainTime):
nonR = self.getnonReward()
shootR = self.getshootReward()
shootWithoutReadyR = self.getshootWithoutReadyReward()
hitR = self.gethitReward()
winR = self.getwinReward(remainTime)
loseR = self.getloseReward()
killR = self.getkillReward(remainTime)
rewards = np.array(
[[nonR, shootR, shootWithoutReadyR, hitR, winR, loseR, killR]],
dtype=np.float,
)
return rewards
def getnonReward(self):
return self.nonReward
def getshootReward(self):
return self.shootReward
def getshootWithoutReadyReward(self):
return self.shootWithoutReadyReward
def gethitReward(self):
return self.hitReward
def getwinReward(self, time):
return self.winReward + time
def getloseReward(self):
return self.loseReward
def getkillReward(self, time):
return self.killReward + time