import numpy as np class rewardAI(object): def __init__( self, nonReward, shootReward, shootWithoutReadyReward, hitReward, winReward, loseReward, killReward, ): self.nonReward = nonReward self.shootReward = shootReward self.shootWithoutReadyReward = shootWithoutReadyReward self.hitReward = hitReward self.winReward = winReward self.loseReward = loseReward self.killReward = killReward def getRewards(self, remainTime): nonR = self.getnonReward() shootR = self.getshootReward() shootWithoutReadyR = self.getshootWithoutReadyReward() hitR = self.gethitReward() winR = self.getwinReward(remainTime) loseR = self.getloseReward() killR = self.getkillReward(remainTime) rewards = np.array( [[nonR, shootR, shootWithoutReadyR, hitR, winR, loseR, killR]], dtype=np.float, ) return rewards def getnonReward(self): return self.nonReward def getshootReward(self): return self.shootReward def getshootWithoutReadyReward(self): return self.shootWithoutReadyReward def gethitReward(self): return self.hitReward def getwinReward(self, time): return self.winReward + time def getloseReward(self): return self.loseReward def getkillReward(self, time): return self.killReward + time