|
|
|
|
|
|
bool hasMaskedActions; |
|
|
|
bool hasValueEstimate; |
|
|
|
float[,] inputState; |
|
|
|
int[] inputPrevAction; |
|
|
|
int[,] inputPrevAction; |
|
|
|
List<float[,,,]> observationMatrixList; |
|
|
|
float[,] inputOldMemories; |
|
|
|
float[,] maskedActions; |
|
|
|
|
|
|
// Create the state tensor
|
|
|
|
if (hasPrevAction) |
|
|
|
{ |
|
|
|
inputPrevAction = new int[currentBatchSize]; |
|
|
|
int totalNumberActions = brain.brainParameters.vectorActionSize.Length; |
|
|
|
inputPrevAction = new int[currentBatchSize, totalNumberActions]; |
|
|
|
inputPrevAction[i] = Mathf.FloorToInt(actionList[0]); |
|
|
|
for (var j = 0 ; j < totalNumberActions; j++) |
|
|
|
{ |
|
|
|
inputPrevAction[i,j] = Mathf.FloorToInt(actionList[j]); |
|
|
|
} |
|
|
|
i++; |
|
|
|
} |
|
|
|
} |
|
|
|