Skip to content

Commit a292765

Browse files
committed
[AttentionTraining] Fixed PR Comments
1 parent 5502d04 commit a292765

File tree

5 files changed

+11
-13
lines changed

5 files changed

+11
-13
lines changed

Deeploy/Targets/Generic/Layers.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -479,10 +479,6 @@ class SGDLayer(ONNXLayer):
479479
def __init__(self, maps: List[NodeMapper]):
480480
super().__init__(maps)
481481

482-
def computeOps(self):
483-
484-
size = self.mapper.parser.operatorRepresentation['size']
485-
return size * 2
486482

487483

488484
class LinearAttentionLayer(ONNXLayer):

Deeploy/Targets/PULPOpen/Bindings.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -190,8 +190,7 @@
190190
FloatAddTemplate.referenceTemplate, ForkTransformer)
191191
] + [
192192
NodeBinding(
193-
AddChecker([PointerClass(float32_t), PointerClass(float32_t),
194-
PointerClass(float32_t)], [PointerClass(float32_t)]), FloatAddTemplate.referenceTemplate,
193+
AddChecker([PointerClass(float32_t), PointerClass(float32_t)], [PointerClass(float32_t)]), FloatAddTemplate.referenceTemplate,
195194
ForkTransformer)
196195
]
197196

Deeploy/Targets/PULPOpen/Templates/FloatLayernormTemplate.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -33,9 +33,9 @@
3333
int32_t ${nodeName}_elem_end = ${nodeName}_end * ${lastDimLength};
3434
int32_t ${nodeName}_elem_count = ${nodeName}_elem_end - ${nodeName}_elem_start;
3535
36-
const float* ${nodeName}_grad_in_ptr = ${grad_in} + ${nodeName}_elem_start;
37-
const float* ${nodeName}_data_in_ptr = ${data_in} + ${nodeName}_elem_start;
38-
float* ${nodeName}_grad_out_ptr = ${grad_out} + ${nodeName}_elem_start;
36+
const float${grad_in_type.referencedType.typeWidth}_t* ${nodeName}_grad_in_ptr = ${grad_in} + ${nodeName}_elem_start;
37+
const float${data_in_type.referencedType.typeWidth}_t* ${nodeName}_data_in_ptr = ${data_in} + ${nodeName}_elem_start;
38+
float${grad_out_type.referencedType.typeWidth}_t* ${nodeName}_grad_out_ptr = ${grad_out} + ${nodeName}_elem_start;
3939
4040
if (${nodeName}_elem_count > 0) {
4141
LayernormGrad_fp${grad_in_type.referencedType.typeWidth}_fp${grad_out_type.referencedType.typeWidth}(

Deeploy/Targets/PULPOpen/Templates/SGDTemplate.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -9,9 +9,9 @@
99
// (Name: ${nodeName}, Op: ${nodeOp})
1010
int8_t ${nodeName}_core_id = pi_core_id();
1111
int8_t ${nodeName}_log2Core = log2(NUM_CORES);
12-
int16_t ${nodeName}_chunk = (${size} >> ${nodeName}_log2Core) + ((${size} & (NUM_CORES-1))!=0);
13-
int16_t ${nodeName}_chunk_start = MIN(${nodeName}_chunk*${nodeName}_core_id, ${size});
14-
int16_t ${nodeName}_chunk_stop = MIN(${nodeName}_chunk_start + ${nodeName}_chunk, ${size});
12+
int32_t ${nodeName}_chunk = (${size} >> ${nodeName}_log2Core) + ((${size} & (NUM_CORES-1))!=0);
13+
int32_t ${nodeName}_chunk_start = MIN(${nodeName}_chunk*${nodeName}_core_id, ${size});
14+
int32_t ${nodeName}_chunk_stop = MIN(${nodeName}_chunk_start + ${nodeName}_chunk, ${size});
1515
1616
${weight_type.typeName} ref_${weight} = ${weight};
1717
${grad_type.typeName} ref_${grad} = ${grad};

Deeploy/Targets/PULPOpen/TileConstraints/GEMMTileConstraint.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -193,10 +193,12 @@ class FloatGEMMTileConstraint(TileConstraint):
193193
@staticmethod
194194
def addGeometricalConstraint(tilerModel: TilerModel, parseDict: Dict, ctxt: NetworkContext) -> TilerModel:
195195

196+
# Get to-be-tiled tensor's buffers
196197
bufferA = ctxt.lookup(name = parseDict['A'])
197198
bufferB = ctxt.lookup(name = parseDict['B'])
198199
outputBuffer = ctxt.lookup(name = parseDict['data_out'])
199200

201+
# Add I/O dimensions to the model as variables
200202
has_bias = 'C' in parseDict and parseDict['C'] is not None
201203
bufferC = None
202204
if has_bias:
@@ -222,9 +224,11 @@ def addGeometricalConstraint(tilerModel: TilerModel, parseDict: Dict, ctxt: Netw
222224
outputFirstDimVar = tilerModel.getTensorDimVar(tensorName = outputBuffer.name, dimIdx = dimOffsetOut)
223225
outputSecondDimVar = tilerModel.getTensorDimVar(tensorName = outputBuffer.name, dimIdx = dimOffsetOut + 1)
224226

227+
# Map output dims to inputs dims
225228
tilerModel.addConstraint(outputFirstDimVar == AFirstDimVar)
226229
tilerModel.addConstraint(outputSecondDimVar == BSecondDimVar)
227230

231+
# Add GEMM Geometrical constraints
228232
tilerModel.addConstraint(ASecondDimVar == BFirstDimVar)
229233

230234
# Add bias constraints only if bias is present
@@ -287,7 +291,6 @@ def serializeTilingSolution(
287291
transB = operatorRepresentation['transB']
288292

289293
varA = operatorRepresentation['A']
290-
varB = operatorRepresentation['B']
291294

292295
if transA == 0:
293296
NSize = ctxt.lookup(varA).shape[-1]

0 commit comments

Comments
 (0)