diff --git a/src/PTQ/PTQ.cpp b/src/PTQ/PTQ.cpp index 4c581feeb48c3ca0a819c47d75edb701f8b5499a..edc624bffa26f7a15ace8332ecbe98eb920aa121 100644 --- a/src/PTQ/PTQ.cpp +++ b/src/PTQ/PTQ.cpp @@ -818,11 +818,9 @@ void normalizeActivations(std::shared_ptr<GraphView> graphView, std::unordered_m // If prevNode is Affine, fix the bias ... - if (isAffine(prevNode)) { - if (nodeHasBias(prevNode)) { - insertScalingBelowProducer(prevNode->getParent(2), 1.0 / prevRatio, graphView); - } - } + if (isAffine(prevNode)) + if (nodeHasBias(prevNode)) + multiplyScalingFactor(prevNode->getParent(2), 1.0 / prevRatio); } // Merging nodes handling : use a maximum arbritration ... @@ -873,7 +871,6 @@ void normalizeActivations(std::shared_ptr<GraphView> graphView, std::unordered_m multiplyScalingFactor(prevScalingNode, prevRatio); } - } }