From ca5eef10339500454c57b0c4a6d1556184116277 Mon Sep 17 00:00:00 2001 From: Duzeyao <330501241@qq.com> Date: Fri, 25 Oct 2019 23:49:27 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E6=94=B9gradient=20accumulation?= =?UTF-8?q?=E4=B8=8Bloss=E8=AE=A1=E7=AE=97=E9=80=BB=E8=BE=91?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- train.py | 2 +- train_single.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/train.py b/train.py index a7cbad4..7cebdd0 100644 --- a/train.py +++ b/train.py @@ -221,7 +221,7 @@ def main(): step + 1, piece_num, epoch + 1, - running_loss * gradient_accumulation / log_step)) + running_loss / log_step)) running_loss = 0 piece_num += 1 diff --git a/train_single.py b/train_single.py index d312ab6..dd06dc3 100644 --- a/train_single.py +++ b/train_single.py @@ -197,7 +197,7 @@ def main(): (step + 1) // gradient_accumulation, piece_num, epoch + 1, - running_loss * gradient_accumulation / log_step)) + running_loss / log_step)) running_loss = 0 piece_num += 1