summaryrefslogtreecommitdiff
path: root/models/cycle_gan_model.py
diff options
context:
space:
mode:
Diffstat (limited to 'models/cycle_gan_model.py')
-rw-r--r--models/cycle_gan_model.py143
1 files changed, 71 insertions, 72 deletions
diff --git a/models/cycle_gan_model.py b/models/cycle_gan_model.py
index 74771cf..fe06823 100644
--- a/models/cycle_gan_model.py
+++ b/models/cycle_gan_model.py
@@ -44,9 +44,9 @@ class CycleGANModel(BaseModel):
which_epoch = opt.which_epoch
self.load_network(self.netG_A, 'G_A', which_epoch)
self.load_network(self.netG_B, 'G_B', which_epoch)
- #if self.isTrain:
- # self.load_network(self.netD_A, 'D_A', which_epoch)
- # self.load_network(self.netD_B, 'D_B', which_epoch)
+ if self.isTrain:
+ self.load_network(self.netD_A, 'D_A', which_epoch)
+ self.load_network(self.netD_B, 'D_B', which_epoch)
if self.isTrain:
self.old_lr = opt.lr
@@ -77,8 +77,6 @@ class CycleGANModel(BaseModel):
networks.print_network(self.netD_B)
print('-----------------------------------------------')
- self.step_count = 0
-
def set_input(self, input):
AtoB = self.opt.which_direction == 'AtoB'
input_A = input['A' if AtoB else 'B']
@@ -86,20 +84,21 @@ class CycleGANModel(BaseModel):
self.input_A.resize_(input_A.size()).copy_(input_A)
self.input_B.resize_(input_B.size()).copy_(input_B)
self.image_paths = input['A_paths' if AtoB else 'B_paths']
- self.image_paths2 = input['B_paths' if AtoB else 'A_paths']
def forward(self):
self.real_A = Variable(self.input_A)
self.real_B = Variable(self.input_B)
def test(self):
- self.real_A = Variable(self.input_A, volatile=True)
- self.fake_B = self.netG_A.forward(self.real_A)
- self.rec_A = self.netG_B.forward(self.fake_B)
+ real_A = Variable(self.input_A, volatile=True)
+ fake_B = self.netG_A(real_A)
+ self.rec_A = self.netG_B(fake_B).data
+ self.fake_B = fake_B.data
- self.real_B = Variable(self.input_B, volatile=True)
- self.fake_A = self.netG_B.forward(self.real_B)
- self.rec_B = self.netG_A.forward(self.fake_A)
+ real_B = Variable(self.input_B, volatile=True)
+ fake_A = self.netG_B(real_B)
+ self.rec_B = self.netG_A(fake_A).data
+ self.fake_A = fake_A.data
# get image paths
def get_image_paths(self):
@@ -107,10 +106,10 @@ class CycleGANModel(BaseModel):
def backward_D_basic(self, netD, real, fake):
# Real
- pred_real = netD.forward(real)
+ pred_real = netD(real)
loss_D_real = self.criterionGAN(pred_real, True)
# Fake
- pred_fake = netD.forward(fake.detach())
+ pred_fake = netD(fake.detach())
loss_D_fake = self.criterionGAN(pred_fake, False)
# Combined loss
loss_D = (loss_D_real + loss_D_fake) * 0.5
@@ -120,11 +119,13 @@ class CycleGANModel(BaseModel):
def backward_D_A(self):
fake_B = self.fake_B_pool.query(self.fake_B)
- self.loss_D_A = self.backward_D_basic(self.netD_A, self.real_B, fake_B)
+ loss_D_A = self.backward_D_basic(self.netD_A, self.real_B, fake_B)
+ self.loss_D_A = loss_D_A.data[0]
def backward_D_B(self):
fake_A = self.fake_A_pool.query(self.fake_A)
- self.loss_D_B = self.backward_D_basic(self.netD_B, self.real_A, fake_A)
+ loss_D_B = self.backward_D_basic(self.netD_B, self.real_A, fake_A)
+ self.loss_D_B = loss_D_B.data[0]
def backward_G(self):
lambda_idt = self.opt.identity
@@ -133,51 +134,59 @@ class CycleGANModel(BaseModel):
# Identity loss
if lambda_idt > 0:
# G_A should be identity if real_B is fed.
- self.idt_A = self.netG_A.forward(self.real_B)
- self.loss_idt_A = self.criterionIdt(self.idt_A, self.real_B) * lambda_B * lambda_idt
+ idt_A = self.netG_A(self.real_B)
+ loss_idt_A = self.criterionIdt(idt_A, self.real_B) * lambda_B * lambda_idt
# G_B should be identity if real_A is fed.
- self.idt_B = self.netG_B.forward(self.real_A)
- self.loss_idt_B = self.criterionIdt(self.idt_B, self.real_A) * lambda_A * lambda_idt
+ idt_B = self.netG_B(self.real_A)
+ loss_idt_B = self.criterionIdt(idt_B, self.real_A) * lambda_A * lambda_idt
+
+ self.idt_A = idt_A.data
+ self.idt_B = idt_B.data
+ self.loss_idt_A = loss_idt_A.data[0]
+ self.loss_idt_B = loss_idt_B.data[0]
else:
+ loss_idt_A = 0
+ loss_idt_B = 0
self.loss_idt_A = 0
self.loss_idt_B = 0
-
- # GAN loss
- # D_A(G_A(A))
- self.fake_B = self.netG_A.forward(self.real_A)
- pred_fake = self.netD_A.forward(self.fake_B)
- self.loss_G_A = self.criterionGAN(pred_fake, True)
- # D_B(G_B(B))
- self.fake_A = self.netG_B.forward(self.real_B)
- pred_fake = self.netD_B.forward(self.fake_A)
- self.loss_G_B = self.criterionGAN(pred_fake, True)
+
+ # GAN loss D_A(G_A(A))
+ fake_B = self.netG_A(self.real_A)
+ pred_fake = self.netD_A(fake_B)
+ loss_G_A = self.criterionGAN(pred_fake, True)
+
+ # GAN loss D_B(G_B(B))
+ fake_A = self.netG_B(self.real_B)
+ pred_fake = self.netD_B(fake_A)
+ loss_G_B = self.criterionGAN(pred_fake, True)
# Forward cycle loss
- self.rec_A = self.netG_B.forward(self.fake_B)
- self.loss_cycle_A = self.criterionCycle(self.rec_A, self.real_A) * lambda_A
+ rec_A = self.netG_B(fake_B)
+ loss_cycle_A = self.criterionCycle(rec_A, self.real_A) * lambda_A
+
# Backward cycle loss
- self.rec_B = self.netG_A.forward(self.fake_A)
- self.loss_cycle_B = self.criterionCycle(self.rec_B, self.real_B) * lambda_B
+ rec_B = self.netG_A(fake_A)
+ loss_cycle_B = self.criterionCycle(rec_B, self.real_B) * lambda_B
# combined loss
- self.loss_G = self.loss_G_A + self.loss_G_B + self.loss_cycle_A + self.loss_cycle_B + self.loss_idt_A + self.loss_idt_B
- self.loss_G.backward()
+ loss_G = loss_G_A + loss_G_B + loss_cycle_A + loss_cycle_B + loss_idt_A + loss_idt_B
+ loss_G.backward()
+
+ self.fake_B = fake_B.data
+ self.fake_A = fake_A.data
+ self.rec_A = rec_A.data
+ self.rec_B = rec_B.data
+
+ self.loss_G_A = loss_G_A.data[0]
+ self.loss_G_B = loss_G_B.data[0]
+ self.loss_cycle_A = loss_cycle_A.data[0]
+ self.loss_cycle_B = loss_cycle_B.data[0]
def optimize_parameters(self):
- self.step_count += 1
# forward
self.forward()
# G_A and G_B
self.optimizer_G.zero_grad()
self.backward_G()
- if (self.loss_G != self.loss_G).sum().data[0] > 0:
- exit(1)
- #for w in self.netG_A.parameters():
- #print(w.grad.data)
- # if (w.grad.data != w.grad.data).sum() > 0:
- # print(w.grad.data)
- # exit(1)
- #print(self.image_paths, self.image_paths2)
- #return
self.optimizer_G.step()
# D_A
self.optimizer_D_A.zero_grad()
@@ -189,36 +198,26 @@ class CycleGANModel(BaseModel):
self.optimizer_D_B.step()
def get_current_errors(self):
- D_A = self.loss_D_A.data[0]
- G_A = self.loss_G_A.data[0]
- Cyc_A = self.loss_cycle_A.data[0]
- D_B = self.loss_D_B.data[0]
- G_B = self.loss_G_B.data[0]
- Cyc_B = self.loss_cycle_B.data[0]
+ ret_errors = OrderedDict([('D_A', self.loss_D_A), ('G_A', self.loss_G_A), ('Cyc_A', self.loss_cycle_A),
+ ('D_B', self.loss_D_B), ('G_B', self.loss_G_B), ('Cyc_B', self.loss_cycle_B)])
if self.opt.identity > 0.0:
- idt_A = self.loss_idt_A.data[0]
- idt_B = self.loss_idt_B.data[0]
- return OrderedDict([('D_A', D_A), ('G_A', G_A), ('Cyc_A', Cyc_A), ('idt_A', idt_A),
- ('D_B', D_B), ('G_B', G_B), ('Cyc_B', Cyc_B), ('idt_B', idt_B)])
- else:
- return OrderedDict([('D_A', D_A), ('G_A', G_A), ('Cyc_A', Cyc_A),
- ('D_B', D_B), ('G_B', G_B), ('Cyc_B', Cyc_B)])
+ ret_errors['idt_A'] = self.loss_idt_A
+ ret_errors['idt_B'] = self.loss_idt_B
+ return ret_errors
def get_current_visuals(self):
- real_A = util.tensor2im(self.real_A.data)
- fake_B = util.tensor2im(self.fake_B.data)
- rec_A = util.tensor2im(self.rec_A.data)
- real_B = util.tensor2im(self.real_B.data)
- fake_A = util.tensor2im(self.fake_A.data)
- rec_B = util.tensor2im(self.rec_B.data)
+ real_A = util.tensor2im(self.input_A)
+ fake_B = util.tensor2im(self.fake_B)
+ rec_A = util.tensor2im(self.rec_A)
+ real_B = util.tensor2im(self.input_B)
+ fake_A = util.tensor2im(self.fake_A)
+ rec_B = util.tensor2im(self.rec_B)
+ ret_visuals = OrderedDict([('real_A', real_A), ('fake_B', fake_B), ('rec_A', rec_A),
+ ('real_B', real_B), ('fake_A', fake_A), ('rec_B', rec_B)])
if self.opt.isTrain and self.opt.identity > 0.0:
- idt_A = util.tensor2im(self.idt_A.data)
- idt_B = util.tensor2im(self.idt_B.data)
- return OrderedDict([('real_A', real_A), ('fake_B', fake_B), ('rec_A', rec_A), ('idt_B', idt_B),
- ('real_B', real_B), ('fake_A', fake_A), ('rec_B', rec_B), ('idt_A', idt_A)])
- else:
- return OrderedDict([('real_A', real_A), ('fake_B', fake_B), ('rec_A', rec_A),
- ('real_B', real_B), ('fake_A', fake_A), ('rec_B', rec_B)])
+ ret_visuals['idt_A'] = util.tensor2im(self.idt_A)
+ ret_visuals['idt_B'] = util.tensor2im(self.idt_B)
+ return ret_visuals
def save(self, label):
self.save_network(self.netG_A, 'G_A', label, self.gpu_ids)