Skip to content

Commit 31be268

Browse files
author
centos Cloud User
committed
debugging cosypose training
1 parent f5f1faf commit 31be268

File tree

2 files changed

+42
-33
lines changed

2 files changed

+42
-33
lines changed

happypose/pose_estimators/cosypose/cosypose/training/train_pose.py

+38-32
Original file line numberDiff line numberDiff line change
@@ -422,44 +422,50 @@ def train_epoch():
422422
iterator = tqdm(ds_iter_train, ncols=80)
423423
t = time.time()
424424
for n, sample in enumerate(iterator):
425-
if n > 0:
426-
meters_time["data"].add(time.time() - t)
427-
428-
optimizer.zero_grad()
429-
430-
t = time.time()
431-
loss = h(data=sample, meters=meters_train)
432-
meters_time["forward"].add(time.time() - t)
433-
iterator.set_postfix(loss=loss.item())
434-
meters_train["loss_total"].add(loss.item())
435-
436-
t = time.time()
437-
loss.backward()
438-
total_grad_norm = torch.nn.utils.clip_grad_norm_(
439-
model.parameters(),
440-
max_norm=args.clip_grad_norm,
441-
norm_type=2,
442-
)
443-
meters_train["grad_norm"].add(torch.as_tensor(total_grad_norm).item())
444-
445-
optimizer.step()
446-
meters_time["backward"].add(time.time() - t)
447-
meters_time["memory"].add(
448-
torch.cuda.max_memory_allocated() / 1024.0**2,
449-
)
450-
451-
if epoch < args.n_epochs_warmup:
452-
lr_scheduler_warmup.step()
453-
t = time.time()
425+
if n < 5:
426+
if n > 0:
427+
meters_time["data"].add(time.time() - t)
428+
429+
optimizer.zero_grad()
430+
431+
t = time.time()
432+
loss = h(data=sample, meters=meters_train)
433+
meters_time["forward"].add(time.time() - t)
434+
iterator.set_postfix(loss=loss.item())
435+
meters_train["loss_total"].add(loss.item())
436+
437+
t = time.time()
438+
loss.backward()
439+
total_grad_norm = torch.nn.utils.clip_grad_norm_(
440+
model.parameters(),
441+
max_norm=args.clip_grad_norm,
442+
norm_type=2,
443+
)
444+
meters_train["grad_norm"].add(torch.as_tensor(total_grad_norm).item())
445+
446+
optimizer.step()
447+
meters_time["backward"].add(time.time() - t)
448+
meters_time["memory"].add(
449+
torch.cuda.max_memory_allocated() / 1024.0**2,
450+
)
451+
452+
if epoch < args.n_epochs_warmup:
453+
lr_scheduler_warmup.step()
454+
t = time.time()
455+
else:
456+
continue
454457
if epoch >= args.n_epochs_warmup:
455458
lr_scheduler.step()
456459

457460
@torch.no_grad()
458461
def validation():
459462
model.eval()
460-
for sample in tqdm(ds_iter_val, ncols=80):
461-
loss = h(data=sample, meters=meters_val)
462-
meters_val["loss_total"].add(loss.item())
463+
for n, sample in enumerate(tqdm(ds_iter_val, ncols=80)):
464+
if n < 5:
465+
loss = h(data=sample, meters=meters_val)
466+
meters_val["loss_total"].add(loss.item())
467+
else:
468+
continue
463469

464470
@torch.no_grad()
465471
def test():

happypose/toolbox/lib3d/transform.py

+4-1
Original file line numberDiff line numberDiff line change
@@ -74,7 +74,10 @@ def __init__(
7474
else:
7575
rotation_np = rotation
7676
else:
77-
raise ValueError
77+
if isinstance(rotation, list):
78+
rotation_np = np.array(rotation)
79+
else:
80+
raise ValueError
7881

7982
if rotation_np.size == 4:
8083
quaternion_xyzw = rotation_np.flatten().tolist()

0 commit comments

Comments
 (0)