|
""" |
|
Plotting utilities to visualize training logs. |
|
""" |
|
import torch |
|
import pandas as pd |
|
import numpy as np |
|
import seaborn as sns |
|
import matplotlib.pyplot as plt |
|
|
|
from pathlib import Path, PurePath |
|
|
|
|
|
def plot_logs(logs, fields=('class_error', 'loss_bbox_unscaled', 'mAP'), ewm_col=0, log_name='log.txt'): |
|
''' |
|
Function to plot specific fields from training log(s). Plots both training and test results. |
|
|
|
:: Inputs - logs = list containing Path objects, each pointing to individual dir with a log file |
|
- fields = which results to plot from each log file - plots both training and test for each field. |
|
- ewm_col = optional, which column to use as the exponential weighted smoothing of the plots |
|
- log_name = optional, name of log file if different than default 'log.txt'. |
|
|
|
:: Outputs - matplotlib plots of results in fields, color coded for each log file. |
|
- solid lines are training results, dashed lines are test results. |
|
|
|
''' |
|
func_name = "plot_utils.py::plot_logs" |
|
|
|
|
|
|
|
|
|
if not isinstance(logs, list): |
|
if isinstance(logs, PurePath): |
|
logs = [logs] |
|
print(f"{func_name} info: logs param expects a list argument, converted to list[Path].") |
|
else: |
|
raise ValueError(f"{func_name} - invalid argument for logs parameter.\n \ |
|
Expect list[Path] or single Path obj, received {type(logs)}") |
|
|
|
|
|
for i, dir in enumerate(logs): |
|
if not isinstance(dir, PurePath): |
|
raise ValueError(f"{func_name} - non-Path object in logs argument of {type(dir)}: \n{dir}") |
|
if not dir.exists(): |
|
raise ValueError(f"{func_name} - invalid directory in logs argument:\n{dir}") |
|
|
|
fn = Path(dir / log_name) |
|
if not fn.exists(): |
|
print(f"-> missing {log_name}. Have you gotten to Epoch 1 in training?") |
|
print(f"--> full path of missing log file: {fn}") |
|
return |
|
|
|
|
|
dfs = [pd.read_json(Path(p) / log_name, lines=True) for p in logs] |
|
|
|
fig, axs = plt.subplots(ncols=len(fields), figsize=(16, 5)) |
|
|
|
for df, color in zip(dfs, sns.color_palette(n_colors=len(logs))): |
|
for j, field in enumerate(fields): |
|
if field == 'mAP': |
|
coco_eval = pd.DataFrame( |
|
np.stack(df.test_coco_eval_bbox.dropna().values)[:, 1] |
|
).ewm(com=ewm_col).mean() |
|
axs[j].plot(coco_eval, c=color) |
|
else: |
|
df.interpolate().ewm(com=ewm_col).mean().plot( |
|
y=[f'train_{field}', f'test_{field}'], |
|
ax=axs[j], |
|
color=[color] * 2, |
|
style=['-', '--'] |
|
) |
|
for ax, field in zip(axs, fields): |
|
if field == 'mAP': |
|
ax.legend([Path(p).name for p in logs]) |
|
ax.set_title(field) |
|
else: |
|
ax.legend([f'train', f'test']) |
|
ax.set_title(field) |
|
|
|
return fig, axs |
|
|
|
def plot_precision_recall(files, naming_scheme='iter'): |
|
if naming_scheme == 'exp_id': |
|
|
|
names = [f.parts[-3] for f in files] |
|
elif naming_scheme == 'iter': |
|
names = [f.stem for f in files] |
|
else: |
|
raise ValueError(f'not supported {naming_scheme}') |
|
fig, axs = plt.subplots(ncols=2, figsize=(16, 5)) |
|
for f, color, name in zip(files, sns.color_palette("Blues", n_colors=len(files)), names): |
|
data = torch.load(f) |
|
|
|
precision = data['precision'] |
|
recall = data['params'].recThrs |
|
scores = data['scores'] |
|
|
|
precision = precision[0, :, :, 0, -1].mean(1) |
|
scores = scores[0, :, :, 0, -1].mean(1) |
|
prec = precision.mean() |
|
rec = data['recall'][0, :, 0, -1].mean() |
|
print(f'{naming_scheme} {name}: mAP@50={prec * 100: 05.1f}, ' + |
|
f'score={scores.mean():0.3f}, ' + |
|
f'f1={2 * prec * rec / (prec + rec + 1e-8):0.3f}' |
|
) |
|
axs[0].plot(recall, precision, c=color) |
|
axs[1].plot(recall, scores, c=color) |
|
|
|
axs[0].set_title('Precision / Recall') |
|
axs[0].legend(names) |
|
axs[1].set_title('Scores / Recall') |
|
axs[1].legend(names) |
|
return fig, axs |
|
|