kamangir
validating fashion_mnist train - kamangir/bolt#689
08b815a
raw
history blame
6.17 kB
from . import *
from abcli import file
from abcli import string
import cv2
import numpy as np
import os.path
import abcli.logging
import logging
logger = logging.getLogger(__name__)
def eval(input_path, output_path):
from sklearn.metrics import accuracy_score
report = {"accuracy": None}
success, ground_truth = file.load(f"{input_path}/test_labels.pyndarray")
if success:
logger.info(
"groundtruth: {} - {}".format(
string.pretty_shape_of_matrix(ground_truth),
",".join([str(value) for value in ground_truth[:10]] + ["..."]),
)
)
success, predictions = file.load(f"{input_path}/predictions.pyndarray")
if success:
predictions = np.argmax(predictions, axis=1).astype(np.uint8)
logger.info(
"predictions: {} - {}".format(
string.pretty_shape_of_matrix(predictions),
",".join([str(value) for value in predictions[:10]] + ["..."]),
)
)
report["accuracy"] = accuracy_score(predictions, ground_truth)
logger.info(
"image_classifier.eval({}->{}): {:.2f}%".format(
input_path, output_path, 100 * report["accuracy"]
)
)
return file.save_json(os.path.join(output_path, "evaluation_report.json"), report)
def preprocess(
output_path,
objects="",
infer_annotation=True,
purpose="predict",
test_size=1.0 / 6,
window_size=28,
):
if objects:
logger.info(
"image_classifier.preprocess({}{})->{} - {}x{} - for {}".format(
",".join(objects),
" + annotation" if infer_annotation else "",
output_path,
window_size,
window_size,
purpose,
)
)
annotations = []
list_of_images = []
for index, object in enumerate(objects):
list_of_images_ = [
"{}/Data/{}/camera.jpg".format(object, frame)
for frame in objects.list_of_frames(object)
]
annotations += len(list_of_images_) * [index]
list_of_images += list_of_images_
annotations = np.array(annotations) if infer_annotation else []
else:
logger.info(
"image_classifier.preprocess({}) - {}x{} - for {}".format(
output_path,
window_size,
window_size,
purpose,
)
)
list_of_images = [
"{}/Data/{}/camera.jpg".format(output_path, frame)
for frame in objects.list_of_frames(output_path)
]
annotations = np.array(
file.load_json(
f"{output_path}/annotations.json".format(),
civilized=True,
default=None,
)[1]
).astype(np.uint8)
if len(annotations) and len(list_of_images) != len(annotations):
logger.error(
f"-{name}: preprocess: mismatch between frame and annotation counts: {len(list_of_images):,g} != {len(annotations):,g}"
)
return False
logger.info("{:,} frame(s)".format(len(list_of_images)))
tensor = np.zeros(
(len(list_of_images), window_size, window_size, 3),
dtype=np.uint8,
)
error_count = 0
for index, filename in enumerate(list_of_images):
logger.info("+= {}".format(filename))
success_, image = file.load_image(filename)
if success_:
try:
tensor[index, :, :, :] = cv2.resize(image, (window_size, window_size))
except:
from abcli.logging import crash_report
crash_report("image_classifier.preprocess() failed")
success_ = False
if not success_:
error_count += 1
logger.info(
"tensor: {}{}".format(
string.pretty_shape_of_matrix(tensor),
" {} error(s)".format(error_count) if error_count else "",
)
)
success = False
if purpose == "predict":
if not file.save("{}/test_images.pyndarray".format(output_path), tensor):
return False
if len(annotations):
if not file.save(
"{}/test_labels.pyndarray".format(output_path), annotations
):
return False
success = True
elif purpose == "train":
if not len(annotations):
logger.error(f"-{name}: preprocess: annotations are not provided.")
return False
from sklearn.model_selection import train_test_split
(
tensor_train,
tensor_test,
annotations_train,
annotations_test,
) = train_test_split(tensor, annotations, test_size=test_size)
logger.info(
"test-train split: {:.0f}%-{:.0f}% ".format(
len(annotations_test) / len(annotations) * 100,
len(annotations_train) / len(annotations) * 100,
)
)
logger.info(
"tensor_train: {}".format(string.pretty_shape_of_matrix(tensor_train))
)
logger.info(
"tensor_test: {}".format(string.pretty_shape_of_matrix(tensor_test))
)
logger.info(
"annotations_train: {}".format(
string.pretty_shape_of_matrix(annotations_train)
)
)
logger.info(
"annotations_test: {}".format(
string.pretty_shape_of_matrix(annotations_test)
)
)
success = (
file.save("{}/train_images.pyndarray".format(output_path), tensor_train)
and file.save("{}/test_images.pyndarray".format(output_path), tensor_test)
and file.save(
"{}/train_labels.pyndarray".format(output_path), annotations_train
)
and file.save(
"{}/test_labels.pyndarray".format(output_path), annotations_test
)
)
else:
logger.error(f"-{name}: preprocess: {purpose}: purpose not found.")
return success