Spaces:

KyanChen
/

TTP

Runtime error

App Files Files Community

TTP / opencd /evaluation /metrics /scd_metric.py

KyanChen

Upload 1861 files

3b96cb1 about 1 year ago

raw

history blame contribute delete

12.2 kB

	# Copyright (c) Open-CD. All rights reserved.
	import copy
	import logging
	from collections import OrderedDict
	from typing import Any, Dict, List, Optional, Sequence, Union

	import numpy as np
	import torch
	from mmengine.dist import (broadcast_object_list, collect_results,
	is_main_process)
	from mmengine.evaluator.metric import _to_cpu
	from mmengine.logging import MMLogger, print_log
	from prettytable import PrettyTable

	from mmseg.evaluation import IoUMetric
	from opencd.registry import METRICS


	@METRICS.register_module()
	class SCDMetric(IoUMetric):
	"""Change Detection evaluation metric.

	Args:
	prefix (str, optional): The prefix that will be added in the metric
	names to disambiguate homonymous metrics of different evaluators.
	If prefix is not provided in the argument, self.default_prefix
	will be used instead. Defaults to 'binary'.
	semantic_prefix (str, optional): The prefix that will be added in the
	metric names to disambiguate homonymous metrics of different
	evaluators. Defaults to 'semantic'.
	cal_sek bool: Whether to calculate the separated kappa (SeK)
	coefficient. Defaults: False.
	"""

	def __init__(self,
	prefix: Optional[str] = 'binary',
	semantic_prefix: Optional[str] = 'semantic',
	cal_sek: bool = False,
	**kwargs) -> None:
	super().__init__(prefix=prefix, **kwargs)

	self.semantic_results: List[Any] = []
	self.semantic_prefix = semantic_prefix
	self.cal_sek = cal_sek

	def process(self, data_batch: dict, data_samples: Sequence[dict]) -> None:
	"""Process one batch of data and data_samples.

	The processed results should be stored in ``self.results``, which will
	be used to compute the metrics when all batches have been processed.

	Args:
	data_batch (dict): A batch of data from the dataloader.
	data_samples (Sequence[dict]): A batch of outputs from the model.
	"""
	num_classes = len(self.dataset_meta['classes'])
	num_semantic_classes = len(self.dataset_meta['semantic_classes'])
	for data_sample in data_samples:
	pred_label = data_sample['pred_sem_seg']['data'].squeeze()
	label = data_sample['gt_sem_seg']['data'].squeeze().to(pred_label)
	pred_label_from = data_sample['pred_sem_seg_from']['data'].squeeze()
	label_from = data_sample['gt_sem_seg_from']['data'].squeeze().to(pred_label_from)
	pred_label_to = data_sample['pred_sem_seg_to']['data'].squeeze()
	label_to = data_sample['gt_sem_seg_to']['data'].squeeze().to(pred_label_to)

	self.results.append(
	self.intersect_and_union(pred_label, label, num_classes,
	self.ignore_index))
	# for semantic pred
	self.semantic_results.append(
	self.intersect_and_union(pred_label_from, label_from, num_semantic_classes,
	self.ignore_index))
	self.semantic_results.append(
	self.intersect_and_union(pred_label_to, label_to, num_semantic_classes,
	self.ignore_index))

	def get_sek(self, results: list) -> np.array:
	"""calculate the Sek value.

	Args:
	pre_eval_results (list[tuple[torch.Tensor]]): per image eval results
	for computing evaluation metric

	Returns:
	[torch.tensor]: The Sek value.
	"""
	assert len(results) == 4

	hist_00 = sum(results[0])[0]

	hist_00_list = torch.zeros(len(results[0][0]))
	hist_00_list[0] = hist_00

	total_area_intersect = sum(results[0]) - hist_00_list
	total_area_pred_label = sum(results[2]) - hist_00_list
	total_area_label = sum(results[3]) - hist_00_list

	# foreground
	fg_intersect_sum = total_area_label[1:].sum(
	) - total_area_pred_label[0]
	fg_area_union_sum = total_area_label.sum()

	po = total_area_intersect.sum() / total_area_label.sum()
	pe = (total_area_label * total_area_pred_label).sum() / \
	total_area_pred_label.sum() ** 2

	kappa0 = (po - pe) / (1 - pe)
	# the `iou_fg` is equal to the binary `changed` iou.
	iou_fg = fg_intersect_sum / fg_area_union_sum
	sek = (kappa0 * torch.exp(iou_fg)) / torch.e

	return sek.numpy() # consistent with other metrics.

	def compute_metrics(self, binary_results: list, semantic_results: list) -> Dict[str, float]:
	"""Compute the metrics from processed results.

	Args:
	binary_results (list): The processed results of each batch.
	semantic_results (list): The semantic results of each batch

	Returns:
	Dict[str, float]: The computed metrics. The keys are the names of
	the metrics, and the values are corresponding results. The key
	mainly includes aAcc, mIoU, mAcc, mDice, mFscore, mPrecision,
	mRecall.
	"""
	logger: MMLogger = MMLogger.get_current_instance()

	# convert list of tuples to tuple of lists, e.g.
	# [(A_1, B_1, C_1, D_1), ..., (A_n, B_n, C_n, D_n)] to
	# ([A_1, ..., A_n], ..., [D_1, ..., D_n])
	binary_results = tuple(zip(*binary_results))
	semantic_results = tuple(zip(*semantic_results))
	assert len(binary_results) == 4 and len(semantic_results) == 4

	# for binary results
	binary_total_area_intersect = sum(binary_results[0])
	binary_total_area_union = sum(binary_results[1])
	binary_total_area_pred_label = sum(binary_results[2])
	binary_total_area_label = sum(binary_results[3])
	binary_ret_metrics = self.total_area_to_metrics(
	binary_total_area_intersect, binary_total_area_union, binary_total_area_pred_label,
	binary_total_area_label, self.metrics, self.nan_to_num, self.beta)

	binary_class_names = self.dataset_meta['classes']

	# summary table
	binary_ret_metrics_summary = OrderedDict({
	ret_metric: np.round(np.nanmean(ret_metric_value) * 100, 2)
	for ret_metric, ret_metric_value in binary_ret_metrics.items()
	})
	binary_metrics = dict()
	for key, val in binary_ret_metrics_summary.items():
	if key == 'aAcc':
	binary_metrics[key] = val
	else:
	binary_metrics['m' + key] = val

	# each class table
	binary_ret_metrics.pop('aAcc', None)
	binary_ret_metrics_class = OrderedDict({
	ret_metric: np.round(ret_metric_value * 100, 2)
	for ret_metric, ret_metric_value in binary_ret_metrics.items()
	})
	binary_ret_metrics_class.update({'Class': binary_class_names})
	binary_ret_metrics_class.move_to_end('Class', last=False)
	binary_class_table_data = PrettyTable()
	for key, val in binary_ret_metrics_class.items():
	binary_class_table_data.add_column(key, val)

	print_log('per binary class results:', logger)
	print_log('\n' + binary_class_table_data.get_string(), logger=logger)

	# for semantic results
	semantic_total_area_intersect = sum(semantic_results[0])
	semantic_total_area_union = sum(semantic_results[1])
	semantic_total_area_pred_label = sum(semantic_results[2])
	semantic_total_area_label = sum(semantic_results[3])
	semantic_ret_metrics = self.total_area_to_metrics(
	semantic_total_area_intersect, semantic_total_area_union, semantic_total_area_pred_label,
	semantic_total_area_label, self.metrics, self.nan_to_num, self.beta)

	semantic_class_names = self.dataset_meta['semantic_classes']

	# summary table
	semantic_ret_metrics_summary = OrderedDict({
	ret_metric: np.round(np.nanmean(ret_metric_value) * 100, 2)
	for ret_metric, ret_metric_value in semantic_ret_metrics.items()
	})
	# for semantic change detection
	if self.cal_sek:
	sek = self.get_sek(semantic_results)
	semantic_ret_metrics_summary.update({'Sek': np.round(sek * 100, 2)})
	semantic_ret_metrics_summary.update({'SCD_Score': \
	np.round(0.3 * binary_ret_metrics_summary['IoU'] + 0.7 * sek * 100, 2)})

	semantic_metrics = dict()
	for key, val in semantic_ret_metrics_summary.items():
	if key in ['aAcc', 'Sek', 'SCD_Score']:
	semantic_metrics[key] = val
	else:
	semantic_metrics['m' + key] = val

	# each class table
	semantic_ret_metrics.pop('aAcc', None)
	semantic_ret_metrics_class = OrderedDict({
	ret_metric: np.round(ret_metric_value * 100, 2)
	for ret_metric, ret_metric_value in semantic_ret_metrics.items()
	})
	semantic_ret_metrics_class.update({'Class': semantic_class_names})
	semantic_ret_metrics_class.move_to_end('Class', last=False)
	semantic_class_table_data = PrettyTable()
	for key, val in semantic_ret_metrics_class.items():
	semantic_class_table_data.add_column(key, val)

	print_log('per semantic class results:', logger)
	print_log('\n' + semantic_class_table_data.get_string(), logger=logger)

	return binary_metrics, semantic_metrics

	def evaluate(self, size: int) -> dict:
	"""Evaluate the model performance of the whole dataset after processing
	all batches.

	Args:
	size (int): Length of the entire validation dataset. When batch
	size > 1, the dataloader may pad some data samples to make
	sure all ranks have the same length of dataset slice. The
	``collect_results`` function will drop the padded data based on
	this size.

	Returns:
	dict: Evaluation metrics dict on the val dataset. The keys are the
	names of the metrics, and the values are corresponding results.
	"""
	if len(self.results) == 0:
	print_log(
	f'{self.__class__.__name__} got empty `self.results`. Please '
	'ensure that the processed results are properly added into '
	'`self.results` in `process` method.',
	logger='current',
	level=logging.WARNING)
	if len(self.semantic_results) == 0:
	print_log(
	f'{self.__class__.__name__} got empty `self.semantic_results`. '
	'Please ensure that the processed results are properly added '
	'into `self.semantic_results` in `process` method.',
	logger='current',
	level=logging.WARNING)

	binary_results = collect_results(self.results, size, self.collect_device)
	semantic_results = collect_results(self.semantic_results, \
	size * 2, self.collect_device)

	if is_main_process():
	# cast all tensors in results list to cpu
	binary_results = _to_cpu(binary_results)
	semantic_results = _to_cpu(semantic_results)
	_binary_metrics, _semantic_metrics = \
	self.compute_metrics(binary_results, semantic_results) # type: ignore
	# Add prefix to metric names
	if self.prefix:
	_binary_metrics = {
	'/'.join((self.prefix, k)): v
	for k, v in _binary_metrics.items()
	}
	_semantic_metrics = {
	'/'.join((self.semantic_prefix, k)): v
	for k, v in _semantic_metrics.items()
	}
	_metrics = {_binary_metrics, _semantic_metrics}
	metrics = [_metrics]
	else:
	metrics = [None] # type: ignore

	broadcast_object_list(metrics)

	# reset the results list
	self.results.clear()
	self.semantic_results.clear()
	return metrics[0]