Skip to content

Commit

Permalink
Merge pull request #406 from CosmiQ/dev
Browse files Browse the repository at this point in the history
Version 0.4.0
  • Loading branch information
dphogan committed Aug 21, 2020
2 parents a6e8d48 + 07a22d4 commit e596041
Show file tree
Hide file tree
Showing 8 changed files with 443 additions and 14 deletions.
13 changes: 13 additions & 0 deletions CHANGELOG.md
Expand Up @@ -25,6 +25,19 @@ When a new version of `solaris` is released, all of the changes in the Unrelease

---

## Version 0.4.0

### Added
- 20200803, jshermeyer: Added mAP metric
- 20200701, dphogan: Added SpaceNet Change and Object Tracking (SCOT) metric
### Removed
### Changed
### Fixed
### Deprecated
### Security

---

## Version 0.3.0

### Added
Expand Down
4 changes: 2 additions & 2 deletions docs/conf.py
Expand Up @@ -25,8 +25,8 @@
copyright = u'2018-{}, CosmiQ Works: an IQT Lab'.format(time.strftime("%Y"))

# The full version, including alpha/beta/rc tags
release = '0.3.0'
version = '0.3.0'
release = '0.4.0'
version = '0.4.0'

# -- General configuration ---------------------------------------------------

Expand Down
2 changes: 1 addition & 1 deletion solaris/__init__.py
@@ -1,3 +1,3 @@
from . import bin, data, eval, nets, preproc, raster, tile, utils, vector

__version__ = "0.3.0"
__version__ = "0.4.0"
2 changes: 1 addition & 1 deletion solaris/eval/__init__.py
@@ -1 +1 @@
from . import base, iou, challenges, pixel, vector
from . import base, iou, scot, challenges, pixel, vector
49 changes: 48 additions & 1 deletion solaris/eval/challenges.py
@@ -1,5 +1,7 @@
import pandas as pd
import geopandas as gpd
from .base import Evaluator
from .scot import scot_multi_aoi
import re


Expand Down Expand Up @@ -112,7 +114,7 @@ def off_nadir_buildings(prop_csv, truth_csv, image_columns={}, miniou=0.5,
Minimum area of ground truth regions to include in scoring calculation.
Defaults to ``20``.
Returnss
Returns
-------
results_DF, results_DF_Full
Expand Down Expand Up @@ -206,6 +208,51 @@ def off_nadir_buildings(prop_csv, truth_csv, image_columns={}, miniou=0.5,
return results_DF, results_DF_Full


def multi_temporal_buildings(prop_csv, truth_csv, miniou=0.25, min_area=4.,
beta=2., stats=False, verbose=False):
"""
Evaluate submissions to SpaceNet 7: Multi-Temporal Urban Development
Input CSV files should have "filename", "id", and "geometry" columns.
"""

# Load dataframes
grnd_df = gpd.read_file(truth_csv, GEOM_POSSIBLE_NAMES="geometry", KEEP_GEOM_COLUMNS="NO")
prop_df = gpd.read_file(prop_csv, GEOM_POSSIBLE_NAMES="geometry", KEEP_GEOM_COLUMNS="NO")
if verbose:
print("init len grnd_df:", len(grnd_df))
print("init len prop_df:", len(prop_df))

# Filter out small buildings from ground truth
if min_area is not None:
grnd_df['area'] = grnd_df.area
grnd_df = grnd_df[grnd_df['area'] >= min_area]
grnd_df = grnd_df.drop(columns=['area'])
if verbose:
print("filtered len grnd_df:", len(grnd_df))

# Extract place (aoi) and time (timestep) from the "filename" column
grnd_df['aoi'] = grnd_df['filename'].str.slice(30, 58)
prop_df['aoi'] = prop_df['filename'].str.slice(30, 58)
grnd_df['timestep'] = grnd_df['filename'].str.slice(15, 22)
prop_df['timestep'] = prop_df['filename'].str.slice(15, 22)
aois = sorted(list(grnd_df.aoi.drop_duplicates()))
if verbose:
print("Number of AOIS:", len(aois))

# Compute the score for this proposal
score, all_stats = scot_multi_aoi(grnd_df, prop_df,
threshold=miniou, base_reward=100.,
beta=beta,
stats=True, verbose=verbose)
if verbose:
print('The submission "%s" receives a score of %f'
% (prop_csv, score))
if stats:
return (score, all_stats)
else:
return score


def get_chip_id(chip_name, challenge="spacenet_2"):
"""Get the unique identifier for a chip location from SpaceNet images.
Expand Down
232 changes: 232 additions & 0 deletions solaris/eval/scot.py
@@ -0,0 +1,232 @@
import geopandas as gpd
import scipy.optimize
import scipy.sparse

def match_footprints(grnd_df, prop_df,
threshold=0.25, base_reward=100.):
"""
Optimal matching of ground truth footprints with proposal footprints
(for a single timestep).
Input dataframes should have "id" & "geometry" columns.
"""

# Supplement IDs with indices (which run from zero
# to one less than the number of unique IDs)
grnd_id_set = set(grnd_df['id'])
prop_id_set = set(prop_df['id'])
grnd_id_to_index = {id: index for index, id in
enumerate(sorted(list(grnd_id_set)))}
prop_id_to_index = {id: index for index, id in
enumerate(sorted(list(prop_id_set)))}
grnd_index_to_id = {index: id for id, index in grnd_id_to_index.items()}
prop_index_to_id = {index: id for id, index in prop_id_to_index.items()}
grnd_df['index'] = grnd_df.id.apply(lambda id: grnd_id_to_index[id])
prop_df['index'] = prop_df.id.apply(lambda id: prop_id_to_index[id])

# Calculate IOU for all intersections, and the corresponding reward
grnd_df['grnd_area'] = grnd_df.area
prop_df['prop_area'] = prop_df.area
if not (grnd_df.empty or prop_df.empty):
intersect = gpd.overlay(grnd_df, prop_df)
else:
intersect = None
if intersect is None or len(intersect) == 0:
return [], [], len(grnd_df), len(prop_df), 0, len(prop_df), len(grnd_df), 0., grnd_id_set, prop_id_set
intersect['inter_area'] = intersect.area
intersect['iou'] = intersect['inter_area'] / (intersect['grnd_area']
+ intersect['prop_area'] - intersect['inter_area'])
intersect['reward'] = intersect.apply(lambda row: (row.iou > threshold)
* (base_reward + row.iou), axis=1)

# Convert IOUs and rewards to 2D arrays (by way of sparse matrices)
iou_matrix = scipy.sparse.coo_matrix((intersect.iou, (intersect.index_1, intersect.index_2)),
shape=(len(grnd_df), len(prop_df)))
iou_arr = iou_matrix.toarray()
reward_matrix = scipy.sparse.coo_matrix((intersect.reward, (intersect.index_1, intersect.index_2)),
shape=(len(grnd_df), len(prop_df)))
reward_arr = reward_matrix.toarray()

# Solve unbalanced linear assignment problem
grnd_match, prop_match = scipy.optimize.linear_sum_assignment(reward_arr, maximize=True)
iou_match = iou_arr[grnd_match, prop_match]

# Remove matches that don't actually contribute to the total score
grnd_match_pruned = grnd_match[iou_match>threshold]
prop_match_pruned = prop_match[iou_match>threshold]
iou_match_pruned = iou_match[iou_match>threshold]

# Look up IDs for each match, and calculate descriptive statistics
grnd_match_ids = [grnd_index_to_id[index] for index in grnd_match_pruned]
prop_match_ids = [prop_index_to_id[index] for index in prop_match_pruned]
num_grnd = len(grnd_df)
num_prop = len(prop_df)
tp = len(iou_match_pruned)
fp = num_prop - tp
fn = num_grnd - tp
if 2*tp + fp + fn > 0:
f1 = (2*tp) / (2*tp + fp + fn)
else:
f1 = 0

return grnd_match_ids, prop_match_ids, num_grnd, num_prop, tp, fp, fn, f1, grnd_id_set, prop_id_set


def scot_one_aoi(grnd_df, prop_df, threshold=0.25, base_reward=100., beta=2.,
stats=False, verbose=False):
"""
SpaceNet Change and Object Tracking (SCOT) metric, for one AOI.
Input dataframes should have "timestep", "id", & "geometry" columns.
"""

# Get list of timesteps from ground truth and proposal dataframes
grnd_timestep_set = set(grnd_df.timestep.drop_duplicates())
prop_timestep_set = set(grnd_df.timestep.drop_duplicates())
timesteps = sorted(list(grnd_timestep_set.union(prop_timestep_set)))

# Loop through timesteps
if verbose:
print('Matching footprints')
tp_net = 0
fp_net = 0
fn_net = 0
num_grnd_net = 0
num_prop_net = 0
all_grnd_ids = []
all_prop_ids = []
change_tp_net = 0
change_fp_net = 0
change_fn_net = 0
change_grnd_ids = set()
change_prop_ids = set()
for i, timestep in enumerate(timesteps):

# Get just the data for this timestep
grnd_df_one_timestep = grnd_df.loc[grnd_df.timestep == timestep].copy()
prop_df_one_timestep = prop_df.loc[prop_df.timestep == timestep].copy()

# Find footprint matches for this timestep
grnd_ids, prop_ids, num_grnd, num_prop, tp, fp, fn, f1, grnd_id_set, prop_id_set = match_footprints(
grnd_df_one_timestep, prop_df_one_timestep,
threshold=threshold, base_reward=base_reward)

# Collect aggregate statistics for tracking, and retain all match IDs
tp_net += tp
fp_net += fp
fn_net += fn
num_grnd_net += num_grnd
num_prop_net += num_prop
all_grnd_ids = grnd_ids + all_grnd_ids # newest first
all_prop_ids = prop_ids + all_prop_ids # newest first
if verbose:
print(' %2i: F1 = %.4f' % (i + 1, f1))

# Collect aggregate statistics for change detection
if i > 0:
# Find change detection TPs, FPs, and FNs among matched footprints
new_grnd = [grnd_id not in change_grnd_ids for grnd_id in grnd_ids]
new_prop = [prop_id not in change_prop_ids for prop_id in prop_ids]
change_tp_list = [g and p for g, p in zip(new_grnd, new_prop)]
change_fp_list = [p and not g for g, p in zip(new_grnd, new_prop)]
change_fn_list = [g and not p for g, p in zip(new_grnd, new_prop)]
change_tp_net += sum(change_tp_list)
change_fp_net += sum(change_fp_list)
change_fn_net += sum(change_fn_list)
# Find change detection FPs and FNs among unmatched footprints
unmatched_fp = prop_id_set.difference(prop_ids).difference(change_prop_ids)
unmatched_fn = grnd_id_set.difference(grnd_ids).difference(change_grnd_ids)
change_fp_net += len(unmatched_fp)
change_fn_net += len(unmatched_fn)
change_grnd_ids = change_grnd_ids.union(grnd_id_set)
change_prop_ids = change_prop_ids.union(prop_id_set)

# Identify which matches are mismatches
# (i.e., inconsistent with previous timesteps)
if verbose:
print('Identifying mismatches')
mm_net = 0
for i in range(len(all_grnd_ids)):
grnd_id = all_grnd_ids[i]
prop_id = all_prop_ids[i]
previous_grnd_ids = all_grnd_ids[i+1:]
previous_prop_ids = all_prop_ids[i+1:]
grnd_mismatch = grnd_id in previous_grnd_ids and previous_prop_ids[previous_grnd_ids.index(grnd_id)] != prop_id
prop_mismatch = prop_id in previous_prop_ids and previous_grnd_ids[previous_prop_ids.index(prop_id)] != grnd_id
mismatch = grnd_mismatch or prop_mismatch
if mismatch:
mm_net += 1

# Compute and return score according to the metric
track_tp_net = tp_net - mm_net
track_fp_net = fp_net + mm_net
track_fn_net = fn_net + mm_net
if track_tp_net + (track_fp_net + track_fn_net)/2. > 0:
track_score = (track_tp_net) / (track_tp_net
+ (track_fp_net + track_fn_net)/2.)
else:
track_score = 0
if change_tp_net + (change_fp_net + change_fn_net)/2. > 0:
change_score = (change_tp_net) / (change_tp_net
+ (change_fp_net + change_fn_net)/2.)
else:
change_score = 0
if beta * beta * change_score + track_score > 0:
combo_score = (1 + beta * beta) * (change_score * track_score) / (beta * beta * change_score + track_score)
else:
combo_score = 0
if verbose:
print('Tracking:')
print(' Mismatches: %i' % mm_net)
print(' True Pos: %i' % track_tp_net)
print(' False Pos: %i' % track_fp_net)
print(' False Neg: %i' % track_fn_net)
print(' Track Score: %.4f' % track_score)
print('Change Detection:')
print(' True Pos: %i' % change_tp_net)
print(' False Pos: %i' % change_fp_net)
print(' False Neg: %i' % change_fn_net)
print(' Change Score: %.4f' % change_score)
print('Combined Score: %.4f' % combo_score)
if stats:
return combo_score, [mm_net, track_tp_net, track_fp_net, track_fn_net,
track_score, change_tp_net, change_fp_net,
change_fn_net, change_score, combo_score]
else:
return combo_score


def scot_multi_aoi(grnd_df, prop_df, threshold=0.25, base_reward=100., beta=2.,
stats=True, verbose=False):
"""
SpaceNet Change and Object Tracking (SCOT) metric,
for a SpaceNet 7 submission with multiple AOIs.
Input dataframes should have "aoi", "timestep", "id", & "geometry" columns.
"""

# Get list of AOIs from ground truth dataframe
aois = sorted(list(grnd_df.aoi.drop_duplicates()))

# Evaluate SCOT metric for each AOI
cumulative_score = 0.
all_stats = {}
for i, aoi in enumerate(aois):
if verbose:
print()
print('%i / %i: AOI %s' % (i + 1, len(aois), aoi))
grnd_df_one_aoi = grnd_df.loc[grnd_df.aoi == aoi].copy()
prop_df_one_aoi = prop_df.loc[prop_df.aoi == aoi].copy()
score_one_aoi, stats_one_aoi = scot_one_aoi(
grnd_df_one_aoi, prop_df_one_aoi,
threshold=threshold,
base_reward=base_reward,
beta=beta, stats=True, verbose=verbose)
cumulative_score += score_one_aoi
all_stats[aoi] = stats_one_aoi

# Return combined SCOT metric score
score = cumulative_score / len(aois)
if verbose:
print('Overall score: %f' % score)
if stats:
return score, all_stats
else:
return score

0 comments on commit e596041

Please sign in to comment.