|
import numpy as np |
|
|
|
|
|
def remove_outlier_points(points_tuples, k_nearest=2, threshold=2.0): |
|
""" |
|
Robust outlier detection for list of (x,y) tuples. |
|
Only requires numpy. |
|
|
|
Args: |
|
points_tuples: list of (x,y) tuples |
|
k_nearest: number of neighbors to consider |
|
threshold: multiplier for median distance |
|
|
|
Returns: |
|
list: filtered list of (x,y) tuples with outliers removed |
|
list: list of booleans indicating which points were kept (True = kept) |
|
""" |
|
points = np.array(points_tuples) |
|
n_points = len(points) |
|
|
|
|
|
dist_matrix = np.zeros((n_points, n_points)) |
|
for i in range(n_points): |
|
for j in range(i + 1, n_points): |
|
|
|
dist = np.sqrt(np.sum((points[i] - points[j]) ** 2)) |
|
dist_matrix[i, j] = dist |
|
dist_matrix[j, i] = dist |
|
|
|
|
|
k = min(k_nearest, n_points - 1) |
|
neighbor_distances = np.partition(dist_matrix, k, axis=1)[:, :k] |
|
avg_neighbor_dist = np.mean(neighbor_distances, axis=1) |
|
|
|
|
|
median_dist = np.median(avg_neighbor_dist) |
|
mask = avg_neighbor_dist <= threshold * median_dist |
|
|
|
|
|
filtered_tuples = [t for t, m in zip(points_tuples, mask) if m] |
|
return filtered_tuples |
|
|