| import numpy as np |
|
|
|
|
| def remove_outlier_points(points_tuples, k_nearest=2, threshold=2.0): |
| """ |
| Robust outlier detection for list of (x,y) tuples. |
| Only requires numpy. |
| |
| Args: |
| points_tuples: list of (x,y) tuples |
| k_nearest: number of neighbors to consider |
| threshold: multiplier for median distance |
| |
| Returns: |
| list: filtered list of (x,y) tuples with outliers removed |
| list: list of booleans indicating which points were kept (True = kept) |
| """ |
| points = np.array(points_tuples) |
| n_points = len(points) |
|
|
| |
| dist_matrix = np.zeros((n_points, n_points)) |
| for i in range(n_points): |
| for j in range(i + 1, n_points): |
| |
| dist = np.sqrt(np.sum((points[i] - points[j]) ** 2)) |
| dist_matrix[i, j] = dist |
| dist_matrix[j, i] = dist |
|
|
| |
| k = min(k_nearest, n_points - 1) |
| neighbor_distances = np.partition(dist_matrix, k, axis=1)[:, :k] |
| avg_neighbor_dist = np.mean(neighbor_distances, axis=1) |
|
|
| |
| median_dist = np.median(avg_neighbor_dist) |
| mask = avg_neighbor_dist <= threshold * median_dist |
|
|
| |
| filtered_tuples = [t for t, m in zip(points_tuples, mask) if m] |
| return filtered_tuples |
|
|