| | import numpy as np
|
| |
|
| |
|
| | def remove_outlier_points(points_tuples, k_nearest=2, threshold=2.0):
|
| | """
|
| | Robust outlier detection for list of (x,y) tuples.
|
| | Only requires numpy.
|
| |
|
| | Args:
|
| | points_tuples: list of (x,y) tuples
|
| | k_nearest: number of neighbors to consider
|
| | threshold: multiplier for median distance
|
| |
|
| | Returns:
|
| | list: filtered list of (x,y) tuples with outliers removed
|
| | list: list of booleans indicating which points were kept (True = kept)
|
| | """
|
| | points = np.array(points_tuples)
|
| | n_points = len(points)
|
| |
|
| |
|
| | dist_matrix = np.zeros((n_points, n_points))
|
| | for i in range(n_points):
|
| | for j in range(i + 1, n_points):
|
| |
|
| | dist = np.sqrt(np.sum((points[i] - points[j]) ** 2))
|
| | dist_matrix[i, j] = dist
|
| | dist_matrix[j, i] = dist
|
| |
|
| |
|
| | k = min(k_nearest, n_points - 1)
|
| | neighbor_distances = np.partition(dist_matrix, k, axis=1)[:, :k]
|
| | avg_neighbor_dist = np.mean(neighbor_distances, axis=1)
|
| |
|
| |
|
| | median_dist = np.median(avg_neighbor_dist)
|
| | mask = avg_neighbor_dist <= threshold * median_dist
|
| |
|
| |
|
| | filtered_tuples = [t for t, m in zip(points_tuples, mask) if m]
|
| | return filtered_tuples
|
| |
|