In this very short post I want to point you to some code for calculating the centroid and distance to that centroid for a set of points in numpy. As bonus I also included some profiling. Note that I already blogged about the centroid function in a previous post.
from math import atan2, sqrt, degrees import numpy as np from math import radians, sin, cos RADIUS = 6371.009 def get_centroid(points): xy = np.asarray(points) xy = np.radians(xy) lon, lat = xy[:, 0], xy[:, 1] avg_x = np.sum(np.cos(lat) * np.cos(lon)) / xy.shape[0] avg_y = np.sum(np.cos(lat) * np.sin(lon)) / xy.shape[0] avg_z = np.sum(np.sin(lat)) / xy.shape[0] center_lon = atan2(avg_y, avg_x) hyp = sqrt(avg_x * avg_x + avg_y * avg_y) center_lat = atan2(avg_z, hyp) return degrees(center_lon), degrees(center_lat) def gc_distance_points(a, points): b = np.asarray(points) lat1, lng1 = radians(a[1]), radians(a[0]) lat2, lng2 = np.radians(b[:, 1]), np.radians(b[:, 0]) sin_lat1, cos_lat1 = sin(lat1), cos(lat1) sin_lat2, cos_lat2 = np.sin(lat2), np.cos(lat2) delta_lng = np.subtract(lng2, lng1) cos_delta_lng, sin_delta_lng = np.cos(delta_lng), np.sin(delta_lng) d = np.arctan2(np.sqrt((cos_lat2 * sin_delta_lng) ** 2 + (cos_lat1 * sin_lat2 - sin_lat1 * cos_lat2 * cos_delta_lng) ** 2), sin_lat1 * sin_lat2 + cos_lat1 * cos_lat2 * cos_delta_lng) return RADIUS * d def gc_dist(a, b): from math import radians, sin, cos, sqrt, atan2 lat1, lng1 = radians(a[1]), radians(a[0]) lat2, lng2 = radians(b[1]), radians(b[0]) sin_lat1, cos_lat1 = sin(lat1), cos(lat1) sin_lat2, cos_lat2 = sin(lat2), cos(lat2) delta_lng = lng2 - lng1 cos_delta_lng, sin_delta_lng = cos(delta_lng), sin(delta_lng) d = atan2(sqrt((cos_lat2 * sin_delta_lng) ** 2 + (cos_lat1 * sin_lat2 - sin_lat1 * cos_lat2 * cos_delta_lng) ** 2), sin_lat1 * sin_lat2 + cos_lat1 * cos_lat2 * cos_delta_lng) return RADIUS * d if __name__ == '__main__': import random random.seed(42) pts = [(random.uniform(-180, 180), random.uniform(-90, 90)) for _ in range(1000000)] centr = get_centroid(pts) import cProfile cProfile.runctx('gc_distance_points(centr, pts)', globals(), locals()) cProfile.runctx('dists = [gc_dist(centr, b) for b in pts]', globals(), locals())
All code is also available at Github. Feel free to post a comment or email in case you have any questions.