Python NumPy计算欧氏距离（Euclidean Distance）

article/2025/9/18 7:13:27

欧氏距离定义：欧氏距离（ Euclidean distance）是一个通常采用的距离定义，它是在m维空间中两个点之间的真实距离。

在二维和三维空间中的欧式距离的就是两点之间的距离，二维的公式是：
begin{equation} d = sqrt{(X_1 – Y_1)^2 + (X_2 – Y_2)^2}end{equation}
三维的公式是：
begin{equation} d = sqrt{(X_1 – Y_1)^2 + (X_2 – Y_2)^2 + (X_3 – Y_3)^2}end{equation}
推广到n维空间，欧式距离的公式是：
begin{equation} d = sqrt{(X_1 – Y_1)^2 + (X_2 – Y_2)^2 + (X_3 – Y_3)^2 + … (X_d – Y_d)}end{equation}

求3维两点距离：

import numpy as np

from matplotlib import pyplot as plt

from mpl_toolkits.mplot3d import Axes3D

from mpl_toolkits.mplot3d import proj3d

coords1 = [1, 2, 3]

coords2 = [4, 5, 6]

fig = plt.figure(figsize=(7,7))

ax = fig.add_subplot(111, projection='3d')

ax.scatter((coords1[0], coords2[0]),

(coords1[1], coords2[1]),

(coords1[2], coords2[2]),

color="k", s=150)

ax.plot((coords1[0], coords2[0]),

(coords1[1], coords2[1]),

(coords1[2], coords2[2]),

color="r")

ax.set_xlabel('X')

ax.set_ylabel('Y')

ax.set_zlabel('Z')

ax.text(x=2.5, y=3.5, z=4.0, s='d = 5.19')

plt.title('Euclidean distance between 2 3D-coordinates')

plt.show()

Screen Shot 2015-11-30 at 3.53.09 PM

经典Python实现（vs） NumPy实现

# 样本数据

coords1 = [1, 2, 3]

coords2 = [4, 5, 6]

np_c1 = np.array(coords1)

np_c2 = np.array(coords2)

# 经典 For循环

def eucldist_forloop(coords1, coords2):

""" Calculates the euclidean distance between 2 lists of coordinates. """

dist = 0

for (x, y) in zip(coords1, coords2):

dist += (x - y)**2

return dist**0.5

# 生成器表达式

def eucldist_generator(coords1, coords2):

""" Calculates the euclidean distance between 2 lists of coordinates. """

return sum((x - y)**2 for x, y in zip(coords1, coords2))**0.5

# NumPy版本

def eucldist_vectorized(coords1, coords2):

""" Calculates the euclidean distance between 2 lists of coordinates. """

return np.sqrt(np.sum((coords1 - coords2)**2))

# NumPy 内建函数

np.linalg.norm(np_c1 - np_c2)

print(eucldist_forloop(coords1, coords2))

print(eucldist_generator(coords1, coords2))

print(eucldist_vectorized(np_c1, np_c2))

print(np.linalg.norm(np_c1 - np_c2))

Screen Shot 2015-11-30 at 4.04.47 PM
timeit比较执行效率：

import numpy as np

from matplotlib import pyplot as plt

from mpl_toolkits.mplot3d import Axes3D

from mpl_toolkits.mplot3d import proj3d

coords1 = [1, 2, 3]

coords2 = [4, 5, 6]

np_c1 = np.array(coords1)

np_c2 = np.array(coords2)

def eucldist_forloop(coords1, coords2):

""" Calculates the euclidean distance between 2 lists of coordinates. """

dist = 0

for (x, y) in zip(coords1, coords2):

dist += (x - y)**2

return dist**0.5

def eucldist_generator(coords1, coords2):

""" Calculates the euclidean distance between 2 lists of coordinates. """

return sum((x - y)**2 for x, y in zip(coords1, coords2))**0.5

def eucldist_vectorized(coords1, coords2):

""" Calculates the euclidean distance between 2 lists of coordinates. """

return np.sqrt(np.sum((coords1 - coords2)**2))

import timeit

import random

random.seed(123)

from numpy.linalg import norm as np_linalg_norm

funcs = ('eucldist_forloop', 'eucldist_generator', 'eucldist_vectorized', 'np_linalg_norm')

times = {f:[] for f in funcs}

orders_n = [10**i for i in range(1, 8)]

for n in orders_n:

c1 = [random.randint(0,100) for _ in range(n)]

c2 = [random.randint(0,100) for _ in range(n)]

np_c1 = np.array(c1)

np_c2 = np.array(c2)

assert(eucldist_forloop(c1, c2)

== eucldist_generator(c1, c2)

== eucldist_vectorized(np_c1, np_c2)

== np_linalg_norm(np_c1 - np_c2)

)

times['eucldist_forloop'].append(min(timeit.Timer('eucldist_forloop(c1, c2)',

'from __main__ import c1, c2, eucldist_forloop').repeat(repeat=50, number=1)))

times['eucldist_generator'].append(min(timeit.Timer('eucldist_generator(c1, c2)',

'from __main__ import c1, c2, eucldist_generator').repeat(repeat=50, number=1)))

times['eucldist_vectorized'].append(min(timeit.Timer('eucldist_vectorized(np_c1, np_c2)',

'from __main__ import np_c1, np_c2, eucldist_vectorized').repeat(repeat=50, number=1)))

times['np_linalg_norm'].append(min(timeit.Timer('np_linalg_norm(np_c1 - np_c2)',

'from __main__ import np_c1, np_c2, np_linalg_norm').repeat(repeat=50, number=1)))

labels = {'eucldist_forloop': 'for-loop',

'eucldist_generator': 'generator expression (comprehension equiv.)',

'eucldist_vectorized': 'NumPy vectorization',

'np_linalg_norm': 'numpy.linalg.norm'

}

def plot(times, orders_n, labels):

colors = ('cyan', '#7DE786', 'black', 'blue')

linestyles = ('-', '-', '--', '--')

fig = plt.figure(figsize=(11,10))

for lb,c,l in zip(labels.keys(), colors, linestyles):

plt.plot(orders_n, times[lb], alpha=1, label=labels[lb],

lw=3, color=c, linestyle=l)

plt.xlabel('sample size n (items in the list)', fontsize=14)

plt.ylabel('time per computation in seconds', fontsize=14)

plt.xlim([min(orders_n) / 10, max(orders_n)* 10])

plt.legend(loc=2, fontsize=14)

plt.grid()

plt.xticks(fontsize=16)

plt.yticks(fontsize=16)

plt.xscale('log')

plt.yscale('log')

plt.title('Python for-loop/generator expr. vs. NumPy vectorized code', fontsize=18)

plt.show()

plot(times, orders_n, labels)

Screen Shot 2015-11-30 at 4.23.19 PM

文章转载自： http://blog.topspeedsnail.com/archives/954

Python NumPy计算欧氏距离（Euclidean Distance）

相关文章

Euclidean division

PRN（20201012）：Improved updating of Euclidean distance maps and Voronoi diagrams

java余弦距离_使用TensorFlow实现余弦距离/欧氏距离（Euclideandistance）以及Attention矩阵的计算...

点云检测--欧式聚类Euclidean Cluster

Voxblox: Incremental 3D Euclidean Signed Distance Fields for On-Board MAV Planning

3D点云处理：点云聚类--FEC: Fast Euclidean Clustering for Point Cloud Segmentation

euclidean loss

Euclidean, Manhattan, hop-count distance 区别

扩展Euclidean算法求乘法逆原理详解与算法实现

NEO4J-相似度算法04-欧几里得距离算法（euclidean）应用场景简介

欧几里德算法、拓展欧几里德、中国剩余定理

logit回归模型_一文读懂条件Logistic回归

目标检测-定位蒸馏：logit蒸馏与feature蒸馏之争

biogeme-nest_logit-cnblog

必看 logit回归分析步骤汇总

PyTorch logit函数

logit回归模型_详解 Logit/Probit 模型中的 completely determined 问题

Logit Adjust

logit

Logit 是怎么算的？