# -*- coding: utf-8 -*- import math def get_average(records): """ 平均值 """ return sum(records) / len(records) def get_variance(records): """ 方差 反映一个数据集的离散程度 """ average = get_average(records) return sum([(x - average) ** 2 for x in records]) / len(records) def get_standard_deviation(records): """ 标准差 == 均方差 反映一个数据集的离散程度 """ variance = get_variance(records) return math.sqrt(variance) def get_rms(records): """ 均方根值 反映的是有效值而不是平均值 """ return math.sqrt(sum([x ** 2 for x in records]) / len(records)) def get_mse(records_real, records_predict): """ 均方误差 估计值与真值 偏差 """ if len(records_real) == len(records_predict): return sum([(x - y) ** 2 for x, y in zip(records_real, records_predict)]) / len(records_real) else: return None def get_rmse(records_real, records_predict): """ 均方根误差:是均方误差的算术平方根 """ mse = get_mse(records_real, records_predict) if mse: return math.sqrt(mse) else: return None def get_mae(records_real, records_predict): """ 平均绝对误差 """ if len(records_real) == len(records_predict): return sum([abs(x - y) for x, y in zip(records_real, records_predict)]) / len(records_real) else: return None if __name__ == '__main__': records1 = [3, 4, 5] records2 = [2, 4, 6] # 平均值 average1 = get_average(records1) # 4.0 average2 = get_average(records2) # 4.0 # 方差 variance1 = get_variance(records1) # 0.66 variance2 = get_variance(records2) # 2.66 # 标准差 std_deviation1 = get_standard_deviation(records1) # 0.81 std_deviation2 = get_standard_deviation(records2) # 1.63 # 均方根 rms1 = get_rms(records1) # 4.08 rms2 = get_rms(records2) # 4.32 # 均方误差 mse = get_mse(records1, records2) # 0.66 # 均方根误差 rmse = get_rmse(records1, records2) # 0.81 # 平均绝对误差 mae = get_mae(records1, records2) # 0.66