将itertools组合列表传递给函数映射？

import numpy as np import matplotlib.pyplot as plt import itertools import statistics def new_list(x,y,n,replacex, replacey): '''Take 2 1D arrays (x and y) and replace item n with replacex and replacey respectively''' # First, copy the source arrays into the new arrays (newx, newy) newx=np.copy(x) newy=np.copy(y) #Now replace item n with the medians newx[n]=replacementx newy[n]=replacementy return(newx,newy) #Initialise the dummy lists, assign the replacement values(medians), clear the temporary variables newx=[] #temporary x list to run the new correlation newy=[] #temporary y list to run the new correlation p2values=[] #list of p values for the new correlations - this should change nearly every iteration r2values=[] #list of r values for the new correlations - this should change nearly every iteration replacementx=[] # single x value to be placed into the source list to run the new correlation. Currently using median replacementy=[] # single y value to be placed into the source list to run the new correlation. Currently using median #x,y values for one of Anscombe's Quartet as an example x=[8, 8, 8, 8, 8, 8, 8, 19, 8, 8, 8] y=[6.58, 5.76, 7.71, 8.84, 8.47, 7.04, 5.25, 12.50, 5.56, 7.91, 6.89] replacementx = statistics.median(x) replacementy = statistics.median(y) for n in range(len(x)): newx,newy = new_list(x,y,n,replacementx,replacementy) r,p = stats.pearsonr(x,y) r2,p2 = stats.pearsonr(newx,newy) p2values.append(p2) r2values.append(r2) newx=[] newy=[] fig, ax1 = plt.subplots() color = 'tab:red' ax1.set_xlabel('Item number') ax1.set_ylabel('Pearson r', color=color) ax1.set_ylim(0,1) ax1.plot(range(len(r2values)), r2values, range(len(rvalues)),rvalues, color=color) ax1.tick_params(axis='y', labelcolor=color) ax2 = ax1.twinx() # instantiate a second axes that shares the same x-axis color = 'tab:blue' ax2.set_ylabel('p value', color=color) # we already handled the x-label with ax1 ax2.plot(range(len(p2values)),p2values, range(len(pvalues)), pvalues, color=color) ax2.tick_params(axis='y', labelcolor=color) plt.show()

import itertools #x,y values for one of Anscombe's Quartet as an example x=[8, 8, 8, 8, 8, 8, 8, 19, 8, 8, 8] y=[6.58, 5.76, 7.71, 8.84, 8.47, 7.04, 5.25, 12.50, 5.56, 7.91, 6.89] data=list(zip(x,y)) replacement_candidates=list(itertools.combinations(data,2)) print(replacement_candidates)

1条回答

网友

1楼 · 发布于 2024-10-01 11:29:34

好的，我已经弄明白了，所以在这里发布代码，以防这对其他人有帮助。我完全走错了方向。这里的示例传递了Anscombe四重奏的第三个成员，硬编码为x，y值和n=3（对于3个值的所有组合），但是您显然可以将其替换为您想要的任何值。n=1表示更换第8项时，该构件易碎（r，p评估为nan）。 sample output plot with n=1 我将把它重写为一个包含x、y和n的函数，但由于组合可能会很快失控，我想采取一些措施来防止内存不足错误和进度条之类的东西（这是我无法理解的，因为这基本上是我在Python中的“Hello World”）结果与原始r和p的虚线参考线一起可视化，这对我很有帮助

import numpy as np 
import matplotlib.pyplot as plt
import itertools
import statistics
from scipy import stats
# Initialise the source values - x,y, and n
# x,y are the source data for the correlation
# n is the number of items to figure out all combinations to replace within x,y

x=[8, 8, 8, 8, 8, 8, 8, 19, 8, 8, 8]
y=[6.58, 5.76, 7.71, 8.84, 8.47, 7.04, 5.25, 12.50, 5.56, 7.91, 6.89]
n=3

r,p = stats.pearsonr(x,y)

appendtuple=()
p2values=[] #list of p-values for the new correlations - this should change nearly every iteration
r2values=[] #list of r values for the new correlations - this should change nearly every iteration
appendtuple=(statistics.median(x),statistics.median(y))
data=list(zip(x,y))
replacement_candidates=list(itertools.combinations(data,n))

def Diff(li1,li2):
    return(list(set(li1)-set(li2)))

for i in range(len(replacement_candidates)):
    a=[]
    a=Diff(data,replacement_candidates[i])
    for k in range(n):
        a.append(appendtuple)
    res_listx = [x[0] for x in a]
    res_listy= [y[1] for y in a]
    r2,p2 = stats.pearsonr(res_listx,res_listy)
    p2values.append(p2)
    r2values.append(r2)
    # print(res_listx,res_listy)
    # print(stats.pearsonr(res_listx,res_listy))

fig, ax1 = plt.subplots()
color = 'tab:red'
ax1.set_xlabel('Item number')
ax1.set_ylabel('Pearson r', color=color)
ax1.set_ylim(0,1)
ax1.plot(range(len(r2values)), r2values, range(len(rvalues)),rvalues, color=color)
ax1.tick_params(axis='y', labelcolor=color)

plt.hlines(r,0,len(p2values),linestyles='dotted',label='r', color='tab:red')

ax2 = ax1.twinx()  # instantiate a second axes that shares the same x-axis

color = 'tab:blue'
ax2.set_ylabel('p value', color=color)  # we already handled the x-label with ax1
ax2.plot(range(len(p2values)),p2values, range(len(pvalues)), pvalues, color=color)
ax2.tick_params(axis='y', labelcolor=color)
plt.hlines(p,0,len(p2values),linestyles='dotted',label='r', color='tab:blue')
plt.show()

相关问题更多 >

编程相关推荐

热门问题

热门文章