python 一元回归拟合

《python 一元回归拟合（含幂函数，对数，S函数，指数函数，一次、二次、三次，逆函数，生长、复合函数）》这篇文章里的代码，用我自己的数据报错如下：numpy.core._exceptions.UFuncTypeError: ufunc 'add' did not contain a loop with signature matching types (dtype('float64'), dtype('<U92')) -> None，应该怎么处理


def analysis_of_regression(data_df,x_自变量,y_因变量,fw,io_1):     
    import matplotlib.pyplot as plt
    
    import pandas as pd
    from sklearn.metrics import r2_score
    plt.rcParams['font.sans-serif']=['SimHei'] #用来正常显示中文标签
    plt.rcParams['axes.unicode_minus']=False #用来正常显示负号
    
    #%%需要外部加载的变量
    
    
    # df_a = pd.DataFrame( columns=['标签','类型', 'r2', '航司','公式']) 
    df_a = pd.DataFrame() 
    df_d = pd.DataFrame(columns=('标签','类型','r2','系数'))
    
    
  
    data_array = np.array(data_df[['标签']])
    b=data_array.tolist()
    a=[x for tup in b for x in tup]
 
    a = list(set(a))
    
    
    #开始进行函数拟合
    for i in a:    
    # for i in [1]:
        jj=data_df[(data_df['标签']==i)]
        # jj=data_df
        ##线性
        x_cz_2=jj[['自变量']].values.tolist()
        y_cz_2=jj[['因变量']].values.tolist()
        x_cz_2=sum(x_cz_2,[])
        y_cz_2=sum(y_cz_2,[])
        L=np.polyfit(x_cz_2, y_cz_2, 1)
        print(L)
        Z=np.polyval(L,x_cz_2,)
        score = r2_score(y_cz_2, Z, multioutput='raw_values')
        print('线性：'+str(score))
        new=pd.DataFrame({'标签':i,
                          '类型':'线性',
                          'r2':score,
                          '系数':[L]})
        
        df_d=df_d.append(new,ignore_index=(True))
        
        
        ##指数
        x_cz_2=jj[['自变量']].values.tolist()
        y_cz_2=jj[['因变量']].values.tolist()
        x_cz_2=sum(x_cz_2,[])
        y_cz_2=sum(y_cz_2,[])
        L=np.polyfit(x_cz_2, np.log(y_cz_2), 1)
        Z=np.polyval(L,x_cz_2)
        true=np.exp(Z)
        score = r2_score(y_cz_2,true, multioutput='raw_values')
        print('指数：'+str(score))
        new=pd.DataFrame({'标签':i,
                          '类型':'指数',
                          'r2':score,
                          '系数':[L]})
        
        df_d=df_d.append(new,ignore_index=(True))
        
        
        
        
        # ##二次
        # x_cz_2=jj[['自变量']].values.tolist()
        # y_cz_2=jj[['因变量']].values.tolist()
        # x_cz_2=sum(x_cz_2,[])
        # y_cz_2=sum(y_cz_2,[])
        # L=np.polyfit(x_cz_2, y_cz_2, 2)
        # print(L)
        # Z=np.polyval(L,x_cz_2,)
        # score = r2_score(y_cz_2, Z, multioutput='raw_values')
        # print('二次：'+str(score))
        
        # new=pd.DataFrame({'标签':i,
        #                   '类型':'二次',
        #                   'r2':score,
        #                   '系数':[L]})
        
        # df_d=df_d.append(new,ignore_index=(True))
        
        
        ##幂函数
        x_cz_2=jj[['自变量']].values.tolist()
        y_cz_2=jj[['因变量']].values.tolist()
        x_cz_2=sum(x_cz_2,[])
        y_cz_2=sum(y_cz_2,[])
        L=np.polyfit(np.log(x_cz_2), np.log(y_cz_2), 1)
        Z=np.polyval(L,np.log(x_cz_2))
        true=np.exp(Z)
        score = r2_score(y_cz_2,true, multioutput='raw_values')
        print('幂函数：'+str(score))
        
        new=pd.DataFrame({'标签':i,
                          '类型':'幂函数',
                          'r2':score,
                          '系数':[L]})
        
        df_d=df_d.append(new,ignore_index=(True))
    
        ##对数
        x_cz_2=jj[['自变量']].values.tolist()
        y_cz_2=jj[['因变量']].values.tolist()
        x_cz_2=sum(x_cz_2,[])
        y_cz_2=sum(y_cz_2,[])
        L=np.polyfit(np.log(x_cz_2), y_cz_2, 1)
        Z=np.polyval(L,np.log(x_cz_2))
        score = r2_score(y_cz_2,Z, multioutput='raw_values')
        print('对数：'+str(score))
        
        new=pd.DataFrame({'标签':i,
                          '类型':'对数',
                          'r2':score,
                          '系数':[L]})
        
        df_d=df_d.append(new,ignore_index=(True))
    
    
        ##复合函数
        x_cz_2=jj[['自变量']].values.tolist()
        y_cz_2=jj[['因变量']].values.tolist()
        x_cz_2=sum(x_cz_2,[])
        y_cz_2=sum(y_cz_2,[])
        L=np.polyfit(x_cz_2,np.log(y_cz_2), 1)
        Z=np.polyval(L,x_cz_2)
        true=np.exp(Z)
        score = r2_score(y_cz_2,true, multioutput='raw_values')
        print('复合函数：'+str(score))
        
        new=pd.DataFrame({'标签':i,
                          '类型':'复合函数',
                          'r2':score,
                          '系数':[L]})
        
        df_d=df_d.append(new,ignore_index=(True))
        
        ##生长
        x_cz_2=jj[['自变量']].values.tolist()
        y_cz_2=jj[['因变量']].values.tolist()
        x_cz_2=sum(x_cz_2,[])
        y_cz_2=sum(y_cz_2,[])
        L=np.polyfit(x_cz_2, np.log(y_cz_2), 1)
        Z=np.polyval(L,x_cz_2)
        true=np.exp(Z)
        score = r2_score(y_cz_2,true, multioutput='raw_values')
        print('生长：'+str(score))
        
        new=pd.DataFrame({'标签':i,
                          '类型':'生长',
                          'r2':score,
                          '系数':[L]})
        
        df_d=df_d.append(new,ignore_index=(True))
        
        # ##三次
        # x_cz_2=jj[['自变量']].values.tolist()
        # y_cz_2=jj[['因变量']].values.tolist()
        # x_cz_2=sum(x_cz_2,[])
        # y_cz_2=sum(y_cz_2,[])
        # L=np.polyfit(x_cz_2, y_cz_2, deg=3)
        # Z=np.polyval(L,x_cz_2)
        # score = r2_score(y_cz_2,Z,multioutput='raw_values')
        # print('三次：'+str(score))
        
        # new=pd.DataFrame({'标签':i,
        #                   '类型':'三次',
        #                   'r2':score,
        #                   '系数':[L]})
        
        # df_d=df_d.append(new,ignore_index=(True))
        
        # ##S函数
        # x_cz_2=jj[['自变量']].values.tolist()
        # y_cz_2=jj[['因变量']].values.tolist()
        # x_cz_2=sum(x_cz_2,[])
        # x_cz_3 = [1/x for x in x_cz_2]
        # y_cz_2=sum(y_cz_2,[])
        # L=np.polyfit(x_cz_3, np.log(y_cz_2), 1)
        # Z=np.polyval(L,x_cz_3)
        # true=np.exp(Z)
        # score = r2_score(y_cz_2,true,multioutput='raw_values')
        # print('S函数：'+str(score))
        
        # new=pd.DataFrame({'标签':i,
        #                   '类型':'S函数',
        #                   'r2':score,
        #                   '系数':[L]})
        
        # df_d=df_d.append(new,ignore_index=(True))
        
        ##逆函数
        x_cz_2=jj[['自变量']].values.tolist()
        y_cz_2=jj[['因变量']].values.tolist()
        x_cz_2=sum(x_cz_2,[])
        x_cz_3 = [1/x for x in x_cz_2]
        y_cz_2=sum(y_cz_2,[])
        L=np.polyfit(x_cz_3, y_cz_2, 1)
        Z=np.polyval(L,x_cz_3)
        score = r2_score(y_cz_2,true,multioutput='raw_values')
        print('逆函数：'+str(score))
        
        new=pd.DataFrame({'标签':i,
                          '类型':'逆函数',
                          'r2':score,
                          '系数':[L]})
        
        df_d=df_d.append(new,ignore_index=(True))
    
    df_zh=df_d.sort_values('r2', ascending=False).groupby('标签', as_index=False).first()
    
 
    
    ff=df_zh
    # second=df_e[(df_e['类型']=='二次')]
    j=0
    while  j < len(a):
        gg=ff.iloc[[j]].values.tolist()
        gg =sum(gg,[]) 
        
   
        if gg[1] == '二次':
            x=fw
            y_sh=gg[3][0]*x**2+gg[3][1]*x+gg[3][2]
            formu_s='y='+str(gg[3][0])+str('x^2+')+str(gg[3][1])+str('x')+str('+(')+str(gg[3][2])+str(')')
        elif gg[1] == '线性':
            x=fw
            y_sh=gg[3][0]*x+gg[3][1]
            formu_s='y_zh='+str(gg[3][0])+str('x')+str('+(')+str(gg[3][1])+str(')')
        elif gg[1] == '指数':
            x=fw
            y_sh=np.exp(gg[3][0]*x+gg[3][1])
            formu_s='y='+str(np.exp(gg[3][1]))+str('e')+'^'+str(gg[3][0]) +'x'
        elif gg[1] == '幂函数':
            x=fw
            y_sh=np.exp(gg[3][1]+(np.log(x)*gg[3][0]))   
            formu_s='y='+str(np.exp(gg[3][1]))+str('x')+'^'+str(gg[3][0])
        elif gg[1] == '对数':
            x=fw
            y_sh=gg[3][1]+(np.log(x)*gg[3][0])  
            formu_s='y='+str(gg[3][1])+'+'+str(gg[3][0])+'In(x)'      
        elif gg[1] == '生长':
            x=fw
            y_sh=np.exp(gg[3][0]*x+gg[3][1])   
            formu_s='y='+'e^('+str(gg[3][0])+str('x')+str('+(')+str(gg[3][1])+str('))')     
        elif gg[1] == '三次':
            x=fw
            y_sh=gg[3][0]*x**3+gg[3][1]*x**2+gg[3][2]*x+gg[3][3]
            formu_s='y='+str(gg[3][0])+str('x^3+')+str(gg[3][1])+str('x^2+')+str(gg[3][2])+str('x')+str('+(')+str(gg[3][3])+str(')')
        elif gg[1] == 'S函数':
            x=fw
            y_sh=np.exp(gg[3][0]*(x)**(-1)+gg[3][1])   
            formu_s='y='+'e^('+str(gg[3][0])+str('(1/x)')+str('+(')+str(gg[3][1])+str('))')          
        elif gg[1] == '逆函数':
            x=fw
            y_sh=gg[3][0]*(x)**(-1)+gg[3][1]   
            formu_s='y='+str(gg[3][0])+str('(1/x)')+str('+(')+str(gg[3][1])+str(')')
        elif gg[1] == '复合函数':
            x=fw
            y_sh=np.exp(gg[3][1]+(gg[3][0]*x))   
            formu_s='y='+str(np.exp(gg[3][1])) +'*'+str(np.exp(gg[3][0])) +'^x'       
        gg.append(formu_s)
        del gg[3]
        gg=[gg]
        
        df_a=df_a.append(gg,ignore_index=(True))
        
        
        
     
        # if gg[1] == '二次':
        #     x=np.arange(0.15,0.4,0.002)
        #     y_nh=gg[3][0]*x**2+gg[3][1]*x+gg[3][2]-x
        #     formu_n='y_cz='+str(gg[3][0])+str('x^2+')+str(gg[3][1])+str('x')+str('+(')+str(gg[3][2])+str(')')+'-x'
        # elif gg[1] == '线性':
        #     x=np.arange(0.15,0.4,0.002)
        #     y_nh=gg[3][0]*x+gg[3][1]-x
        #     formu_n='y_cz='+str(gg[3][0])+str('x')+str('+(')+str(gg[3][1])+str(')')+'-x'
        # elif gg[1] == '指数':
        #     x=np.arange(0.15,0.4,0.002)
        #     y_nh=np.exp(gg[3][0]*x+np.log(gg[3][1]))-x
        #     # formu=str(gg[3][0])+str('x')+str('+(')+str(gg[3][1])+str(')')    
        # else :
        #     x=np.arange(0.15,0.4,0.002)
        #     y_nh=np.exp(gg[3][0]*x+np.log(gg[3][1])) -x
        
        # if gg[5] == '二次':
        #     x=np.arange(0.15,0.4,0.002)
        #     y_sh=gg[7][0]*x**2+gg[7][1]*x+gg[7][2] -x
        #     formu_s='y_zh='+str(gg[7][0])+str('x^2+')+str(gg[7][1])+str('x')+str('+(')+str(gg[7][2])+str(')')+'-x'
        # elif gg[5] == '线性':
        #     x=np.arange(0.15,0.4,0.002)
        #     y_sh=gg[7][0]*x+gg[7][1] -x
        #     formu_s='y_zh='+str(gg[7][0])+str('x')+str('+(')+str(gg[7][1])+str(')')+'-x'
        # elif gg[5] == '指数':
        #     x=np.arange(0.15,0.4,0.002)
        #     y_sh=np.exp(gg[7][0]*x+np.log(gg[7][1])) -x 
        # else :
        #     x=np.arange(0.15,0.4,0.002)
        #     y_sh=np.exp(ff[7][0]*x+np.log(ff[7][1])) -x
        
        
        
        
        
        
        
        
        
        # fig11=plt.figure(num=11,figsize=(20,17))
        # ax11=fig11.add_subplot(111)
        #调整保存图片的大小
        plt.figure(figsize=(20, 15))
        
        plt.plot(x,y_sh,'r-.o',label=y_因变量+formu_s+'  r2='+str(gg[0][2]),linewidth=0.05)
        
        
        plt.tick_params(labelsize=23)
        
        plt.xlabel(x_自变量,fontsize=40)
        
        plt.ylabel(y_因变量,fontsize=40)
        
        
        
        
        plt.title(str(gg[0][0])+'--'+x_自变量+'&'+y_因变量,fontsize=40) #要用plt调动title
        
        plt.legend(fontsize=30)
    
    
    
    
        x2=data_df[(data_df['标签']==gg[0][0])][['自变量']]
        y2=data_df[(data_df['标签']==gg[0][0])][['因变量']]
        
       
        colors2 = '#DC143C'
        area = np.pi * 6**2.7  # 点面积 
        # 画散点图
        plt.scatter(x2, y2, s=area, c=colors2, alpha=0.5)
        plt.savefig('')
        
        
        plt.savefig(io_1+'/%s.jpg'%(gg[0][0]), bbox_inches='tight')
        plt.show()
        # plt.close()
        j=j+1
        if j > len(a)-1:    
            break
    df_a.columns= ['标签','类型', 'r2','公式'] 
    return df_a

data_df = pd.read_csv(r"E:\回归.csv")
data_df = data_df[data_df.WaterSpeed >= 15]
df_d = pd.DataFrame(columns=('标签','类型', 'r2', '系数'))
x_自变量 = data_df['自变量']
y_因变量 = data_df['因变量']
io_1 = r'C:\Users\**\Desktop\图'
fw = np.arange(1, 100, 1)
answer = analysis_of_regression(data_df, x_自变量, y_因变量, fw, io_1)

写回答
好问题 0 提建议
追加酬金
关注问题
分享
邀请回答
编辑收藏删除
收藏举报

报告相同问题？

关注问题

Python编程语言 list python 有问必答
2021-12-29 11:00

回答 2 已采纳 import random n=int(input()) list=[] for i in range(n): list.append(random.randint(1,200)) print
python编程线性回归 python
2021-06-28 10:33

回答 1 已采纳 import numpy as np import csv import pandas as pd import matplotlib.pyplot as plt from sklearn.line
python一元二次方程求解 python
2022-10-10 18:35

回答 4 已采纳主要是求根那里的表达式有错误，测试例子使用的是第二个链接的第19题，修改如下：参考链接：一元二次方程根的判别式_初三网一元二次方程ax2
python一元线性回归
2022-05-02 21:35

在Python编程环境中，一元线性回归是一种基本的统计学方法，用于研究两个变量之间的关系。这个主题主要涉及数据预处理、模型构建、训练以及预测。在这个案例中，我们将使用`price_diff.csv`数据集来建立一个一元线性...
Python 求一元二次方程问题 python
2021-10-12 12:10

回答 2 已采纳 import math str_in = input('请输出方程系数(a b c):') num = [int(n) for n in str_in.split()] a= num[0]#a b
python编程解决问题 python 有问必答
2021-06-09 20:56

回答 2 已采纳 import random a=[] sum=0 max=0 min=1000 for i in range(20): a.append(random.randint(1,999))
如何matlab或者python实现多元函数的非线性拟合。 python r语言
2021-02-06 22:30

回答 2 已采纳 matlab x1 = [1 2 3 4 5 6]'; x2 = [.2 .4 .8 .9 1.1 2.1]'; X = [x1 x2]; f = [ 3.3079 6.6358 10.31
Python实现一元回归多元回归及参数检验
2022-07-25 21:34

宁然也的博客 Python实现一元回归多元回归及参数检验
阿尔法编程智能实训平台Python python 有问必答
2021-05-31 08:58

回答 7 已采纳 with open('data.txt', 'r') as f: for i in f.readlines(): if i[0]!='#': prin
Python编程填空 python
2021-06-16 10:45

回答 1 已采纳 1、mstr
python求一元二次方程的根 python
2022-11-18 22:13

回答 1 已采纳 print(x1,x2)
python实现一元线性回归方程
2023-10-21 11:36

勿笑葱的博客利用最小二乘法，计算出一元线性回归方程，可以直接调用函数。这里采用的是t检验，数据来源于1990-2012年国内生产总值与成品刚才需求量的统计数据。代码主体用python来实现的，图片是用matlab实现的(个人感觉matlab...
Python用lmfit的lm方法拟合 python
2023-03-04 22:01

回答 1 已采纳 “Devil组”引证GPT后的撰写：用lmfit的lm方法拟合多参数方程时，可以通过调整Parameters对象的参数属性来设置参数权重和步长。其中，每个参数都有一个vary属性，如果vary为Tru
Python一元和多元线性回归模型的原理及评估【附代码】
2024-03-09 19:15

DING0614的博客线性回归模型是利用线性拟合的方式来探寻数据背后的规律，如下图所示，就是通过搭建线性回归模型来寻找这些散点（也称样本点）背后的趋势线（也称回归曲线），而通过这个回归曲线我们就能进行一些简单的预测分析或...
一元线性回归python代码
2021-11-19 21:24

gyh小桂子的博客 4.python代码: 4.1梯度下降法： t1和t2是两组数据，代表着直径数据和价格数据，假设函数(def h(x))是首先进行一个初始赋值，通过梯度下降的方法不断对k和b进行更新，最后拟合出一元线性回归方程。 # 通过分析披萨的...
没有解决我的问题, 去提问

问题事件

关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
系统已结题 11月11日
关注

码龄粉丝数原力等级 --

被采纳

被点赞

采纳率
创建了问题 11月3日

悬赏问题

¥50 python批量提取发票的信息
¥15 mysql安装，初始化数据库失败
¥15 虚幻五引擎内容如何上传至网盘？
¥15 使用mmpose库时出现了问题
¥15 IRI2016模型matlab运行报错
¥50 bat怎么设置电脑后台自动点击网页指定词运行脚本，输入指定网页链接，指定点击词，指定间隔时间，指定网页出现的词，指定网页出现词出现后后点击锁定，放在后台运行不影响前台鼠标工作
¥20 20CrMnMo的高温变形抗力
¥15 RTX3.6 5565驱动中断报错
¥50 带防重放token（Antireplay-Token）的网站怎么用Python发送请求
¥15 visa版本没问题，串口调试助手调试串口正常使用，但是labview刷新不出来

python 一元回归拟合

0条回答 默认 最新

问题事件

悬赏问题

0条回答默认最新