zhuge
# -*- coding: utf-8 -*-
"""
Created on Fri Dec 1 18:08:06 2017
@author: Administrator
"""
def popo(dmi,columns):
most_area=Counter(dmi[columns]).most_common(1)
if most_area[0][1]>=2:
dmi2=dmi[dmi[columns]==most_area[0][0]]
print('dmi=',dmi)
#dmi2=dmi1
dmiy=lower_dimention(dmi2)
ratio2=(dmiy.max()-dmiy.min())/dmiy.mean()
ww1=round(k_means( dmiy ),2)
ww2=round(k_means(dmi2[columns]),2)
print('dmi2=',dmi2)
if ratio2<0.1 and len(dmiy)>1:
return [ww1,ww2,10]
print('area_filter',dd)
else:
return [ww1,ww2,len(dmiy)]
dd=numpy.array([[None,None,None],[None,None,None],[None,None,None]])
dd[0]=popo(dmi2,'room')
def filter_data(dmi):
dd=numpy.array([[None,None,None],[None,None,None],[None,None,None]])
#dmi_values=dmi['total_price']
#ratio1=(dmi_values.max()-dmi_values.min())/dmi_values.mean()
#cred1=set(dmi['url'])
#avg1=dmi['total_price']/dmi['area']
dmix=lower_dimention(dmi)
ratio1=(dmix.max()-dmix.min())/dmix.mean()
vv1=round(k_means( dmix ),2)
vv2=round(k_means(dmi['area']),2)
print('x'*100)
print(dmi)
if ratio1<0.1 and len(dmix)>1:
dd[0]=[vv1,vv2,10]
print('room_filter',dd)
else:
dd[0]=[vv1,vv2,len(dmix)]
most_area=Counter(dmi['area']).most_common(1)
if most_area[0][1]>=2:
dmi2=dmi[dmi['area']==most_area[0][0]]
print('dmi=',dmi)
#dmi2=dmi1
dmiy=lower_dimention(dmi2)
ratio2=(dmiy.max()-dmiy.min())/dmiy.mean()
ww1=round(k_means( dmiy ),2)
ww2=round(k_means(dmi2['area']),2)
print('dmi2=',dmi2)
#dmi2_values=dmi2['total_price']
#ratio2=(dmi2_values.max()-dmi2_values.min())/dmi2_values.mean()
#cred2=set(dmi2['url'])
if ratio2<0.1 and len(dmiy)>1:
#avg1=dmi['total_price']/dmi['area']
#avg2=dmi2['total_price']/dmi2['area']
#ww1=round(k_means( avg2 ),2)
#ww2=round(k_means(dmi['area']),2)
dd[1]=[ww1,ww2,10]
print('area_filter',dd)
else:
dd[1]=[ww1,ww2,len(dmiy)]
print('****************************************'*10)
#print(dmi2)
#print(dmi2['floor'])
most_floor=Counter(dmi2['floor']).most_common(1)
#dmi2['floor']=dmi2['floor'].fillna(most_floor[0][0])
if most_floor[0][1]>=2:
dmi3=dmi2[dmi2['floor']==most_floor[0][0]]
#dmi2=dmi1
print('dmi3=',dmi3)
dmiz=lower_dimention(dmi3)
ratio3=(dmiz.max()-dmiz.min())/dmiz.mean()
xx1=round(k_means( dmiz ),2)
xx2=round(k_means(dmi3['area']),2)
#dmi3=dmi2[dmi2['floor']==most_floor[0][0]]
#dmi3_values=dmi3['total_price']
#ratio3=(dmi3_values.max()-dmi3_values.min())/dmi3_values.mean()
#cred3=set(dmi2['url'])
if ratio3<0.1 and len(dmiz)>1:
#avg3=dmi3['total_price']/dmi3['area']
#xx1=round(k_means( dimz ),2)
#xx2=round(k_means(dmi['area']),2)
dd[2]=[xx1,xx2,10]
print(dd)
else:
dd[2]=[xx1,xx2,len(dmiz)]
return dd
ddr=filter_data(dmi2)
【推荐】国内首个AI IDE,深度理解中文开发场景,立即下载体验Trae
【推荐】编程新体验,更懂你的AI,立即体验豆包MarsCode编程助手
【推荐】抖音旗下AI助手豆包,你的智能百科全书,全免费不限次数
【推荐】轻量又高性能的 SSH 工具 IShell:AI 加持,快人一步
· DeepSeek 开源周回顾「GitHub 热点速览」
· 物流快递公司核心技术能力-地址解析分单基础技术分享
· .NET 10首个预览版发布:重大改进与新特性概览!
· AI与.NET技术实操系列(二):开始使用ML.NET
· .NET10 - 预览版1新功能体验(一)