美文网首页
Python 数据处理

Python 数据处理

作者: 正在充电Loading | 来源:发表于2017-08-24 22:10 被阅读0次

    from sklearn.preprocessing import MinMaxScaler# -*- coding: utf-8 -*-

    import pandas

    data = pandas.read_csv('D:\\PDM\\6.1\\data1.csv')

    #Min-Max标准化

    scaler = MinMaxScaler()

    data['标准化累计票房'] = scaler.fit_transform(data['累计票房'])

    data['标准化豆瓣评分'] = scaler.fit_transform(data['豆瓣评分'])

    #Z-Score标准化

    from sklearn.preprocessing import scale

    data['标准化累计票房'] = scale(data['累计票房'])

    data['标准化豆瓣评分'] = scale(data['豆瓣评分'])

    #Normalizer归一化

    from sklearn.preprocessing import Normalizer

    scaler = Normalizer()

    data['归一化累计票房'] = scaler.fit_transform(

    data['累计票房']

    )[0]

    data['归一化豆瓣评分'] = scaler.fit_transform(

    data['豆瓣评分']

    )[0]

    # -*- coding: utf-8 -*-

    import pandas

    data = pandas.read_csv('D:\\PDM\\6.1\\data2.csv')

    data['症状'] = data['症状'].astype('category')

    dummiesData = pandas.get_dummies(

    data,

    columns=['症状'],

    prefix=['症状'],

    prefix_sep="_"

    )

    import pandas

    data = pandas.read_csv('D:\\PDM\\6.1\\data3.csv')

    from sklearn.preprocessing import Imputer;

    #'mean', 'median', 'most_frequent'

    imputer = Imputer(strategy='mean')

    imputer.fit_transform(data[['累计票房']])

    相关文章

      网友评论

          本文标题:Python 数据处理

          本文链接:https://www.haomeiwen.com/subject/yckydxtx.html