代码转载自:
https://blog.csdn.net/qq_36847641/article/details/78279309
链接为:
# -*- coding: utf-8 -*-
import sys
reload(sys)
sys.setdefaultencoding('utf-8')
# @Author: Chi Yu
# @Date: 2018-07-02 16:23:44
# @Last Modified by: appleyuchi
# @Last Modified time: 2018-07-02 16:45:36
from sklearn.feature_extraction import DictVectorizer
measurements = [
{'city': 'Dubai', 'temperature': 33.},
{'city': 'London', 'temperature': 12.},
{'city': 'San Fransisco', 'temperature': 18.},
]
print"类型是",type(measurements[0])#可以看到这是一个包含两个键的字典,一个字典中包含两个key-value对
print measurements[0]['city']
print measurements[0]['temperature']
# print"measurements=",measurements
vec = DictVectorizer()
print(vec.fit_transform(measurements).toarray())
"""
输出:
array([[ 1., 0., 0., 33.],
[ 0., 1., 0., 12.],
[ 0., 0., 1., 18.]])
"""
print(vec.get_feature_names())
"""
输出:
['city=Dubai', 'city=London', 'city=San Fransisco', 'temperature']
"""
原表形式
转换后形式