datafest competition 2019
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
|
import pandas as pd
|
|
|
|
# read in CSV
|
|
df = pd.read_csv('cleaned/dirty_wellness.csv')
|
|
|
|
|
|
def vectorize_mult(column, dictionary, file=None):
|
|
"""
|
|
Handles vectorizing
|
|
:param column:
|
|
:param dictionary:
|
|
:param file:
|
|
:return:
|
|
"""
|
|
newCol = column + "Num"
|
|
df[newCol] = df[column].map(dictionary)
|
|
if file is not None:
|
|
df.to_csv('cleaned/{}.csv'.format(file))
|
|
|
|
|
|
|
|
vectorize_mult("USGMeasurement", {"No": 0, "Yes": 1}, "wellness")
|