datafest competition 2019
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 

22 lines
462 B

import pandas as pd
# read in CSV
df = pd.read_csv('cleaned/dirty_wellness.csv')
def vectorize_mult(column, dictionary, file=None):
"""
Handles vectorizing
:param column:
:param dictionary:
:param file:
:return:
"""
newCol = column + "Num"
df[newCol] = df[column].map(dictionary)
if file is not None:
df.to_csv('cleaned/{}.csv'.format(file))
vectorize_mult("USGMeasurement", {"No": 0, "Yes": 1}, "wellness")