import pandas as pd


def read_data_dict(filename, type_cast_dict = {}):
    file = open(filename, "r")
    data = []
   
    headers = file.readline()
    headers = headers.strip().split(",")
     
    for line in file:
        pieces = line.strip().split(",")
        
        row_dict = {}
        # go through each column and link the value
        # to the appropriate header
        for i in range(len(pieces)):
        
            if headers[i] in type_cast_dict:
                cast_func = type_cast_dict[headers[i]]
                row_dict[headers[i]] = cast_func(pieces[i])
            else:
                row_dict[headers[i]] = pieces[i]
                
        data.append(row_dict)
        
    return data


data = read_data_dict('heart_failure_clinical_records_dataset.csv')
data[0:5]

[{'age': '75',
  'anaemia': '0',
  'creatinine_phosphokinase': '582',
  'diabetes': '0',
  'ejection_fraction': '20',
  'high_blood_pressure': '1',
  'platelets': '265000',
  'serum_creatinine': '1.9',
  'serum_sodium': '130',
  'sex': '1',
  'smoking': '0',
  'time': '4',
  'DEATH_EVENT': '1'},
 {'age': '55',
  'anaemia': '0',
  'creatinine_phosphokinase': '7861',
  'diabetes': '0',
  'ejection_fraction': '38',
  'high_blood_pressure': '0',
  'platelets': '263358.03',
  'serum_creatinine': '1.1',
  'serum_sodium': '136',
  'sex': '1',
  'smoking': '0',
  'time': '6',
  'DEATH_EVENT': '1'},
 {'age': '65',
  'anaemia': '0',
  'creatinine_phosphokinase': '146',
  'diabetes': '0',
  'ejection_fraction': '20',
  'high_blood_pressure': '0',
  'platelets': '162000',
  'serum_creatinine': '1.3',
  'serum_sodium': '129',
  'sex': '1',
  'smoking': '1',
  'time': '7',
  'DEATH_EVENT': '1'},
 {'age': '50',
  'anaemia': '1',
  'creatinine_phosphokinase': '111',
  'diabetes': '0',
  'ejection_fraction': '20',
  'high_blood_pressure': '0',
  'platelets': '210000',
  'serum_creatinine': '1.9',
  'serum_sodium': '137',
  'sex': '1',
  'smoking': '0',
  'time': '7',
  'DEATH_EVENT': '1'},
 {'age': '65',
  'anaemia': '1',
  'creatinine_phosphokinase': '160',
  'diabetes': '1',
  'ejection_fraction': '20',
  'high_blood_pressure': '0',
  'platelets': '327000',
  'serum_creatinine': '2.7',
  'serum_sodium': '116',
  'sex': '0',
  'smoking': '0',
  'time': '8',
  'DEATH_EVENT': '1'}]

heart failure¶

Data Features¶

Data Usage¶