# to sort these into tables: sids = [] marr_val = [[] for i in df['marriage_related'][0][0].keys()] # for other variables # work_val = [[] for i in df['work_related'][0][0].keys()] # ... for i, el in enumerate(df['survey_id']): sids.extend([el for i in marriage_related[i]]) for j, lst in enumerate(marr_val): lst.extend(np.array(marriage_related[i])[:,j]) # casting to np array so that indexing can be easier # the others can be listed below (work_val, ..., age_val) # ^ which means this loop will be 5x the amount of code as above :) marriage_related_df = {'survey_id': sids} for i, el in enumerate(df['marriage_related'][0][0].keys()): marriage_related_df[el] = marr_val[i] pd.DataFrame(marriage_related_df)
survey_idobject
ID1994DHS1.5%
ID1997DHS1.5%
197 others97.1%
DM_nvr_marr_pfloat64
2.7 - 76.96
2.710.12617.55224.97799999999999832.40399999999999639.8347.25654.68199999999999562.10869.53399999999999Missing

0

AM2000DHS

26.03

1

AM2000DHS

25.53

2

AM2000DHS

24.85

3

AM2000DHS

24.34

4

AM2000DHS

24.45

5

AM2000DHS

31.69

6

AM2000DHS

28.25

7

AM2000DHS

27.33

8

AM2000DHS

24.89

9

AM2000DHS

23.79

Hosted onDeepnote