geoHeil
05/26/2022, 12:46 PMgeoHeil
05/26/2022, 12:47 PMgeoHeil
05/26/2022, 12:53 PMsean
05/26/2022, 12:53 PMgeoHeil
05/26/2022, 12:53 PMgeoHeil
05/26/2022, 12:53 PMsean
05/26/2022, 12:53 PMsean
05/26/2022, 12:54 PMgeoHeil
05/26/2022, 12:54 PMgeoHeil
05/26/2022, 12:54 PMgeoHeil
05/26/2022, 12:54 PMsean
05/26/2022, 12:57 PMgeoHeil
05/26/2022, 12:57 PMgeoHeil
05/26/2022, 12:58 PMsean
05/26/2022, 12:58 PMJSON.parse(JSON.stringify({ [""]: "" }))
geoHeil
05/26/2022, 12:59 PMgeoHeil
05/26/2022, 1:02 PMimport pandas as pd
df = pd.DataFrame({'foo':[1,2,3], 'bar':[4,5,6]})
m_derived = df.dtypes.astype('str').rename('dtype').to_frame()
d_c = 'description'
m_derived.loc['foo', d_c] = 'Foo description'
# notice bar is missing accidentally
m_derived.loc['', d_c] = ''
display(m_derived)
column_details = m_derived.reset_index().rename(columns={'index':'column_name'}).to_dict(orient='records')
column_details
m_res = {
'source_upstream':{
'name':'my_dummy_name',
'column_details': column_details,
},
}
m_res
{'source_upstream': {'name': 'my_dummy_name',
'column_details': [{'column_name': 'foo',
'dtype': 'int64',
'description': 'Foo description'},
{'column_name': 'bar', 'dtype': 'int64', 'description': nan},
{'column_name': '', 'dtype': nan, 'description': ''}]}}
geoHeil
05/26/2022, 1:02 PMsean
05/26/2022, 1:02 PMgeoHeil
05/26/2022, 1:02 PMm_res
sean
05/26/2022, 1:04 PMgeoHeil
05/26/2022, 1:04 PMsean
05/26/2022, 1:06 PMsean
05/26/2022, 1:07 PMDagster Bot
05/26/2022, 1:07 PM