@@ -15,7 +15,7 @@ def create_upload_dict(df:pandas.core.frame.DataFrame, lb_client:Client, base_cl
15
15
row_data_col : Required (str) - Column containing asset URL or file path
16
16
global_key_col : Optional (str) - Column name containing the data row global key - defaults to row data
17
17
external_id_col : Optional (str) - Column name containing the data row external ID - defaults to global key
18
- metadata_index : Optional (dict) - Dictionary where {key=column_name : value=metadata_type} - metadata_type = "enum", "string", "datetime" or "number"
18
+ metadata_index : Optional (dict) - Dictionary where {key=column_name : value=metadata_type}
19
19
local_files : Optional (bool) - If True, will create urls for local files; if False, uploads `row_data_col` as urls
20
20
divider : Optional (str) - String delimiter for all name keys generated
21
21
verbose : Optional (bool) - If True, prints information about code execution
@@ -30,14 +30,17 @@ def create_upload_dict(df:pandas.core.frame.DataFrame, lb_client:Client, base_cl
30
30
external_id_col = external_id_col if external_id_col else global_key_col
31
31
metadata_schema_to_name_key = base_client .get_metadata_schema_to_name_key (lb_mdo = False , divider = divider , invert = False )
32
32
metadata_name_key_to_schema = base_client .get_metadata_schema_to_name_key (lb_mdo = False , divider = divider , invert = True )
33
- global_key_to_upload_dict = {}
34
33
with ThreadPoolExecutor (max_workers = 8 ) as exc :
34
+ global_key_to_upload_dict = {}
35
35
errors = []
36
36
futures = []
37
37
if verbose :
38
38
print (f'Submitting data rows...' )
39
39
for index , row in df .iterrows ():
40
- futures .append (exc .submit (create_data_rows , lb_client , base_client , row , metadata_name_key_to_schema , metadata_schema_to_name_key , row_data_col , global_key_col , external_id_col , metadata_index , local_files , divider ))
40
+ futures .append (exc .submit (
41
+ create_data_rows , lb_client , base_client , row , metadata_name_key_to_schema , metadata_schema_to_name_key ,
42
+ row_data_col , global_key_col , external_id_col , metadata_index , local_files , divider
43
+ ))
41
44
if verbose :
42
45
print (f'Processing data rows...' )
43
46
for f in tqdm (as_completed (futures )):
@@ -68,9 +71,9 @@ def create_data_rows(lb_client:Client, base_client:baseClient, row:pandas.core.s
68
71
metadata_name_key_to_schema : Required (dict) - Dictionary where {key=metadata_field_name_key : value=metadata_schema_id}
69
72
metadata_schema_to_name_key : Required (dict) - Inverse of metadata_name_key_to_schema
70
73
row_data_col : Required (str) - Column containing asset URL or file path
71
- global_key_col : Optional (str) - Column name containing the data row global key - defaults to row data
72
- external_id_col : Optional (str) - Column name containing the data row external ID - defaults to global key
73
- metadata_index : Optional (dict) - Dictionary where {key=column_name : value=metadata_type} - metadata_type = "enum", "string", "datetime" or "number"
74
+ global_key_col : Optional (str) - Column name containing the data row global key
75
+ external_id_col : Optional (str) - Column name containing the data row external ID
76
+ metadata_index : Optional (dict) - Dictionary where {key=column_name : value=metadata_type}
74
77
local_files : Optional (bool) - If True, will create urls for local files; if False, uploads `row_data_col` as urls
75
78
divider : Optional (str) - String delimiter for all name keys generated
76
79
Returns:
0 commit comments