@@ -71,6 +71,8 @@ def __init__(self, chat_data: pd.DataFrame,
71
71
self .convo_aggregation = convo_aggregation
72
72
self .convo_methods = convo_methods
73
73
self .user_aggregation = user_aggregation
74
+ self .user_methods = user_methods
75
+ self .user_columns = user_columns
74
76
# Denotes the columns that can be summarized from the chat level, onto the conversation level.
75
77
self .input_columns = list (input_columns )
76
78
if 'conversation_num' not in self .input_columns :
@@ -177,7 +179,7 @@ def get_conversation_level_aggregates(self) -> None:
177
179
if 'mean' in self .convo_methods :
178
180
self .conv_data = pd .merge (
179
181
left = self .conv_data ,
180
- right = get_average (self .chat_data .copy (), column , 'average_ ' + column , self .conversation_id_col ),
182
+ right = get_mean (self .chat_data .copy (), column , 'mean_ ' + column , self .conversation_id_col ),
181
183
on = [self .conversation_id_col ],
182
184
how = "inner"
183
185
)
@@ -247,7 +249,7 @@ def get_user_level_aggregates(self) -> None:
247
249
# Average/Mean of User-Level Feature
248
250
self .conv_data = pd .merge (
249
251
left = self .conv_data ,
250
- right = get_average (self .user_data .copy (), user_method + "_" + user_column , 'average_user_' + user_method + "_" + user_column , self .conversation_id_col ),
252
+ right = get_mean (self .user_data .copy (), user_method + "_" + user_column , "mean_user_" + user_method + "_" + user_column , self .conversation_id_col ),
251
253
on = [self .conversation_id_col ],
252
254
how = "inner"
253
255
)
@@ -269,7 +271,7 @@ def get_user_level_aggregates(self) -> None:
269
271
# Minima of User-Level Feature
270
272
self .conv_data = pd .merge (
271
273
left = self .conv_data ,
272
- right = get_min (self .user_data .copy (), user_method + "_" + user_column , 'min_user_sum_ ' + user_method + "_" + user_column , self .conversation_id_col ),
274
+ right = get_min (self .user_data .copy (), user_method + "_" + user_column , 'min_user_ ' + user_method + "_" + user_column , self .conversation_id_col ),
273
275
on = [self .conversation_id_col ],
274
276
how = "inner"
275
277
)
@@ -280,7 +282,7 @@ def get_user_level_aggregates(self) -> None:
280
282
# Maxima of User-Level Feature
281
283
self .conv_data = pd .merge (
282
284
left = self .conv_data ,
283
- right = get_max (self .user_data .copy (), user_method + "_" + user_column , 'max_user_sum_ ' + user_method + "_" + user_column , self .conversation_id_col ),
285
+ right = get_max (self .user_data .copy (), user_method + "_" + user_column , 'max_user_ ' + user_method + "_" + user_column , self .conversation_id_col ),
284
286
on = [self .conversation_id_col ],
285
287
how = "inner"
286
288
)
@@ -335,14 +337,14 @@ def get_user_level_aggregates(self) -> None:
335
337
# how="inner"
336
338
# )
337
339
338
- # Average Columns were created using self.get_user_level_averaged_features ()
340
+ # Average Columns were created using self.get_user_level_mean_features ()
339
341
for column in self .columns_to_summarize :
340
342
341
343
if 'mean' in self .convo_methods :
342
344
# Average/Mean of User-Level Feature
343
345
self .conv_data = pd .merge (
344
346
left = self .conv_data ,
345
- right = get_average (self .user_data .copy (), "average_ " + column , 'average_user_avg_ ' + column , self .conversation_id_col ),
347
+ right = get_mean (self .user_data .copy (), "mean_ " + column , 'mean_user_avg_ ' + column , self .conversation_id_col ),
346
348
on = [self .conversation_id_col ],
347
349
how = "inner"
348
350
)
@@ -351,7 +353,7 @@ def get_user_level_aggregates(self) -> None:
351
353
# Standard Deviation of User-Level Feature
352
354
self .conv_data = pd .merge (
353
355
left = self .conv_data ,
354
- right = get_stdev (self .user_data .copy (), "average_ " + column , 'stdev_user_avg_' + column , self .conversation_id_col ),
356
+ right = get_stdev (self .user_data .copy (), "mean_ " + column , 'stdev_user_avg_' + column , self .conversation_id_col ),
355
357
on = [self .conversation_id_col ],
356
358
how = "inner"
357
359
)
@@ -360,7 +362,7 @@ def get_user_level_aggregates(self) -> None:
360
362
# Minima of User-Level Feature
361
363
self .conv_data = pd .merge (
362
364
left = self .conv_data ,
363
- right = get_min (self .user_data .copy (), "average_ " + column , 'min_user_avg_' + column , self .conversation_id_col ),
365
+ right = get_min (self .user_data .copy (), "mean_ " + column , 'min_user_avg_' + column , self .conversation_id_col ),
364
366
on = [self .conversation_id_col ],
365
367
how = "inner"
366
368
)
@@ -369,7 +371,7 @@ def get_user_level_aggregates(self) -> None:
369
371
# Maxima of User-Level Feature
370
372
self .conv_data = pd .merge (
371
373
left = self .conv_data ,
372
- right = get_max (self .user_data .copy (), "average_ " + column , 'max_user_avg_' + column , self .conversation_id_col ),
374
+ right = get_max (self .user_data .copy (), "mean_ " + column , 'max_user_avg_' + column , self .conversation_id_col ),
373
375
on = [self .conversation_id_col ],
374
376
how = "inner"
375
377
)
0 commit comments