From c5c3e323d5f6d051d3c4844a65f09b7e0a3281c9 Mon Sep 17 00:00:00 2001 From: Ravikanth Karra Date: Mon, 9 Sep 2024 15:24:39 -0400 Subject: [PATCH] Done Pandas10 --- 1050Actors&Directors.py | 7 +++++++ 1484GroupSoldProductsByDate.py | 10 ++++++++++ 1693DailyLeadsPartners.py | 32 ++++++++++++++++++++++++++++++++ 3 files changed, 49 insertions(+) create mode 100644 1050Actors&Directors.py create mode 100644 1484GroupSoldProductsByDate.py create mode 100644 1693DailyLeadsPartners.py diff --git a/1050Actors&Directors.py b/1050Actors&Directors.py new file mode 100644 index 0000000..ac99590 --- /dev/null +++ b/1050Actors&Directors.py @@ -0,0 +1,7 @@ +import pandas as pd + +def actors_and_directors(actor_director: pd.DataFrame) -> pd.DataFrame: + result = actor_director.groupby(['actor_id', 'director_id']).size().reset_index(name='cnt') + result = result[(result['cnt'] > 2)] + # print((result)) + return result[['actor_id', 'director_id']] diff --git a/1484GroupSoldProductsByDate.py b/1484GroupSoldProductsByDate.py new file mode 100644 index 0000000..34dee1d --- /dev/null +++ b/1484GroupSoldProductsByDate.py @@ -0,0 +1,10 @@ +import pandas as pd + +def categorize_products(activities: pd.DataFrame) -> pd.DataFrame: + grouped = activities.groupby(['sell_date']) + df1 = grouped.agg( + num_sold = ('product','nunique'), + products = ( 'product',lambda x: ','.join(sorted(set(x)))) + ).reset_index() + # print(df1) + return df1 \ No newline at end of file diff --git a/1693DailyLeadsPartners.py b/1693DailyLeadsPartners.py new file mode 100644 index 0000000..a27f329 --- /dev/null +++ b/1693DailyLeadsPartners.py @@ -0,0 +1,32 @@ +import pandas as pd + +def daily_leads_and_partners(daily_sales: pd.DataFrame) -> pd.DataFrame: + group = daily_sales.groupby(['date_id', 'make_name']) + result = group.agg( + unique_leads=('lead_id', 'nunique'), + unique_partners=('partner_id', 'nunique') + ).reset_index() + return result + # dict = {} + # for i in range(len(daily_sales)): + # dateid = daily_sales['date_id'][i] + # make = daily_sales['make_name'][i] + # leadid = daily_sales['lead_id'][i] + # partnerid = daily_sales['partner_id'][i] + # keytup = (dateid, make) + # if keytup not in dict: + # dict[keytup] = [] + # (dict[keytup]).append({leadid}) + # (dict[keytup]).append({partnerid}) + # else: + # (dict[keytup])[0].add(leadid) + # (dict[keytup])[1].add(partnerid) + # # print(dict) + # result = [] + # for key, value in dict.items(): + # result.append([key[0], key[1] , len(value[0]), len(value[1])]) + # # print(result) + + # df = pd.DataFrame(result, columns = ['date_id', 'make_name', 'unique_leads', 'unique_partners']) + # return df +