Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
23 changes: 23 additions & 0 deletions 01-DepartmentHighestSalary.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
# Problem 1: Department Highest Salary (https://leetcode.com/problems/department-highest-salary/)

import pandas as pd

# solution 1 using groupby and merge
def department_highest_salary(employee: pd.DataFrame, department: pd.DataFrame) -> pd.DataFrame:
max_salary = employee.groupby('departmentId')['salary'].max().reset_index()
result = pd.merge(max_salary, employee)
output = pd.merge(result, department, left_on=['departmentId'], right_on=['id'])
return output[['name_y', 'name_x', 'salary']].rename(columns={'name_y':'Department', 'name_x':'Employee', 'salary':'Salary'})

# solution 2 using transform and merge
def department_highest_salary(employee: pd.DataFrame, department: pd.DataFrame) -> pd.DataFrame:
df = pd.merge(employee, department, left_on='departmentId', right_on='id')
max_salary = df.groupby('departmentId')['salary'].transform('max')
df = df[df['salary']==max_salary]
return df[['name_y', 'name_x', 'salary']].rename(columns={'name_y':'Department', 'name_x':'Employee', 'salary':'Salary'})

"""
Note:
- transform returns a series (it is like partition by in SQL), so it returns the same number of rows as the original DataFrame.
- the default merge is an inner join, so it is fine to omit how='inner', it will only return the rows that have matching values in both DataFrames.
"""
8 changes: 8 additions & 0 deletions 02-RankScores.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
# Problem 2: Rank Scores (https://leetcode.com/problems/rank-scores/)

import pandas as pd

# solution 1 using rank
def order_scores(scores: pd.DataFrame) -> pd.DataFrame:
scores['rank'] = scores['score'].rank(method='dense', ascending=False)
return scores[['score', 'rank']].sort_values(by='score', ascending=False)