diff --git a/problem1.py b/problem1.py new file mode 100644 index 0000000..dbdc423 --- /dev/null +++ b/problem1.py @@ -0,0 +1,6 @@ +import pandas as pd + +def article_views(views: pd.DataFrame) -> pd.DataFrame: + df=views[views['author_id']==views['viewer_id']].drop_duplicates(subset=['author_id'])[['author_id']].rename(columns={'author_id':'id'}).sort_values(by=['id']) + return df + \ No newline at end of file diff --git a/problem2.py b/problem2.py new file mode 100644 index 0000000..be1f149 --- /dev/null +++ b/problem2.py @@ -0,0 +1,5 @@ +import pandas as pd + +def invalid_tweets(tweets: pd.DataFrame) -> pd.DataFrame: + df=tweets[tweets['content'].str.len() >15 ][['tweet_id']] + return df \ No newline at end of file