Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
37 changes: 37 additions & 0 deletions main.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
import numpy as np
import pandas as pd


def calculate_mismatches_between_profession_and_qualification(data):
result = 0
for (job, qualification) in zip(data["jobTitle"], data['qualification']):
if not check_substring(job, qualification) and not check_substring(qualification, job):
result += 1
return result


def check_substring(substring, string) -> bool:
words = substring.split(' ')
for word in words:
if word in string:
return True

return False


def get_profession_top_by_parameter(data, profession, first_parameter, second_parameter):
workers = data[data[first_parameter].str.contains(profession)]
return workers[second_parameter].value_counts().head(5)


works = pd.read_csv('works.csv').dropna()
works_lower = works.apply(lambda record: record.astype(str).str.lower())

count_mismatches = calculate_mismatches_between_profession_and_qualification(works_lower)
print(count_mismatches)
print(works.shape[0])

managers_top = get_profession_top_by_parameter(works_lower, "менеджер", "jobTitle", "qualification")
print(managers_top)
engineers_top = get_profession_top_by_parameter(works_lower, "инженер", "qualification", "jobTitle")
print(engineers_top)
24 changes: 24 additions & 0 deletions report.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,24 @@
# Анализ данных

### 1. Количество несовпадений профессий и должностей.
Всего 1068 человека, у 794 из которых обнаружено несовпадение.

### 2. Топ-5 образований для менеджеров.

|Образование|Количество|
|---|---|
|бакалавр|11|
|менеджер|10|
|специалист|6|
|экономист|6|
|экономист-менеджер|4|

### 3. Топ-5 работ для инженеров.

|Работа|Количество|
|---|---|
|заместитель директора|3|
|главный инженер|3|
|ведущий инженер-конструктор|2|
|инженер лесопользования|2|
|директор|2|