Comparative evaluation of Random Forest vs. Isolation Forest on CICIDS2017 flows.
- data/ # cleaned CSV
- src/
- preprocess.py # combines & scales raw CSVs
- train_models.py # trains & evaluates RF and IF
# Clone
git clone https://github.com/Jakebhudson/SIT326-Task-1-HD.git
cd SIT326-Task-1-HD
# 1. Setup virtualenv
python3 -m venv .venv
source .venv/bin/activate
# 2. Install dependencies
pip install --upgrade pip setuptools wheel
pip install pandas scikit-learn python-dotenv kaggle
# 3. Prepare data
mv archive data
python src/preprocess.py
# 4. Train & evaluate
python src/train_models.py