Installation $ python3 -m pip install -r requirements.txt $ python3 -m ipykernel install --name spark-excercises --user Prepare Data # It takes long to generate the datasets $ python3 generator.py