cd agi-hackathon
python3 scripts/test_single.py --track thlpcd agi-hackathon
# Install dependencies
pip install -r requirements.txt
# Run evaluation
python3 scripts/evaluate.py --model claude --track allcd agi-hackathon
bash scripts/download_data.shcd agi-hackathon
# Fix multiline choices in TTM and TSCP
python3 scripts/fix_kaggle_datasets.py
# Then manually update About descriptions on Kaggle
# Visit: https://www.kaggle.com/datasets/playra/trinity-cognitive-probes-<track>/edit✅ Repository structure created ✅ Test scripts implemented ✅ Kaggle fix scripts created ✅ Evaluation prompts documented
See README.md for details on Kaggle dataset issues