-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathquickstart.sh
More file actions
executable file
·78 lines (66 loc) · 1.96 KB
/
quickstart.sh
File metadata and controls
executable file
·78 lines (66 loc) · 1.96 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
#!/bin/bash
# VANTA Research Reasoning Evaluation (VRRE) - Quick Start Script
echo "VANTA Research Reasoning Evaluation (VRRE) Quick Start"
echo "========================================================="
# Check if Python 3 is available
if ! command -v python3 &> /dev/null; then
echo "❌ Python 3 is required but not found. Please install Python 3."
exit 1
fi
# Check if pip is available
if ! command -v pip3 &> /dev/null; then
echo "❌ pip3 is required but not found. Please install pip."
exit 1
fi
# Install requirements
echo "📦 Installing requirements..."
pip3 install -r requirements.txt
# Check if Ollama is running
if ! curl -s http://localhost:11434/api/tags >/dev/null 2>&1; then
echo "❌ Ollama is not running. Please start Ollama first:"
echo " ollama serve"
exit 1
fi
echo "✅ Ollama is running"
# List available models
echo ""
echo "📋 Available Ollama models:"
ollama list | head -10
echo ""
echo "🔬 Choose an evaluation to run:"
echo "1. Basic evaluation (single model)"
echo "2. Comparative evaluation (multiple models)"
echo "3. Custom tasks example"
echo "4. Run examples"
echo "5. Command line interface"
read -p "Enter choice (1-5): " choice
case $choice in
1)
read -p "Enter model name: " model_name
python3 vrre_eval.py --models "$model_name"
;;
2)
read -p "Enter model names (space separated): " models
python3 vrre_eval.py --models $models --compare
;;
3)
python3 examples.py
;;
4)
python3 examples.py
;;
5)
echo "Command line usage:"
python3 vrre_eval.py --help
;;
*)
echo "Invalid choice. Running basic example..."
python3 vrre_eval.py
;;
esac
echo ""
echo "✅ Evaluation complete!"
echo ""
echo "📄 Check the generated JSON files for detailed results"
echo "🔬 Modify vrre_eval.py to add custom tasks"
echo "📊 Use examples.py as a template for your own evaluations"