| model,avg_score,rank | |
| gpt4o,8.9,1 | |
| claude,8.7,2 | |
| gemma3,8.7,2 | |
| llama3,8.6,4 | |
| al_luna,8.5,5 | |
| llamasupport,8.4,6 | |
| mistral,8.3,7 | |
| phi4,7.3,8 | |
| mental_llama2,6.5,9 | |
| model,avg_score,rank | |
| gpt4o,8.9,1 | |
| claude,8.7,2 | |
| gemma3,8.7,2 | |
| llama3,8.6,4 | |
| al_luna,8.5,5 | |
| llamasupport,8.4,6 | |
| mistral,8.3,7 | |
| phi4,7.3,8 | |
| mental_llama2,6.5,9 | |