CodeReviewBench / leaderboard_data.json
kenkaneki's picture
zalupa5
bf8f34b
raw
history blame contribute delete
978 Bytes
{
"entries": [
{
"model_name": "GPT-4-CodeReview",
"model_type": "LLM",
"mode": "Strict",
"review_model_type": "gpt-4",
"programming_language": "Python",
"comment_language": "en",
"topic": "Code Reliability",
"submission_date": "2024-10-06T12:00:00Z",
"version": "v0",
"readability": 8.5,
"relevance": 9.0,
"explanation_clarity": 7.8,
"problem_identification": 8.2,
"actionability": 8.7,
"completeness": 8.0,
"specificity": 7.5,
"contextual_adequacy": 8.3,
"consistency": 8.8,
"brevity": 7.2,
"pass_at_1": 0.75,
"pass_at_5": 0.88,
"pass_at_10": 0.92,
"bleu_at_10": 0.65,
"total_evaluations": 100
}
],
"last_updated": "2024-10-06T12:00:00Z",
"version": "v0"
}