CodeReviewBench

Sleeping

CodeReviewBench / leaderboard_data.json

zalupa5

bf8f34b 6 months ago

978 Bytes

	{
	"entries": [
	{
	"model_name": "GPT-4-CodeReview",
	"model_type": "LLM",
	"mode": "Strict",
	"review_model_type": "gpt-4",
	"programming_language": "Python",
	"comment_language": "en",
	"topic": "Code Reliability",
	"submission_date": "2024-10-06T12:00:00Z",
	"version": "v0",
	"readability": 8.5,
	"relevance": 9.0,
	"explanation_clarity": 7.8,
	"problem_identification": 8.2,
	"actionability": 8.7,
	"completeness": 8.0,
	"specificity": 7.5,
	"contextual_adequacy": 8.3,
	"consistency": 8.8,
	"brevity": 7.2,
	"pass_at_1": 0.75,
	"pass_at_5": 0.88,
	"pass_at_10": 0.92,
	"bleu_at_10": 0.65,
	"total_evaluations": 100
	}
	],
	"last_updated": "2024-10-06T12:00:00Z",
	"version": "v0"
	}