Official Survey Paper on the Evaluation of Large Language Models
LLM-eval-survey is the official GitHub page for a survey paper on the evaluation of large language models. The project provides a detailed overview of existing evaluation methods and metrics, offering researchers and developers a comprehensive reference framework.
This is the machine-readable structured data for this agent. AI systems and search engines use this to understand the agent's capabilities.
[
{
"@context": "https://schema.org",
"@type": "SoftwareApplication",
"@id": "https://agentsignals.ai/agents/llm-eval-survey",
"name": "LLM-eval-survey",
"description": "LLM-eval-survey is the official GitHub page for a survey paper on the evaluation of large language models. The project provides a detailed overview of existing evaluation methods and metrics, offering researchers and developers a comprehensive reference framework.",
"url": "https://agentsignals.ai/agents/llm-eval-survey",
"applicationCategory": "研究",
"operatingSystem": "GitHub",
"sameAs": "https://github.com/MLGroupJLU/LLM-eval-survey",
"installUrl": "https://github.com/MLGroupJLU/LLM-eval-survey",
"offers": {
"@type": "Offer",
"price": "0",
"priceCurrency": "USD",
"description": "免费",
"availability": "https://schema.org/InStock"
},
"featureList": [
"Summarize existing evaluation methods",
"Provide a reference framework",
"Promote research progress"
],
"datePublished": "2025-12-05T17:15:45.893894+00:00",
"dateModified": "2025-12-19T05:05:46.090602+00:00",
"publisher": {
"@type": "Organization",
"name": "Agent Signals",
"url": "https://agentsignals.ai"
}
},
{
"@context": "https://schema.org",
"@type": "BreadcrumbList",
"itemListElement": [
{
"@type": "ListItem",
"position": 1,
"name": "Home",
"item": "https://agentsignals.ai"
},
{
"@type": "ListItem",
"position": 2,
"name": "Agents",
"item": "https://agentsignals.ai/agents"
},
{
"@type": "ListItem",
"position": 3,
"name": "LLM-eval-survey",
"item": "https://agentsignals.ai/agents/llm-eval-survey"
}
]
},
{
"@context": "https://schema.org",
"@type": "FAQPage",
"mainEntity": [
{
"@type": "Question",
"name": "What is LLM-eval-survey?",
"acceptedAnswer": {
"@type": "Answer",
"text": "Official Survey Paper on the Evaluation of Large Language Models"
}
},
{
"@type": "Question",
"name": "What features does LLM-eval-survey offer?",
"acceptedAnswer": {
"@type": "Answer",
"text": "Summarize existing evaluation methods, Provide a reference framework, Promote research progress"
}
},
{
"@type": "Question",
"name": "What are the use cases for LLM-eval-survey?",
"acceptedAnswer": {
"@type": "Answer",
"text": "Academic Research, Model Development, Evaluation Tool Development"
}
},
{
"@type": "Question",
"name": "What are the advantages of LLM-eval-survey?",
"acceptedAnswer": {
"@type": "Answer",
"text": "权威性高, 资源丰富, 社区活跃"
}
},
{
"@type": "Question",
"name": "What are the limitations of LLM-eval-survey?",
"acceptedAnswer": {
"@type": "Answer",
"text": "内容较技术性, 更新频率未知"
}
}
]
}
]