restructure library, deprecate challenges (#336)
Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> Co-authored-by: Merwane Hamadi <merwanehamadi@gmail.com>pull/5155/head
parent
b263cab511
commit
b6ad300eda
|
@ -1,21 +0,0 @@
|
||||||
{
|
|
||||||
"name": "TestEngUrlShortener",
|
|
||||||
"category": ["code"],
|
|
||||||
"task": "Create a URL shortener app using HTML, CSS, JavaScript, and a backend language like Python or Node.js. Allow users to input a long URL and generate a shortened version that redirects to the original URL. Store the shortened URLs in a database.",
|
|
||||||
"dependencies": ["TestReturnCode_Simple"],
|
|
||||||
"cutoff": 90,
|
|
||||||
"ground": {
|
|
||||||
"answer": "",
|
|
||||||
"should_contain": [],
|
|
||||||
"should_not_contain": [],
|
|
||||||
"files": ["test.py"],
|
|
||||||
"eval": {
|
|
||||||
"type": "python"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"info": {
|
|
||||||
"difficulty": "advanced",
|
|
||||||
"description": "",
|
|
||||||
"side_effects": []
|
|
||||||
}
|
|
||||||
}
|
|
|
@ -1,21 +0,0 @@
|
||||||
{
|
|
||||||
"name": "TestEngCurrencyConverter",
|
|
||||||
"category": ["code"],
|
|
||||||
"task": "Build a currency converter app using an API for exchange rates. Use HTML, CSS, and JavaScript for the frontend and Node.js for the backend. Allow users to convert between different currencies.",
|
|
||||||
"dependencies": ["TestReturnCode_Simple"],
|
|
||||||
"cutoff": 90,
|
|
||||||
"ground": {
|
|
||||||
"answer": "Tries converting three different currencies which should match the API set up in test.py",
|
|
||||||
"should_contain": ["True", "True", "True"],
|
|
||||||
"should_not_contain": [],
|
|
||||||
"files": ["test.py"],
|
|
||||||
"eval": {
|
|
||||||
"type": "python"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"info": {
|
|
||||||
"difficulty": "advanced",
|
|
||||||
"description": "Converts currency by calling an API and returning the result.",
|
|
||||||
"side_effects": []
|
|
||||||
}
|
|
||||||
}
|
|
|
@ -1,25 +0,0 @@
|
||||||
{
|
|
||||||
"name": "TestEngFileExplorer",
|
|
||||||
"category": ["code"],
|
|
||||||
"task": "Create a file organizer CLI tool in Python that sorts files in a directory based on their file types (e.g., images, documents, audio) and moves them into corresponding folders.",
|
|
||||||
"dependencies": ["TestReturnCode_Simple"],
|
|
||||||
"cutoff": 90,
|
|
||||||
"ground": {
|
|
||||||
"answer": "Given a directory with audio files, images, and txt files, it should sort them into folders.",
|
|
||||||
"should_contain": [
|
|
||||||
"Audio sorted correctly",
|
|
||||||
"Images sorted correctly",
|
|
||||||
".txt files sorted correctly"
|
|
||||||
],
|
|
||||||
"should_not_contain": [],
|
|
||||||
"files": ["test.py"],
|
|
||||||
"eval": {
|
|
||||||
"type": "python"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"info": {
|
|
||||||
"difficulty": "advanced",
|
|
||||||
"description": "Testing the creation of a file organizer CLI tool",
|
|
||||||
"side_effects": []
|
|
||||||
}
|
|
||||||
}
|
|
|
@ -1,21 +0,0 @@
|
||||||
{
|
|
||||||
"name": "TestEngFileOrganizer",
|
|
||||||
"category": ["code"],
|
|
||||||
"task": "Build a currency converter app using an API for exchange rates. Use HTML, CSS, and JavaScript for the frontend and Node.js for the backend. Allow users to convert between different currencies.",
|
|
||||||
"dependencies": ["TestReturnCode_Simple"],
|
|
||||||
"cutoff": 90,
|
|
||||||
"ground": {
|
|
||||||
"answer": "Tries converting three different currencies which should match the API set up in test.py",
|
|
||||||
"should_contain": ["True", "True", "True"],
|
|
||||||
"should_not_contain": [],
|
|
||||||
"files": ["test.py"],
|
|
||||||
"eval": {
|
|
||||||
"type": "python"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"info": {
|
|
||||||
"difficulty": "advanced",
|
|
||||||
"description": "Converts currency by calling an API and returning the result.",
|
|
||||||
"side_effects": []
|
|
||||||
}
|
|
||||||
}
|
|
|
@ -1,21 +0,0 @@
|
||||||
{
|
|
||||||
"name": "TestEngImageResizer",
|
|
||||||
"category": ["code"],
|
|
||||||
"task": "Create a CLI tool in Python that allows users to resize images by specifying the desired width and height. Use the Pillow library for image manipulation.",
|
|
||||||
"dependencies": ["TestReturnCode_Simple"],
|
|
||||||
"cutoff": 90,
|
|
||||||
"ground": {
|
|
||||||
"answer": "Takes two image files img1.jpg and img2.png and checks if they have been resized correctly",
|
|
||||||
"should_contain": ["1280*1280", "640*640"],
|
|
||||||
"should_not_contain": [],
|
|
||||||
"files": ["test.py"],
|
|
||||||
"eval": {
|
|
||||||
"type": "python"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"info": {
|
|
||||||
"difficulty": "advanced",
|
|
||||||
"description": "Asks to build CLI tool that resizes images to a specified width and height.",
|
|
||||||
"side_effects": []
|
|
||||||
}
|
|
||||||
}
|
|
|
@ -1,21 +0,0 @@
|
||||||
{
|
|
||||||
"name": "TestEngMarkdownEditor",
|
|
||||||
"category": ["code"],
|
|
||||||
"task": "Build a simple markdown editor using HTML, CSS, and JavaScript. Allow users to input markdown text and display the formatted output in real-time.",
|
|
||||||
"dependencies": ["TestReturnCode_Simple"],
|
|
||||||
"cutoff": 90,
|
|
||||||
"ground": {
|
|
||||||
"answer": "",
|
|
||||||
"should_contain": [],
|
|
||||||
"should_not_contain": [],
|
|
||||||
"files": ["test.py"],
|
|
||||||
"eval": {
|
|
||||||
"type": "python"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"info": {
|
|
||||||
"difficulty": "advanced",
|
|
||||||
"description": "",
|
|
||||||
"side_effects": []
|
|
||||||
}
|
|
||||||
}
|
|
|
@ -1,23 +0,0 @@
|
||||||
{
|
|
||||||
"name": "TestEngPassGen",
|
|
||||||
"category": ["code"],
|
|
||||||
"task": "Create a password generator CLI tool in Python that generates strong, random passwords based on user-specified criteria, such as length and character types (letters, numbers, symbols).",
|
|
||||||
"dependencies": ["TestReturnCode_Simple"],
|
|
||||||
"cutoff": 90,
|
|
||||||
"ground": {
|
|
||||||
"answer": "Does the following password fulfill the requirements of the user?",
|
|
||||||
"should_contain": [],
|
|
||||||
"should_not_contain": [],
|
|
||||||
"files": ["test.py"],
|
|
||||||
"eval": {
|
|
||||||
"type": "llm",
|
|
||||||
"scoring": "binary",
|
|
||||||
"template": "question"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"info": {
|
|
||||||
"difficulty": "advanced",
|
|
||||||
"description": "Test.py will get content in the format of 1) Length: 10 2) Character types: letters, numbers, symbols 3) Password: 1a2b3c4d5e which the llm will score.",
|
|
||||||
"side_effects": []
|
|
||||||
}
|
|
||||||
}
|
|
|
@ -1,21 +0,0 @@
|
||||||
{
|
|
||||||
"name": "TestEngPomodoro",
|
|
||||||
"category": ["code"],
|
|
||||||
"task": "Develop a Pomodoro timer app using HTML, CSS, and JavaScript. Allow users to set work and break intervals and receive notifications when it's time to switch.",
|
|
||||||
"dependencies": ["TestReturnCode_Simple"],
|
|
||||||
"cutoff": 90,
|
|
||||||
"ground": {
|
|
||||||
"answer": "",
|
|
||||||
"should_contain": [],
|
|
||||||
"should_not_contain": [],
|
|
||||||
"files": ["test.py"],
|
|
||||||
"eval": {
|
|
||||||
"type": "python"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"info": {
|
|
||||||
"difficulty": "advanced",
|
|
||||||
"description": "",
|
|
||||||
"side_effects": []
|
|
||||||
}
|
|
||||||
}
|
|
|
@ -1,21 +0,0 @@
|
||||||
{
|
|
||||||
"name": "TestEngTimerApp",
|
|
||||||
"category": ["code"],
|
|
||||||
"task": "Create a simple timer app using HTML, CSS, and JavaScript that allows users to set a countdown timer and receive an alert when the time is up.",
|
|
||||||
"dependencies": ["TestReturnCode_Simple"],
|
|
||||||
"cutoff": 90,
|
|
||||||
"ground": {
|
|
||||||
"answer": "",
|
|
||||||
"should_contain": [],
|
|
||||||
"should_not_contain": [],
|
|
||||||
"files": ["test.py"],
|
|
||||||
"eval": {
|
|
||||||
"type": "python"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"info": {
|
|
||||||
"difficulty": "advanced",
|
|
||||||
"description": "",
|
|
||||||
"side_effects": []
|
|
||||||
}
|
|
||||||
}
|
|
|
@ -1,21 +0,0 @@
|
||||||
{
|
|
||||||
"name": "TestEngTodoList",
|
|
||||||
"category": ["code"],
|
|
||||||
"task": "Create a simple to-do list app using HTML, CSS, and JavaScript. Store tasks in local storage and allow users to add, edit, and delete tasks.",
|
|
||||||
"dependencies": ["TestReturnCode_Simple"],
|
|
||||||
"cutoff": 90,
|
|
||||||
"ground": {
|
|
||||||
"answer": "",
|
|
||||||
"should_contain": [],
|
|
||||||
"should_not_contain": [],
|
|
||||||
"files": ["test.py"],
|
|
||||||
"eval": {
|
|
||||||
"type": "python"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"info": {
|
|
||||||
"difficulty": "advanced",
|
|
||||||
"description": "",
|
|
||||||
"side_effects": []
|
|
||||||
}
|
|
||||||
}
|
|
Some files were not shown because too many files have changed in this diff Show More
Loading…
Reference in New Issue