{"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-aime_evaluation", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "All answers are integers ranging from 000 to 999, inclusive. Please format your answer as a string with three digits.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "All answers are integers ranging from 000 to 999, inclusive. Please format your answer as a string with three digits.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-aime_evaluation", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.includes(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-aime_evaluation", "type": "vis", "data": {"input": "eval-aime_evaluation"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-aime_evaluation", "type": "inspect", "data": {"input": "prompt-aime_evaluation"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-aime_evaluation", "type": "table", "data": {"rows": [{"prompt": "Find the sum of all positive two-digit integers that are divisible by each of their digits.", "ideal": "630"}, {"prompt": "A fair die is rolled four times. The probability that each of the final three rolls is at least as large as the roll preceding it may be expressed in the form m/n, where m and n are relatively prime positive integers. Find m + n", "ideal": "079"}, {"prompt": "A sphere is inscribed in the tetrahedron whose vertices are A = (6, 0, 0), B = (0, 4, 0), C = (0, 0, 2), and D = (0, 0, 0).The radius of the sphere is m / n, where m and n are relatively prime positive integers. Find m + n.", "ideal": "005"}, {"prompt": "A mail carrier delivers mail to the nineteen houses on the east side of Elm Street. The carrier notices that no two adjacent houses ever get mail on the same day, but that there are never more than two houses in a row that get no mail on the same day. How many different patterns of mail delivery are possible?", "ideal": "351"}, {"prompt": "The numbers 1, 2, 3, 4, 5, 6, 7, and 8 are randomly written on the faces of a regular octahedron so that each face contains a different number. The probability that no two consecutive numbers, where 8 and 1 are considered to be consecutive, are written on faces that share an edge is m/n, where m and n are relatively prime positive integers. Find m + n.", "ideal": "085"}, {"prompt": "Let N be the largest positive integer with the following property: reading from left to right, each pair of consecutive digits of N forms a perfect square. What are the leftmost three digits of N?", "ideal": "816"}, {"prompt": "Each of the 2001 students at a high school studies either Spanish or French, and some study both. The number who study Spanish is between 80 percent and 85 percent of the school population, and the number who study French is between 30 percent and 40 percent. Let m be the smallest number of students who could study both languages, and let M be the largest number of students who could study both languages. Find M-m.", "ideal": "298"}, {"prompt": "A set of positive numbers has the 'triangle-property' if it has three distinct elements that are the lengths of the sides of a triangle whose area is positive. Consider sets {4, 5, 6, ..., n} of consecutive positive integers, all of whose ten-element subsets have the triangle property. What is the largest possible value of n?", "ideal": "253"}, {"prompt": "Each unit square of a 3-by-3 unit-square grid is to be colored either blue or red. For each square, either color is equally likely to be used. The probability of obtaining a grid that does not have a 2-by-2 red square is m/n, where m and n are relatively prime positive integers. Find m + n.", "ideal": "929"}, {"prompt": "Given that x and y are both integers between 100 and 999, inclusive; y is the number formed by reversing the digits of x; and z=|x-y|. How many distinct values of z are possible?", "ideal": "009"}, {"prompt": "A straight river that is 264 meters wide flows from west to east at a rate of 14 meters per minute. Melanie and Sherry sit on the south bank of the river with Melanie a distance of D meters downstream from Sherry. Relative to the water, Melanie swims at 80 meters per minute, and Sherry swims at 60 meters per minute. At the same time, Melanie and Sherry begin swimming in straight lines to a point on the north bank of the river that is equidistant from their starting positions. The two women arrive at this point simultaneously. Find D.", "ideal": "550"}, {"prompt": "Adults made up 5/12 of the crowd of people at a concert. After a bus carrying 50 more people arrived, adults made up 11/25 of the people at the concert. Find the minimum number of adults who could have been at the concert after the bus arrived.", "ideal": "154"}, {"prompt": "A right square pyramid with volume 54 has a base with side length 6. The five vertices of the pyramid all lie on a sphere with radius m/n, where m and n are relatively prime positive integers. Find m+n.", "ideal": "021"}, {"prompt": "Twenty distinct points are marked on a circle and labeled 1 through 20 in clockwise order. A line segment is drawn between every pair of points whose labels differ by a prime number. Find the number of triangles formed whose vertices are among the original 20 points", "ideal": "072"}, {"prompt": "A circle with radius 6 is externally tangent to a circle with radius 24. Find the area of the triangular region bounded by the three common tangent lines of these two circles.", "ideal": "192"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-aime_evaluation", "sourceHandle": "prompt", "target": "eval-aime_evaluation", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-aime_evaluation", "sourceHandle": "prompt", "target": "inspect-aime_evaluation", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-aime_evaluation", "sourceHandle": "output", "target": "vis-aime_evaluation", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-aime_evaluation", "sourceHandle": "Prompt", "target": "prompt-aime_evaluation", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}