{"flow": {"nodes": [{"width": 312, "height": 311, "id": "prompt-track_objects", "type": "prompt", "data": {"prompt": "{prompt}", "n": 1, "llms": [{"key": "aa3c0f03-22bd-416e-af4d-4bf5c4278c99", "settings": {"system_msg": "Follow the instructions and then answer the question with only one lowercase word.", "temperature": 1, "functions": [], "function_call": "", "top_p": 1, "stop": [], "presence_penalty": 0, "frequency_penalty": 0}, "name": "GPT3.5", "emoji": "\ud83d\ude42", "model": "gpt-3.5-turbo", "base_model": "gpt-3.5-turbo", "temp": 1, "formData": {"shortname": "GPT3.5", "model": "gpt-3.5-turbo", "system_msg": "Follow the instructions and then answer the question with only one lowercase word.", "temperature": 1, "functions": "", "function_call": "", "top_p": 1, "stop": "", "presence_penalty": 0, "frequency_penalty": 0}}]}, "position": {"x": 448, "y": 224}, "selected": false, "positionAbsolute": {"x": 448, "y": 224}, "dragging": false}, {"width": 333, "height": 182, "id": "eval-track_objects", "type": "evaluator", "data": {"code": "function evaluate(response) {\n\tlet ideal = response.meta['Ideal'];\n\treturn response.text.startsWith(ideal);\n}", "language": "javascript"}, "position": {"x": 820, "y": 150}, "positionAbsolute": {"x": 820, "y": 150}}, {"width": 228, "height": 196, "id": "vis-track_objects", "type": "vis", "data": {"input": "eval-track_objects"}, "position": {"x": 1200, "y": 250}, "positionAbsolute": {"x": 1200, "y": 250}}, {"width": 302, "height": 260, "id": "inspect-track_objects", "type": "inspect", "data": {"input": "prompt-track_objects"}, "position": {"x": 820, "y": 400}, "positionAbsolute": {"x": 820, "y": 400}}, {"width": 423, "height": 417, "id": "table-track_objects", "type": "table", "data": {"rows": [{"prompt": "Keep track of the rabbit. A rabbit is on the shelf. Move all objects on the shelf to the ground. Where is the rabbit?", "ideal": "ground"}, {"prompt": "Keep track of the rabbit. A rabbit is on the shelf. A bag is on the ground. Move all objects on the ground to the shelf. Move all objects on the shelf to the ground. Where is the rabbit?", "ideal": "ground"}, {"prompt": "Keep track of the rabbit. A rabbit is on the shelf. A bag is on the ground. Nothing is on the table. Move all objects on the ground to the table. Move all objects on the shelf to the ground. Where is the rabbit?", "ideal": "ground"}, {"prompt": "Keep track of the rabbit. A rabbit is on the shelf. A bag is on the ground. Nothing is on the table. Move all objects on the ground to the table. Move all objects on the shelf to the ground. Move all objects from the ground to the shelf. Where is the rabbit?", "ideal": "shelf"}, {"prompt": "Keep track of the rabbit. A rabbit is on the table. A bag is on the ground. A book is on the shelf. Move all objects on the table to the ground. Move all objects on the ground to the table. Where is the rabbit?", "ideal": "table"}, {"prompt": "Keep track of the rabbit. A rabbit is on the table. A bag is on the ground. A book is on the shelf. Move all objects on the table to the ground. Move all objects on the ground to the table. Move all items on the shelf to the ground. Where is the rabbit?", "ideal": "table"}, {"prompt": "Keep track of the rabbit. A rabbit is on the table. A bag is on the ground. Nothing is on the shelf. Move all items on the ground to the shelf. Move all items on the ground to the table. Move all items on the ground to the shelf. Where is the rabbit?", "ideal": "table"}, {"prompt": "Keep track of the rabbit. Nothing is on the shelf. A rabbit is on the table. A bag is on the ground. Move all items on the ground to the shelf. Move all items on the ground to the table. Move all items on the ground to the shelf. Where is the rabbit?", "ideal": "table"}, {"prompt": "Keep track of the rabbit. A rabbit is on the table. Nothing is on the ground. Nothing is on the shelf. Move all items on the table to the shelf. Move all items on the ground to the table. Move all items from the table to the ground. Where is the rabbit?", "ideal": "shelf"}, {"prompt": "Keep track of the rabbit. A rabbit is on the table. A bag is on the ground. A book is on the shelf. Move all objects on the table to the ground. Move all items on the ground to the shelf. Move all items from the table to the ground. Move all items from the ground to the table. Where is the rabbit?", "ideal": "shelf"}, {"prompt": "Keep track of the rabbit. A rabbit is on the table. A bag is on the ground. A book is on the shelf. Move all objects on the table to the ground. Move all items on the table to the shelf. Move all items on the shelf to the table. Where is the rabbit?", "ideal": "ground"}, {"prompt": "Keep track of the rabbit. A bag is on the ground. A book is on the shelf. A rabbit is on the table. Move all objects on the table to the ground. Move all items on the table to the shelf. Move all items on the shelf to the table. Where is the rabbit?", "ideal": "ground"}, {"prompt": "Keep track of the rabbit. A rabbit is on the table. A bag is on the ground. Nothing is on the shelf. Move all items on the table to the shelf. Move all items on the ground to the table. Move all items from the table to the ground. Where is the rabbit?", "ideal": "shelf"}, {"prompt": "Keep track of the rabbit. A bag is on the ground. Nothing is on the shelf. A rabbit is on the table. Move all items on the table to the shelf. Move all items on the ground to the table. Move all items from the table to the ground. Where is the rabbit?", "ideal": "shelf"}, {"prompt": "Keep track of the rabbit. A rabbit is on the table. A bag is on the ground. A book is on the shelf. Move all items on the table to the shelf. Move all items on the ground to the table. Move all items from the table to the ground. Where is the rabbit?", "ideal": "shelf"}], "columns": [{"key": "prompt", "header": "Prompt"}, {"key": "ideal", "header": "Ideal"}]}, "position": {"x": -16, "y": 160}, "selected": false, "positionAbsolute": {"x": -16, "y": 160}, "dragging": false}], "edges": [{"source": "prompt-track_objects", "sourceHandle": "prompt", "target": "eval-track_objects", "targetHandle": "responseBatch", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-eval-1686756357355responseBatch"}, {"source": "prompt-track_objects", "sourceHandle": "prompt", "target": "inspect-track_objects", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-prompt-1686756357355prompt-inspect-1686756357355input"}, {"source": "eval-track_objects", "sourceHandle": "output", "target": "vis-track_objects", "targetHandle": "input", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-eval-1686756357355output-vis-1686756357355input"}, {"source": "table-track_objects", "sourceHandle": "Prompt", "target": "prompt-track_objects", "targetHandle": "prompt", "interactionWidth": 100, "markerEnd": {"type": "arrow", "width": "22px", "height": "22px"}, "id": "reactflow__edge-table-1686756385002Prompt-prompt-1686756357355prompt"}], "viewport": {"x": 144, "y": 37, "zoom": 1}}, "cache": {"eval-1686756357355.json": {}, "inspect-1686756357355.json": {}, "prompt-1686756357355.json": {}, "table-1686756385002.json": {}, "vis-1686756357355.json": {}}}