|
39 | 39 | "name": "stderr", |
40 | 40 | "output_type": "stream", |
41 | 41 | "text": [ |
42 | | - "\u001b[32m2025-11-03 22:12:09.413\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.utils.dataset_manager\u001b[0m:\u001b[36mvalidate_dataset\u001b[0m:\u001b[36m212\u001b[0m - \u001b[34m\u001b[1mDataset validation passed: /Users/aadam/workspace/JaxARC/data/MiniARC\u001b[0m\n", |
43 | | - "\u001b[32m2025-11-03 22:12:09.414\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.utils.dataset_manager\u001b[0m:\u001b[36mensure_dataset_available\u001b[0m:\u001b[36m81\u001b[0m - \u001b[34m\u001b[1mDataset 'MiniARC' found at /Users/aadam/workspace/JaxARC/data/MiniARC\u001b[0m\n", |
44 | | - "\u001b[32m2025-11-03 22:12:09.417\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mjaxarc.parsers.mini_arc\u001b[0m:\u001b[36m_validate_grid_constraints\u001b[0m:\u001b[36m104\u001b[0m - \u001b[1mMiniARC parser configured with optimal 5x5 grid constraints\u001b[0m\n", |
45 | | - "\u001b[32m2025-11-03 22:12:09.419\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mjaxarc.parsers.mini_arc\u001b[0m:\u001b[36m_scan_available_tasks\u001b[0m:\u001b[36m131\u001b[0m - \u001b[1mFound 149 tasks in MiniARC dataset (lazy loading - tasks loaded on-demand, optimized for 5x5 grids)\u001b[0m\n", |
46 | | - "\u001b[32m2025-11-03 22:12:09.420\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.parsers.mini_arc\u001b[0m:\u001b[36m_load_task_from_disk\u001b[0m:\u001b[36m171\u001b[0m - \u001b[34m\u001b[1mLoaded MiniARC task 'Most_Common_color_l6ab0lf3xztbyxsu3p' from disk\u001b[0m\n", |
47 | | - "\u001b[32m2025-11-03 22:12:09.816\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.parsers.base_parser\u001b[0m:\u001b[36m_log_parsing_stats\u001b[0m:\u001b[36m479\u001b[0m - \u001b[34m\u001b[1mTask Most_Common_color_l6ab0lf3xztbyxsu3p: 3 train pairs, 1 test pairs, max grid size: 5x5\u001b[0m\n", |
48 | | - "\u001b[32m2025-11-03 22:12:09.817\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.utils.task_manager\u001b[0m:\u001b[36mget_global_task_manager\u001b[0m:\u001b[36m236\u001b[0m - \u001b[34m\u001b[1mCreated global task ID manager\u001b[0m\n", |
49 | | - "\u001b[32m2025-11-03 22:12:09.817\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.utils.task_manager\u001b[0m:\u001b[36mregister_task\u001b[0m:\u001b[36m72\u001b[0m - \u001b[34m\u001b[1mRegistered task 'Most_Common_color_l6ab0lf3xztbyxsu3p' with index 0\u001b[0m\n" |
| 42 | + "\u001b[32m2025-11-18 22:47:09.240\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.utils.dataset_manager\u001b[0m:\u001b[36mvalidate_dataset\u001b[0m:\u001b[36m212\u001b[0m - \u001b[34m\u001b[1mDataset validation passed: /Users/aadam/workspace/JaxARC/data/MiniARC\u001b[0m\n", |
| 43 | + "\u001b[32m2025-11-18 22:47:09.240\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.utils.dataset_manager\u001b[0m:\u001b[36mensure_dataset_available\u001b[0m:\u001b[36m81\u001b[0m - \u001b[34m\u001b[1mDataset 'MiniARC' found at /Users/aadam/workspace/JaxARC/data/MiniARC\u001b[0m\n", |
| 44 | + "\u001b[32m2025-11-18 22:47:09.243\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mjaxarc.parsers.mini_arc\u001b[0m:\u001b[36m_validate_grid_constraints\u001b[0m:\u001b[36m104\u001b[0m - \u001b[1mMiniARC parser configured with optimal 5x5 grid constraints\u001b[0m\n", |
| 45 | + "\u001b[32m2025-11-18 22:47:09.245\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mjaxarc.parsers.mini_arc\u001b[0m:\u001b[36m_scan_available_tasks\u001b[0m:\u001b[36m131\u001b[0m - \u001b[1mFound 149 tasks in MiniARC dataset (lazy loading - tasks loaded on-demand, optimized for 5x5 grids)\u001b[0m\n", |
| 46 | + "\u001b[32m2025-11-18 22:47:09.246\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.parsers.mini_arc\u001b[0m:\u001b[36m_load_task_from_disk\u001b[0m:\u001b[36m171\u001b[0m - \u001b[34m\u001b[1mLoaded MiniARC task 'Most_Common_color_l6ab0lf3xztbyxsu3p' from disk\u001b[0m\n", |
| 47 | + "\u001b[32m2025-11-18 22:47:09.240\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.utils.dataset_manager\u001b[0m:\u001b[36mensure_dataset_available\u001b[0m:\u001b[36m81\u001b[0m - \u001b[34m\u001b[1mDataset 'MiniARC' found at /Users/aadam/workspace/JaxARC/data/MiniARC\u001b[0m\n", |
| 48 | + "\u001b[32m2025-11-18 22:47:09.243\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mjaxarc.parsers.mini_arc\u001b[0m:\u001b[36m_validate_grid_constraints\u001b[0m:\u001b[36m104\u001b[0m - \u001b[1mMiniARC parser configured with optimal 5x5 grid constraints\u001b[0m\n", |
| 49 | + "\u001b[32m2025-11-18 22:47:09.245\u001b[0m | \u001b[1mINFO \u001b[0m | \u001b[36mjaxarc.parsers.mini_arc\u001b[0m:\u001b[36m_scan_available_tasks\u001b[0m:\u001b[36m131\u001b[0m - \u001b[1mFound 149 tasks in MiniARC dataset (lazy loading - tasks loaded on-demand, optimized for 5x5 grids)\u001b[0m\n", |
| 50 | + "\u001b[32m2025-11-18 22:47:09.246\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.parsers.mini_arc\u001b[0m:\u001b[36m_load_task_from_disk\u001b[0m:\u001b[36m171\u001b[0m - \u001b[34m\u001b[1mLoaded MiniARC task 'Most_Common_color_l6ab0lf3xztbyxsu3p' from disk\u001b[0m\n", |
| 51 | + "\u001b[32m2025-11-18 22:47:09.658\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.parsers.base_parser\u001b[0m:\u001b[36m_log_parsing_stats\u001b[0m:\u001b[36m479\u001b[0m - \u001b[34m\u001b[1mTask Most_Common_color_l6ab0lf3xztbyxsu3p: 3 train pairs, 1 test pairs, max grid size: 5x5\u001b[0m\n", |
| 52 | + "\u001b[32m2025-11-18 22:47:09.658\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.utils.task_manager\u001b[0m:\u001b[36mget_global_task_manager\u001b[0m:\u001b[36m236\u001b[0m - \u001b[34m\u001b[1mCreated global task ID manager\u001b[0m\n", |
| 53 | + "\u001b[32m2025-11-18 22:47:09.659\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.utils.task_manager\u001b[0m:\u001b[36mregister_task\u001b[0m:\u001b[36m72\u001b[0m - \u001b[34m\u001b[1mRegistered task 'Most_Common_color_l6ab0lf3xztbyxsu3p' with index 0\u001b[0m\n", |
| 54 | + "\u001b[32m2025-11-18 22:47:09.658\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.parsers.base_parser\u001b[0m:\u001b[36m_log_parsing_stats\u001b[0m:\u001b[36m479\u001b[0m - \u001b[34m\u001b[1mTask Most_Common_color_l6ab0lf3xztbyxsu3p: 3 train pairs, 1 test pairs, max grid size: 5x5\u001b[0m\n", |
| 55 | + "\u001b[32m2025-11-18 22:47:09.658\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.utils.task_manager\u001b[0m:\u001b[36mget_global_task_manager\u001b[0m:\u001b[36m236\u001b[0m - \u001b[34m\u001b[1mCreated global task ID manager\u001b[0m\n", |
| 56 | + "\u001b[32m2025-11-18 22:47:09.659\u001b[0m | \u001b[34m\u001b[1mDEBUG \u001b[0m | \u001b[36mjaxarc.utils.task_manager\u001b[0m:\u001b[36mregister_task\u001b[0m:\u001b[36m72\u001b[0m - \u001b[34m\u001b[1mRegistered task 'Most_Common_color_l6ab0lf3xztbyxsu3p' with index 0\u001b[0m\n" |
50 | 57 | ] |
51 | 58 | }, |
52 | 59 | { |
|
117 | 124 | "Action keys: ['operation', 'row', 'col']\n", |
118 | 125 | "\n", |
119 | 126 | "Initial observation shape: (5, 5, 1)\n", |
| 127 | + "\n", |
| 128 | + "Initial observation shape: (5, 5, 1)\n", |
| 129 | + "Point action executed: {'operation': 2, 'row': 2, 'col': 3}\n", |
| 130 | + "Reward: -0.005\n", |
120 | 131 | "Point action executed: {'operation': 2, 'row': 2, 'col': 3}\n", |
121 | 132 | "Reward: -0.005\n" |
122 | 133 | ] |
123 | 134 | } |
124 | 135 | ], |
125 | 136 | "source": [ |
126 | | - "from jaxarc.envs import PointActionWrapper\n", |
| 137 | + "from jaxarc.wrappers import PointActionWrapper\n", |
127 | 138 | "\n", |
128 | 139 | "# Wrap environment\n", |
129 | 140 | "point_env = PointActionWrapper(env)\n", |
|
176 | 187 | } |
177 | 188 | ], |
178 | 189 | "source": [ |
179 | | - "from jaxarc.envs import BboxActionWrapper\n", |
| 190 | + "from jaxarc.wrappers import BboxActionWrapper\n", |
180 | 191 | "\n", |
181 | 192 | "# Wrap environment\n", |
182 | 193 | "bbox_env = BboxActionWrapper(env)\n", |
|
226 | 237 | } |
227 | 238 | ], |
228 | 239 | "source": [ |
229 | | - "from jaxarc.envs import FlattenActionWrapper\n", |
| 240 | + "from jaxarc.wrappers import FlattenActionWrapper\n", |
230 | 241 | "\n", |
231 | 242 | "# Wrap environment\n", |
232 | 243 | "# Using PointActionWrapper here to reduce the action space size for demonstration\n", |
|
277 | 288 | "+ AnswerObservationWrapper: (5, 5, 3)\n", |
278 | 289 | "+ ClipboardObservationWrapper: (5, 5, 4)\n", |
279 | 290 | "\n", |
| 291 | + "Total channels so far: 4\n", |
| 292 | + "+ AnswerObservationWrapper: (5, 5, 3)\n", |
| 293 | + "+ ClipboardObservationWrapper: (5, 5, 4)\n", |
| 294 | + "\n", |
280 | 295 | "Total channels so far: 4\n" |
281 | 296 | ] |
282 | 297 | } |
283 | 298 | ], |
284 | 299 | "source": [ |
285 | | - "from jaxarc.envs import (\n", |
| 300 | + "from jaxarc.wrappers import (\n", |
286 | 301 | " AnswerObservationWrapper,\n", |
287 | 302 | " ClipboardObservationWrapper,\n", |
288 | 303 | " InputGridObservationWrapper,\n", |
|
346 | 361 | } |
347 | 362 | ], |
348 | 363 | "source": [ |
349 | | - "from jaxarc.envs import ContextualObservationWrapper\n", |
| 364 | + "from jaxarc.wrappers import ContextualObservationWrapper\n", |
350 | 365 | "\n", |
351 | 366 | "# Add 3 demonstration pairs as context\n", |
352 | 367 | "env_with_context = ContextualObservationWrapper(env_with_clipboard, num_context_pairs=3)\n", |
|
429 | 444 | "| `AnswerObservationWrapper` | Add answer grid channel | Training with supervision |\n", |
430 | 445 | "| `ClipboardObservationWrapper` | Add clipboard channel | Copy-paste operations |\n", |
431 | 446 | "| `ContextualObservationWrapper` | Add demonstration pairs | Few-shot learning, pattern recognition |\n", |
| 447 | + "| **Visualization Wrappers** | | |\n", |
| 448 | + "| `StepVisualizationWrapper` | Enable detailed SVG rendering | Debugging agent actions and transitions |\n", |
432 | 449 | "\n", |
433 | | - "Wrappers enhance environment usability without altering core logic. They enable flexible action formats and richer observations, facilitating effective agent training and evaluation." |
| 450 | + "Wrappers enhance environment usability without altering core logic. They enable flexible action formats, richer observations, and better visualization, facilitating effective agent training and evaluation." |
434 | 451 | ] |
435 | 452 | } |
436 | 453 | ], |
|
0 commit comments