moves-rwth
diff --git a/‎docs/getting_started/grid.ipynb
Lines changed: 113 additions & 30 deletions b/‎docs/getting_started/grid.ipynb
Lines changed: 113 additions & 30 deletions
diff --git a/‎docs/getting_started/pinkgreen.json
Lines changed: 147 additions & 0 deletions b/‎docs/getting_started/pinkgreen.json
Lines changed: 147 additions & 0 deletions
@@ -18,6 +18,7 @@
    "outputs": [],
    "source": [
     "import stormvogel.model\n",
+    "from stormvogel.model import EmptyAction\n",
     "from stormvogel.layout import Layout\n",
     "from stormvogel.show import show"
    ]
@@ -102,19 +103,19 @@
     "    \n",
     "    escaped = pomdp.new_state(\"escaped\")\n",
     "    escaped.set_observation(END)\n",
-    "    reward_model.set(escaped, 0)\n",
+    "    #reward_model.set(escaped, 0)\n",
     "    \n",
     "    grid = [[None for x in range(width)] for y in range(height)]\n",
     "    for x in range(width):\n",
     "        for y in range(height):\n",
     "            if level_list[y][x] == WALKABLE:\n",
     "                grid[y][x] = pomdp.new_state([\"t\", f\"({x},{y})\"])\n",
     "                grid[y][x].set_observation(UNKNOWN)\n",
-    "                reward_model.set(grid[y][x], -1)\n",
+    "                #reward_model.set_state_action_reward(grid[y][x], -1)\n",
     "            if level_list[y][x] == EXIT:\n",
     "                grid[y][x] = pomdp.new_state([\"e\", f\"({x},{y})\"])\n",
     "                grid[y][x].set_observation(UNKNOWN)\n",
-    "                reward_model.set(grid[y][x], 100)\n",
+    "                #reward_model.set_state_action_reward(grid[y][x], 100)\n",
     "                grid[y][x].add_transitions([(1, escaped)])\n",
     "    dirs = {d: pomdp.new_action(d) for d in [UP, DOWN, LEFT, RIGHT]}\n",
     "    positions = {}\n",
@@ -125,14 +126,19 @@
     "                for d,action in dirs.items():\n",
     "                    positions[str(grid[y][x].id)] = {\"x\": x * position_scalar, \"y\": y * position_scalar}\n",
     "                    ((res_x, res_y), observation) = direction_result(x,y,d,level_list,width,height)\n",
+    "\n",
+    "                    \n",
+    "                    \n",
     "                    if not observation == OUT_OF_BOUNDS:\n",
     "                        took_dir = pomdp.new_state([d, f\"({x},{y})\"])\n",
-    "                        reward_model.set(took_dir, 0)\n",
     "                        grid[y][x].add_transitions([(action, took_dir)])\n",
+    "                        reward_model.set_state_action_reward(grid[y][x], action, 0)\n",
     "                        # print(took_dir)\n",
     "                        took_dir.add_transitions([(1, grid[res_y][res_x])])\n",
+    "                        reward_model.set_state_action_reward(took_dir, EmptyAction, -1)\n",
     "                        took_dir.set_observation(observation)\n",
     "    pomdp.add_self_loops()\n",
+    "    reward_model.set_unset_rewards(0)\n",
     "    return pomdp, positions"
    ]
   },
@@ -187,16 +193,82 @@
    "metadata": {},
    "outputs": [
     {
-     "ename": "TypeError",
-     "evalue": "new_pomdp() got an unexpected keyword argument 'create_initial_state'",
-     "output_type": "error",
-     "traceback": [
-      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
-      "\u001b[0;31mTypeError\u001b[0m                                 Traceback (most recent call last)",
-      "Cell \u001b[0;32mIn[4], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m pomdp, positions \u001b[38;5;241m=\u001b[39m \u001b[43mgrid_world\u001b[49m\u001b[43m(\u001b[49m\u001b[43mLEVEL\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m      3\u001b[0m vis \u001b[38;5;241m=\u001b[39m show(pomdp, layout\u001b[38;5;241m=\u001b[39mLayout(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mlayouts/grid.json\u001b[39m\u001b[38;5;124m\"\u001b[39m), separate_labels\u001b[38;5;241m=\u001b[39m[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mt\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124me\u001b[39m\u001b[38;5;124m\"\u001b[39m])\n",
-      "Cell \u001b[0;32mIn[2], line 69\u001b[0m, in \u001b[0;36mgrid_world\u001b[0;34m(level, position_scalar)\u001b[0m\n\u001b[1;32m     67\u001b[0m \u001b[38;5;250m\u001b[39m\u001b[38;5;124;03m\"\"\"Create a grid world with an actor.\"\"\"\u001b[39;00m\n\u001b[1;32m     68\u001b[0m level_list, width, height \u001b[38;5;241m=\u001b[39m parse_level(level)\n\u001b[0;32m---> 69\u001b[0m pomdp \u001b[38;5;241m=\u001b[39m \u001b[43mstormvogel\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mnew_pomdp\u001b[49m\u001b[43m(\u001b[49m\u001b[43mcreate_initial_state\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mFalse\u001b[39;49;00m\u001b[43m)\u001b[49m\n\u001b[1;32m     70\u001b[0m reward_model \u001b[38;5;241m=\u001b[39m pomdp\u001b[38;5;241m.\u001b[39madd_rewards(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m     72\u001b[0m escaped \u001b[38;5;241m=\u001b[39m pomdp\u001b[38;5;241m.\u001b[39mnew_state(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mescaped\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n",
-      "\u001b[0;31mTypeError\u001b[0m: new_pomdp() got an unexpected keyword argument 'create_initial_state'"
-     ]
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "676e37cbe8a846d19550bccc6d5c4dd5",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Output()"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "text/html": [
+       "<script>fetch('http://127.0.0.1:8889/vDdOnHCrvh/MESSAGE/' + 'test message')</script>"
+      ],
+      "text/plain": [
+       "<IPython.core.display.HTML object>"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "text/html": [
+       "<script>fetch('http://127.0.0.1:8889/vDdOnHCrvh/MESSAGE/' + 'test message')</script>"
+      ],
+      "text/plain": [
+       "<IPython.core.display.HTML object>"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "text/html": [
+       "<script>fetch('http://127.0.0.1:8889/vDdOnHCrvh/MESSAGE/' + 'test message')</script>"
+      ],
+      "text/plain": [
+       "<IPython.core.display.HTML object>"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "b3f4a3d048254e1cb8573a25408495ac",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "Output()"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "848d2f62271c4a4488bcebe203d3a59e",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "HBox(children=(Output(), Output()))"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
     }
    ],
    "source": [
@@ -223,37 +295,48 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 35,
+   "execution_count": 6,
    "id": "8d5b0e8e-47db-4dfb-a533-a8181ec04751",
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "ERROR (Model.cpp:71): Invalid size (22) of state action reward vector (expected:34).\n"
-     ]
-    },
-    {
-     "ename": "RuntimeError",
-     "evalue": "IllegalArgumentException: Invalid size (22) of state action reward vector (expected:34).",
-     "output_type": "error",
-     "traceback": [
-      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
-      "\u001b[0;31mRuntimeError\u001b[0m                              Traceback (most recent call last)",
-      "Cell \u001b[0;32mIn[35], line 4\u001b[0m\n\u001b[1;32m      1\u001b[0m \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01mstormvogel\u001b[39;00m\u001b[38;5;21;01m.\u001b[39;00m\u001b[38;5;21;01mmapping\u001b[39;00m \u001b[38;5;28;01mimport\u001b[39;00m stormvogel_to_stormpy\n\u001b[0;32m----> 4\u001b[0m stormpy_model \u001b[38;5;241m=\u001b[39m \u001b[43mstormvogel_to_stormpy\u001b[49m\u001b[43m(\u001b[49m\u001b[43mpomdp\u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m~/git/env/lib/python3.12/site-packages/stormvogel/mapping.py:300\u001b[0m, in \u001b[0;36mstormvogel_to_stormpy\u001b[0;34m(model)\u001b[0m\n\u001b[1;32m    298\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m map_ctmc(model)\n\u001b[1;32m    299\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m model\u001b[38;5;241m.\u001b[39mget_type() \u001b[38;5;241m==\u001b[39m stormvogel\u001b[38;5;241m.\u001b[39mmodel\u001b[38;5;241m.\u001b[39mModelType\u001b[38;5;241m.\u001b[39mPOMDP:\n\u001b[0;32m--> 300\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mmap_pomdp\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    301\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m model\u001b[38;5;241m.\u001b[39mget_type() \u001b[38;5;241m==\u001b[39m stormvogel\u001b[38;5;241m.\u001b[39mmodel\u001b[38;5;241m.\u001b[39mModelType\u001b[38;5;241m.\u001b[39mMA:\n\u001b[1;32m    302\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m map_ma(model)\n",
-      "File \u001b[0;32m~/git/env/lib/python3.12/site-packages/stormvogel/mapping.py:225\u001b[0m, in \u001b[0;36mstormvogel_to_stormpy.<locals>.map_pomdp\u001b[0;34m(model)\u001b[0m\n\u001b[1;32m    223\u001b[0m components\u001b[38;5;241m.\u001b[39mobservability_classes \u001b[38;5;241m=\u001b[39m observations\n\u001b[1;32m    224\u001b[0m components\u001b[38;5;241m.\u001b[39mchoice_labeling \u001b[38;5;241m=\u001b[39m choice_labeling\n\u001b[0;32m--> 225\u001b[0m pomdp \u001b[38;5;241m=\u001b[39m \u001b[43mstormpy\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mstorage\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mSparsePomdp\u001b[49m\u001b[43m(\u001b[49m\u001b[43mcomponents\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    227\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m pomdp\n",
-      "\u001b[0;31mRuntimeError\u001b[0m: IllegalArgumentException: Invalid size (22) of state action reward vector (expected:34)."
+      "-------------------------------------------------------------- \n",
+      "Model type: \tPOMDP (sparse)\n",
+      "States: \t22\n",
+      "Transitions: \t34\n",
+      "Choices: \t34\n",
+      "Observations: \t5\n",
+      "Reward Models:  (default)\n",
+      "State Labels: \t12 labels\n",
+      "   * (1,2) -> 1 item(s)\n",
+      "   * escaped -> 1 item(s)\n",
+      "   * ← -> 4 item(s)\n",
+      "   * (1,1) -> 5 item(s)\n",
+      "   * (2,1) -> 5 item(s)\n",
+      "   * t -> 4 item(s)\n",
+      "   * ↑ -> 4 item(s)\n",
+      "   * (3,2) -> 5 item(s)\n",
+      "   * → -> 4 item(s)\n",
+      "   * e -> 1 item(s)\n",
+      "   * ↓ -> 4 item(s)\n",
+      "   * (3,1) -> 5 item(s)\n",
+      "Choice Labels: \t0 labels\n",
+      "-------------------------------------------------------------- \n",
+      "\n"
      ]
     }
    ],
    "source": [
     "from stormvogel.mapping import stormvogel_to_stormpy\n",
     "\n",
     "stormpy_model = stormvogel_to_stormpy(pomdp)\n",
+    "print(stormpy_model)\n",
     "\n",
-    "# TODO use stormpy to find the best policy/schedule, i.e. escape the maze as quickly as possible."
+    "# TODO use stormpy to find the best policy/schedule, i.e. escape the maze as quickly as possible.\n",
+    "# Ask Pim or Linus for help?"
    ]
   },
   {
 
@@ -0,0 +1,147 @@
+{
+  "__fake_macros": {
+    "__group_macro": {
+      "borderWidth": 1,
+      "color": {
+        "background": "white",
+        "border": "black",
+        "highlight": {
+          "background": "white",
+          "border": "red"
+        }
+      },
+      "shape": "ellipse",
+      "mass": 1,
+      "font": {
+        "color": "black",
+        "size": 14
+      }
+    }
+  },
+  "groups": {
+    "states": {
+      "borderWidth": 1,
+      "color": {
+        "background": "#8ff0a4",
+        "border": "black",
+        "highlight": {
+          "background": "white",
+          "border": "red"
+        }
+      },
+      "shape": "ellipse",
+      "mass": 1,
+      "font": {
+        "color": "black",
+        "size": 14
+      }
+    },
+    "actions": {
+      "borderWidth": 1,
+      "color": {
+        "background": "#ffc0cb",
+        "border": "black",
+        "highlight": {
+          "background": "white",
+          "border": "red"
+        }
+      },
+      "shape": "box",
+      "mass": 1,
+      "font": {
+        "color": "black",
+        "size": 14
+      }
+    },
+    "scheduled_actions": {
+      "borderWidth": 1,
+      "color": {
+        "background": "pink",
+        "border": "black",
+        "highlight": {
+          "background": "white",
+          "border": "red"
+        }
+      },
+      "shape": "box",
+      "mass": 1,
+      "font": {
+        "color": "black",
+        "size": 14
+      },
+      "schedColor": false
+    }
+  },
+  "reload_button": false,
+  "edges": {
+    "arrows": "to",
+    "font": {
+      "color": "black",
+      "size": 14
+    },
+    "color": {
+      "color": "black"
+    }
+  },
+  "numbers": {
+    "fractions": true,
+    "digits": 5
+  },
+  "state_properties": {
+    "show_results": true,
+    "result_symbol": "\u2606",
+    "show_rewards": false,
+    "reward_symbol": "\u20ac",
+    "show_observations": true,
+    "observation_symbol": "\u0298"
+  },
+  "layout": {
+    "randomSeed": 5
+  },
+  "misc": {
+    "enable_physics": true,
+    "width": 800,
+    "height": 600,
+    "explore": false
+  },
+  "saving": {
+    "relative_path": true,
+    "filename": "pinkgreen.json",
+    "save_button": false,
+    "load_button": false
+  },
+  "positions": {
+    "0": {
+      "x": 12,
+      "y": -136
+    },
+    "1": {
+      "x": 96,
+      "y": -33
+    },
+    "2": {
+      "x": -90,
+      "y": -53
+    },
+    "3": {
+      "x": 13,
+      "y": 72
+    },
+    "4": {
+      "x": -19,
+      "y": 26
+    },
+    "5": {
+      "x": -47,
+      "y": 161
+    }
+  },
+  "width": 800,
+  "height": 600,
+  "physics": true,
+  "results_and_rewards": {
+    "show_results": true,
+    "resultSymbol": "\u2606",
+    "show_rewards": true
+  }
+}