cp

daveey · daveey · commit 2ffd88e6f933 · 2025-12-17T22:36:54.000-08:00
diff --git a/packages/mettagrid/cpp/include/mettagrid/objects/chest.hpp b/packages/mettagrid/cpp/include/mettagrid/objects/chest.hpp
@@ -1,6 +1,7 @@
 #ifndef PACKAGES_METTAGRID_CPP_INCLUDE_METTAGRID_OBJECTS_CHEST_HPP_
 #define PACKAGES_METTAGRID_CPP_INCLUDE_METTAGRID_OBJECTS_CHEST_HPP_
 
+#include <algorithm>
 #include <set>
 #include <unordered_map>
 #include <vector>
@@ -121,7 +122,8 @@ class Chest : public GridObject, public Usable, public HasInventory {
       throw std::runtime_error("Observation encoder not set for chest");
     }
     std::vector<PartialObservationToken> features;
-    features.reserve(1 + this->inventory.get().size() + this->tag_ids.size() + (this->vibe != 0 ? 1 : 0));
+    // Up to 2 tokens per inventory item (low byte + optional high byte)
+    features.reserve(1 + this->inventory.get().size() * 2 + this->tag_ids.size() + (this->vibe != 0 ? 1 : 0));
 
     if (this->vibe != 0) features.push_back({ObservationFeature::Vibe, static_cast<ObservationType>(this->vibe)});
 
diff --git a/packages/mettagrid/cpp/include/mettagrid/objects/inventory.hpp b/packages/mettagrid/cpp/include/mettagrid/objects/inventory.hpp
@@ -1,6 +1,7 @@
 #ifndef PACKAGES_METTAGRID_CPP_INCLUDE_METTAGRID_OBJECTS_INVENTORY_HPP_
 #define PACKAGES_METTAGRID_CPP_INCLUDE_METTAGRID_OBJECTS_INVENTORY_HPP_
 
+#include <limits>
 #include <string>
 #include <unordered_map>
 #include <vector>
diff --git a/packages/mettagrid/cpp/src/mettagrid/objects/agent.cpp b/packages/mettagrid/cpp/src/mettagrid/objects/agent.cpp
@@ -209,7 +209,7 @@ std::vector<PartialObservationToken> Agent::obs_features() const {
   if (!this->obs_encoder) {
     throw std::runtime_error("Observation encoder not set for agent");
   }
-  const size_t num_tokens = this->inventory.get().size() + this->tag_ids.size() + 5;
+const size_t num_tokens = this->inventory.get().size() * 2 + this->tag_ids.size() + 5;
 
   std::vector<PartialObservationToken> features;
   features.reserve(num_tokens);
diff --git a/packages/mettagrid/docs/observations.md b/packages/mettagrid/docs/observations.md
@@ -103,30 +103,30 @@ The feature set follows this general structure (exact IDs depend on configuratio
 depend on your game configuration (number of resources, whether protocol details are enabled, etc.), so always use
 `IdMap` to get the exact feature IDs for your configuration.
 
-| Feature Name                      | Description                                                                     | Objects with this Feature | Notes                                                                           |
-| --------------------------------- | ------------------------------------------------------------------------------- | ------------------------- | ------------------------------------------------------------------------------- |
-| `agent:group`                     | Agent's group/team identifier                                                   | agents                    |                                                                                 |
-| `agent:frozen`                    | Whether agent is frozen or not. Frozen agents cannot act                        | agents                    |                                                                                 |
-| `episode_completion_pct`          | Portion of the episode completed, from 0 (start) to 255 (end). Not a percentage | self                      |                                                                                 |
-| `last_action`                     | Last action taken by the agent                                                  | self                      |                                                                                 |
-| `last_reward`                     | Last reward received by the agent                                               | self                      |                                                                                 |
-| `vibe`                            | Agent's current vibe                                                            | any object                | Values can be found in `vibes.VIBES`                                            |
-| `agent:compass`                   | Compass direction toward assembler                                              | self                      |                                                                                 |
-| `tag`                             | Tags associated with an object (e.g., "wall", "oxygen_extractor", "blue")       | any object                | Values can be found in `IdMap.tag_names()`. Multiple tags emit multiple tokens. |
-| `cooldown_remaining`              | Remaining cooldown time for objects                                             | assembler, extractors     | Value capped at 255                                                             |
-| `clipped`                         | Whether an assembler is clipped or not                                          | extractors                |                                                                                 |
-| `remaining_uses`                  | Remaining uses for objects with use limits                                      | extractors                | Value capped at 255. Only emitted if `max_uses > 0`                             |
-| `inv:{resource_name}`             | Base inventory amount (amount % token_value_max)                                | agents, chests            | One feature per resource. See [Inventory Encoding](#inventory-encoding) below.  |
-| `inv:{resource_name}:p1`          | Power 1 component ((amount / B) % B)                                            | agents, chests            | Only emitted if amount >= B. See [Inventory Encoding](#inventory-encoding).     |
-| `inv:{resource_name}:p2`          | Power 2 component ((amount / B²) % B)                                           | agents, chests            | Only emitted if amount >= B². See [Inventory Encoding](#inventory-encoding).    |
-| `protocol_input:{resource_name}`  | Required input resource amount for current protocol                             | assembler, extractors     | One feature per resource                                                        |
-| `protocol_output:{resource_name}` | Output resource amount for current protocol                                     | assembler, extractors     | One feature per resource                                                        |
+| Feature Name             | Description                                                                     | Objects with this Feature | Notes                                                                           |
+| ------------------------ | ------------------------------------------------------------------------------- | ------------------------- | ------------------------------------------------------------------------------- |
+| `agent:group`            | Agent's group/team identifier                                                   | agents                    |                                                                                 |
+| `agent:frozen`           | Whether agent is frozen or not. Frozen agents cannot act                        | agents                    |                                                                                 |
+| `episode_completion_pct` | Portion of the episode completed, from 0 (start) to 255 (end). Not a percentage | self                      |                                                                                 |
+| `last_action`            | Last action taken by the agent                                                  | self                      |                                                                                 |
+| `last_reward`            | Last reward received by the agent                                               | self                      |                                                                                 |
+| `vibe`                   | Agent's current vibe                                                            | any object                | Values can be found in `vibes.VIBES`                                            |
+| `agent:compass`          | Compass direction toward assembler                                              | self                      |                                                                                 |
+| `tag`                    | Tags associated with an object (e.g., "wall", "oxygen_extractor", "blue")       | any object                | Values can be found in `IdMap.tag_names()`. Multiple tags emit multiple tokens. |
+| `cooldown_remaining`     | Remaining cooldown time for objects                                             | assembler, extractors     | Value capped at 255                                                             |
+| `clipped`                | Whether an assembler is clipped or not                                          | extractors                |                                                                                 |
+| `remaining_uses`         | Remaining uses for objects with use limits                                      | extractors                | Value capped at 255. Only emitted if `max_uses > 0`                             |
+| `inv:{resource_name}` | Base inventory amount (amount % token_value_max) | agents, chests | One feature per resource. See [Inventory Encoding](#inventory-encoding) below. |
+| `inv:{resource_name}:p1` | Power 1 component ((amount / B) % B) | agents, chests | Only emitted if amount >= B. See [Inventory Encoding](#inventory-encoding). |
+| `inv:{resource_name}:p2` | Power 2 component ((amount / B²) % B) | agents, chests | Only emitted if amount >= B². See [Inventory Encoding](#inventory-encoding). |
+| `protocol_input:{resource_name}` | Required input resource amount for current protocol | assembler, extractors | One feature per resource |
+| `protocol_output:{resource_name}` | Output resource amount for current protocol | assembler, extractors | One feature per resource |
 
 ### Inventory Encoding
 
-Inventory values are encoded using a multi-token scheme with a configurable base (`ObsConfig.token_value_max`, default
-255). This allows representing large amounts while keeping individual token values bounded. The number of tokens is
-dynamically computed based on the maximum inventory value (uint16_t max = 65535).
+Inventory values are encoded using a multi-token scheme with a configurable base
+(`ObsConfig.token_value_max`, default 255). This allows representing large amounts while keeping individual token values
+bounded. The number of tokens is dynamically computed based on the maximum inventory value (uint16_t max = 65535).
 
 - **`inv:{resource}`**: Base value = `amount % B` (always emitted if amount > 0)
 - **`inv:{resource}:p1`**: Power 1 = `(amount / B) % B` (only emitted if amount >= B)
diff --git a/packages/mettagrid/docs/simulator_api.md b/packages/mettagrid/docs/simulator_api.md
@@ -265,9 +265,11 @@ obs = agent.observation
 for token in obs.tokens:
     if token.feature.name == "object_type":
         print(f"Object at ({token.col()}, {token.row()}): {token.value}")
-    elif token.feature.name.startswith("inv:"):
-        resource = token.feature.name[4:]  # Remove "inv:" prefix
-        print(f"Inventory {resource}: {token.value}")
+
+# For inventory, use the agent.inventory property which handles the encoding
+inventory = agent.inventory
+for resource, amount in inventory.items():
+    print(f"Inventory {resource}: {amount}")
 ```
 
 ## Event Handling
diff --git a/packages/mettagrid/python/src/mettagrid/config/mettagrid_c_config.py b/packages/mettagrid/python/src/mettagrid/config/mettagrid_c_config.py
@@ -348,9 +348,7 @@ def convert_to_cpp_game_config(mettagrid_config: dict | GameConfig):
                         if name in resource_name_to_id
                     }
                     limit_defs.append(
-                        CppLimitDef(
-                            resources=resource_ids, base_limit=min(resource_limit.limit, 255), modifiers=modifier_ids
-                        )
+                        CppLimitDef(resources=resource_ids, base_limit=resource_limit.limit, modifiers=modifier_ids)
                     )
 
             inventory_config = CppInventoryConfig()

Original file line number	Diff line number	Diff line change
`@@ -209,7 +209,7 @@ std::vector<PartialObservationToken> Agent::obs_features() const {`
`209`	`209`	`if (!this->obs_encoder) {`
`210`	`210`	`throw std::runtime_error("Observation encoder not set for agent");`
`211`	`211`	`}`
`212`		`- const size_t num_tokens = this->inventory.get().size() + this->tag_ids.size() + 5;`
	`212`	`+const size_t num_tokens = this->inventory.get().size() * 2 + this->tag_ids.size() + 5;`
`213`	`213`
`214`	`214`	`std::vector<PartialObservationToken> features;`
`215`	`215`	`features.reserve(num_tokens);`
Original file line number	Diff line number	Diff line change
`@@ -348,9 +348,7 @@ def convert_to_cpp_game_config(mettagrid_config: dict \| GameConfig):`
`348`	`348`	`if name in resource_name_to_id`
`349`	`349`	`}`
`350`	`350`	`limit_defs.append(`
`351`		`- CppLimitDef(`
`352`		`- resources=resource_ids, base_limit=min(resource_limit.limit, 255), modifiers=modifier_ids`
`353`		`- )`
	`351`	`+ CppLimitDef(resources=resource_ids, base_limit=resource_limit.limit, modifiers=modifier_ids)`
`354`	`352`	`)`
`355`	`353`
`356`	`354`	`inventory_config = CppInventoryConfig()`