package fehu

You can search for identifiers within the package.

in-package search v0.2.0

On This Page

Example
Tips

package fehu

fehu
- CHANGES
- README
- Library fehu
  - Fehu
    
    Errors
    
    Info
    
    Metadata
    
    Render
    
    Pixel
    
    Space
    
    Value
    
    Discrete
    
    Box
    
    Multi_binary
    
    Multi_discrete
    
    Tuple
    
    Dict
    
    Sequence
    
    Text
    
    Env
    
    Wrapper
    
    Vector_env
    
    Buffer
    
    Replay
    
    Rollout
    
    Training
    
    Policy
    
    Trajectory
- Library fehu.algorithms
  - Fehu_algorithms
    
    Reinforce
    
    Dqn
- Library fehu.envs
  - Fehu_envs
    
    Random_walk
    
    Grid_world
    
    Cartpole
    
    Mountain_car
- Library fehu.visualize
  - Fehu_visualize
    
    Overlay
    
    Video
    
    Sink
- Sources
  - fehu
    
    buffer.ml
    
    env.ml
    
    errors.ml
    
    fehu.ml
    
    fehu__.ml
    
    info.ml
    
    metadata.ml
    
    policy.ml
    
    render.ml
    
    space.ml
    
    training.ml
    
    trajectory.ml
    
    vector_env.ml
    
    wrapper.ml
  - fehu.algorithms
    
    dqn.ml
    
    fehu_algorithms.ml
    
    fehu_algorithms__.ml
    
    reinforce.ml
  - fehu.envs
    
    cartpole.ml
    
    fehu_envs.ml
    
    fehu_envs__.ml
    
    grid_world.ml
    
    mountain_car.ml
    
    random_walk.ml
  - fehu.visualize
    
    fehu_visualize.ml
    
    fehu_visualize__.ml
    
    overlay.ml
    
    sink.ml
    
    utils.ml
    
    wrapper_video.ml

Legend:
Page
Library
Module
Module type
Parameter
Class
Class type
Source

Module `Fehu_envs.Grid_world`Source

Two-dimensional grid world with goal and obstacles.

ID: GridWorld-v0

Observation Space: Fehu.Space.Multi_discrete with shape [5; 5]. Represents the agent's (row, column) position as two discrete coordinates, each in range [0, 5).

Action Space: Fehu.Space.Discrete with 4 choices:

0: Move up (row -= 1)
1: Move down (row += 1)
2: Move left (col -= 1)
3: Move right (col += 1)

Rewards:

+10.0: Reaching the goal at position (4, 4)
-1.0: Every other step (encourages shortest path)

Episode Termination:

Terminated: Agent reaches the goal position (4, 4)
Truncated: Episode exceeds 200 steps

Obstacles: Position (2, 2) is blocked. Actions attempting to move into obstacles or outside the grid leave the agent's position unchanged.

Rendering: ASCII grid visualization:

'A': Agent position
'G': Goal position (4, 4)
'#': Obstacle at (2, 2)
'.': Empty cells

Example

Navigate to the goal while avoiding obstacles:

  let rng = Rune.Rng.create () in
  let env = Fehu_envs.Grid_world.make ~rng () in
  let obs, _ = Fehu.Env.reset env () in
  let rec run_episode steps =
    if steps >= 200 then ()
    else begin
      let action = (* policy maps (row, col) to action 0-3 *) in
      let t = Fehu.Env.step env action in
      match Fehu.Env.render env with
      | Some grid -> print_endline grid
      | None -> ();
      if t.terminated then
        Printf.printf "Goal reached in %d steps!\n" steps
      else
        run_episode (steps + 1)
    end
  in
  run_episode 0

Tips

Optimal policy requires approximately 8 steps (Manhattan distance from (0,0) to (4,4))
Obstacle at (2, 2) forces agents to plan around it
Good for testing Q-learning, DQN, or policy gradient methods on discrete spaces

Sourcetype observation = (int32, Rune.int32_elt) Rune.t

Sourcetype action = (int32, Rune.int32_elt) Rune.t

Sourcetype render = Fehu.Render.t

Sourcetype state = {

mutable position : int * int;
mutable steps : int;

}

Sourceval grid_size : int

Sourceval observation_space : Fehu.Space.Multi_discrete.element Fehu__Space.t

Sourceval action_space : Fehu.Space.Discrete.element Fehu__Space.t

Sourceval metadata : Fehu.Metadata.t

Sourceval is_goal : (int * int) -> bool

Sourceval is_obstacle : (int * int) -> bool

Sourceval is_valid_pos : (int * int) -> bool

Source

val reset : 
  'a ->
  ?options:'b ->
  unit ->
  state ->
  (int32, Rune.int32_elt) Rune.t * Fehu.Info.t

Source

val step : 
  'a ->
  (Int32.t, 'b) Rune.t ->
  state ->
  ((int32, Rune.int32_elt) Rune.t, 'c, 'd) Fehu.Env.transition

Sourceval render_text : state -> string

Sourceval cell_size : int

Sourceval frame_width : int

Sourceval frame_height : int

Sourceval clamp_color : int -> int

Source

val fill_rect : 
  (char, 'a, 'b) Bigarray.Array1.t ->
  width:int ->
  x0:int ->
  y0:int ->
  w:int ->
  h:int ->
  (int * int * int) ->
  unit

Sourceval render_image : state -> Fehu.Render.image

Sourceval render : ('a, 'b, 'c) Fehu.Env.t -> state -> Fehu.Render.frame option

Source

val make : 
  rng:Rune.Rng.key ->
  ?render_mode:Fehu.Env.render_mode ->
  unit ->
  (Fehu.Space.Multi_discrete.element,
    Fehu.Space.Discrete.element,
    Fehu.Render.frame)
    Fehu.Env.t

package fehu

Module Fehu_envs.Grid_worldSource

Example

Tips

Module `Fehu_envs.Grid_world`Source