ReCo.jl/src/RL/EnvHelper.jl

abstract type EnvHelper end

struct EnvHelperSharedProps{H<:AbstractHook}
    env::Env
    agent::Agent
    hook::H

    n_steps_before_actions_update::Int64
    n_actions_updates_per_episode::Int64
    reward_normalization::Float64

    elliptical_a_b_ratio::Float64

    n_particles::Int64

    old_states_id::Vector{Int64}
    states_id::Vector{Int64}

    actions::Vector{SVector{2,Float64}}
    actions_id::Vector{Int64}

    function EnvHelperSharedProps(
        env::Env,
        agent::Agent,
        hook::H,
        n_steps_before_actions_update::Int64,
        n_actions_updates_per_episode::Int64,
        elliptical_a_b_ratio::Float64,
        n_particles::Int64,
    ) where {H<:AbstractHook}
        reward_normalization = n_particles * n_actions_updates_per_episode

        return new{H}(
            env,
            agent,
            hook,
            n_steps_before_actions_update,
            n_actions_updates_per_episode,
            reward_normalization,
            elliptical_a_b_ratio,
            n_particles,
            fill(0, n_particles),
            fill(0, n_particles),
            fill(SVector(0.0, 0.0), n_particles),
            fill(0, n_particles),
        )
    end
end

function gen_env_helper(::Env, env_helper_params::EnvHelperSharedProps; args)
    return ReCo.method_not_implemented()
end

function get_env_agent_hook(env_helper::EnvHelper)
    return (env_helper.shared.env, env_helper.shared.agent, env_helper.shared.hook)
end
RL code organization 2022-01-11 18:00:41 +00:00			`abstract type EnvHelper end`

			`struct EnvHelperSharedProps{H<:AbstractHook}`
			`env::Env`
			`agent::Agent`
			`hook::H`

			`n_steps_before_actions_update::Int64`
Added reward normalization 2022-01-30 02:20:45 +00:00			`n_actions_updates_per_episode::Int64`
Fixed normalization 2022-01-30 02:32:47 +00:00			`reward_normalization::Float64`
RL code organization 2022-01-11 18:00:41 +00:00
Replaced goal ratio with a_b_ratio and added abs to eigvals ratio 2022-01-25 23:20:53 +00:00			`elliptical_a_b_ratio::Float64`
RL code organization 2022-01-11 18:00:41 +00:00
			`n_particles::Int64`

Added state_id_tensor 2022-01-15 20:27:15 +00:00			`old_states_id::Vector{Int64}`
			`states_id::Vector{Int64}`
RL code organization 2022-01-11 18:00:41 +00:00
			`actions::Vector{SVector{2,Float64}}`
Added state_id_tensor 2022-01-15 20:27:15 +00:00			`actions_id::Vector{Int64}`
RL code organization 2022-01-11 18:00:41 +00:00
			`function EnvHelperSharedProps(`
			`env::Env,`
			`agent::Agent,`
Fixed constructor 2022-01-18 01:25:28 +00:00			`hook::H,`
RL code organization 2022-01-11 18:00:41 +00:00			`n_steps_before_actions_update::Int64,`
Added reward normalization 2022-01-30 02:20:45 +00:00			`n_actions_updates_per_episode::Int64,`
Replaced goal ratio with a_b_ratio and added abs to eigvals ratio 2022-01-25 23:20:53 +00:00			`elliptical_a_b_ratio::Float64,`
RL code organization 2022-01-11 18:00:41 +00:00			`n_particles::Int64,`
Fixed constructor 2022-01-18 01:25:28 +00:00			`) where {H<:AbstractHook}`
Fixed normalization 2022-01-30 02:32:47 +00:00			`reward_normalization = n_particles * n_actions_updates_per_episode`

Fixed constructor 2022-01-18 01:25:28 +00:00			`return new{H}(`
RL code organization 2022-01-11 18:00:41 +00:00			`env,`
			`agent,`
			`hook,`
			`n_steps_before_actions_update,`
Added reward normalization 2022-01-30 02:20:45 +00:00			`n_actions_updates_per_episode,`
Fixed normalization 2022-01-30 02:32:47 +00:00			`reward_normalization,`
Replaced goal ratio with a_b_ratio and added abs to eigvals ratio 2022-01-25 23:20:53 +00:00			`elliptical_a_b_ratio,`
RL code organization 2022-01-11 18:00:41 +00:00			`n_particles,`
			`fill(0, n_particles),`
			`fill(0, n_particles),`
			`fill(SVector(0.0, 0.0), n_particles),`
			`fill(0, n_particles),`
			`)`
			`end`
			`end`

Added shape reward term 2022-01-14 11:28:47 +00:00			`function gen_env_helper(::Env, env_helper_params::EnvHelperSharedProps; args)`
Fixed elliptical_distance 2022-01-14 12:01:14 +00:00			`return ReCo.method_not_implemented()`
RL code organization 2022-01-11 18:00:41 +00:00			`end`

			`function get_env_agent_hook(env_helper::EnvHelper)`
			`return (env_helper.shared.env, env_helper.shared.agent, env_helper.shared.hook)`
			`end`