Skip to content

Commit

Permalink
Merge pull request #65 from lkruse/master
Browse files Browse the repository at this point in the history
upgraded to POMDPTools
  • Loading branch information
zsunberg authored Jul 25, 2022
2 parents a348215 + 3464c39 commit 5e8608e
Show file tree
Hide file tree
Showing 8 changed files with 12 additions and 15 deletions.
8 changes: 3 additions & 5 deletions Project.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "DeepQLearning"
uuid = "de0a67f4-c691-11e8-0034-5fc6e16e22d3"
repo = "https://github.com/JuliaPOMDP/DeepQLearning.jl"
version = "0.6.4"
version = "0.6.5"

[deps]
BSON = "fbb218c0-5317-5bc6-957e-2ee96dd4b1f0"
Expand All @@ -10,8 +10,7 @@ EllipsisNotation = "da5c29d0-fa7d-589e-88eb-ea29b0a81949"
Flux = "587475ba-b771-5e3f-ad9e-33799f191a9c"
LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
POMDPLinter = "f3bd98c0-eb40-45e2-9eb1-f2763262d755"
POMDPModelTools = "08074719-1b2a-587c-a292-00f91cc44415"
POMDPPolicies = "182e52fb-cfd0-5e46-8c26-fd0667c990f4"
POMDPTools = "7588e00f-9cae-40de-98dc-e0c70c48cdd7"
POMDPs = "a93abf59-7444-517b-a68a-c42f96afdd7d"
Parameters = "d96e819e-fc66-5662-9728-84c9c7592b0a"
Printf = "de0858da-6303-5e67-8744-51eddeeeb8d7"
Expand All @@ -25,8 +24,7 @@ CommonRLInterface = "0.2, 0.3"
EllipsisNotation = "0.4, 1.0"
Flux = "0.10, 0.11, 0.12"
POMDPLinter = "0.1"
POMDPModelTools = "0.3.4"
POMDPPolicies = "0.3, 0.4"
POMDPTools = "0.1"
POMDPs = "0.9"
Parameters = "0.12"
StatsBase = "0.32, 0.33"
Expand Down
2 changes: 1 addition & 1 deletion README.md
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,7 @@ using POMDPs
using Flux
using POMDPModels
using POMDPSimulators
using POMDPPolicies
using POMDPTools

# load MDP model from POMDPModels or define your own!
mdp = SimpleGridWorld();
Expand Down
3 changes: 1 addition & 2 deletions src/DeepQLearning.jl
Original file line number Diff line number Diff line change
Expand Up @@ -6,8 +6,7 @@ using Printf
using Parameters
using Flux
using BSON
using POMDPModelTools
using POMDPPolicies
using POMDPTools
using POMDPLinter
using LinearAlgebra
using TensorBoardLogger: TBLogger, log_value
Expand Down
6 changes: 3 additions & 3 deletions src/policy.jl
Original file line number Diff line number Diff line change
Expand Up @@ -67,9 +67,9 @@ POMDPs.action(policy::NNPolicy, o) = _action(policy, o)
POMDPs.action(policy::NNPolicy{P}, s) where {P <: MDP} = _action(policy, POMDPs.convert_s(Array{Float32}, s, policy.problem))
POMDPs.action(policy::NNPolicy{P}, o) where {P <: POMDP} = _action(policy, POMDPs.convert_o(Array{Float32}, o, policy.problem))

POMDPPolicies.actionvalues(policy::NNPolicy, o) = _actionvalues(policy, o)
POMDPPolicies.actionvalues(policy::NNPolicy{P}, s) where {P<:MDP} = _actionvalues(policy, POMDPs.convert_s(Array{Float32}, s, policy.problem))
POMDPPolicies.actionvalues(policy::NNPolicy{P}, o) where {P<:POMDP} = _actionvalues(policy, POMDPs.convert_o(Array{Float32}, o, policy.problem))
POMDPTools.actionvalues(policy::NNPolicy, o) = _actionvalues(policy, o)
POMDPTools.actionvalues(policy::NNPolicy{P}, s) where {P<:MDP} = _actionvalues(policy, POMDPs.convert_s(Array{Float32}, s, policy.problem))
POMDPTools.actionvalues(policy::NNPolicy{P}, o) where {P<:POMDP} = _actionvalues(policy, POMDPs.convert_o(Array{Float32}, o, policy.problem))

POMDPs.value(policy::NNPolicy, o) = _value(policy, o)
POMDPs.value(policy::NNPolicy{P}, s) where {P <: MDP} = _value(policy, POMDPs.convert_s(Array{Float32}, s, policy.problem))
Expand Down
2 changes: 1 addition & 1 deletion test/flux_test.jl
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,8 @@ using Random
using DeepQLearning
using POMDPModels
using POMDPSimulators
using POMDPTools
using RLInterface
using POMDPPolicies
using Test
using Flux

Expand Down
2 changes: 1 addition & 1 deletion test/prototype.jl
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@ using Revise
using Random
using BenchmarkTools
using POMDPs
using POMDPModelTools
using POMDPTools
# using CuArrays
using Flux
using DeepQLearning
Expand Down
2 changes: 1 addition & 1 deletion test/runtests.jl
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
using DeepQLearning
using POMDPModels
using POMDPSimulators
using POMDPPolicies
using POMDPTools
using Flux
using Random
using StaticArrays
Expand Down
2 changes: 1 addition & 1 deletion test/test_env.jl
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
using POMDPs
using POMDPModelTools
using POMDPTools

# Define a test environment
# it has 2 states, it ends up after taking 5 action
Expand Down

2 comments on commit 5e8608e

@zsunberg
Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

@JuliaRegistrator
Copy link

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Registration pull request created: JuliaRegistries/General/64954

After the above pull request is merged, it is recommended that a tag is created on this repository for the registered package version.

This will be done automatically if the Julia TagBot GitHub Action is installed, or can be done manually through the github interface, or via:

git tag -a v0.6.5 -m "<description of version>" 5e8608e10e5a29c937e2d587a010b59911e20b61
git push origin v0.6.5

Please sign in to comment.