Skip to content
This repository was archived by the owner on May 6, 2021. It is now read-only.

Commit 8c293d4

Browse files
authored
Reorganize code structure to support distributed reinforcement learning (#169)
* bugfixes with trajectory * simplify trajectories * clean up utils * revisit extensions * update processors * pass tests * reorganize code structure * fix training/testing mode * fix problems found in BasicDQN * improve trajectories * support PrioritizedTrajectory * resolve comments
1 parent a6a3c44 commit 8c293d4

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

59 files changed

+706
-1798
lines changed

.gitignore

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
.DS_Store
2-
/Manifest.toml
2+
Manifest.toml
33
/dev/
44
/checkpoints/
55
/logs/

Project.toml

Lines changed: 4 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -6,12 +6,14 @@ version = "0.5.1"
66
[deps]
77
AbstractTrees = "1520ce14-60c1-5f80-bbc7-55ef81b5835c"
88
Adapt = "79e6a3ab-5dfb-504d-930d-738a2a938a0e"
9-
BSON = "fbb218c0-5317-5bc6-957e-2ee96dd4b1f0"
109
CUDA = "052768ef-5323-5732-b1bb-66c8b64840ba"
10+
CircularArrayBuffers = "9de3a189-e0c0-4e15-ba3b-b14b9fb0aec1"
11+
Dates = "ade2ca70-3891-5945-98fb-dc099432e06a"
1112
Distributions = "31c24e10-a181-5473-b8eb-7969acd0382f"
1213
ElasticArrays = "fdbdab4c-e67f-52f5-8c3f-e7b388dad3d4"
1314
FillArrays = "1a297f60-69ca-5386-bcde-b61e274b549b"
1415
Flux = "587475ba-b771-5e3f-ad9e-33799f191a9c"
16+
Functors = "d9f16b24-f501-4c13-a1f2-28368ffc5196"
1517
GPUArrays = "0c68f7d7-f131-5f86-a1c3-88cf8149b2d7"
1618
ImageTransformations = "02fcd773-0e25-5acc-982a-7f6622650795"
1719
JLD = "4138dd39-2aa7-5051-a626-17a0bb65d9c8"
@@ -28,7 +30,7 @@ Zygote = "e88e6eb3-aa80-5325-afca-941959d7151f"
2830
[compat]
2931
AbstractTrees = "0.3"
3032
Adapt = "2"
31-
BSON = "0.2"
33+
CircularArrayBuffers = "0.1"
3234
CUDA = "1, 2.1"
3335
Distributions = "0.24"
3436
ElasticArrays = "1.2"
@@ -44,10 +46,3 @@ Setfield = "0.6, 0.7"
4446
StatsBase = "0.32, 0.33"
4547
Zygote = "0.5"
4648
julia = "1.4"
47-
48-
[extras]
49-
ReinforcementLearningEnvironments = "25e41dd2-4622-11e9-1641-f1adca772921"
50-
Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
51-
52-
[targets]
53-
test = ["Test", "ReinforcementLearningEnvironments"]

src/ReinforcementLearningCore.jl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ export RLCore
1313

1414
include("utils/utils.jl")
1515
include("extensions/extensions.jl")
16-
include("components/components.jl")
16+
include("policies/policies.jl")
1717
include("core/core.jl")
1818

1919
end # module

src/components/agents/abstract_agent.jl

Lines changed: 0 additions & 78 deletions
This file was deleted.

src/components/agents/agent.jl

Lines changed: 0 additions & 137 deletions
This file was deleted.

src/components/agents/agents.jl

Lines changed: 0 additions & 3 deletions
This file was deleted.

src/components/agents/dyna_agent.jl

Lines changed: 0 additions & 71 deletions
This file was deleted.

src/components/components.jl

Lines changed: 0 additions & 7 deletions
This file was deleted.

0 commit comments

Comments
 (0)