Skip to content

Commit c0d1d20

Browse files
authored
update Pluto version (#65)
* update Pluto version * pass local test
1 parent 6f7f368 commit c0d1d20

24 files changed

+514
-12234
lines changed

Manifest.toml

+415-605
Large diffs are not rendered by default.

Project.toml

+3-2
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
[deps]
22
Distributions = "31c24e10-a181-5473-b8eb-7969acd0382f"
33
Flux = "587475ba-b771-5e3f-ad9e-33799f191a9c"
4+
Measures = "442fdcdd-2543-5da2-b0f3-8c86c306513e"
45
Plots = "91a5bcdd-55d7-5caf-9e0b-520d859cae80"
56
PlutoUI = "7f904dfe-b85e-4ff6-b463-dae2292396a8"
67
ReinforcementLearning = "158674fc-8238-5cab-b5ba-03dfc80d1318"
@@ -10,9 +11,9 @@ StatsPlots = "f3b207a7-027a-5e70-b257-86293d7955fd"
1011

1112
[compat]
1213
Distributions = "0.24"
13-
Flux = "0.11"
14+
Flux = "0.12"
1415
Plots = "1.10"
1516
PlutoUI = "0.7"
16-
ReinforcementLearning = "0.8"
17+
ReinforcementLearning = "0.10"
1718
StatsBase = "0.33"
1819
StatsPlots = "0.14"

notebooks/Chapter01_Tic_Tac_Toe.jl

+6-2
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,15 @@
11
### A Pluto.jl notebook ###
2-
# v0.14.3
2+
# v0.16.4
33

44
using Markdown
55
using InteractiveUtils
66

77
# ╔═╡ 9b8c8d1a-481e-11eb-1b85-91264e100b12
8-
using ReinforcementLearning
8+
begin
9+
import Pkg
10+
Pkg.activate(Base.current_project())
11+
using ReinforcementLearning
12+
end
913

1014
# ╔═╡ 7441759c-4853-11eb-3d63-2be1f95f59fe
1115
using Plots

notebooks/Chapter02_Ten_Armed_Testbed.jl

+8-4
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,15 @@
11
### A Pluto.jl notebook ###
2-
# v0.14.3
2+
# v0.16.4
33

44
using Markdown
55
using InteractiveUtils
66

77
# ╔═╡ dab179ae-4a5a-11eb-317c-c7fa9d9ccf8f
8-
using ReinforcementLearning
8+
begin
9+
import Pkg
10+
Pkg.activate(Base.current_project())
11+
using ReinforcementLearning
12+
end
913

1014
# ╔═╡ 109c4fb2-4a5b-11eb-08d5-bd6b1eb0ebe9
1115
using Plots
@@ -110,7 +114,7 @@ function bandit_testbed(
110114
trajectory=VectorSARTTrajectory()
111115
)
112116
h1 = CollectBestActions(;best_action=findmax(env.true_values)[2])
113-
h2 = TotalRewardPerEpisode()
117+
h2 = TotalRewardPerEpisode(;is_display_on_exit=false)
114118
run(agent, env, StopAfterStep(1000), ComposedHook(h1, h2))
115119
h1.isbest, h2.rewards
116120
end
@@ -198,7 +202,7 @@ function gb_bandit_testbed(
198202
)
199203

200204
h1 = CollectBestActions(;best_action=findmax(env.true_values)[2])
201-
h2 = TotalRewardPerEpisode()
205+
h2 = TotalRewardPerEpisode(;is_display_on_exit=false)
202206
run(agent, env, StopAfterStep(1000), ComposedHook(h1, h2))
203207
h1.isbest, h2.rewards
204208
end

notebooks/Chapter03_Grid_World.jl

+3-1
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,13 @@
11
### A Pluto.jl notebook ###
2-
# v0.12.18
2+
# v0.16.4
33

44
using Markdown
55
using InteractiveUtils
66

77
# ╔═╡ bd94028c-5d8e-11eb-22b6-5fa384999fdb
88
begin
9+
import Pkg
10+
Pkg.activate(Base.current_project())
911
using ReinforcementLearning
1012
using Flux
1113
using Statistics

notebooks/Chapter04_Car_Rental.jl

+3-1
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,13 @@
11
### A Pluto.jl notebook ###
2-
# v0.12.18
2+
# v0.16.4
33

44
using Markdown
55
using InteractiveUtils
66

77
# ╔═╡ 92081fb8-5d90-11eb-2078-ddbf87421051
88
begin
9+
import Pkg
10+
Pkg.activate(Base.current_project())
911
using ReinforcementLearning
1012
using Flux
1113
using Statistics

notebooks/Chapter04_Gambler_Problem.jl

+3-1
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,13 @@
11
### A Pluto.jl notebook ###
2-
# v0.12.18
2+
# v0.16.4
33

44
using Markdown
55
using InteractiveUtils
66

77
# ╔═╡ f5cc0f04-5d99-11eb-3abe-bf3fccdac9e6
88
begin
9+
import Pkg
10+
Pkg.activate(Base.current_project())
911
using ReinforcementLearning
1012
using Flux
1113
using Statistics

notebooks/Chapter04_Grid_World.jl

+3-1
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,13 @@
11
### A Pluto.jl notebook ###
2-
# v0.12.18
2+
# v0.16.4
33

44
using Markdown
55
using InteractiveUtils
66

77
# ╔═╡ 604afcfc-5d9d-11eb-0e2d-4971e8c87824
88
begin
9+
import Pkg
10+
Pkg.activate(Base.current_project())
911
using ReinforcementLearning
1012
using Flux
1113
using Statistics

0 commit comments

Comments
 (0)