gokererdogan's
repositories
|
data
|
old
|
EvaluateGradientApproximation.ipynb
|
LearningImportanceSamplers.ipynb
|
.gitignore
|
__init__.py
|
calculate_optimal_w_1d_adjust_mean.py
|
find_the_dot_problem.py
|
find_the_square_problem.py
|
ftd_estimate_gradient.py
|
ftd_estimate_reward.py
|
ftd_plot_learned_policy.py
|
ftd_run_chain.py
|
ftd_run_experiment.py
|
ftd_supervised.py
|
fts_estimate_gradient.py
|
fts_estimate_reward.py
|
fts_plot_learned_policy.py
|
fts_run_chain.py
|
fts_run_experiment.py
|
fts_supervised.py
|
g1d_estimate_gradient.py
|
g1d_run_chain.py
|
g1d_run_experiment.py
|
gradient_estimator.py
|
ideas.md
|
init_plotting.py
|
lddp_1d_gaussian_reference_implementation.py
|
lddp_sampler.py
|
occluding_tiles_problem.py
|
optimizer.py
|
otp_move_tile_supervised.py
|
otp_pick_tile_supervised.py
|
otp_plot_learned_policy.py
|
otp_plot_performance.py
|
otp_run_chain.py
|
otp_run_experiment.py
|
parameter_schedule.py
|
plot_manuscript_figures.py
|
plot_reward_surfaces.py
|
policy.py
|
ref_g1d.txt
|
reward.py
|
run_experiment.py
|
target_distribution.py
|
workspace.py
|