gusucode.com > 马尔科夫决策过程包括一些例程源码程序 > test1.m
nrows = 5; ncols = 5; obstacle = zeros(nrows, ncols); terminal = zeros(nrows, ncols); psucc_act = 1.0; absorb = 0; wrap_around = 0; noop = 0; nrows = 4; ncols = 3; obstacle = zeros(nrows, ncols); obstacle(2,2) = 1; obstacle(4,3)=1; terminal = zeros(nrows, ncols); psucc_act = 0.8; absorb = 0; wrap_around = 1; noop = 0; [T, T2] = mk_grid_world(nrows, ncols, psucc_act, obstacle, terminal, absorb, wrap_around, noop); [A, A2] = mk_grid2(nrows, ncols, psucc_act, obstacle, terminal, absorb, wrap_around, noop);