Commit 1ed489c

author

Shunichi09

committed

Update: Cartpole Env and Cartpole models

1 parent e523720 commit 1ed489cCopy full SHA for 1ed489c

File tree

12 files changed

+475

-43

lines changed

Environments.md
PythonLinearNonlinearControl
- configs
- controllers
  - ilqr.py
- envs
  - cartpole.py
- models
  - cartpole.py
scripts
- simple_run.py
tests
- configs
  - test_cartpole.py
  - test_two_wheeled.py
- models
  - test_cartpole.py
  - test_two_wheeled.py

12 files changed

+475

-43

lines changed

`‎Environments.md‎`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -41,7 +41,7 @@ X_g denote the goal states.`
`41`	`41`
`42`	`42`	`## [CatpoleEnv (Swing up)](PythonLinearNonlinearControl/envs/cartpole.py)`
`43`	`43`
`44`		`-System equation.`
	`44`	`+## System equation.`
`45`	`45`
`46`	`46`	`<img src="assets/cartpole.png" width="600">`
`47`	`47`

`‎PythonLinearNonlinearControl/configs/cartpole.py‎`

Lines changed: 49 additions & 11 deletions

Original file line number	Diff line number	Diff line change
`@@ -10,7 +10,11 @@ class CartPoleConfigModule():`
`10`	`10`	`INPUT_SIZE = 1`
`11`	`11`	`DT = 0.02`
`12`	`12`	`# cost parameters`
`13`		`- R = np.diag([0.01])`
	`13`	`+ R = np.diag([1.]) # 0.01 is worked for MPPI and CEM and MPPIWilliams`
	`14`	`+ # 1. is worked for iLQR`
	`15`	`+ Terminal_Weight = 1.`
	`16`	`+ Q = None`
	`17`	`+ Sf = None`
`14`	`18`	`# bounds`
`15`	`19`	`INPUT_LOWER_BOUND = np.array([-3.])`
`16`	`20`	`INPUT_UPPER_BOUND = np.array([3.])`
`@@ -128,12 +132,14 @@ def terminal_state_cost_fn(terminal_x, terminal_g_x):`
`128`	`132`	`return (6. * (terminal_x[:, 0]**2) \`
`129`	`133`	`+ 12. * ((np.cos(terminal_x[:, 2]) + 1.)**2) \`
`130`	`134`	`+ 0.1 * (terminal_x[:, 1]**2) \`
`131`		`- + 0.1 * (terminal_x[:, 3]**2))[:, np.newaxis]`
	`135`	`+ + 0.1 * (terminal_x[:, 3]**2))[:, np.newaxis] \`
	`136`	`+ * CartPoleConfigModule.Terminal_Weight`
`132`	`137`
`133`		`- return 6. * (terminal_x[0]**2) \`
	`138`	`+ return (6. * (terminal_x[0]**2) \`
`134`	`139`	`+ 12. * ((np.cos(terminal_x[2]) + 1.)**2) \`
`135`	`140`	`+ 0.1 * (terminal_x[1]**2) \`
`136`		`- + 0.1 * (terminal_x[3]**2)`
	`141`	`+ + 0.1 * (terminal_x[3]**2)) \`
	`142`	`+ * CartPoleConfigModule.Terminal_Weight`
`137`	`143`
`138`	`144`	`@staticmethod`
`139`	`145`	`def gradient_cost_fn_with_state(x, g_x, terminal=False):`
`@@ -148,9 +154,21 @@ def gradient_cost_fn_with_state(x, g_x, terminal=False):`
`148`	`154`	`or shape(1, state_size)`
`149`	`155`	`"""`
`150`	`156`	`if not terminal:`
`151`		`- return None`
	`157`	`+ cost_dx0 = 12. * x[:, 0]`
	`158`	`+ cost_dx1 = 0.2 * x[:, 1]`
	`159`	`+ cost_dx2 = 24. * (1 + np.cos(x[:, 2])) * -np.sin(x[:, 2])`
	`160`	`+ cost_dx3 = 0.2 * x[:, 3]`
	`161`	`+ cost_dx = np.stack((cost_dx0, cost_dx1,\`
	`162`	`+ cost_dx2, cost_dx3), axis=1)`
	`163`	`+ return cost_dx`
`152`	`164`
`153`		`- return None`
	`165`	`+ cost_dx0 = 12. * x[0]`
	`166`	`+ cost_dx1 = 0.2 * x[1]`
	`167`	`+ cost_dx2 = 24. * (1 + np.cos(x[2])) * -np.sin(x[2])`
	`168`	`+ cost_dx3 = 0.2 * x[3]`
	`169`	`+ cost_dx = np.array([[cost_dx0, cost_dx1, cost_dx2, cost_dx3]])`
	`170`	`+`
	`171`	`+ return cost_dx * CartPoleConfigModule.Terminal_Weight`
`154`	`172`
`155`	`173`	`@staticmethod`
`156`	`174`	`def gradient_cost_fn_with_input(x, u):`
`@@ -163,7 +181,7 @@ def gradient_cost_fn_with_input(x, u):`
`163`	`181`	`Returns:`
`164`	`182`	`l_u (numpy.ndarray): gradient of cost, shape(pred_len, input_size)`
`165`	`183`	`"""`
`166`		`- return None`
	`184`	`+ return 2.unp.diag(CartPoleConfigModule.R)`
`167`	`185`
`168`	`186`	`@staticmethod`
`169`	`187`	`def hessian_cost_fn_with_state(x, g_x, terminal=False):`
`@@ -179,10 +197,30 @@ def hessian_cost_fn_with_state(x, g_x, terminal=False):`
`179`	`197`	`shape(1, state_size, state_size) or`
`180`	`198`	`"""`
`181`	`199`	`if not terminal:`
`182`		`- (pred_len, _) = x.shape`
`183`		`- return None`
	`200`	`+ (pred_len, state_size) = x.shape`
	`201`	`+ hessian = np.eye(state_size)`
	`202`	`+ hessian = np.tile(hessian, (pred_len, 1, 1))`
	`203`	`+ hessian[:, 0, 0] = 12.`
	`204`	`+ hessian[:, 1, 1] = 0.2`
	`205`	`+ hessian[:, 2, 2] = 24. * -np.sin(x[:, 2]) \`
	`206`	`+ * (-np.sin(x[:, 2])) \`
	`207`	`+ + 24. * (1. + np.cos(x[:, 2])) \`
	`208`	`+ * -np.cos(x[:, 2])`
	`209`	`+ hessian[:, 3, 3] = 0.2`
	`210`	`+`
	`211`	`+ return hessian`
`184`	`212`
`185`		`- return None`
	`213`	`+ state_size = len(x)`
	`214`	`+ hessian = np.eye(state_size)`
	`215`	`+ hessian[0, 0] = 12.`
	`216`	`+ hessian[1, 1] = 0.2`
	`217`	`+ hessian[2, 2] = 24. * -np.sin(x[2]) \`
	`218`	`+ * (-np.sin(x[2])) \`
	`219`	`+ + 24. * (1. + np.cos(x[2])) \`
	`220`	`+ * -np.cos(x[2])`
	`221`	`+ hessian[3, 3] = 0.2`
	`222`	`+`
	`223`	`+ return hessian[np.newaxis, :, :] * CartPoleConfigModule.Terminal_Weight`
`186`	`224`
`187`	`225`	`@staticmethod`
`188`	`226`	`def hessian_cost_fn_with_input(x, u):`
`@@ -198,7 +236,7 @@ def hessian_cost_fn_with_input(x, u):`
`198`	`236`	`"""`
`199`	`237`	`(pred_len, _) = u.shape`
`200`	`238`
`201`		`- return None`
	`239`	`+ return np.tile(2.*CartPoleConfigModule.R, (pred_len, 1, 1))`
`202`	`240`
`203`	`241`	`@staticmethod`
`204`	`242`	`def hessian_cost_fn_with_input_state(x, u):`

`‎PythonLinearNonlinearControl/configs/first_order_lag.py‎`

Lines changed: 2 additions & 4 deletions

Original file line number	Diff line number	Diff line change
`@@ -159,11 +159,9 @@ def hessian_cost_fn_with_state(x, g_x, terminal=False):`
`159`	`159`	`"""`
`160`	`160`	`if not terminal:`
`161`	`161`	`(pred_len, _) = x.shape`
`162`		`- return -g_x[:, :, np.newaxis] \`
`163`		`- * np.tile(2.*FirstOrderLagConfigModule.Q, (pred_len, 1, 1))`
	`162`	`+ return np.tile(2.*FirstOrderLagConfigModule.Q, (pred_len, 1, 1))`
`164`	`163`
`165`		`- return -g_x[:, np.newaxis] \`
`166`		`- * np.tile(2.*FirstOrderLagConfigModule.Sf, (1, 1, 1))`
	`164`	`+ return np.tile(2.*FirstOrderLagConfigModule.Sf, (1, 1, 1))`
`167`	`165`
`168`	`166`	`@staticmethod`
`169`	`167`	`def hessian_cost_fn_with_input(x, u):`

`‎PythonLinearNonlinearControl/configs/two_wheeled.py‎`

Lines changed: 2 additions & 4 deletions

Original file line number	Diff line number	Diff line change
`@@ -153,11 +153,9 @@ def hessian_cost_fn_with_state(x, g_x, terminal=False):`
`153`	`153`	`"""`
`154`	`154`	`if not terminal:`
`155`	`155`	`(pred_len, _) = x.shape`
`156`		`- return -g_x[:, :, np.newaxis] \`
`157`		`- * np.tile(2.*TwoWheeledConfigModule.Q, (pred_len, 1, 1))`
	`156`	`+ return np.tile(2.*TwoWheeledConfigModule.Q, (pred_len, 1, 1))`
`158`	`157`
`159`		`- return -g_x[:, np.newaxis] \`
`160`		`- * np.tile(2.*TwoWheeledConfigModule.Sf, (1, 1, 1))`
	`158`	`+ return np.tile(2.*TwoWheeledConfigModule.Sf, (1, 1, 1))`
`161`	`159`
`162`	`160`	`@staticmethod`
`163`	`161`	`def hessian_cost_fn_with_input(x, u):`

`‎PythonLinearNonlinearControl/controllers/ilqr.py‎`

Lines changed: 0 additions & 5 deletions

Original file line number	Diff line number	Diff line change
`@@ -50,11 +50,6 @@ def __init__(self, config, model):`
`50`	`50`	`self.input_size = config.INPUT_SIZE`
`51`	`51`	`self.dt = config.DT`
`52`	`52`
`53`		`- # cost parameters`
`54`		`- self.Q = config.Q`
`55`		`- self.R = config.R`
`56`		`- self.Sf = config.Sf`
`57`		`-`
`58`	`53`	`# initialize`
`59`	`54`	`self.prev_sol = np.zeros((self.pred_len, self.input_size))`
`60`	`55`

`‎PythonLinearNonlinearControl/envs/cartpole.py‎`

Lines changed: 2 additions & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -37,7 +37,8 @@ def reset(self, init_x=None):`
`37`	`37`	`"""`
`38`	`38`	`self.step_count = 0`
`39`	`39`
`40`		`- self.curr_x = np.array([0., 0., 0., 0.])`
	`40`	`+ theta = np.random.randn(1)`
	`41`	`+ self.curr_x = np.array([0., 0., theta[0], 0.])`
`41`	`42`
`42`	`43`	`if init_x is not None:`
`43`	`44`	`self.curr_x = init_x`

`‎PythonLinearNonlinearControl/models/cartpole.py‎`

Lines changed: 38 additions & 11 deletions

Original file line number	Diff line number	Diff line change
`@@ -90,8 +90,41 @@ def calc_f_x(self, xs, us, dt):`
`90`	`90`
`91`	`91`	`f_x = np.zeros((pred_len, state_size, state_size))`
`92`	`92`
`93`		`- f_x[:, 0, 2] = -np.sin(xs[:, 2]) * us[:, 0]`
`94`		`- f_x[:, 1, 2] = np.cos(xs[:, 2]) * us[:, 0]`
	`93`	`+ # f_x_dot`
	`94`	`+ f_x[:, 0, 1] = np.ones(pred_len)`
	`95`	`+`
	`96`	`+ # f_theta`
	`97`	`+ tmp = ((self.mc + self.mp * np.sin(xs[:, 2])2)(-2)) \`
	`98`	`+ * self.mp * 2. * np.sin(xs[:, 2]) * np.cos(xs[:, 2])`
	`99`	`+ tmp2 = 1. / (self.mc + self.mp * (np.sin(xs[:, 2])**2))`
	`100`	`+`
	`101`	`+ f_x[:, 1, 2] = - us[:, 0] * tmp \`
	`102`	`+ - tmp * (self.mp * np.sin(xs[:, 2]) \`
	`103`	`+ * (self.l * xs[:, 3]**2 \`
	`104`	`+ + self.g * np.cos(xs[:, 2]))) \`
	`105`	`+ + tmp2 * (self.mp * np.cos(xs[:, 2]) * self.l \`
	`106`	`+ * xs[:, 3]**2 \`
	`107`	`+ + self.mp * self.g * (np.cos(xs[:, 2])**2 \`
	`108`	`+ - np.sin(xs[:, 2])**2))`
	`109`	`+ f_x[:, 3, 2] = - 1. / self.l * tmp \`
	`110`	`+ * (-us[:, 0] * np.cos(xs[:, 2]) \`
	`111`	`+ - self.mp * self.l * (xs[:, 3]**2) \`
	`112`	`+ * np.cos(xs[:, 2]) * np.sin(xs[:, 2]) \`
	`113`	`+ - (self.mc + self.mp) * self.g * np.sin(xs[:, 2])) \`
	`114`	`+ + 1. / self.l * tmp2 \`
	`115`	`+ * (us[:, 0] * np.sin(xs[:, 2]) \`
	`116`	`+ - self.mp * self.l * xs[:, 3]**2 \`
	`117`	`+ * (np.cos(xs[:, 2])2 - np.sin(xs[:, 2])2) \`
	`118`	`+ - (self.mc + self.mp) \`
	`119`	`+ * self.g * np.cos(xs[:, 2]))`
	`120`	`+`
	`121`	`+ # f_theta_dot`
	`122`	`+ f_x[:, 1, 3] = tmp2 * (self.mp * np.sin(xs[:, 2]) \`
	`123`	`+ * self.l * 2 * xs[:, 3])`
	`124`	`+ f_x[:, 2, 3] = np.ones(pred_len)`
	`125`	`+ f_x[:, 3, 3] = 1. / self.l * tmp2 \`
	`126`	`+ * (-2. * self.mp * self.l * xs[:, 3] \`
	`127`	`+ * np.cos(xs[:, 2]) * np.sin(xs[:, 2]))`
`95`	`128`
`96`	`129`	`return f_x * dt + np.eye(state_size) # to discrete form`
`97`	`130`
`@@ -139,10 +172,7 @@ def calc_f_xx(self, xs, us, dt):`
`139`	`172`
`140`	`173`	`f_xx = np.zeros((pred_len, state_size, state_size, state_size))`
`141`	`174`
`142`		`- f_xx[:, 0, 2, 2] = -np.cos(xs[:, 2]) * us[:, 0]`
`143`		`- f_xx[:, 1, 2, 2] = -np.sin(xs[:, 2]) * us[:, 0]`
`144`		`-`
`145`		`- return f_xx * dt`
	`175`	`+ raise NotImplementedError`
`146`	`176`
`147`	`177`	`def calc_f_ux(self, xs, us, dt):`
`148`	`178`	`""" hessian of model with respect to state and input in batch form`
`@@ -161,11 +191,8 @@ def calc_f_ux(self, xs, us, dt):`
`161`	`191`
`162`	`192`	`f_ux = np.zeros((pred_len, state_size, input_size, state_size))`
`163`	`193`
`164`		`- f_ux[:, 0, 0, 2] = -np.sin(xs[:, 2])`
`165`		`- f_ux[:, 1, 0, 2] = np.cos(xs[:, 2])`
	`194`	`+ raise NotImplementedError`
`166`	`195`
`167`		`- return f_ux * dt`
`168`		`-`
`169`	`196`	`def calc_f_uu(self, xs, us, dt):`
`170`	`197`	`""" hessian of model with respect to input in batch form`
`171`	`198`
`@@ -183,4 +210,4 @@ def calc_f_uu(self, xs, us, dt):`
`183`	`210`
`184`	`211`	`f_uu = np.zeros((pred_len, state_size, input_size, input_size))`
`185`	`212`
`186`		`- returnf_uu*dt`
	`213`	`+ raiseNotImplementedError`

`‎scripts/simple_run.py‎`

Lines changed: 2 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -42,9 +42,9 @@ def run(args):`
`42`	`42`	`def main():`
`43`	`43`	`parser = argparse.ArgumentParser()`
`44`	`44`
`45`		`- parser.add_argument("--controller_type", type=str, default="CEM")`
	`45`	`+ parser.add_argument("--controller_type", type=str, default="DDP")`
`46`	`46`	`parser.add_argument("--planner_type", type=str, default="const")`
`47`		`- parser.add_argument("--env", type=str, default="TwoWheeledConst")`
	`47`	`+ parser.add_argument("--env", type=str, default="CartPole")`
`48`	`48`	`parser.add_argument("--result_dir", type=str, default="./result")`
`49`	`49`
`50`	`50`	`args = parser.parse_args()`

0 commit comments

Comments

(0)

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit 1ed489c

File tree

12 files changed

12 files changed

`‎Environments.md‎`

`‎PythonLinearNonlinearControl/configs/cartpole.py‎`

`‎PythonLinearNonlinearControl/configs/first_order_lag.py‎`

`‎PythonLinearNonlinearControl/configs/two_wheeled.py‎`

`‎PythonLinearNonlinearControl/controllers/ilqr.py‎`

`‎PythonLinearNonlinearControl/envs/cartpole.py‎`

`‎PythonLinearNonlinearControl/models/cartpole.py‎`

`‎scripts/simple_run.py‎`

0 commit comments