LEO Satellite Channel Allocation Scheme Based on Reinforcement Learning

<table class="table-group" id="tab1"><tr><td><table class="table"><tr><td class="thead-hr" colspan="2"><hr/></td></tr><tr class="thead"><td class="align_left" colspan="2">Initialize system parameters</td></tr><tr><td class="thead-hr" colspan="2"><hr/></td></tr><tr><td class="align_left">1</td><td class="align_center">Preallocation: Assign <i>M</i> channel to each beam</td></tr><tr><td class="align_left">2</td><td class="align_center"><b>for</b> Business request time <i>t</i> = 1 : <i>T</i></td></tr><tr><td class="align_left">3</td><td class="align_center"> <b>if</b> Resource is rich; recycle surplus resources</td></tr><tr><td class="align_left">4</td><td class="align_center"> <b>else</b> resource is poor:Dynamic allocation</td></tr><tr><td class="align_left">5</td><td class="align_center"> Allocate resources from resource pool</td></tr><tr><td class="align_left">6</td><td class="align_center"> initialize parameter, learning rate <svg height="6.1673pt" id="M53" style="vertical-align:-0.2063904pt" version="1.1" viewbox="-0.0498162 -5.96091 7.51131 6.1673" width="7.51131pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M545 106L524 126C493 85 467 65 455 65C438 65 427 113 405 238C448 295 498 362 543 439L533 448L478 435C453 386 423 331 398 295H395C370 404 347 448 282 448C169 448 23 309 23 153C23 54 65 -12 128 -12C203 -12 283 70 339 155H341C360 29 380 -12 411 -12C444 -12 491 11 545 106ZM333 204C265 95 210 54 169 54C137 54 113 96 113 171C113 302 191 405 252 405C301 405 318 306 333 204Z"></path></g></svg> discount factor <span class="nowrap"><svg height="9.39034pt" id="M54" style="vertical-align:-3.42943pt" version="1.1" viewbox="-0.0498162 -5.96091 6.63704 9.39034" width="6.63704pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M478 372C478 418 458 448 431 448C409 448 389 431 389 410C389 404 391 400 394 395C398 388 406 371 406 348C406 253 308 122 251 51H249C254 122 249 257 231 336C212 421 189 448 159 448C126 448 75 412 23 327L48 306C83 354 103 371 115 371C125 371 134 360 144 334C185 224 192 64 183 -19C146 -100 116 -202 110 -244L125 -261C154 -259 208 -234 222 -220C222 -194 225 -84 235 -23C247 -3 273 36 308 79C379 165 478 288 478 372Z"></path></g></svg>,</span> initial explore probability <span class="nowrap"><svg height="9.25202pt" id="M55" style="vertical-align:-3.29111pt" version="1.1" viewbox="-0.0498162 -5.96091 10.0698 9.25202" width="10.0698pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M387 375C387 402 357 448 257 448C172 448 82 404 82 326C82 289 108 255 156 241V239C85 223 23 181 23 116C23 39 89 -12 182 -12C265 -12 336 31 378 91L361 114C320 73 269 47 216 47C157 47 115 82 115 137C115 191 160 219 218 219C243 219 262 218 272 217L304 259L302 266C295 265 281 264 255 264C195 264 163 294 163 335C163 377 200 416 249 416C293 416 321 389 329 342C331 332 335 329 341 329C355 329 387 352 387 375Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,5.005,3.132)"><path d="M245 635C92 635 37 457 37 312C37 149 91 -12 244 -12C395 -12 449 166 449 312C449 469 395 635 245 635ZM243 598C332 598 358 454 358 312C358 173 334 26 245 26C158 26 128 174 128 313S152 598 243 598Z"></path></g></svg>,</span> <i>Q</i> table</td></tr><tr><td class="align_left">7</td><td class="align_center"> Reconstruct state based on business request <svg height="8.8423pt" id="M56" style="vertical-align:-0.2064009pt" version="1.1" viewbox="-0.0498162 -8.6359 25.5011 8.8423" width="25.5011pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M352 391C352 416 319 448 267 448C236 448 173 423 147 400C107 364 96 332 96 304C96 248 143 210 193 181C241 153 258 124 258 100C258 72 232 38 184 38C151 38 107 66 81 108C77 114 64 116 55 111C34 99 23 84 23 65C23 29 81 -12 134 -12C220 -12 325 61 325 141C325 184 297 215 234 256C194 282 161 309 161 346C161 380 188 401 217 401C255 401 279 380 301 353C308 344 313 341 325 347C341 355 352 371 352 391Z"></path></g><g transform="matrix(.013,0,0,-0.013,8.507,0)"><path d="M535 323V373H52V323H535ZM535 138V188H52V138H535Z"></path></g><g transform="matrix(.013,0,0,-0.013,19.77,0)"><path d="M405 650H141L135 622C222 616 230 610 215 535L133 116C118 41 113 33 29 28L23 0H289L295 28C209 33 205 40 219 116L298 535C312 609 317 616 399 622L405 650Z"></path></g></svg></td></tr><tr><td class="align_left">8</td><td class="align_center"> <b>for</b> Episode = 1:max<b>_</b>episode</td></tr><tr><td class="align_left">9</td><td class="align_center">  <b>while</b> (<svg height="9.36162pt" id="M57" style="vertical-align:-3.40071pt" version="1.1" viewbox="-0.0498162 -5.96091 18.6246 9.36162" width="18.6246pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M352 391C352 416 319 448 267 448C236 448 173 423 147 400C107 364 96 332 96 304C96 248 143 210 193 181C241 153 258 124 258 100C258 72 232 38 184 38C151 38 107 66 81 108C77 114 64 116 55 111C34 99 23 84 23 65C23 29 81 -12 134 -12C220 -12 325 61 325 141C325 184 297 215 234 256C194 282 161 309 161 346C161 380 188 401 217 401C255 401 279 380 301 353C308 344 313 341 325 347C341 355 352 371 352 391Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,4.81,3.132)"><path d="M329 433H203L239 587L230 596L147 534L123 433H57L30 395L34 388H115L61 129C37 16 59 -12 85 -12C147 -12 222 58 260 98L241 125C212 95 160 62 144 62C132 62 127 71 138 126L192 386L305 394L329 433Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,7.968,3.132)"><path d="M556 236V289H337V504H275V289H56V236H275V-4H337V236H556Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,13.528,3.132)"><path d="M389 0V32C297 38 291 46 291 118V635C234 613 175 595 109 583V556L161 554C203 552 207 547 207 497V118C207 46 201 38 110 32V0H389Z"></path></g></svg> is terminal state)</td></tr><tr><td class="align_left">10</td><td class="align_center">  Confirm initial state <svg height="9.25202pt" id="M58" style="vertical-align:-3.29111pt" version="1.1" viewbox="-0.0498162 -5.96091 8.59533 9.25202" width="8.59533pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M352 391C352 416 319 448 267 448C236 448 173 423 147 400C107 364 96 332 96 304C96 248 143 210 193 181C241 153 258 124 258 100C258 72 232 38 184 38C151 38 107 66 81 108C77 114 64 116 55 111C34 99 23 84 23 65C23 29 81 -12 134 -12C220 -12 325 61 325 141C325 184 297 215 234 256C194 282 161 309 161 346C161 380 188 401 217 401C255 401 279 380 301 353C308 344 313 341 325 347C341 355 352 371 352 391Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,4.81,3.132)"><path d="M329 433H203L239 587L230 596L147 534L123 433H57L30 395L34 388H115L61 129C37 16 59 -12 85 -12C147 -12 222 58 260 98L241 125C212 95 160 62 144 62C132 62 127 71 138 126L192 386L305 394L329 433Z"></path></g></svg></td></tr><tr><td class="align_left">11</td><td class="align_center">  Update explore probability <svg height="6.1673pt" id="M59" style="vertical-align:-0.2063904pt" version="1.1" viewbox="-0.0498162 -5.96091 5.44961 6.1673" width="5.44961pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M387 375C387 402 357 448 257 448C172 448 82 404 82 326C82 289 108 255 156 241V239C85 223 23 181 23 116C23 39 89 -12 182 -12C265 -12 336 31 378 91L361 114C320 73 269 47 216 47C157 47 115 82 115 137C115 191 160 219 218 219C243 219 262 218 272 217L304 259L302 266C295 265 281 264 255 264C195 264 163 294 163 335C163 377 200 416 249 416C293 416 321 389 329 342C331 332 335 329 341 329C355 329 387 352 387 375Z"></path></g></svg></td></tr><tr><td class="align_left">12</td><td class="align_center">  Choose best <svg height="14.0461pt" id="M60" style="vertical-align:-3.9436pt" version="1.1" viewbox="-0.0498162 -10.1025 12.7814 14.0461" width="12.7814pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M483 97L471 123C436 91 401 65 392 65C388 65 384 74 390 106C414 239 444 378 457 429L455 433C444 433 429 436 416 439C392 444 368 448 344 448C281 448 204 415 152 376C71 315 23 205 23 103C23 21 57 -12 85 -12C114 -12 149 6 185 34C231 70 285 119 329 183H331L309 81C292 0 308 -12 326 -12C350 -12 421 24 483 97ZM374 387C370 363 356 291 345 261C315 193 181 50 139 50C124 50 110 71 110 118C110 224 153 331 218 379C238 394 271 402 301 402C329 402 359 394 374 387Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,6.58,-5.741)"><path d="M486 158C486 177 478 202 466 220C413 228 386 236 336 262C386 288 413 297 466 304C478 323 486 347 485 366C470 376 444 381 422 380C389 338 368 319 321 288C323 345 329 372 349 422C339 442 322 461 305 470C289 461 271 442 262 422C281 372 287 345 290 288C243 319 222 338 189 380C167 381 142 376 125 366C125 347 133 322 145 304C198 296 225 288 275 262C225 236 198 227 145 220C133 201 125 177 126 158C141 148 167 143 189 144C222 186 243 205 290 236C288 179 282 152 262 102C272 82 289 63 306 54C322 63 340 82 350 102C330 152 324 179 321 236C368 205 390 186 422 144C444 143 470 148 486 158Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,5.993,3.784)"><path d="M329 433H203L239 587L230 596L147 534L123 433H57L30 395L34 388H115L61 129C37 16 59 -12 85 -12C147 -12 222 58 260 98L241 125C212 95 160 62 144 62C132 62 127 71 138 126L192 386L305 394L329 433Z"></path></g></svg> or Choose randomly <svg height="9.25202pt" id="M61" style="vertical-align:-3.29111pt" version="1.1" viewbox="-0.0498162 -5.96091 9.78277 9.25202" width="9.78277pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M483 97L471 123C436 91 401 65 392 65C388 65 384 74 390 106C414 239 444 378 457 429L455 433C444 433 429 436 416 439C392 444 368 448 344 448C281 448 204 415 152 376C71 315 23 205 23 103C23 21 57 -12 85 -12C114 -12 149 6 185 34C231 70 285 119 329 183H331L309 81C292 0 308 -12 326 -12C350 -12 421 24 483 97ZM374 387C370 363 356 291 345 261C315 193 181 50 139 50C124 50 110 71 110 118C110 224 153 331 218 379C238 394 271 402 301 402C329 402 359 394 374 387Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,5.993,3.132)"><path d="M329 433H203L239 587L230 596L147 534L123 433H57L30 395L34 388H115L61 129C37 16 59 -12 85 -12C147 -12 222 58 260 98L241 125C212 95 160 62 144 62C132 62 127 71 138 126L192 386L305 394L329 433Z"></path></g></svg></td></tr><tr><td class="align_left">13</td><td class="align_center">  Execute action, get reward <svg height="9.25202pt" id="M62" style="vertical-align:-3.29111pt" version="1.1" viewbox="-0.0498162 -5.96091 8.68666 9.25202" width="8.68666pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M393 379C402 394 400 411 393 422C384 437 365 448 348 448C301 448 237 372 186 285H182L193 335C210 408 205 448 178 448C150 448 80 402 29 344L45 321C80 355 114 373 122 373C128 373 130 365 124 330C106 228 76 98 50 -5L57 -12C82 -5 112 3 132 6L172 203C196 256 234 304 254 329C275 355 293 367 306 367C318 367 330 360 342 348C347 343 355 343 365 350S386 367 393 379Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,4.901,3.132)"><path d="M329 433H203L239 587L230 596L147 534L123 433H57L30 395L34 388H115L61 129C37 16 59 -12 85 -12C147 -12 222 58 260 98L241 125C212 95 160 62 144 62C132 62 127 71 138 126L192 386L305 394L329 433Z"></path></g></svg></td></tr><tr><td class="align_left">14</td><td class="align_center">  Update <i>Q</i> table</td></tr><tr><td class="align_left">15</td><td class="align_center">  Jump to next state <svg height="9.36162pt" id="M63" style="vertical-align:-3.40071pt" version="1.1" viewbox="-0.0498162 -5.96091 18.6246 9.36162" width="18.6246pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M352 391C352 416 319 448 267 448C236 448 173 423 147 400C107 364 96 332 96 304C96 248 143 210 193 181C241 153 258 124 258 100C258 72 232 38 184 38C151 38 107 66 81 108C77 114 64 116 55 111C34 99 23 84 23 65C23 29 81 -12 134 -12C220 -12 325 61 325 141C325 184 297 215 234 256C194 282 161 309 161 346C161 380 188 401 217 401C255 401 279 380 301 353C308 344 313 341 325 347C341 355 352 371 352 391Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,4.81,3.132)"><path d="M329 433H203L239 587L230 596L147 534L123 433H57L30 395L34 388H115L61 129C37 16 59 -12 85 -12C147 -12 222 58 260 98L241 125C212 95 160 62 144 62C132 62 127 71 138 126L192 386L305 394L329 433Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,7.968,3.132)"><path d="M556 236V289H337V504H275V289H56V236H275V-4H337V236H556Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,13.528,3.132)"><path d="M389 0V32C297 38 291 46 291 118V635C234 613 175 595 109 583V556L161 554C203 552 207 547 207 497V118C207 46 201 38 110 32V0H389Z"></path></g></svg></td></tr><tr><td class="align_left">16</td><td class="align_center">  <b>End</b></td></tr><tr><td class="align_left">17</td><td class="align_center">  End of training, output <i>Q</i> table</td></tr><tr><td class="align_left">18</td><td class="align_center">  Choose best strategy according to <i>Q</i> table <svg height="10.3089pt" id="M64" style="vertical-align:-0.2063999pt" version="1.1" viewbox="-0.0498162 -10.1025 13.8905 10.3089" width="13.8905pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M574 449L545 460C526 432 516 430 487 430C404 430 311 435 226 435C104 435 56 379 25 341L43 318C81 354 121 372 181 372C161 246 87 53 23 3L30 -12C48 -12 88 -4 113 11C157 75 207 248 232 371L386 367L326 109C321 86 318 66 318 50C318 4 339 -12 366 -12C410 -12 461 21 505 69L492 96C467 79 434 60 418 60C406 60 400 78 411 147C422 217 439 300 457 366C487 366 524 367 536 370C547 385 558 408 574 449Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,7.684,-5.741)"><path d="M486 158C486 177 478 202 466 220C413 228 386 236 336 262C386 288 413 297 466 304C478 323 486 347 485 366C470 376 444 381 422 380C389 338 368 319 321 288C323 345 329 372 349 422C339 442 322 461 305 470C289 461 271 442 262 422C281 372 287 345 290 288C243 319 222 338 189 380C167 381 142 376 125 366C125 347 133 322 145 304C198 296 225 288 275 262C225 236 198 227 145 220C133 201 125 177 126 158C141 148 167 143 189 144C222 186 243 205 290 236C288 179 282 152 262 102C272 82 289 63 306 54C322 63 340 82 350 102C330 152 324 179 321 236C368 205 390 186 422 144C444 143 470 148 486 158Z"></path></g></svg></td></tr><tr><td class="align_left">19</td><td class="align_center">  Channel allocation</td></tr><tr><td class="align_left">20</td><td class="align_center"> <b>End</b></td></tr><tr><td class="align_left">21</td><td class="align_center"><b>End</b></td></tr><tr class="table-tr"><td colspan="2"><hr class="tbody-hr"/></td></tr></table></td></tr></table>

Mobile Information Systems

tab1

Table 1

Table 1: LEO Satellite Channel Allocation Scheme Based on Reinforcement Learning