IoT-Based Reinforcement Learning Using Probabilistic Model for Determining Extensive Exploration through Computational Intelligence for Next-Generation Techniques

<table class="table-group" id="tab1"><tr><td><table class="table"><tr><td class="thead-hr" colspan="2"><hr/></td></tr><tr class="thead"><td class="align_left">Hyperparameters</td><td class="align_center">Value</td></tr><tr><td class="thead-hr" colspan="2"><hr/></td></tr><tr><td class="align_left">Discount parameters <svg height="9.39034pt" id="M94" style="vertical-align:-3.42943pt" version="1.1" viewbox="-0.0498162 -5.96091 6.63704 9.39034" width="6.63704pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M478 372C478 418 458 448 431 448C409 448 389 431 389 410C389 404 391 400 394 395C398 388 406 371 406 348C406 253 308 122 251 51H249C254 122 249 257 231 336C212 421 189 448 159 448C126 448 75 412 23 327L48 306C83 354 103 371 115 371C125 371 134 360 144 334C185 224 192 64 183 -19C146 -100 116 -202 110 -244L125 -261C154 -259 208 -234 222 -220C222 -194 225 -84 235 -23C247 -3 273 36 308 79C379 165 478 288 478 372Z"></path></g></svg></td><td class="align_center">0.99</td></tr><tr><td class="align_left">Batch size <svg height="6.1673pt" id="M95" style="vertical-align:-0.2063904pt" version="1.1" viewbox="-0.0498162 -5.96091 6.6501 6.1673" width="6.6501pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M495 86L479 114C446 82 419 66 409 66C401 66 401 72 406 97C420 166 436 231 453 297C489 435 454 448 428 448C406 448 384 439 354 422C305 394 222 327 161 247H159L183 345C200 415 194 448 173 448C143 448 82 410 23 351L38 325C64 349 95 371 105 371C111 371 116 365 109 336L25 -4L31 -12C50 -4 77 3 107 9C119 69 132 122 145 168C197 254 321 381 370 381C387 381 393 374 378 305L329 95C309 17 320 -12 345 -12C372 -12 430 19 495 86Z"></path></g></svg></td><td class="align_center">128</td></tr><tr><td class="align_left">Memory pool capacity</td><td class="align_center">100</td></tr><tr><td class="align_left">Number of learners <svg height="8.68572pt" id="M96" style="vertical-align:-0.0498209pt" version="1.1" viewbox="-0.0498162 -8.6359 9.95144 8.68572" width="9.95144pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M743 650H503L496 622L527 618C563 613 564 603 532 573C449 495 371 431 323 392C301 374 272 355 246 346L280 522C297 609 300 614 379 622L385 650H135L129 622C209 614 215 609 198 522L124 133C106 39 99 35 23 28L17 0H271L277 28C193 35 192 39 208 133L239 316C264 328 280 325 303 288C368 183 435 90 502 0H652L659 28C602 34 584 43 543 94C495 154 403 283 347 369L574 554C634 603 659 612 735 624L743 650Z"></path></g></svg></td><td class="align_center">10</td></tr><tr><td class="align_left">Parameter prior mean <svg height="10.8257pt" id="M97" style="vertical-align:-0.2063999pt" version="1.1" viewbox="-0.0498162 -10.6193 21.0298 10.8257" width="21.0298pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M475 507C475 612 440 712 326 712C139 712 23 420 23 215C23 96 58 -12 180 -12C369 -12 475 293 475 507ZM391 522C391 486 387 448 379 394H126C155 538 222 677 310 677C386 677 391 571 391 522ZM373 346C344 193 283 22 189 22C126 22 106 114 106 196C106 243 111 293 118 346H373Z"></path></g><g transform="matrix(.013,0,0,-0.013,6.475,0)"><path d="M517 162C503 123 484 89 467 68C445 42 417 34 341 34C291 34 256 35 237 47C219 60 213 82 213 129V317H308C395 317 402 311 415 240H444V431H415C403 364 398 356 307 356H213V584C213 613 215 616 246 616H322C394 616 421 609 435 587C448 566 458 544 467 502L496 506C493 557 488 625 488 650H42V622C120 616 128 612 128 523V125C128 42 120 34 29 28V0H511C520 31 540 125 546 158L517 162ZM386 797C360 797 338 776 338 748C338 722 360 699 385 699C412 699 433 722 433 748C433 776 412 797 386 797ZM196 797C169 797 147 775 147 747C147 721 169 699 195 699C222 699 243 721 243 747C243 775 222 797 196 797Z"></path></g><g transform="matrix(.013,0,0,-0.013,13.859,0)"><path d="M495 163C480 117 462 85 444 65C421 39 387 34 332 34C290 34 256 36 236 47C218 57 213 77 213 131V526C213 612 222 616 301 622V650H40V622C122 616 128 611 128 526V126C128 41 120 34 36 28V0H489C498 31 519 126 525 157L495 163ZM385 655C367 655 349 642 349 618C349 604 356 596 362 593C381 587 394 577 394 555C394 531 379 514 348 498L358 470C406 485 445 517 445 575C445 622 417 655 385 655Z"></path></g></svg></td><td class="align_center">0</td></tr><tr><td class="align_left">Parameter prior variance <svg height="9.49473pt" id="M98" style="vertical-align:-0.2063999pt" version="1.1" viewbox="-0.0498162 -9.28833 7.30254 9.49473" width="7.30254pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M529 97L508 118C475 75 449 58 438 58C428 58 421 66 415 104C393 234 374 403 364 496C345 670 307 712 254 712C220 712 174 691 153 669L161 645C176 653 194 658 206 658C237 658 261 640 278 562C287 522 290 483 293 434C223 269 110 105 23 9L32 -12C59 -6 85 0 108 7C152 64 251 252 300 366C307 297 315 221 337 82C346 24 363 -12 393 -12C425 -12 475 13 529 97Z"></path></g></svg></td><td class="align_center">10</td></tr><tr><td class="align_left">Sampling interval <svg height="12.2075pt" id="M99" style="vertical-align:-0.04980087pt" version="1.1" viewbox="-0.0498162 -12.1577 34.9876 12.2075" width="34.9876pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M620 675H597C578 656 570 650 541 650H144C112 650 104 653 94 675H72C59 618 42 552 23 493L53 491C71 534 88 564 105 585C124 608 144 615 238 615H290L197 121C182 40 174 34 88 28L82 0H361L367 28C275 34 266 38 281 121L374 615H441C522 615 543 608 553 583C562 560 566 531 565 493L597 494C603 551 612 629 620 675Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,8.285,-5.741)"><path d="M327 325C324 350 312 408 304 433C283 442 256 451 213 451C120 451 59 391 59 320C59 243 125 210 188 181C237 158 266 136 266 93C266 52 231 24 195 24C134 24 93 81 74 148L42 143C42 106 51 37 59 23C78 8 125 -12 177 -12C257 -12 345 35 345 127C345 198 292 234 216 264C171 283 131 305 131 348C131 387 156 416 195 416C243 416 277 378 297 317L327 325Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,11.743,-5.741)"><path d="M442 39L431 68C420 63 406 57 394 57C377 57 359 71 359 118V301C359 353 349 393 314 424C291 443 261 451 230 451C171 438 107 401 79 381C59 366 46 355 46 340C46 316 72 295 91 295C106 295 117 303 122 319C131 350 139 371 152 384C163 397 178 404 197 404C246 404 281 365 281 293V278C260 262 186 232 124 213C69 194 41 161 41 112C41 47 92 -12 163 -12C195 -12 243 25 283 51C288 35 293 22 308 7C319 -4 339 -12 354 -12L442 39ZM281 87C262 68 226 51 199 51C169 51 129 74 129 126C129 162 151 181 190 198C211 208 259 229 281 240V87Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,15.747,-5.741)"><path d="M810 0V30C751 35 744 40 744 106V296C744 396 694 451 614 451C583 451 558 438 537 425C512 409 485 391 454 368C434 420 390 451 342 451C309 451 285 439 260 424C228 405 206 387 185 372V453C141 434 90 421 43 413V386C102 378 105 373 105 309V106C105 41 96 35 29 30V0H243V30C194 35 185 41 185 106V335C216 360 256 389 297 389C357 389 384 348 384 275V106C384 41 374 35 312 30V0H530V30C475 35 465 41 465 104V294C465 313 464 324 463 336C502 367 539 389 576 389C637 389 663 346 663 274V109C663 41 653 35 593 30V0H810Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,23.154,-5.741)"><path d="M173 382V461C125 442 68 425 25 418V390C88 382 92 382 92 317V-127C92 -191 84 -199 18 -204V-235H259V-204C180 -196 173 -192 173 -120V7C188 -1 212 -11 243 -12C375 12 495 109 495 261C495 361 427 451 316 451C303 451 283 446 266 435L173 382ZM173 345C200 365 243 388 274 388C346 388 409 329 409 222C409 111 353 40 266 40C231 40 196 56 173 79V345Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,27.949,-5.741)"><path d="M244 0V30C178 35 170 41 170 107V710C136 697 72 680 18 675V647C83 642 89 639 89 572V107C89 43 80 35 16 30V0H244Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,30.315,-5.741)"><path d="M384 109C349 76 310 59 268 59C197 59 123 113 120 245C240 248 367 259 384 262C403 266 407 275 407 296C407 376 338 451 254 451H253C201 451 148 425 105 378C65 334 39 272 39 203C39 88 112 -12 235 -12C266 -12 339 5 402 84L384 109ZM230 411C285 411 319 365 319 313C319 298 313 293 294 293C236 291 180 290 125 290C141 370 185 411 230 411Z"></path></g></svg></td><td class="align_center">20</td></tr><tr><td class="align_left">Target network update interval <svg height="11.2576pt" id="M100" style="vertical-align:-0.04979992pt" version="1.1" viewbox="-0.0498162 -11.2078 30.3566 11.2576" width="30.3566pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M620 675H597C578 656 570 650 541 650H144C112 650 104 653 94 675H72C59 618 42 552 23 493L53 491C71 534 88 564 105 585C124 608 144 615 238 615H290L197 121C182 40 174 34 88 28L82 0H361L367 28C275 34 266 38 281 121L374 615H441C522 615 543 608 553 583C562 560 566 531 565 493L597 494C603 551 612 629 620 675Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,8.285,-5.741)"><path d="M303 37L293 66C280 59 256 49 231 49S173 63 173 143V396H281C294 404 298 428 287 439H173V575L158 577L92 509V439H46L17 408L22 396H92V107C92 27 128 -12 192 -12C203 -12 218 -9 237 2L303 37Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,11.179,-5.741)"><path d="M442 39L431 68C420 63 406 57 394 57C377 57 359 71 359 118V301C359 353 349 393 314 424C291 443 261 451 230 451C171 438 107 401 79 381C59 366 46 355 46 340C46 316 72 295 91 295C106 295 117 303 122 319C131 350 139 371 152 384C163 397 178 404 197 404C246 404 281 365 281 293V278C260 262 186 232 124 213C69 194 41 161 41 112C41 47 92 -12 163 -12C195 -12 243 25 283 51C288 35 293 22 308 7C319 -4 339 -12 354 -12L442 39ZM281 87C262 68 226 51 199 51C169 51 129 74 129 126C129 162 151 181 190 198C211 208 259 229 281 240V87Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,15.183,-5.741)"><path d="M185 344V453C137 433 92 421 41 413V386C100 378 104 375 104 310V106C104 41 97 35 33 30V0H268V30C190 35 185 41 185 107V283C206 340 240 371 267 371C282 371 296 364 310 351C316 344 325 343 336 348C357 357 369 378 369 399C369 424 345 451 310 451C262 451 219 397 187 344H185Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,18.568,-5.741)"><path d="M472 439C432 432 382 428 334 425C303 442 271 451 236 451H235C158 451 54 398 54 285C54 216 97 171 140 152C124 133 93 105 53 90C52 81 55 63 64 48C77 27 102 5 137 -6C115 -22 77 -53 57 -73C40 -88 32 -107 32 -130C32 -189 96 -253 208 -253C340 -253 461 -159 461 -56C461 44 378 63 314 63C281 63 246 62 207 62C163 62 145 80 145 99C145 114 160 130 175 141C191 138 210 136 226 136C314 136 405 188 405 294C405 329 393 359 376 382L433 378C448 387 469 415 477 430L472 439ZM226 417C282 417 320 364 320 288S281 172 236 171C180 171 142 224 142 300S182 417 226 417ZM248 -9C291 -9 319 -11 346 -22S390 -57 390 -90C390 -151 339 -199 246 -199C171 -199 114 -159 114 -106C114 -79 132 -53 159 -30C178 -15 200 -9 248 -9Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,22.863,-5.741)"><path d="M384 109C349 76 310 59 268 59C197 59 123 113 120 245C240 248 367 259 384 262C403 266 407 275 407 296C407 376 338 451 254 451H253C201 451 148 425 105 378C65 334 39 272 39 203C39 88 112 -12 235 -12C266 -12 339 5 402 84L384 109ZM230 411C285 411 319 365 319 313C319 298 313 293 294 293C236 291 180 290 125 290C141 370 185 411 230 411Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,26.812,-5.741)"><path d="M303 37L293 66C280 59 256 49 231 49S173 63 173 143V396H281C294 404 298 428 287 439H173V575L158 577L92 509V439H46L17 408L22 396H92V107C92 27 128 -12 192 -12C203 -12 218 -9 237 2L303 37Z"></path></g></svg></td><td class="align_center">20</td></tr><tr class="table-tr"><td colspan="2"><hr class="tbody-hr"/></td></tr></table></td></tr></table>

Computational Intelligence and Neuroscience

tab1

Table 1

Table 1: IoT-Based Reinforcement Learning Using Probabilistic Model for Determining Extensive Exploration through Computational Intelligence for Next-Generation Techniques 

Table 1 | IoT-Based Reinforcement Learning Using Probabilistic Model for Determining Extensive Exploration through Computational Intelligence for Next-Generation Techniques