@article{scholars17688, journal = {Computers, Materials and Continua}, publisher = {Tech Science Press}, pages = {5741--5759}, year = {2022}, title = {Deep Reinforcement Learning Based Unmanned Aerial Vehicle (UAV) Control Using 3D Hand Gestures}, note = {cited By 2}, volume = {72}, number = {3}, doi = {10.32604/cmc.2022.024927}, abstract = {The evident change in the design of the autopilot system produced massive help for the aviation industry and it required frequent upgrades. Reinforcement learning delivers appropriate outcomes when considering a continuous environment where the controlling Unmanned Aerial Vehicle (UAV) required maximum accuracy. In this paper, we designed a hybrid framework, which is based on Reinforcement Learning and Deep Learning where the traditional electronic flight controller is replaced by using 3D hand gestures. The algorithm is designed to take the input from 3D hand gestures and integrate with the Deep Deterministic Policy Gradient (DDPG) to receive the best reward and take actions according to 3D hand gestures input. The UAV consist of a Jetson Nano embedded testbed, Global Positioning System (GPS) sensor module, and Intel depth camera. The collision avoidance system based on the polar mask segmentation technique detects the obstacles and decides the best path according to the designed reward function. The analysis of the results has been observed providing best accuracy and computational time using novel design framework when compared with traditional Proportional Integral Derivatives (PID) flight controller. There are six reward functions estimated for 2500, 5000, 7500, and 10000 episodes of training, which have been normalized between 0 to -4000. The best observation has been captured on 2500 episodes where the rewards are calculated for maximum value. The achieved training accuracy of polar mask segmentation for collision avoidance is 86.36. {\^A}{\copyright} 2022 Tech Science Press. All rights reserved.}, keywords = {Aircraft control; Aircraft detection; Antennas; Collision avoidance; Controllers; Deep learning; Proportional control systems; Reinforcement learning; Two term control systems, 3d hand gesture; Autopilot systems; Flight controllers; Hand gesture; Hybrid framework; Maximum accuracies; Obstacles detection; Polar mask; Reinforcement learnings; Reward function, Unmanned aerial vehicles (UAV)}, url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85128625765&doi=10.32604\%2fcmc.2022.024927&partnerID=40&md5=0ca90aa48129e8bdb703f0dcbca329ad}, issn = {15462218}, author = {Khan, F. S. and Mohd, M. N. H. and Zulkifli, S. A. B. M. and Abro, G. E. M. and Kazi, S. and Soomro, D. M.} }