@article{M7F9A5072, title = "Directional Autonomous Torpedo Maneuver Control Using Reinforcement Learning", journal = "The Journal of Korean Institute of Communications and Information Sciences", year = "2024", issn = "1226-4717", doi = "10.7840/kics.2024.49.5.752", author = "Emily Jimin Roh, Hyunsoo Lee, Soohyun Park, Joongheon Kim, Keonhyung Kim, Seunghwan Kim", keywords = "MDP, Reinforcement Learning, Q-Learning, Autonomous Torpedo, Directional Control", abstract = "This paper proposes a method to optimize the autonomous torpedo maneuver path for reaching the target of torpedoes, which are explosive projectile weapons in naval operations. For flexible maneuvering of torpedoes, movement in various directions is considered. Also, the obstacles in the actual marine environment and the minimization of the waypoint that occurs when the angle of the torpedoes is changed considered to increase the efficiency of torpedo maneuvering. Consequently, this study presents the environment that reflects the action of the torpedo in various directions according to the maximum rotation angle. Torpedo maneuver strategy is formulated by applying a Markov Decision Process based reinforcement learning algorithm, Q-Learning. Compared to the general Q-Learning algorithm, the superiority of the proposed algorithm is assessed and its applicability in the actual marine environment, through the success rate of reaching the target point and the number of waypoints." }