@article{15819, author = {G. Qiao and Supeng Leng and Sabita Maharjan and Yan Zhang and Nirwan Ansari}, title = {Deep Reinforcement Learning for Cooperative Content Caching in Vehicular Edge Computing and Networks}, abstract = {In this article, we propose a cooperative edge caching scheme, a new paradigm to jointly optimize the content placement and content delivery in the vehicular edge computing and networks, with the aid of the flexible trilateral cooperations among a macro-cell station, roadside units, and smart vehicles. We formulate the joint optimization problem as a double time-scale Markov decision process (DTS-MDP), based on the fact that the time-scale of content timeliness changes less frequently as compared to the vehicle mobility and network states during the content delivery process. At the beginning of the large time-scale, the content placement/updating decision can be obtained according to the content popularity, vehicle driving paths, and resource availability. On the small time-scale, the joint vehicle scheduling and bandwidth allocation scheme is designed to minimize the content access cost while satisfying the constraint on content delivery latency. To solve the long-term mixed integer linear programming (LT-MILP) problem, we propose a nature-inspired method based on the deep deterministic policy gradient (DDPG) framework to obtain a suboptimal solution with a low computation complexity. The simulation results demonstrate that the proposed cooperative caching system can reduce the system cost, as well as the content delivery latency, and improve content hit ratio, as compared to the noncooperative and random edge caching schemes.}, year = {2020}, journal = {IEEE Internet of Things Journal}, volume = {7}, pages = {247-257}, month = {01/2020}, publisher = {IEEE}, url = {https://ieeexplore.ieee.org/abstract/document/8879573}, doi = {10.1109/JIOT.2019.2945640}, }