mirror of
https://github.com/wassname/ray.git
synced 2026-06-28 21:46:57 +08:00
[rllib] replace the assertion in SyncReplayOptimizer by a warning (#4534)
This commit is contained in:
@@ -2,6 +2,7 @@ from __future__ import absolute_import
|
||||
from __future__ import division
|
||||
from __future__ import print_function
|
||||
|
||||
import logging
|
||||
import collections
|
||||
import numpy as np
|
||||
|
||||
@@ -17,6 +18,8 @@ from ray.rllib.utils.compression import pack_if_needed
|
||||
from ray.rllib.utils.timer import TimerStat
|
||||
from ray.rllib.utils.schedules import LinearSchedule
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
|
||||
class SyncReplayOptimizer(PolicyOptimizer):
|
||||
"""Variant of the local sync optimizer that supports replay (for DQN).
|
||||
@@ -69,7 +72,9 @@ class SyncReplayOptimizer(PolicyOptimizer):
|
||||
|
||||
self.replay_buffers = collections.defaultdict(new_buffer)
|
||||
|
||||
assert buffer_size >= self.replay_starts
|
||||
if buffer_size < self.replay_starts:
|
||||
logger.warning("buffer_size={} < replay_starts={}".format(
|
||||
buffer_size, self.replay_starts))
|
||||
|
||||
@override(PolicyOptimizer)
|
||||
def step(self):
|
||||
|
||||
Reference in New Issue
Block a user