Skip to content
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions fastdeploy/engine/common_engine.py
Original file line number Diff line number Diff line change
Expand Up @@ -687,6 +687,7 @@ def _fetch_request():
else:
max_num_batched_tokens = self.cfg.model_config.max_model_len

self.check_and_free_block_tables()
tasks = self.scheduler.get_requests(
available_blocks=self.cfg.cache_config.max_block_num_per_seq,
block_size=self.cfg.cache_config.block_size,
Expand Down
2 changes: 0 additions & 2 deletions fastdeploy/engine/sched/resource_manager_v1.py
Original file line number Diff line number Diff line change
Expand Up @@ -515,8 +515,6 @@ def schedule(self):
error_reqs: list[tuple[str, str]] = []
token_budget = self.config.scheduler_config.max_num_batched_tokens

self.check_and_free_block_tables()

# First, schedule the RUNNING requests.
req_index = 0
num_decoding_req_nums = 0
Expand Down
Loading