Skip to content

Commit

Permalink
share gpu fix
Browse files Browse the repository at this point in the history
  • Loading branch information
mitya52 committed Jan 22, 2025
1 parent f75e1e8 commit 1a321e8
Showing 1 changed file with 4 additions and 4 deletions.
8 changes: 4 additions & 4 deletions refact_webgui/webgui/selfhost_model_assigner.py
Original file line number Diff line number Diff line change
Expand Up @@ -196,10 +196,10 @@ def _model_inference_setup(self, inference_config: Dict[str, Any]) -> Dict[str,
n_ctx=assignment.get("n_ctx", None),
has_loras=self._has_loras(model_name),
))
for _ in range(model_group.gpus_shard()):
if gpus[cursor]["mem_total_mb"] < model_group.required_memory_mb(self.models_db):
required_memory_exceed_available = True
cursor += 1
for _ in range(model_group.gpus_shard()):
if gpus[cursor]["mem_total_mb"] < model_group.required_memory_mb(self.models_db):
required_memory_exceed_available = True
cursor += 1

# dump configs
allowed_to_exist = set()
Expand Down

0 comments on commit 1a321e8

Please sign in to comment.