Skip to content
Merged
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 3 additions & 0 deletions vllm/compilation/backends.py
Original file line number Diff line number Diff line change
Expand Up @@ -624,9 +624,12 @@ def __call__(self, graph: fx.GraphModule, example_inputs) -> Callable:
]

# index of tensors that have symbolic shapes (batch size)
# for weights and static buffers, they will have concrete shapes,
# and therefore x.numel() will be an integer.
self.sym_tensor_indices = [
i for i, x in enumerate(fake_args)
if isinstance(x, torch._subclasses.fake_tensor.FakeTensor)
and not isinstance(x.numel(), int)
]

# compiler managed cudagraph input buffers
Expand Down
Loading