Skip to content
Open
Show file tree
Hide file tree
Changes from 5 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 6 additions & 0 deletions src/neural/backends/cuda/network_cuda.cc
Original file line number Diff line number Diff line change
Expand Up @@ -893,6 +893,12 @@ class CudaNetwork : public Network {
return 2 * sm_count_;
}

int GetPreferredBatchStep() const override {
int preferred_split = 7;
while (sm_count_ % preferred_split != 0) preferred_split++;
return preferred_split;
}

int GetThreads() const override { return 1 + multi_stream_; }

std::unique_ptr<NetworkComputation> NewComputation() override {
Expand Down
Loading