Skip to content

Commit 4ff44cf

Browse files
committed
Removing buffers
Signed-off-by: Linda-Stadter <[email protected]>
1 parent 0159d90 commit 4ff44cf

File tree

6 files changed

+2
-142
lines changed

6 files changed

+2
-142
lines changed

cpp/include/tensorrt_llm/batch_manager/runtimeBuffers.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -168,7 +168,7 @@ class RuntimeBuffers
168168

169169
public:
170170
//! Additional buffers depending on model type
171-
std::shared_ptr<TransformerBuffers> transformerBuffers;
171+
std::unique_ptr<TransformerBuffers> transformerBuffers;
172172
std::unique_ptr<RnnStateBuffers> rnnStateBuffers;
173173

174174
//! Encoder-Decoder

cpp/tensorrt_llm/batch_manager/runtimeBuffers.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -84,7 +84,7 @@ void RuntimeBuffers::create(SizeType32 maxBatchSize, SizeType32 maxBeamWidth,
8484

8585
if (modelConfig.isTransformerBased())
8686
{
87-
transformerBuffers = std::make_shared<TransformerBuffers>(maxBatchSize, maxBeamWidth, maxAttentionWindowVec,
87+
transformerBuffers = std::make_unique<TransformerBuffers>(maxBatchSize, maxBeamWidth, maxAttentionWindowVec,
8888
maxAttentionWindow, sinkTokenLen, runtime, modelConfig, worldConfig);
8989
}
9090
if (modelConfig.isRnnBased())

cpp/tensorrt_llm/nanobind/CMakeLists.txt

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,6 @@ set(TRTLLM_NB_MODULE
66
set(SRCS
77
batch_manager/algorithms.cpp
88
batch_manager/bindings.cpp
9-
batch_manager/buffers.cpp
109
batch_manager/cacheTransceiver.cpp
1110
batch_manager/kvCacheManager.cpp
1211
batch_manager/llmRequest.cpp

cpp/tensorrt_llm/nanobind/batch_manager/buffers.cpp

Lines changed: 0 additions & 108 deletions
This file was deleted.

cpp/tensorrt_llm/nanobind/batch_manager/buffers.h

Lines changed: 0 additions & 29 deletions
This file was deleted.

cpp/tensorrt_llm/nanobind/bindings.cpp

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,6 @@
3333
#include "tensorrt_llm/common/quantization.h"
3434
#include "tensorrt_llm/nanobind/batch_manager/algorithms.h"
3535
#include "tensorrt_llm/nanobind/batch_manager/bindings.h"
36-
#include "tensorrt_llm/nanobind/batch_manager/buffers.h"
3736
#include "tensorrt_llm/nanobind/batch_manager/cacheTransceiver.h"
3837
#include "tensorrt_llm/nanobind/batch_manager/kvCacheManager.h"
3938
#include "tensorrt_llm/nanobind/batch_manager/llmRequest.h"
@@ -474,7 +473,6 @@ NB_MODULE(TRTLLM_NB_MODULE, m)
474473
tb::kv_cache_manager::KVCacheManagerBindings::initBindings(mInternalBatchManager);
475474
tb::BasePeftCacheManagerBindings::initBindings(mInternalBatchManager);
476475
tb::CacheTransceiverBindings::initBindings(mInternalBatchManager);
477-
tpb::Buffers::initBindings(mInternalBatchManager);
478476

479477
auto mInternalAlgorithms = mInternal.def_submodule("algorithms", "Algorithms internal bindings");
480478
tpb::algorithms::initBindings(mInternalAlgorithms);

0 commit comments

Comments
 (0)