summaryrefslogtreecommitdiffstats
path: root/searchlib
diff options
context:
space:
mode:
authorArne Juul <arnej@verizonmedia.com>2020-12-02 11:06:28 +0000
committerArne Juul <arnej@verizonmedia.com>2020-12-02 11:06:28 +0000
commit2f96f28106d79001c6a6eb2662ca6378912e7266 (patch)
treeb3415ddfefa5545946396ce5a059fa43750106a8 /searchlib
parentfdbcea7e4213e5e452729f133afe85939fe4271c (diff)
remove padding for alignment
* we have control of alignment up to 8 bytes, so we can remove padding. Put in extra asserts to make sure.
Diffstat (limited to 'searchlib')
-rw-r--r--searchlib/src/vespa/searchlib/tensor/streamed_value_store.cpp27
1 files changed, 10 insertions, 17 deletions
diff --git a/searchlib/src/vespa/searchlib/tensor/streamed_value_store.cpp b/searchlib/src/vespa/searchlib/tensor/streamed_value_store.cpp
index ae2e0e7ed10..2e5e5a60b34 100644
--- a/searchlib/src/vespa/searchlib/tensor/streamed_value_store.cpp
+++ b/searchlib/src/vespa/searchlib/tensor/streamed_value_store.cpp
@@ -34,17 +34,12 @@ struct CellsMemBlock {
};
template<typename T>
-T *fix_alignment(T *ptr, size_t align)
+void check_alignment(T *ptr, size_t align)
{
static_assert(sizeof(T) == 1);
- assert((align & (align-1)) == 0); // must be 2^N
size_t ptr_val = (size_t)ptr;
size_t unalign = ptr_val & (align - 1);
- if (unalign == 0) {
- return ptr;
- } else {
- return ptr + (align - unalign);
- }
+ assert(unalign == 0);
}
} // namespace <unnamed>
@@ -60,6 +55,11 @@ StreamedValueStore::StreamedValueStore(const ValueType &tensor_type)
{
_store.addType(&_bufferType);
_store.initActiveBuffers();
+ size_t align = CellTypeUtils::alignment(_data_from_type.cell_type);
+ // max alignment we can handle is 8:
+ assert(align <= 8);
+ // alignment must be a power of two:
+ assert((align & (align-1)) == 0);
}
StreamedValueStore::~StreamedValueStore()
@@ -132,12 +132,7 @@ StreamedValueStore::get_tensor_data(EntryRef ref) const
}
vespalib::nbostream source(raw.first, raw.second);
uint32_t num_cells = source.readValue<uint32_t>();
- {
- uint32_t alignment = CellTypeUtils::alignment(_data_from_type.cell_type);
- const char *aligned_ptr = fix_alignment(source.peek(), alignment);
- size_t adjustment = aligned_ptr - source.peek();
- source.adjustReadPos(adjustment);
- }
+ check_alignment(source.peek(), CellTypeUtils::alignment(_data_from_type.cell_type));
retval.cells_ref = TypedCells(source.peek(), _data_from_type.cell_type, num_cells);
source.adjustReadPos(CellTypeUtils::mem_size(_data_from_type.cell_type, num_cells));
retval.num_subspaces = source.readValue<uint32_t>();
@@ -197,18 +192,16 @@ StreamedValueStore::store_tensor(const Value &tensor)
{
assert(tensor.type() == _tensor_type);
CellsMemBlock cells_mem(tensor.cells());
- size_t alignment = CellTypeUtils::alignment(_data_from_type.cell_type);
- size_t padding = alignment - 1;
vespalib::nbostream stream;
stream << uint32_t(cells_mem.num);
serialize_labels(tensor.index(), stream);
- size_t mem_size = stream.size() + cells_mem.total_sz + padding;
+ size_t mem_size = stream.size() + cells_mem.total_sz;
auto raw = allocRawBuffer(mem_size);
char *target = raw.data;
memcpy(target, stream.peek(), sizeof(uint32_t));
stream.adjustReadPos(sizeof(uint32_t));
target += sizeof(uint32_t);
- target = fix_alignment(target, alignment);
+ check_alignment(target, CellTypeUtils::alignment(_data_from_type.cell_type));
memcpy(target, cells_mem.ptr, cells_mem.total_sz);
target += cells_mem.total_sz;
memcpy(target, stream.peek(), stream.size());