// Iterate over the tuples in the sorter in batches/vectors of the given size void Sorter::VectorizedIterate( CodeGen &codegen, llvm::Value *sorter_ptr, uint32_t vector_size, uint64_t offset, Sorter::VectorizedIterateCallback &callback) const { llvm::Value *start_pos = codegen.Load(SorterProxy::tuples_start, sorter_ptr); llvm::Value *num_tuples = NumTuples(codegen, sorter_ptr); num_tuples = codegen->CreateTrunc(num_tuples, codegen.Int32Type()); if (offset != 0) { start_pos = codegen->CreateConstInBoundsGEP1_32(codegen.CharPtrType(), start_pos, offset); num_tuples = codegen->CreateSub(num_tuples, codegen.Const32(offset)); } lang::VectorizedLoop loop(codegen, num_tuples, vector_size, {}); { // Current loop range auto curr_range = loop.GetCurrentRange(); // Provide an accessor into the sorted space SorterAccess sorter_access(*this, start_pos); // Issue the callback callback.ProcessEntries(codegen, curr_range.start, curr_range.end, sorter_access); // That's it loop.LoopEnd(codegen, {}); } }
llvm::Value *Sorter::NumTuples(CodeGen &codegen, llvm::Value *sorter_ptr) const { // Pull out start and end (char **) auto *start = codegen.Load(SorterProxy::tuples_start, sorter_ptr); auto *end = codegen.Load(SorterProxy::tuples_end, sorter_ptr); // Convert both to uint64_t start = codegen->CreatePtrToInt(start, codegen.Int64Type()); end = codegen->CreatePtrToInt(end, codegen.Int64Type()); // Subtract (end - start) auto *diff = codegen->CreateSub(end, start); // Divide by pointer size (diff >> 3, or div / 8) return codegen->CreateAShr(diff, 3, "numTuples", true); }