sglang_v0.5.2/flashinfer_0.3.1/include/flashinfer/attention/heap.h

67 lines
1.7 KiB
C++

/*
* Copyright (c) 2023 by FlashInfer team.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifndef FLASHINFER_ATTENTION_HEAP_H
#define FLASHINFER_ATTENTION_HEAP_H
#include <algorithm>
#include <stdexcept>
#include <utility>
#include <vector>
namespace flashinfer {
/*!
* \brief Heap data structure for (index, value) pairs
* \note minimal element on top
*/
class MinHeap {
public:
// first: index, second: cost
using Element = std::pair<int, float>;
MinHeap(int capacity) : heap_(capacity) {
for (int i = 0; i < capacity; ++i) {
heap_[i] = std::make_pair(i, 0.f);
}
}
void insert(const Element& element) {
heap_.push_back(element);
std::push_heap(heap_.begin(), heap_.end(), compare);
}
Element pop() {
std::pop_heap(heap_.begin(), heap_.end(), compare);
Element minElement = heap_.back();
heap_.pop_back();
return minElement;
}
std::vector<Element> getHeap() const { return heap_; }
private:
// Custom comparator for the min-heap: compare based on 'val' in the pair
static bool compare(const Element& a, const Element& b) {
return a.second > b.second; // create a min-heap based on val
}
std::vector<Element> heap_;
};
} // namespace flashinfer
#endif // FLASHINFER_ATTENTION_HEAP_H