algo/python/28_binary_heap/binary_heap.py

218 lines
4.7 KiB
Python
Raw Normal View History

2018-11-26 20:03:25 +08:00
#!/usr/bin/python
# -*- coding: UTF-8 -*-
import math
import random
class BinaryHeap:
"""
大顶堆
"""
2018-11-28 15:30:36 +08:00
def __init__(self, data=None, capacity=100):
2018-11-26 20:03:25 +08:00
self._data = []
2018-11-28 15:30:36 +08:00
self._capacity = capacity
2018-11-26 20:03:25 +08:00
if type(data) is list:
2018-11-28 15:30:36 +08:00
if len(data) > self._capacity:
raise Exception('Heap oversize, capacity:{}, data size:{}'.format(self._capacity, len(data)))
2018-11-27 10:53:31 +08:00
self._type_assert(data)
2018-11-26 20:03:25 +08:00
self._data = data
self._length = len(self._data)
def heapify(self):
"""
堆化
:return:
"""
self._heapify(self._data, self._length-1)
def _heapify(self, data, tail_idx):
"""
堆化内部实现
:param data: 需要堆化的数据
:param tail_idx: 尾元素的索引
:return:
"""
# heapify data[:tail_idx+1]
if tail_idx <= 0:
return
# idx of the Last Parent node
lp = (tail_idx - 1) // 2
for i in range(lp, -1, -1):
self._heap_down(data, i, tail_idx)
@staticmethod
def _heap_down(data, idx, tail_idx):
"""
将指定的位置堆化
:param data: 需要堆化的数据
:param idx: data: 中需要堆化的位置
:param tail_idx: 尾元素的索引
:return:
"""
assert type(data) is list
lp = (tail_idx - 1) // 2
# top-down
while idx <= lp:
# Left and Right Child index
lc = 2 * idx + 1
rc = lc + 1
# right child exists
if rc <= tail_idx:
tmp = lc if data[lc] > data[rc] else rc
else:
tmp = lc
if data[tmp] > data[idx]:
data[tmp], data[idx] = data[idx], data[tmp]
idx = tmp
else:
break
def insert(self, num):
"""
插入
:param num:
:return:
"""
2018-11-28 15:30:36 +08:00
if self._length < self._capacity:
if self._insert(self._data, num):
self._length += 1
return True
return False
2018-11-26 20:03:25 +08:00
@staticmethod
def _insert(data, num):
"""
堆中插入元素的内部实现
:param data:
:param num:
:return:
"""
assert type(data) is list
assert type(num) is int
data.append(num)
length = len(data)
# idx of New Node
nn = length - 1
# bottom-up
while nn > 0:
p = (nn-1) // 2
if data[nn] > data[p]:
data[nn], data[p] = data[p], data[nn]
nn = p
else:
break
return True
2018-11-28 15:30:36 +08:00
def get_top(self):
2018-11-26 20:03:25 +08:00
"""
2018-11-28 15:30:36 +08:00
取堆顶
2018-11-26 20:03:25 +08:00
:return:
"""
2018-11-28 15:30:36 +08:00
if self._length <= 0:
return None
return self._data[0]
def remove_top(self):
"""
取堆顶
:return:
"""
ret = None
if self._length > 0:
ret = self._remove_top(self._data)
2018-11-26 20:03:25 +08:00
self._length -= 1
2018-11-28 15:30:36 +08:00
return ret
2018-11-26 20:03:25 +08:00
@staticmethod
2018-11-28 15:30:36 +08:00
def _remove_top(data):
2018-11-26 20:03:25 +08:00
"""
2018-11-28 15:30:36 +08:00
取堆顶内部实现
2018-11-26 20:03:25 +08:00
:param data:
:return:
"""
assert type(data) is list
length = len(data)
if length == 0:
2018-11-28 15:30:36 +08:00
return None
2018-11-26 20:03:25 +08:00
data[0], data[-1] = data[-1], data[0]
2018-11-28 15:30:36 +08:00
ret = data.pop()
2018-11-26 20:03:25 +08:00
length -= 1
# length == 0 or == 1, return
if length > 1:
BinaryHeap._heap_down(data, 0, length-1)
2018-11-28 15:30:36 +08:00
return ret
2018-11-26 20:03:25 +08:00
@staticmethod
2018-11-27 10:53:31 +08:00
def _type_assert(nums):
assert type(nums) is list
for n in nums:
assert type(n) is int
2018-11-26 20:03:25 +08:00
@staticmethod
def _draw_heap(data):
"""
格式化打印
:param data:
:return:
"""
length = len(data)
if length == 0:
return 'empty heap'
ret = ''
for i, n in enumerate(data):
ret += str(n)
# 每行最后一个换行
if i == 2**int(math.log(i+1, 2)+1) - 2 or i == len(data) - 1:
ret += '\n'
else:
ret += ', '
return ret
def __repr__(self):
return self._draw_heap(self._data)
if __name__ == '__main__':
nums = list(range(10))
random.shuffle(nums)
bh = BinaryHeap(nums)
print('--- before heapify ---')
print(bh)
# heapify
bh.heapify()
print('--- after heapify ---')
print(bh)
# insert
print('--- insert ---')
2018-11-28 15:30:36 +08:00
if bh.insert(8):
print('insert success')
else:
print('insert fail')
2018-11-26 20:03:25 +08:00
print(bh)
2018-11-28 15:30:36 +08:00
# get top
print('--- get top ---')
print('get top of the heap: {}'.format(bh.get_top()))
bh.remove_top()
2018-11-26 20:03:25 +08:00
print(bh)