2020-12-09 14:01:58 +00:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
|
2016-07-29 13:03:20 +00:00
|
|
|
"""
|
2023-10-21 18:53:34 +00:00
|
|
|
Pure Python implementations of binary search algorithms
|
2016-07-29 13:03:20 +00:00
|
|
|
|
2023-10-21 18:53:34 +00:00
|
|
|
For doctests run the following command:
|
2016-07-29 20:06:49 +00:00
|
|
|
python3 -m doctest -v binary_search.py
|
2016-07-29 13:03:20 +00:00
|
|
|
|
|
|
|
For manual testing run:
|
2020-12-09 14:01:58 +00:00
|
|
|
python3 binary_search.py
|
2016-07-29 13:03:20 +00:00
|
|
|
"""
|
2021-09-07 11:37:03 +00:00
|
|
|
from __future__ import annotations
|
|
|
|
|
2016-07-29 14:12:51 +00:00
|
|
|
import bisect
|
|
|
|
|
|
|
|
|
2020-12-09 14:01:58 +00:00
|
|
|
def bisect_left(
|
2021-09-07 11:37:03 +00:00
|
|
|
sorted_collection: list[int], item: int, lo: int = 0, hi: int = -1
|
2020-12-09 14:01:58 +00:00
|
|
|
) -> int:
|
2020-01-28 17:03:59 +00:00
|
|
|
"""
|
2020-05-01 21:36:35 +00:00
|
|
|
Locates the first element in a sorted array that is larger or equal to a given
|
|
|
|
value.
|
2020-01-28 17:03:59 +00:00
|
|
|
|
2020-05-01 21:36:35 +00:00
|
|
|
It has the same interface as
|
|
|
|
https://docs.python.org/3/library/bisect.html#bisect.bisect_left .
|
2020-01-28 17:03:59 +00:00
|
|
|
|
|
|
|
:param sorted_collection: some ascending sorted collection with comparable items
|
|
|
|
:param item: item to bisect
|
|
|
|
:param lo: lowest index to consider (as in sorted_collection[lo:hi])
|
|
|
|
:param hi: past the highest index to consider (as in sorted_collection[lo:hi])
|
2020-05-01 21:36:35 +00:00
|
|
|
:return: index i such that all values in sorted_collection[lo:i] are < item and all
|
|
|
|
values in sorted_collection[i:hi] are >= item.
|
2020-01-28 17:03:59 +00:00
|
|
|
|
|
|
|
Examples:
|
|
|
|
>>> bisect_left([0, 5, 7, 10, 15], 0)
|
|
|
|
0
|
|
|
|
>>> bisect_left([0, 5, 7, 10, 15], 6)
|
|
|
|
2
|
|
|
|
>>> bisect_left([0, 5, 7, 10, 15], 20)
|
|
|
|
5
|
|
|
|
>>> bisect_left([0, 5, 7, 10, 15], 15, 1, 3)
|
|
|
|
3
|
|
|
|
>>> bisect_left([0, 5, 7, 10, 15], 6, 2)
|
|
|
|
2
|
|
|
|
"""
|
2020-12-09 14:01:58 +00:00
|
|
|
if hi < 0:
|
2020-01-28 17:03:59 +00:00
|
|
|
hi = len(sorted_collection)
|
|
|
|
|
|
|
|
while lo < hi:
|
2021-10-27 04:25:48 +00:00
|
|
|
mid = lo + (hi - lo) // 2
|
2020-01-28 17:03:59 +00:00
|
|
|
if sorted_collection[mid] < item:
|
|
|
|
lo = mid + 1
|
|
|
|
else:
|
|
|
|
hi = mid
|
|
|
|
|
|
|
|
return lo
|
|
|
|
|
|
|
|
|
2020-12-09 14:01:58 +00:00
|
|
|
def bisect_right(
|
2021-09-07 11:37:03 +00:00
|
|
|
sorted_collection: list[int], item: int, lo: int = 0, hi: int = -1
|
2020-12-09 14:01:58 +00:00
|
|
|
) -> int:
|
2020-01-28 17:03:59 +00:00
|
|
|
"""
|
|
|
|
Locates the first element in a sorted array that is larger than a given value.
|
|
|
|
|
2020-05-01 21:36:35 +00:00
|
|
|
It has the same interface as
|
|
|
|
https://docs.python.org/3/library/bisect.html#bisect.bisect_right .
|
2020-01-28 17:03:59 +00:00
|
|
|
|
|
|
|
:param sorted_collection: some ascending sorted collection with comparable items
|
|
|
|
:param item: item to bisect
|
|
|
|
:param lo: lowest index to consider (as in sorted_collection[lo:hi])
|
|
|
|
:param hi: past the highest index to consider (as in sorted_collection[lo:hi])
|
2020-05-01 21:36:35 +00:00
|
|
|
:return: index i such that all values in sorted_collection[lo:i] are <= item and
|
|
|
|
all values in sorted_collection[i:hi] are > item.
|
2020-01-28 17:03:59 +00:00
|
|
|
|
|
|
|
Examples:
|
|
|
|
>>> bisect_right([0, 5, 7, 10, 15], 0)
|
|
|
|
1
|
|
|
|
>>> bisect_right([0, 5, 7, 10, 15], 15)
|
|
|
|
5
|
|
|
|
>>> bisect_right([0, 5, 7, 10, 15], 6)
|
|
|
|
2
|
|
|
|
>>> bisect_right([0, 5, 7, 10, 15], 15, 1, 3)
|
|
|
|
3
|
|
|
|
>>> bisect_right([0, 5, 7, 10, 15], 6, 2)
|
|
|
|
2
|
|
|
|
"""
|
2020-12-09 14:01:58 +00:00
|
|
|
if hi < 0:
|
2020-01-28 17:03:59 +00:00
|
|
|
hi = len(sorted_collection)
|
|
|
|
|
|
|
|
while lo < hi:
|
2021-10-27 04:25:48 +00:00
|
|
|
mid = lo + (hi - lo) // 2
|
2020-01-28 17:03:59 +00:00
|
|
|
if sorted_collection[mid] <= item:
|
|
|
|
lo = mid + 1
|
|
|
|
else:
|
|
|
|
hi = mid
|
|
|
|
|
|
|
|
return lo
|
|
|
|
|
|
|
|
|
2020-12-09 14:01:58 +00:00
|
|
|
def insort_left(
|
2021-09-07 11:37:03 +00:00
|
|
|
sorted_collection: list[int], item: int, lo: int = 0, hi: int = -1
|
2020-12-09 14:01:58 +00:00
|
|
|
) -> None:
|
2020-01-28 17:03:59 +00:00
|
|
|
"""
|
|
|
|
Inserts a given value into a sorted array before other values with the same value.
|
|
|
|
|
2020-05-01 21:36:35 +00:00
|
|
|
It has the same interface as
|
|
|
|
https://docs.python.org/3/library/bisect.html#bisect.insort_left .
|
2020-01-28 17:03:59 +00:00
|
|
|
|
|
|
|
:param sorted_collection: some ascending sorted collection with comparable items
|
|
|
|
:param item: item to insert
|
|
|
|
:param lo: lowest index to consider (as in sorted_collection[lo:hi])
|
|
|
|
:param hi: past the highest index to consider (as in sorted_collection[lo:hi])
|
|
|
|
|
|
|
|
Examples:
|
|
|
|
>>> sorted_collection = [0, 5, 7, 10, 15]
|
|
|
|
>>> insort_left(sorted_collection, 6)
|
|
|
|
>>> sorted_collection
|
|
|
|
[0, 5, 6, 7, 10, 15]
|
|
|
|
>>> sorted_collection = [(0, 0), (5, 5), (7, 7), (10, 10), (15, 15)]
|
|
|
|
>>> item = (5, 5)
|
|
|
|
>>> insort_left(sorted_collection, item)
|
|
|
|
>>> sorted_collection
|
|
|
|
[(0, 0), (5, 5), (5, 5), (7, 7), (10, 10), (15, 15)]
|
|
|
|
>>> item is sorted_collection[1]
|
|
|
|
True
|
|
|
|
>>> item is sorted_collection[2]
|
|
|
|
False
|
|
|
|
>>> sorted_collection = [0, 5, 7, 10, 15]
|
|
|
|
>>> insort_left(sorted_collection, 20)
|
|
|
|
>>> sorted_collection
|
|
|
|
[0, 5, 7, 10, 15, 20]
|
|
|
|
>>> sorted_collection = [0, 5, 7, 10, 15]
|
|
|
|
>>> insort_left(sorted_collection, 15, 1, 3)
|
|
|
|
>>> sorted_collection
|
|
|
|
[0, 5, 7, 15, 10, 15]
|
|
|
|
"""
|
|
|
|
sorted_collection.insert(bisect_left(sorted_collection, item, lo, hi), item)
|
|
|
|
|
|
|
|
|
2020-12-09 14:01:58 +00:00
|
|
|
def insort_right(
|
2021-09-07 11:37:03 +00:00
|
|
|
sorted_collection: list[int], item: int, lo: int = 0, hi: int = -1
|
2020-12-09 14:01:58 +00:00
|
|
|
) -> None:
|
2020-01-28 17:03:59 +00:00
|
|
|
"""
|
|
|
|
Inserts a given value into a sorted array after other values with the same value.
|
|
|
|
|
2020-05-01 21:36:35 +00:00
|
|
|
It has the same interface as
|
|
|
|
https://docs.python.org/3/library/bisect.html#bisect.insort_right .
|
2020-01-28 17:03:59 +00:00
|
|
|
|
|
|
|
:param sorted_collection: some ascending sorted collection with comparable items
|
|
|
|
:param item: item to insert
|
|
|
|
:param lo: lowest index to consider (as in sorted_collection[lo:hi])
|
|
|
|
:param hi: past the highest index to consider (as in sorted_collection[lo:hi])
|
|
|
|
|
|
|
|
Examples:
|
|
|
|
>>> sorted_collection = [0, 5, 7, 10, 15]
|
|
|
|
>>> insort_right(sorted_collection, 6)
|
|
|
|
>>> sorted_collection
|
|
|
|
[0, 5, 6, 7, 10, 15]
|
|
|
|
>>> sorted_collection = [(0, 0), (5, 5), (7, 7), (10, 10), (15, 15)]
|
|
|
|
>>> item = (5, 5)
|
|
|
|
>>> insort_right(sorted_collection, item)
|
|
|
|
>>> sorted_collection
|
|
|
|
[(0, 0), (5, 5), (5, 5), (7, 7), (10, 10), (15, 15)]
|
|
|
|
>>> item is sorted_collection[1]
|
|
|
|
False
|
|
|
|
>>> item is sorted_collection[2]
|
|
|
|
True
|
|
|
|
>>> sorted_collection = [0, 5, 7, 10, 15]
|
|
|
|
>>> insort_right(sorted_collection, 20)
|
|
|
|
>>> sorted_collection
|
|
|
|
[0, 5, 7, 10, 15, 20]
|
|
|
|
>>> sorted_collection = [0, 5, 7, 10, 15]
|
|
|
|
>>> insort_right(sorted_collection, 15, 1, 3)
|
|
|
|
>>> sorted_collection
|
|
|
|
[0, 5, 7, 15, 10, 15]
|
|
|
|
"""
|
|
|
|
sorted_collection.insert(bisect_right(sorted_collection, item, lo, hi), item)
|
|
|
|
|
|
|
|
|
2023-10-21 18:53:34 +00:00
|
|
|
def binary_search(sorted_collection: list[int], item: int) -> int:
|
|
|
|
"""Pure implementation of a binary search algorithm in Python
|
2016-07-29 13:03:20 +00:00
|
|
|
|
2023-10-21 18:53:34 +00:00
|
|
|
Be careful collection must be ascending sorted otherwise, the result will be
|
2016-07-29 20:06:49 +00:00
|
|
|
unpredictable
|
|
|
|
|
2019-05-06 09:54:31 +00:00
|
|
|
:param sorted_collection: some ascending sorted collection with comparable items
|
2016-07-29 13:03:20 +00:00
|
|
|
:param item: item value to search
|
2023-10-21 18:53:34 +00:00
|
|
|
:return: index of the found item or -1 if the item is not found
|
2016-07-29 13:03:20 +00:00
|
|
|
|
|
|
|
Examples:
|
|
|
|
>>> binary_search([0, 5, 7, 10, 15], 0)
|
|
|
|
0
|
|
|
|
>>> binary_search([0, 5, 7, 10, 15], 15)
|
|
|
|
4
|
|
|
|
>>> binary_search([0, 5, 7, 10, 15], 5)
|
|
|
|
1
|
|
|
|
>>> binary_search([0, 5, 7, 10, 15], 6)
|
2023-10-21 18:53:34 +00:00
|
|
|
-1
|
2016-07-29 13:03:20 +00:00
|
|
|
"""
|
2023-10-21 18:53:34 +00:00
|
|
|
if list(sorted_collection) != sorted(sorted_collection):
|
|
|
|
raise ValueError("sorted_collection must be sorted in ascending order")
|
2016-07-29 13:03:20 +00:00
|
|
|
left = 0
|
|
|
|
right = len(sorted_collection) - 1
|
|
|
|
|
|
|
|
while left <= right:
|
2019-06-24 10:11:07 +00:00
|
|
|
midpoint = left + (right - left) // 2
|
2016-07-29 13:03:20 +00:00
|
|
|
current_item = sorted_collection[midpoint]
|
|
|
|
if current_item == item:
|
|
|
|
return midpoint
|
2019-10-08 08:22:40 +00:00
|
|
|
elif item < current_item:
|
|
|
|
right = midpoint - 1
|
2016-07-23 12:03:51 +00:00
|
|
|
else:
|
2019-10-08 08:22:40 +00:00
|
|
|
left = midpoint + 1
|
2023-10-21 18:53:34 +00:00
|
|
|
return -1
|
2016-07-29 13:03:20 +00:00
|
|
|
|
|
|
|
|
2023-10-21 18:53:34 +00:00
|
|
|
def binary_search_std_lib(sorted_collection: list[int], item: int) -> int:
|
|
|
|
"""Pure implementation of a binary search algorithm in Python using stdlib
|
2016-07-29 14:12:51 +00:00
|
|
|
|
2023-10-21 18:53:34 +00:00
|
|
|
Be careful collection must be ascending sorted otherwise, the result will be
|
2016-07-29 20:06:49 +00:00
|
|
|
unpredictable
|
|
|
|
|
2019-05-06 09:54:31 +00:00
|
|
|
:param sorted_collection: some ascending sorted collection with comparable items
|
2016-07-29 14:12:51 +00:00
|
|
|
:param item: item value to search
|
2023-10-21 18:53:34 +00:00
|
|
|
:return: index of the found item or -1 if the item is not found
|
2016-07-29 14:12:51 +00:00
|
|
|
|
|
|
|
Examples:
|
|
|
|
>>> binary_search_std_lib([0, 5, 7, 10, 15], 0)
|
|
|
|
0
|
|
|
|
>>> binary_search_std_lib([0, 5, 7, 10, 15], 15)
|
|
|
|
4
|
|
|
|
>>> binary_search_std_lib([0, 5, 7, 10, 15], 5)
|
|
|
|
1
|
|
|
|
>>> binary_search_std_lib([0, 5, 7, 10, 15], 6)
|
2023-10-21 18:53:34 +00:00
|
|
|
-1
|
2016-07-29 14:12:51 +00:00
|
|
|
"""
|
2023-10-21 18:53:34 +00:00
|
|
|
if list(sorted_collection) != sorted(sorted_collection):
|
|
|
|
raise ValueError("sorted_collection must be sorted in ascending order")
|
2016-07-29 14:12:51 +00:00
|
|
|
index = bisect.bisect_left(sorted_collection, item)
|
|
|
|
if index != len(sorted_collection) and sorted_collection[index] == item:
|
|
|
|
return index
|
2023-10-21 18:53:34 +00:00
|
|
|
return -1
|
2016-07-29 14:12:51 +00:00
|
|
|
|
2019-10-05 05:14:13 +00:00
|
|
|
|
2020-12-09 14:01:58 +00:00
|
|
|
def binary_search_by_recursion(
|
2023-10-21 18:53:34 +00:00
|
|
|
sorted_collection: list[int], item: int, left: int = 0, right: int = -1
|
|
|
|
) -> int:
|
|
|
|
"""Pure implementation of a binary search algorithm in Python by recursion
|
2017-07-05 08:40:18 +00:00
|
|
|
|
2023-10-21 18:53:34 +00:00
|
|
|
Be careful collection must be ascending sorted otherwise, the result will be
|
2017-07-05 08:40:18 +00:00
|
|
|
unpredictable
|
|
|
|
First recursion should be started with left=0 and right=(len(sorted_collection)-1)
|
|
|
|
|
2019-05-06 09:54:31 +00:00
|
|
|
:param sorted_collection: some ascending sorted collection with comparable items
|
2017-07-05 08:40:18 +00:00
|
|
|
:param item: item value to search
|
2023-10-21 18:53:34 +00:00
|
|
|
:return: index of the found item or -1 if the item is not found
|
2017-07-05 08:40:18 +00:00
|
|
|
|
|
|
|
Examples:
|
2020-08-01 05:26:04 +00:00
|
|
|
>>> binary_search_by_recursion([0, 5, 7, 10, 15], 0, 0, 4)
|
2017-07-05 08:40:18 +00:00
|
|
|
0
|
2020-08-01 05:26:04 +00:00
|
|
|
>>> binary_search_by_recursion([0, 5, 7, 10, 15], 15, 0, 4)
|
2017-07-05 08:40:18 +00:00
|
|
|
4
|
2020-08-01 05:26:04 +00:00
|
|
|
>>> binary_search_by_recursion([0, 5, 7, 10, 15], 5, 0, 4)
|
2017-07-05 08:40:18 +00:00
|
|
|
1
|
2020-08-01 05:26:04 +00:00
|
|
|
>>> binary_search_by_recursion([0, 5, 7, 10, 15], 6, 0, 4)
|
2023-10-21 18:53:34 +00:00
|
|
|
-1
|
2017-07-05 08:40:18 +00:00
|
|
|
"""
|
2023-10-21 18:53:34 +00:00
|
|
|
if right < 0:
|
|
|
|
right = len(sorted_collection) - 1
|
|
|
|
if list(sorted_collection) != sorted(sorted_collection):
|
|
|
|
raise ValueError("sorted_collection must be sorted in ascending order")
|
2019-10-05 05:14:13 +00:00
|
|
|
if right < left:
|
2023-10-21 18:53:34 +00:00
|
|
|
return -1
|
2019-08-19 13:37:49 +00:00
|
|
|
|
2017-07-05 08:40:18 +00:00
|
|
|
midpoint = left + (right - left) // 2
|
|
|
|
|
|
|
|
if sorted_collection[midpoint] == item:
|
|
|
|
return midpoint
|
|
|
|
elif sorted_collection[midpoint] > item:
|
2019-10-05 05:14:13 +00:00
|
|
|
return binary_search_by_recursion(sorted_collection, item, left, midpoint - 1)
|
2017-07-05 08:40:18 +00:00
|
|
|
else:
|
2019-10-05 05:14:13 +00:00
|
|
|
return binary_search_by_recursion(sorted_collection, item, midpoint + 1, right)
|
|
|
|
|
2019-08-19 13:37:49 +00:00
|
|
|
|
2023-10-21 18:53:34 +00:00
|
|
|
def exponential_search(sorted_collection: list[int], item: int) -> int:
|
|
|
|
"""Pure implementation of an exponential search algorithm in Python
|
|
|
|
Resources used:
|
|
|
|
https://en.wikipedia.org/wiki/Exponential_search
|
|
|
|
|
|
|
|
Be careful collection must be ascending sorted otherwise, result will be
|
|
|
|
unpredictable
|
|
|
|
|
|
|
|
:param sorted_collection: some ascending sorted collection with comparable items
|
|
|
|
:param item: item value to search
|
|
|
|
:return: index of the found item or -1 if the item is not found
|
|
|
|
|
|
|
|
the order of this algorithm is O(lg I) where I is index position of item if exist
|
|
|
|
|
|
|
|
Examples:
|
|
|
|
>>> exponential_search([0, 5, 7, 10, 15], 0)
|
|
|
|
0
|
|
|
|
>>> exponential_search([0, 5, 7, 10, 15], 15)
|
|
|
|
4
|
|
|
|
>>> exponential_search([0, 5, 7, 10, 15], 5)
|
|
|
|
1
|
|
|
|
>>> exponential_search([0, 5, 7, 10, 15], 6)
|
|
|
|
-1
|
|
|
|
"""
|
|
|
|
if list(sorted_collection) != sorted(sorted_collection):
|
|
|
|
raise ValueError("sorted_collection must be sorted in ascending order")
|
|
|
|
bound = 1
|
|
|
|
while bound < len(sorted_collection) and sorted_collection[bound] < item:
|
|
|
|
bound *= 2
|
|
|
|
left = bound // 2
|
|
|
|
right = min(bound, len(sorted_collection) - 1)
|
|
|
|
last_result = binary_search_by_recursion(
|
|
|
|
sorted_collection=sorted_collection, item=item, left=left, right=right
|
|
|
|
)
|
|
|
|
if last_result is None:
|
|
|
|
return -1
|
|
|
|
return last_result
|
|
|
|
|
|
|
|
|
|
|
|
searches = ( # Fastest to slowest...
|
|
|
|
binary_search_std_lib,
|
|
|
|
binary_search,
|
|
|
|
exponential_search,
|
|
|
|
binary_search_by_recursion,
|
|
|
|
)
|
|
|
|
|
|
|
|
|
2019-10-05 05:14:13 +00:00
|
|
|
if __name__ == "__main__":
|
2023-10-21 18:53:34 +00:00
|
|
|
import doctest
|
|
|
|
import timeit
|
|
|
|
|
|
|
|
doctest.testmod()
|
|
|
|
for search in searches:
|
|
|
|
name = f"{search.__name__:>26}"
|
|
|
|
print(f"{name}: {search([0, 5, 7, 10, 15], 10) = }") # type: ignore[operator]
|
|
|
|
|
|
|
|
print("\nBenchmarks...")
|
|
|
|
setup = "collection = range(1000)"
|
|
|
|
for search in searches:
|
|
|
|
name = search.__name__
|
|
|
|
print(
|
|
|
|
f"{name:>26}:",
|
|
|
|
timeit.timeit(
|
|
|
|
f"{name}(collection, 500)", setup=setup, number=5_000, globals=globals()
|
|
|
|
),
|
|
|
|
)
|
|
|
|
|
|
|
|
user_input = input("\nEnter numbers separated by comma: ").strip()
|
2020-12-09 14:01:58 +00:00
|
|
|
collection = sorted(int(item) for item in user_input.split(","))
|
2023-10-21 18:53:34 +00:00
|
|
|
target = int(input("Enter a single number to be found in the list: "))
|
|
|
|
result = binary_search(sorted_collection=collection, item=target)
|
|
|
|
if result == -1:
|
2020-12-09 14:01:58 +00:00
|
|
|
print(f"{target} was not found in {collection}.")
|
2016-07-29 13:03:20 +00:00
|
|
|
else:
|
2023-10-21 18:53:34 +00:00
|
|
|
print(f"{target} was found at position {result} of {collection}.")
|