2017-10-15 16:11:10 +00:00
|
|
|
"""
|
2020-03-04 12:40:28 +00:00
|
|
|
This is pure Python implementation of interpolation search algorithm
|
2017-10-15 16:11:10 +00:00
|
|
|
"""
|
2017-11-25 09:23:50 +00:00
|
|
|
|
2017-10-15 16:11:10 +00:00
|
|
|
|
2024-07-25 15:56:31 +00:00
|
|
|
def interpolation_search(sorted_collection: list[int], item: int) -> int | None:
|
|
|
|
"""
|
|
|
|
Searches for an item in a sorted collection by interpolation search algorithm.
|
|
|
|
|
|
|
|
Args:
|
|
|
|
sorted_collection: sorted list of integers
|
|
|
|
item: item value to search
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
int: The index of the found item, or None if the item is not found.
|
|
|
|
Examples:
|
|
|
|
>>> interpolation_search([1, 2, 3, 4, 5], 2)
|
|
|
|
1
|
|
|
|
>>> interpolation_search([1, 2, 3, 4, 5], 4)
|
|
|
|
3
|
|
|
|
>>> interpolation_search([1, 2, 3, 4, 5], 6) is None
|
|
|
|
True
|
|
|
|
>>> interpolation_search([], 1) is None
|
|
|
|
True
|
|
|
|
>>> interpolation_search([100], 100)
|
|
|
|
0
|
|
|
|
>>> interpolation_search([1, 2, 3, 4, 5], 0) is None
|
|
|
|
True
|
|
|
|
>>> interpolation_search([1, 2, 3, 4, 5], 7) is None
|
|
|
|
True
|
|
|
|
>>> interpolation_search([1, 2, 3, 4, 5], 2)
|
|
|
|
1
|
|
|
|
>>> interpolation_search([1, 2, 3, 4, 5], 0) is None
|
|
|
|
True
|
|
|
|
>>> interpolation_search([1, 2, 3, 4, 5], 7) is None
|
|
|
|
True
|
|
|
|
>>> interpolation_search([1, 2, 3, 4, 5], 2)
|
|
|
|
1
|
|
|
|
>>> interpolation_search([5, 5, 5, 5, 5], 3) is None
|
|
|
|
True
|
2017-10-15 16:11:10 +00:00
|
|
|
"""
|
|
|
|
left = 0
|
|
|
|
right = len(sorted_collection) - 1
|
|
|
|
|
|
|
|
while left <= right:
|
2020-01-18 12:24:33 +00:00
|
|
|
# avoid divided by 0 during interpolation
|
2019-10-05 05:14:13 +00:00
|
|
|
if sorted_collection[left] == sorted_collection[right]:
|
|
|
|
if sorted_collection[left] == item:
|
Interpolation search - fix endless loop bug, divide 0 bug and update description (#793)
* fix endless loop bug, divide 0 bug and update description
fix an endless bug, for example, if collection = [10,30,40,45,50,66,77,93], item = 67.
fix divide 0 bug, when right=left it is not OK to point = left + ((item - sorted_collection[left]) * (right - left)) // (sorted_collection[right] - sorted_collection[left])
update 'sorted' to 'ascending sorted' in description to avoid confusion
* delete swap files
* delete 'address' and add input validation
2019-05-18 02:59:12 +00:00
|
|
|
return left
|
2024-07-25 15:56:31 +00:00
|
|
|
return None
|
Interpolation search - fix endless loop bug, divide 0 bug and update description (#793)
* fix endless loop bug, divide 0 bug and update description
fix an endless bug, for example, if collection = [10,30,40,45,50,66,77,93], item = 67.
fix divide 0 bug, when right=left it is not OK to point = left + ((item - sorted_collection[left]) * (right - left)) // (sorted_collection[right] - sorted_collection[left])
update 'sorted' to 'ascending sorted' in description to avoid confusion
* delete swap files
* delete 'address' and add input validation
2019-05-18 02:59:12 +00:00
|
|
|
|
2019-10-05 05:14:13 +00:00
|
|
|
point = left + ((item - sorted_collection[left]) * (right - left)) // (
|
|
|
|
sorted_collection[right] - sorted_collection[left]
|
|
|
|
)
|
2019-08-19 13:37:49 +00:00
|
|
|
|
2019-10-05 05:14:13 +00:00
|
|
|
# out of range check
|
|
|
|
if point < 0 or point >= len(sorted_collection):
|
2017-10-15 16:11:10 +00:00
|
|
|
return None
|
|
|
|
|
|
|
|
current_item = sorted_collection[point]
|
|
|
|
if current_item == item:
|
|
|
|
return point
|
2024-07-25 15:56:31 +00:00
|
|
|
if point < left:
|
2024-03-28 17:25:41 +00:00
|
|
|
right = left
|
|
|
|
left = point
|
|
|
|
elif point > right:
|
|
|
|
left = right
|
|
|
|
right = point
|
|
|
|
elif item < current_item:
|
|
|
|
right = point - 1
|
2017-10-15 16:11:10 +00:00
|
|
|
else:
|
2024-03-28 17:25:41 +00:00
|
|
|
left = point + 1
|
2017-10-15 16:11:10 +00:00
|
|
|
return None
|
|
|
|
|
2019-10-05 05:14:13 +00:00
|
|
|
|
2024-07-25 15:56:31 +00:00
|
|
|
def interpolation_search_by_recursion(
|
|
|
|
sorted_collection: list[int], item: int, left: int = 0, right: int | None = None
|
|
|
|
) -> int | None:
|
2017-10-15 16:11:10 +00:00
|
|
|
"""Pure implementation of interpolation search algorithm in Python by recursion
|
Interpolation search - fix endless loop bug, divide 0 bug and update description (#793)
* fix endless loop bug, divide 0 bug and update description
fix an endless bug, for example, if collection = [10,30,40,45,50,66,77,93], item = 67.
fix divide 0 bug, when right=left it is not OK to point = left + ((item - sorted_collection[left]) * (right - left)) // (sorted_collection[right] - sorted_collection[left])
update 'sorted' to 'ascending sorted' in description to avoid confusion
* delete swap files
* delete 'address' and add input validation
2019-05-18 02:59:12 +00:00
|
|
|
Be careful collection must be ascending sorted, otherwise result will be
|
2017-10-15 16:11:10 +00:00
|
|
|
unpredictable
|
|
|
|
First recursion should be started with left=0 and right=(len(sorted_collection)-1)
|
|
|
|
|
2024-07-25 15:56:31 +00:00
|
|
|
Args:
|
|
|
|
sorted_collection: some sorted collection with comparable items
|
|
|
|
item: item value to search
|
|
|
|
left: left index in collection
|
|
|
|
right: right index in collection
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
index of item in collection or None if item is not present
|
|
|
|
|
|
|
|
Examples:
|
|
|
|
>>> interpolation_search_by_recursion([0, 5, 7, 10, 15], 0)
|
|
|
|
0
|
|
|
|
>>> interpolation_search_by_recursion([0, 5, 7, 10, 15], 15)
|
|
|
|
4
|
|
|
|
>>> interpolation_search_by_recursion([0, 5, 7, 10, 15], 5)
|
|
|
|
1
|
|
|
|
>>> interpolation_search_by_recursion([0, 5, 7, 10, 15], 100) is None
|
|
|
|
True
|
|
|
|
>>> interpolation_search_by_recursion([5, 5, 5, 5, 5], 3) is None
|
|
|
|
True
|
|
|
|
"""
|
|
|
|
if right is None:
|
|
|
|
right = len(sorted_collection) - 1
|
2020-01-18 12:24:33 +00:00
|
|
|
# avoid divided by 0 during interpolation
|
2019-10-05 05:14:13 +00:00
|
|
|
if sorted_collection[left] == sorted_collection[right]:
|
|
|
|
if sorted_collection[left] == item:
|
Interpolation search - fix endless loop bug, divide 0 bug and update description (#793)
* fix endless loop bug, divide 0 bug and update description
fix an endless bug, for example, if collection = [10,30,40,45,50,66,77,93], item = 67.
fix divide 0 bug, when right=left it is not OK to point = left + ((item - sorted_collection[left]) * (right - left)) // (sorted_collection[right] - sorted_collection[left])
update 'sorted' to 'ascending sorted' in description to avoid confusion
* delete swap files
* delete 'address' and add input validation
2019-05-18 02:59:12 +00:00
|
|
|
return left
|
2024-07-25 15:56:31 +00:00
|
|
|
return None
|
Interpolation search - fix endless loop bug, divide 0 bug and update description (#793)
* fix endless loop bug, divide 0 bug and update description
fix an endless bug, for example, if collection = [10,30,40,45,50,66,77,93], item = 67.
fix divide 0 bug, when right=left it is not OK to point = left + ((item - sorted_collection[left]) * (right - left)) // (sorted_collection[right] - sorted_collection[left])
update 'sorted' to 'ascending sorted' in description to avoid confusion
* delete swap files
* delete 'address' and add input validation
2019-05-18 02:59:12 +00:00
|
|
|
|
2019-10-05 05:14:13 +00:00
|
|
|
point = left + ((item - sorted_collection[left]) * (right - left)) // (
|
|
|
|
sorted_collection[right] - sorted_collection[left]
|
|
|
|
)
|
2019-08-19 13:37:49 +00:00
|
|
|
|
2019-10-05 05:14:13 +00:00
|
|
|
# out of range check
|
|
|
|
if point < 0 or point >= len(sorted_collection):
|
2017-10-15 16:11:10 +00:00
|
|
|
return None
|
|
|
|
|
|
|
|
if sorted_collection[point] == item:
|
|
|
|
return point
|
2024-07-25 15:56:31 +00:00
|
|
|
if point < left:
|
Interpolation search - fix endless loop bug, divide 0 bug and update description (#793)
* fix endless loop bug, divide 0 bug and update description
fix an endless bug, for example, if collection = [10,30,40,45,50,66,77,93], item = 67.
fix divide 0 bug, when right=left it is not OK to point = left + ((item - sorted_collection[left]) * (right - left)) // (sorted_collection[right] - sorted_collection[left])
update 'sorted' to 'ascending sorted' in description to avoid confusion
* delete swap files
* delete 'address' and add input validation
2019-05-18 02:59:12 +00:00
|
|
|
return interpolation_search_by_recursion(sorted_collection, item, point, left)
|
2024-07-25 15:56:31 +00:00
|
|
|
if point > right:
|
Interpolation search - fix endless loop bug, divide 0 bug and update description (#793)
* fix endless loop bug, divide 0 bug and update description
fix an endless bug, for example, if collection = [10,30,40,45,50,66,77,93], item = 67.
fix divide 0 bug, when right=left it is not OK to point = left + ((item - sorted_collection[left]) * (right - left)) // (sorted_collection[right] - sorted_collection[left])
update 'sorted' to 'ascending sorted' in description to avoid confusion
* delete swap files
* delete 'address' and add input validation
2019-05-18 02:59:12 +00:00
|
|
|
return interpolation_search_by_recursion(sorted_collection, item, right, left)
|
2024-07-25 15:56:31 +00:00
|
|
|
if sorted_collection[point] > item:
|
2024-03-28 17:25:41 +00:00
|
|
|
return interpolation_search_by_recursion(
|
|
|
|
sorted_collection, item, left, point - 1
|
|
|
|
)
|
2024-07-25 15:56:31 +00:00
|
|
|
return interpolation_search_by_recursion(sorted_collection, item, point + 1, right)
|
2017-10-15 16:11:10 +00:00
|
|
|
|
|
|
|
|
2019-10-05 05:14:13 +00:00
|
|
|
if __name__ == "__main__":
|
2024-07-25 15:56:31 +00:00
|
|
|
import doctest
|
2019-08-19 13:37:49 +00:00
|
|
|
|
2024-07-25 15:56:31 +00:00
|
|
|
doctest.testmod()
|