2019-10-05 05:14:13 +00:00
|
|
|
"""
|
2020-06-16 08:09:19 +00:00
|
|
|
Algorithm for calculating the most cost-efficient sequence for converting one string
|
|
|
|
into another.
|
2018-03-20 19:23:09 +00:00
|
|
|
The only allowed operations are
|
2020-10-01 01:04:31 +00:00
|
|
|
--- Cost to copy a character is copy_cost
|
|
|
|
--- Cost to replace a character is replace_cost
|
|
|
|
--- Cost to delete a character is delete_cost
|
|
|
|
--- Cost to insert a character is insert_cost
|
2019-10-05 05:14:13 +00:00
|
|
|
"""
|
|
|
|
|
|
|
|
|
2020-10-01 01:04:31 +00:00
|
|
|
def compute_transform_tables(
|
|
|
|
source_string: str,
|
|
|
|
destination_string: str,
|
|
|
|
copy_cost: int,
|
|
|
|
replace_cost: int,
|
|
|
|
delete_cost: int,
|
|
|
|
insert_cost: int,
|
2021-08-25 11:35:36 +00:00
|
|
|
) -> tuple[list[list[int]], list[list[str]]]:
|
2024-10-04 09:36:14 +00:00
|
|
|
"""
|
|
|
|
Finds the most cost efficient sequence
|
|
|
|
for converting one string into another.
|
|
|
|
|
|
|
|
>>> costs, operations = compute_transform_tables("cat", "cut", 1, 2, 3, 3)
|
|
|
|
>>> costs[0][:4]
|
|
|
|
[0, 3, 6, 9]
|
|
|
|
>>> costs[2][:4]
|
|
|
|
[6, 4, 3, 6]
|
|
|
|
>>> operations[0][:4]
|
|
|
|
['0', 'Ic', 'Iu', 'It']
|
|
|
|
>>> operations[3][:4]
|
|
|
|
['Dt', 'Dt', 'Rtu', 'Ct']
|
|
|
|
|
|
|
|
>>> compute_transform_tables("", "", 1, 2, 3, 3)
|
|
|
|
([[0]], [['0']])
|
|
|
|
"""
|
2020-10-01 01:04:31 +00:00
|
|
|
source_seq = list(source_string)
|
|
|
|
destination_seq = list(destination_string)
|
|
|
|
len_source_seq = len(source_seq)
|
|
|
|
len_destination_seq = len(destination_seq)
|
|
|
|
costs = [
|
|
|
|
[0 for _ in range(len_destination_seq + 1)] for _ in range(len_source_seq + 1)
|
|
|
|
]
|
|
|
|
ops = [
|
2021-08-25 11:35:36 +00:00
|
|
|
["0" for _ in range(len_destination_seq + 1)] for _ in range(len_source_seq + 1)
|
2020-10-01 01:04:31 +00:00
|
|
|
]
|
|
|
|
|
|
|
|
for i in range(1, len_source_seq + 1):
|
|
|
|
costs[i][0] = i * delete_cost
|
2024-10-04 09:28:50 +00:00
|
|
|
ops[i][0] = f"D{source_seq[i - 1]}"
|
2020-10-01 01:04:31 +00:00
|
|
|
|
|
|
|
for i in range(1, len_destination_seq + 1):
|
|
|
|
costs[0][i] = i * insert_cost
|
2024-10-04 09:28:50 +00:00
|
|
|
ops[0][i] = f"I{destination_seq[i - 1]}"
|
2020-10-01 01:04:31 +00:00
|
|
|
|
|
|
|
for i in range(1, len_source_seq + 1):
|
|
|
|
for j in range(1, len_destination_seq + 1):
|
|
|
|
if source_seq[i - 1] == destination_seq[j - 1]:
|
|
|
|
costs[i][j] = costs[i - 1][j - 1] + copy_cost
|
2024-10-04 09:28:50 +00:00
|
|
|
ops[i][j] = f"C{source_seq[i - 1]}"
|
2019-10-05 05:14:13 +00:00
|
|
|
else:
|
2020-10-01 01:04:31 +00:00
|
|
|
costs[i][j] = costs[i - 1][j - 1] + replace_cost
|
2024-10-04 09:28:50 +00:00
|
|
|
ops[i][j] = f"R{source_seq[i - 1]}" + str(destination_seq[j - 1])
|
2018-03-20 19:23:09 +00:00
|
|
|
|
2020-10-01 01:04:31 +00:00
|
|
|
if costs[i - 1][j] + delete_cost < costs[i][j]:
|
|
|
|
costs[i][j] = costs[i - 1][j] + delete_cost
|
2024-10-04 09:28:50 +00:00
|
|
|
ops[i][j] = f"D{source_seq[i - 1]}"
|
2018-03-20 19:23:09 +00:00
|
|
|
|
2020-10-01 01:04:31 +00:00
|
|
|
if costs[i][j - 1] + insert_cost < costs[i][j]:
|
|
|
|
costs[i][j] = costs[i][j - 1] + insert_cost
|
2024-10-04 09:28:50 +00:00
|
|
|
ops[i][j] = f"I{destination_seq[j - 1]}"
|
2018-03-20 19:23:09 +00:00
|
|
|
|
2019-10-05 05:14:13 +00:00
|
|
|
return costs, ops
|
2018-03-20 19:23:09 +00:00
|
|
|
|
|
|
|
|
2021-08-25 11:35:36 +00:00
|
|
|
def assemble_transformation(ops: list[list[str]], i: int, j: int) -> list[str]:
|
2024-10-04 09:36:14 +00:00
|
|
|
"""
|
|
|
|
Assembles the transformations based on the ops table.
|
|
|
|
|
|
|
|
>>> ops = [['0', 'Ic', 'Iu', 'It'],
|
|
|
|
... ['Dc', 'Cc', 'Iu', 'It'],
|
|
|
|
... ['Da', 'Da', 'Rau', 'Rat'],
|
|
|
|
... ['Dt', 'Dt', 'Rtu', 'Ct']]
|
|
|
|
>>> x = len(ops) - 1
|
|
|
|
>>> y = len(ops[0]) - 1
|
|
|
|
>>> assemble_transformation(ops, x, y)
|
|
|
|
['Cc', 'Rau', 'Ct']
|
|
|
|
|
|
|
|
>>> ops1 = [['0']]
|
|
|
|
>>> x1 = len(ops1) - 1
|
|
|
|
>>> y1 = len(ops1[0]) - 1
|
|
|
|
>>> assemble_transformation(ops1, x1, y1)
|
|
|
|
[]
|
2024-12-30 11:10:44 +00:00
|
|
|
|
|
|
|
>>> ops2 = [['0', 'I1', 'I2', 'I3'],
|
|
|
|
... ['D1', 'C1', 'I2', 'I3'],
|
|
|
|
... ['D2', 'D2', 'R23', 'R23']]
|
|
|
|
>>> x2 = len(ops2) - 1
|
|
|
|
>>> y2 = len(ops2[0]) - 1
|
|
|
|
>>> assemble_transformation(ops2, x2, y2)
|
|
|
|
['C1', 'I2', 'R23']
|
2024-10-04 09:36:14 +00:00
|
|
|
"""
|
2019-10-05 05:14:13 +00:00
|
|
|
if i == 0 and j == 0:
|
2020-10-01 01:04:31 +00:00
|
|
|
return []
|
2024-03-28 17:25:41 +00:00
|
|
|
elif ops[i][j][0] in {"C", "R"}:
|
|
|
|
seq = assemble_transformation(ops, i - 1, j - 1)
|
|
|
|
seq.append(ops[i][j])
|
|
|
|
return seq
|
|
|
|
elif ops[i][j][0] == "D":
|
|
|
|
seq = assemble_transformation(ops, i - 1, j)
|
|
|
|
seq.append(ops[i][j])
|
|
|
|
return seq
|
2019-10-05 05:14:13 +00:00
|
|
|
else:
|
2024-03-28 17:25:41 +00:00
|
|
|
seq = assemble_transformation(ops, i, j - 1)
|
|
|
|
seq.append(ops[i][j])
|
|
|
|
return seq
|
2019-10-05 05:14:13 +00:00
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
_, operations = compute_transform_tables("Python", "Algorithms", -1, 1, 2, 2)
|
|
|
|
|
|
|
|
m = len(operations)
|
|
|
|
n = len(operations[0])
|
|
|
|
sequence = assemble_transformation(operations, m - 1, n - 1)
|
|
|
|
|
|
|
|
string = list("Python")
|
|
|
|
i = 0
|
|
|
|
cost = 0
|
|
|
|
|
|
|
|
with open("min_cost.txt", "w") as file:
|
|
|
|
for op in sequence:
|
|
|
|
print("".join(string))
|
|
|
|
|
|
|
|
if op[0] == "C":
|
2024-11-25 20:46:20 +00:00
|
|
|
file.write("%-16s" % "Copy %c" % op[1]) # noqa: UP031
|
2019-10-05 05:14:13 +00:00
|
|
|
file.write("\t\t\t" + "".join(string))
|
|
|
|
file.write("\r\n")
|
|
|
|
|
|
|
|
cost -= 1
|
|
|
|
elif op[0] == "R":
|
|
|
|
string[i] = op[2]
|
|
|
|
|
2024-11-25 20:46:20 +00:00
|
|
|
file.write("%-16s" % ("Replace %c" % op[1] + " with " + str(op[2]))) # noqa: UP031
|
2019-10-05 05:14:13 +00:00
|
|
|
file.write("\t\t" + "".join(string))
|
|
|
|
file.write("\r\n")
|
|
|
|
|
|
|
|
cost += 1
|
|
|
|
elif op[0] == "D":
|
|
|
|
string.pop(i)
|
|
|
|
|
2024-11-25 20:46:20 +00:00
|
|
|
file.write("%-16s" % "Delete %c" % op[1]) # noqa: UP031
|
2019-10-05 05:14:13 +00:00
|
|
|
file.write("\t\t\t" + "".join(string))
|
|
|
|
file.write("\r\n")
|
|
|
|
|
|
|
|
cost += 2
|
|
|
|
else:
|
|
|
|
string.insert(i, op[1])
|
|
|
|
|
2024-11-25 20:46:20 +00:00
|
|
|
file.write("%-16s" % "Insert %c" % op[1]) # noqa: UP031
|
2019-10-05 05:14:13 +00:00
|
|
|
file.write("\t\t\t" + "".join(string))
|
|
|
|
file.write("\r\n")
|
|
|
|
|
|
|
|
cost += 2
|
|
|
|
|
|
|
|
i += 1
|
|
|
|
|
|
|
|
print("".join(string))
|
|
|
|
print("Cost: ", cost)
|
|
|
|
|
|
|
|
file.write("\r\nMinimum cost: " + str(cost))
|