Longest Common Subsequence (LCS)
Posted by Dustin Boston .
Source Code Listing
code.ts
/**
* @file Longest Common Subsequence (LCS)
* @author Dustin Boston
* @see Cormen, T, Leiserson, C, Rivest, R, and Stein, C. (2001).
* _Introduction to Algorithms_. (2nd ed). The MIT Press.
*/
/**
* Computes the longest common subsequence (LCS) length and the optimal path
* matrix between two sequences. This function uses dynamic programming to build
* a table that stores the lengths of LCSs for different segments of the two
* input arrays.
*
* @template T - The type of elements in the input arrays.
* @param arrayX - The first sequence of elements.
* @param arrayY - The second sequence of elements.
* @returns A tuple containing two matrices:
*
* - `computed`: A matrix of LCS lengths for subarrays at the coordinate.
* - `trace`: A matrix of directions to trace back the LCS.
*/
export function lcsLength<T>(
arrayX: T[],
arrayY: T[],
): [computed: number[][], trace: string[][]] {
const lengthX = arrayX.length;
const lengthY = arrayY.length;
const computed: number[][] = [];
const trace: string[][] = [];
for (let i = 0; i <= lengthX; i++) {
computed[i] = Array.from({length: lengthY + 1}, () => 0);
trace[i] = Array.from({length: lengthY + 1}, () => "");
}
for (let i = 1; i <= lengthX; i++) {
for (let index = 1; index <= lengthY; index++) {
if (arrayX[i - 1] === arrayY[index - 1]) {
computed[i][index] = computed[i - 1][index - 1] + 1;
trace[i][index] = "↖";
} else if (computed[i - 1][index] >= computed[i][index - 1]) {
computed[i][index] = computed[i - 1][index];
trace[i][index] = "↑";
} else {
computed[i][index] = computed[i][index - 1];
trace[i][index] = "←";
}
}
}
return [computed, trace];
}
/**
* Recursively reconstructs the longest common subsequence (LCS) from the trace
* matrix generated by the `lcsLength` function. This function traces the
* optimal path from the bottom-right corner of the matrix to the top-left,
* building the LCS string by following the directions stored in the matrix.
*
* @template T - The type of elements in the input array.
* @param trace - The matrix containing the optimal path directions.
* @param arrayX - The sequence of elements used to generate the trace matrix.
* @param i - The current row index in the `trace` matrix to be considered.
* @param j - The current column index in the `trace` matrix to be considered.
* @returns The longest common subsequence as a string.
*/
export function printLcs<T>(
trace: string[][],
arrayX: T[],
i: number,
index: number,
): string {
if (i === 0 || index === 0) {
// Return empty when we reach the edge of the table.
return "";
}
if (trace[i][index] === "↖") {
// Include this character and continue recursion
return printLcs(trace, arrayX, i - 1, index - 1) + arrayX[i - 1];
}
if (trace[i][index] === "↑") {
// Recurse upwards
return printLcs(trace, arrayX, i - 1, index);
}
// Recurse leftwards
return printLcs(trace, arrayX, i, index - 1);
}
(() => {
const arrayX = "ABCBDAB".split("");
const arrayY = "BDCABA".split("");
const [_computed, trace] = lcsLength<string>(arrayX, arrayY);
const result = printLcs<string>(trace, arrayX, arrayX.length, arrayY.length);
if (result !== "BCBA" && result !== "BDAB") {
console.log("Did not find expected result");
}
console.log(`Longest common subsequence: ${result}`);
})();
longest_common_subsequence_test.ts
import {assertEquals} from "https://deno.land/std@0.202.0/assert/assert_equals.ts";
import {
lcsLength,
printLCS,
} from "../../../../data/algorithms/src/longest_common_subsequence.ts";
test(function lcsCase1() {
const arrayX = "ABCBDAB".split("");
const arrayY = "BDCABA".split("");
const [_computed, trace] = lcsLength<string>(arrayX, arrayY);
// Console.table(computed);
// console.table(trace);
const result = printLCS<string>(trace, arrayX, arrayX.length, arrayY.length);
assertEquals(result, "BCBA"); // OR BDAB
});
test(function numericLCS() {
const arrayX = "10010101".split("").map(Number);
const arrayY = "010110110".split("").map(Number);
const [_computed, trace] = lcsLength<number>(arrayX, arrayY);
const result = printLCS<number>(trace, arrayX, arrayX.length, arrayY.length);
assertEquals(result, "100110"); // OR 101010
});