原文链接: https://leetcode-cn.com/problems/find-the-shortest-superstring
Given an array of strings words
, return the smallest string that contains each string in words
as a substring. If there are multiple valid strings of the smallest length, return any of them.
You may assume that no string in words
is a substring of another string in words
Example 1:
Input: words = ["alex","loves","leetcode"] Output: "alexlovesleetcode" Explanation: All permutations of "alex","loves","leetcode" would also be accepted.
Example 2:
Input: words = ["catg","ctaagt","gcta","ttca","atgcatc"] Output: "gctaagttcatgcatc"
1 <= words.length <= 12
1 <= words[i].length <= 20
consists of lowercase English letters.- All the strings of
are unique.
给定一个字符串数组 words
,找到以 words
中每个字符串作为子字符串的最短字符串。如果有多个有效最短字符串满足题目条件,返回其中 任意一个 即可。
我们可以假设 words
中没有字符串是 words
示例 1:
输入:words = ["alex","loves","leetcode"] 输出:"alexlovesleetcode" 解释:"alex","loves","leetcode" 的所有排列都会被接受。
示例 2:
输入:words = ["catg","ctaagt","gcta","ttca","atgcatc"] 输出:"gctaagttcatgcatc"
1 <= words.length <= 12
1 <= words[i].length <= 20
中的所有字符串 互不相同
假设我们已经选出了若干个字符串将它们排成一行且合并了重复部分,并且最后一个选出的字符串是 A[i]
,那么如果我们现在选出一个新的字符串 A[j]
,那么重复部分的长度会增加 overlap(A[i], A[j])
,而与在 A[i]
因此我们可以使用动态规划来解决这个问题。设 dp(mask, i)
表示已经选出的字符串为 mask
是一个长度为 A.length
的二进制数,它的第 k
位如果为 1
,则表示第 k
个字符串已经选出,否则表示第 k
个字符串没有被选出),且最后一个选出的字符串是 A[i]
时的重复部分的最大长度。在状态转移时,我们枚举下一个选出的字符串 j
dp(mask ^ (1 << j), j) = max{overlap(A[i], A[j]) + dp(mask, i)}
当然 dp(mask, i)
overlap(A[i], A[j])
dp(mask, i)
[sol1]class Solution { public String shortestSuperstring(String[] A) { int N = A.length; // Populate overlaps int[][] overlaps = new int[N][N]; for (int i = 0; i < N; ++i) for (int j = 0; j < N; ++j) if (i != j) { int m = Math.min(A[i].length(), A[j].length()); for (int k = m; k >= 0; --k) if (A[i].endsWith(A[j].substring(0, k))) { overlaps[i][j] = k; break; } } // dp[mask][i] = most overlap with mask, ending with ith element int[][] dp = new int[1<<N][N]; int[][] parent = new int[1<<N][N]; for (int mask = 0; mask < (1<<N); ++mask) { Arrays.fill(parent[mask], -1); for (int bit = 0; bit < N; ++bit) if (((mask >> bit) & 1) > 0) { // Let's try to find dp[mask][bit]. Previously, we had // a collection of items represented by pmask. int pmask = mask ^ (1 << bit); if (pmask == 0) continue; for (int i = 0; i < N; ++i) if (((pmask >> i) & 1) > 0) { // For each bit i in pmask, calculate the value // if we ended with word i, then added word 'bit'. int val = dp[pmask][i] + overlaps[i][bit]; if (val > dp[mask][bit]) { dp[mask][bit] = val; parent[mask][bit] = i; } } } } // # Answer will have length sum(len(A[i]) for i) - max(dp[-1]) // Reconstruct answer, first as a sequence 'perm' representing // the indices of each word from left to right. int[] perm = new int[N]; boolean[] seen = new boolean[N]; int t = 0; int mask = (1 << N) - 1; // p: the last element of perm (last word written left to right) int p = 0; for (int j = 0; j < N; ++j) if (dp[(1<<N) - 1][j] > dp[(1<<N) - 1][p]) p = j; // Follow parents down backwards path that retains maximum overlap while (p != -1) { perm[t++] = p; seen[p] = true; int p2 = parent[mask][p]; mask ^= 1 << p; p = p2; } // Reverse perm for (int i = 0; i < t/2; ++i) { int v = perm[i]; perm[i] = perm[t-1-i]; perm[t-1-i] = v; } // Fill in remaining words not yet added for (int i = 0; i < N; ++i) if (!seen[i]) perm[t++] = i; // Reconstruct final answer given perm StringBuilder ans = new StringBuilder(A[perm[0]]); for (int i = 1; i < N; ++i) { int overlap = overlaps[perm[i-1]][perm[i]]; ans.append(A[perm[i]].substring(overlap)); } return ans.toString(); } }
[sol1]class Solution(object): def shortestSuperstring(self, A): N = len(A) # Populate overlaps overlaps = [[0] * N for _ in xrange(N)] for i, x in enumerate(A): for j, y in enumerate(A): if i != j: for ans in xrange(min(len(x), len(y)), -1, -1): if x.endswith(y[:ans]): overlaps[i][j] = ans break # dp[mask][i] = most overlap with mask, ending with ith element dp = [[0] * N for _ in xrange(1<<N)] parent = [[None] * N for _ in xrange(1<<N)] for mask in xrange(1, 1 << N): for bit in xrange(N): if (mask >> bit) & 1: # Let's try to find dp[mask][bit]. Previously, we had # a collection of items represented by pmask. pmask = mask ^ (1 << bit) if pmask == 0: continue for i in xrange(N): if (pmask >> i) & 1: # For each bit i in pmask, calculate the value # if we ended with word i, then added word 'bit'. value = dp[pmask][i] + overlaps[i][bit] if value > dp[mask][bit]: dp[mask][bit] = value parent[mask][bit] = i # Answer will have length sum(len(A[i]) for i) - max(dp[-1]) # Reconstruct answer: # Follow parents down backwards path that retains maximum overlap perm = [] mask = (1<<N) - 1 i = max(xrange(N), key = dp[-1].__getitem__) while i is not None: perm.append(i) mask, i = mask ^ (1<<i), parent[mask][i] # Reverse path to get forwards direction; add all remaining words perm = perm[::-1] seen = [False] * N for x in perm: seen[x] = True perm.extend([i for i in xrange(N) if not seen[i]]) # Reconstruct answer given perm = word indices in left to right order ans = [A[perm[0]]] for i in xrange(1, len(perm)): overlap = overlaps[perm[i-1]][perm[i]] ans.append(A[perm[i]][overlap:]) return "".join(ans)
时间复杂度:$O(N^2 * (2^N + W))$,其中 $N$ 是字符串的数目,$W$ 是字符串的最大长度。
空间复杂度:$O(N * (2^N + W))$。
通过次数 | 提交次数 | AC比率 |
1998 | 4366 | 45.8% |
提交时间 | 提交结果 | 执行时间 | 内存消耗 | 语言 |