comments | difficulty | edit_url |
---|---|---|
true |
Medium |
Oh, no! You have accidentally removed all spaces, punctuation, and capitalization in a lengthy document. A sentence like "I reset the computer. It still didn't boot!" became "iresetthecomputeritstilldidntboot''. You'll deal with the punctuation and capitalization later; right now you need to re-insert the spaces. Most of the words are in a dictionary but a few are not. Given a dictionary (a list of strings) and the document (a string), design an algorithm to unconcatenate the document in a way that minimizes the number of unrecognized characters. Return the number of unrecognized characters.
Note: This problem is slightly different from the original one in the book.
Example:
Input: dictionary = ["looked","just","like","her","brother"] sentence = "jesslookedjustliketimherbrother" Output: 7 Explanation: After unconcatenating, we got "jess looked just like tim her brother", which containing 7 unrecognized characters.
Note:
0 <= len(sentence) <= 1000
The total number of characters in dictionary
is less than or equal to 150000.- There are only lowercase letters in
dictionary
andsentence
.
class Solution:
def respace(self, dictionary: List[str], sentence: str) -> int:
s = set(dictionary)
n = len(sentence)
dp = [0] * (n + 1)
for i in range(1, n + 1):
dp[i] = dp[i - 1] + 1
for j in range(i):
if sentence[j:i] in s:
dp[i] = min(dp[i], dp[j])
return dp[-1]
class Solution {
public int respace(String[] dictionary, String sentence) {
Set<String> dict = new HashSet<>(Arrays.asList(dictionary));
int n = sentence.length();
int[] dp = new int[n + 1];
for (int i = 1; i <= n; i++) {
dp[i] = dp[i - 1] + 1;
for (int j = 0; j < i; ++j) {
if (dict.contains(sentence.substring(j, i))) {
dp[i] = Math.min(dp[i], dp[j]);
}
}
}
return dp[n];
}
}
class Solution {
public:
int respace(vector<string>& dictionary, string sentence) {
unordered_set<string> s(dictionary.begin(), dictionary.end());
int n = sentence.size();
vector<int> dp(n + 1);
for (int i = 1; i <= n; ++i) {
dp[i] = dp[i - 1] + 1;
for (int j = 0; j < i; ++j) {
if (s.count(sentence.substr(j, i - j))) {
dp[i] = min(dp[i], dp[j]);
}
}
}
return dp[n];
}
};
func respace(dictionary []string, sentence string) int {
s := map[string]bool{}
for _, v := range dictionary {
s[v] = true
}
n := len(sentence)
dp := make([]int, n+1)
for i := 1; i <= n; i++ {
dp[i] = dp[i-1] + 1
for j := 0; j < i; j++ {
if s[sentence[j:i]] {
dp[i] = min(dp[i], dp[j])
}
}
}
return dp[n]
}
class TrieNode {
var children: [TrieNode?] = Array(repeating: nil, count: 26)
var isEndOfWord = false
}
class Trie {
private let root = TrieNode()
func insert(_ word: String) {
var node = root
for char in word {
let index = Int(char.asciiValue! - Character("a").asciiValue!)
if node.children[index] == nil {
node.children[index] = TrieNode()
}
node = node.children[index]!
}
node.isEndOfWord = true
}
func search(_ sentence: Array<Character>, start: Int, end: Int) -> Bool {
var node = root
for i in start...end {
let index = Int(sentence[i].asciiValue! - Character("a").asciiValue!)
guard let nextNode = node.children[index] else {
return false
}
node = nextNode
}
return node.isEndOfWord
}
}
class Solution {
func respace(_ dictionary: [String], _ sentence: String) -> Int {
let n = sentence.count
guard n > 0 else { return 0 }
let trie = Trie()
dictionary.forEach { trie.insert($0) }
let chars = Array(sentence)
var dp = Array(repeating: Int.max, count: n + 1)
dp[0] = 0
for i in 1...n {
dp[i] = dp[i - 1] + 1
for j in 0..<i {
if trie.search(chars, start: j, end: i - 1) {
dp[i] = min(dp[i], dp[j])
}
}
}
return dp[n]
}
}