LintCode 107: Word Break (DFS, DP经典题!)

2023-12-08 03:35:16

Word Break
Given a string s and a dictionary of words dict, determine if s can be break into a space-separated sequence of one or more dictionary words.

Example
Given s = “lintcode”, dict = [“lint”, “code”].

Return true because “lintcode” can be break as “lint code”.

解法1：DFS。超时 (95%的时候)

class Solution {
public:/** @param s: A string* @param dict: A dictionary of words dict* @return: A boolean*/bool wordBreak(string &s, unordered_set &dict) {int lenS = s.size();int lenD = dict.size();maxWordLen = 0;minWordLen = lenS;for (auto w : dict) {maxWordLen = max(maxWordLen, (int)w.size());minWordLen = min(minWordLen, (int)w.size());}vector sol;vector> result;helper(s, dict, sol, result);if (result.size() > 0) return true;return false;}private:void helper(string &s, unordered_set &dict, vector &sol, vector> &result) {int len = s.size();if (len == 0) {result.push_back(sol);return;}if (len < minWordLen) return;for (int i = minWordLen; i <= maxWordLen; ++i) {string w = s.substr(0, i);if (dict.find(w) == dict.end()) continue;sol.push_back(w);string newStr = s.substr(i, len - i);helper(newStr, dict, sol, result);sol.pop_back();}}int minWordLen;int maxWordLen;
};

解法2：还是DFS，s不动index动。Pass。

class Solution {
public:/** @param s: A string* @param dict: A dictionary of words dict* @return: A boolean*/bool wordBreak(string &s, unordered_set &dict) {int lenS = s.size();int lenD = dict.size();maxWordLen = 0;minWordLen = lenS;for (auto w : dict) {maxWordLen = max(maxWordLen, (int)w.size());minWordLen = min(minWordLen, (int)w.size());}vector sol;vector> result;helper(s, 0, dict, sol, result);if (result.size() > 0) return true;return false;}private:void helper(string &s, int index, unordered_set &dict, vector &sol, vector> &result) {int len = s.size();if (index == len) {result.push_back(sol);return;}if (index + minWordLen > len)    //剪枝return;for (int i = minWordLen; i <= maxWordLen; ++i) {string w = s.substr(index, i);if (dict.find(w) == dict.end()) continue;sol.push_back(w);helper(s, index + i, dict, sol, result);sol.pop_back();}}int minWordLen;int maxWordLen;
};

解法3：DFS+Memorization
即把s分成str1和str2，如果str1在dict中则可调用子问题，输入为str2。
Memozation可以减枝。
代码如下：

class Solution {
public:/** @param s: A string* @param dict: A dictionary of words dict* @return: A boolean*/bool wordBreak(string &s, unordered_set<string> &dict) {if (s.size() == 0 && dict.size() == 0) return true;unordered_map<string, bool> memo;return helper(s, dict, memo);}private:bool helper(string &s, unordered_set<string> &dict, unordered_map<string, bool> & memo) {if (s.size() == 0) return false;if (memo.find(s) != memo.end()) return memo[s];int len = s.size();for (int i = 1; i <= len; ++i) {string subStr1 = s.substr(0, i);if (dict.find(subStr1) != dict.end()) {if (subStr1 == s) {memo[s] = true;return true;}string subStr2 = s.substr(i);bool result = helper(subStr2, dict, memo);if (result) {memo[s] = true;    return true;}}}memo[s] = false;return false;}};

二刷：还是DFS+memorization。上面那个过不了96%。这个能过。

class Solution {
public:/** @param s: A string* @param dict: A dictionary of words dict* @return: A boolean*/bool wordBreak(string &s, unordered_set<string> &dict) {map<int, int> memo; //0: uninitialized, 1: true, -1: falseminLen = dict.size() == 0 ? 0 : INT_MAX;maxLen = dict.size() == 0 ? 0 : INT_MIN;memo[0] = 1;for (auto w : dict) {maxLen = max(maxLen, (int)w.size());minLen = min(minLen, (int)w.size());}return dfs(s, dict, s.size(), memo); //也可以先dfs(s, dict, s.size(), memo)，然后return memo[s.size()];}
private:    bool dfs(string &s, unordered_set<string> &dict, int pos, map<int, int> &memo) {if (pos == 0){return true;}        int upperlimit = min(maxLen, pos);//  |------------------------pos-----------|//                      <-----//                      len    for (int len = minLen; len <= upperlimit; len++){string str = s.substr(pos - len, len);if (dict.find(str) == dict.end() || memo[pos - len] == -1){continue;}if (memo[pos - len] == 1 || dfs(s, dict, pos - len, memo)) {memo[pos] = 1;return true;}}memo[pos] = 0;return false;}int maxLen, minLen;
};

用map也可以。但是要注意map[pos] == false有两种情况，一种是map[pos]确实是false，另一种是map[pos]还未赋值，但默认为false。当然，如果用unordered_map会更快。

class Solution {
public:/** @param s: A string* @param dict: A dictionary of words dict* @return: A boolean*/bool wordBreak(string &s, unordered_set<string> &dict) {//map memo; //0: uninitialized, 1: true, -1: falsemap<int, bool> memo; //minLen = dict.size() == 0 ? 0 : INT_MAX;maxLen = dict.size() == 0 ? 0 : INT_MIN;memo[0] = true;for (auto w : dict) {maxLen = max(maxLen, (int)w.size());minLen = min(minLen, (int)w.size());}dfs(s, dict, s.size(), memo);return memo[s.size()];}
private:    bool dfs(string &s, unordered_set<string> &dict, int pos, map<int, bool> &memo) {if (pos == 0){return true;}        int upperlimit = min(maxLen, pos);for (int len = minLen; len <= upperlimit; len++){string str = s.substr(pos - len, len);if (dict.find(str) == dict.end() || (memo.find(pos - len) != memo.end() && !memo[pos - len])){continue;}if (memo[pos - len] || dfs(s, dict, pos - len, memo)) {memo[pos] = 1;return true;}}memo[pos] = false;return false;}int maxLen, minLen;
};

上面的思路是pos从尾扫到头，最后看memo[s.size()]。也可以让pos从头扫到尾，最后看memo[0]。两者都是属于dfs里面的分治法。

class Solution {
public:/** @param s: A string* @param dict: A dictionary of words dict* @return: A boolean*/bool wordBreak(string &s, unordered_set<string> &dict) {unordered_map<int, bool> memo; //minLen = dict.size() == 0 ? 0 : INT_MAX;maxLen = dict.size() == 0 ? 0 : INT_MIN;memo[s.size()] = true;for (auto w : dict) {maxLen = max(maxLen, (int)w.size());minLen = min(minLen, (int)w.size());}dfs(s, dict, 0, memo);return memo[0];}
private:    bool dfs(string &s, unordered_set<string> &dict, int pos, unordered_map<int, bool> &memo) {if (pos == s.size()){return true;}        int upperlimit = maxLen;//  |---------pos--------------------|//              ---------->//                len  for (int len = minLen; len <= upperlimit; len++){string str = s.substr(pos, len);if (dict.find(str) == dict.end() || (memo.find(pos + len) != memo.end() && !memo[pos + len])){continue;}if (memo[pos + len] || dfs(s, dict, pos + len, memo)) {memo[pos] = 1;return true;}}memo[pos] = false;return false;}int maxLen, minLen;
};

解法4：DP。j是表示i的某个长度的前缀。

class Solution {
public:bool wordBreak(string s, unordered_set<string>& wordSet) {int n = s.size();vector<bool> dp(n + 1, false);dp[0] = true;for (int i = 0; i <= n; ++i) {for (int j = 0; j < i; ++j) {if (dp[j] && wordSet.find(s.substr(j, i - j)) != wordSet.end()) {dp[i] = true;break;}}}return dp.back();}
};

解法5: 还是DP。但是j是表示可能匹配的字符串的长度，所以加以minSize和maxSize的上限。显然，这个方法更好，因为字符串的长度不会很长，所以j循环次数少而且效率很高，因为一旦匹配上，就可以退出循环。
i从头扫到尾,dp[0]一开始等于true，最后看dp[len].

class Solution {
public:bool wordBreak(string s, unordered_set<string>& wordSet) {int n = s.size();vector<bool> dp(n + 1, false);int minSize = INT_MAX, maxSize = INT_MIN;for (auto w : wordSet) {minSize = min(minSize, (int)w.size());maxSize = max(maxSize, (int)w.size());}dp[0] = true;//  ------------i-->---------//       <--j---| //for (int i = 1; i <= n; ++i) {for (int j = minSize; j <= maxSize; j++) {if (i >= j && dp[i - j] && wordSet.find(s.substr(i - j, j)) != wordSet.end()) {dp[i] = true;break;}}//for (int j = 0; j < i; ++j) {//    if (dp[j] && wordSet.find(s.substr(j, i - j)) != wordSet.end()) {//        dp[i] = true;//        break;//    }//}}return dp[n];}
};

还是DP，不过是pos从尾扫到头，一开始dp[len] = true，最后看dp[0]。

class Solution {
public:/** @param s: A string* @param dict: A dictionary of words dict* @return: A boolean*/bool wordBreak(string &s, unordered_set<string> &dict) {vector<bool> dp(s.size() + 1, false);int len = s.size();dp[len] = true;int minSize = INT_MAX, maxSize = 0;for (auto w : dict) {minSize = min(minSize, (int)w.size());maxSize = max(maxSize, (int)w.size());}//  ------<--pos-----------------------//            |----i-----> for (int pos = len - 1; pos >= 0; pos--) {for (int i = minSize; i <= maxSize && pos + i <= len; i++) {string str = s.substr(pos, i);if (dict.find(str) == dict.end()) continue;if (dp[pos + i]) {dp[pos] = true;break;}}}return dp[0];}
};

本文来自互联网用户投稿，文章观点仅代表作者本人，不代表本站立场，不承担相关法律责任。如若转载，请注明出处。 如若内容造成侵权/违法违规/事实不符，请点击【内容举报】进行投诉反馈！

标签：技术

上一篇 > LintCode-829. Word Pattern II (DFS难题）
下一篇 > 浅谈操作系统-启动过程

Duilib中list控件支持ctrl和shif多行选中的实现

[ICML2015]Batch Normalization:Accelerating Deep Network Training by Reducing Internal Covariate Shif

win10系统微软输入法于eclipse ctrl+shif+f冲突间接处理办法

Codeforces Round #259 (Div. 2) B. Little Pony and Sort by Shif

读LDD3，内存映射与DMA--PAGE_SHIF…

VMware虚拟机安装XP【要先分区，再设置BOOT 启动CD，shif+上移】

更换iBus五笔的左与右Shif

sublime ctrl+shif+f 没用解决办法

idea 对 ctrl + z 的撤销是 ctrl + shif + z

计算机最早的设计师应用于,计算机应用基础选择题doc.doc

win10自带截图神器：Win+Shift+S

Python基础之文件目录操作

python简述目录_Python基础之文件目录操作(示例代码)

tp5 如何做数据采集

任务2-7(服务器字体+阿里巴巴矢量库)

html标签（1)：h1~h6,p,br,pre,hr

TI 电量计介绍与芯片选型指南

几款TI电源芯片简介

TI DSP芯片C2000系列读取FLASH数据

德州仪器(Ti)平台嵌入式开发基础

TI三相电机智能栅极驱动芯片特点分类

省选模拟（12.08） T3 圈圈圈圈圈圈圈圈

Hadoop生态圈技术栈（上）

大数据开发基础入门与项目实战（三）Hadoop核心及生态圈技术栈之6.Impala交互式查询

小猿圈之Linux下Mysql 操作命令

大数据Hadoop生态圈常用面试题

大数据开发基础入门与项目实战（三）Hadoop核心及生态圈技术栈之4.Hive DDL、DQL和数据操作

备战Noip2018模拟赛11（B组）T3 Monogatari 物语

【智能优化算法-圆圈搜索算法】基于圆圈搜索算法Circle Search Algorithm求解单目标优化问题附matlab代码

NYOJ 78 圈水池

递归问题跑道汽车绕圈问题 Python实现

Hadoop生态圈（三）：MapReduce

LintCode 107: Word Break (DFS, DP经典题!)

相关文章