2.2.1. Questions

2.2.1.1. Decode String

Given an encoded string, return it’s decoded string.

The encoding rule is: k[encoded_string], where the encoded_string inside the square brackets is being repeated exactly k times. Note that k is guaranteed to be a positive integer.

You may assume that the input string is always valid; No extra white spaces, square brackets are well-formed, etc. Furthermore, you may assume that the original data does not contain any digits and that digits are only for those repeat numbers, k. For example, there won’t be input like 3a or 2[4].

Examples:

input: "3[a]2[bc]", output: "aaabcbc".
input: "3[a2[c]]", output: "accaccacc".
input: "2[abc]3[cd]ef", output: "abcabccdcdcdef".

leetcode

The original problem and its subproblem have the same structure, so this problem can be easily done with a recursive function or DFS. It is very important to clearly define the input and output of the recursive function. In this case, the output is the resulting string from square bracket pair […], and the input is the original string and index. We can write code like:

struct Solution {
    string decodeString(string s) {
        int i = 0;
        return rec(s, i);
    }
    string rec(string& s, int& i) {
        string r; // final result
        int m = 0; // multiplier
        for (; i<s.size(); i++) {
            if (isalpha(s[i]))
                r += s[i];
            else if (isdigit(s[i]))
                m = m * 10 + s[i] - '0';
            else if (s[i] == '[') {
                i++;////
                string t = rec(s, i);
                while (m) r += t, m--;
            } else if (s[i] == ']')
                return r;////
        }
        return r;
    }
};

The input also has a parenthesis structure(ref to:CLRS page 606). DFS is actually a recursive algorithm.

2.2.1.2. Shortest Length of Folding String

Given a string and folding rule, find the length of its shortest fold.

The folding rule is:

A string can be regarded as its own fold. Denoted as S ~ S
X(S) is a fold of a string of X(X>1) Ss connected together. Denoted as X(S) ~ SSSS...S(X S).
If A ~ A', B ~ B', then AB ~ A'B'.
   For example, because 3(A) = AAA, 2(B) = BB, so 3(A)C2(B) ~ AAACBB, and 2(3(A)C)2(B) ~ AAACAAACBB

For example, the shortest fold of AAAAAAAAAABABABCCCD is: 9(A)3(AB)CCD.

Example:

input: "NEERCYESYESYESNEERCYESYESYES", output: 14.
Explanation: A shortest fold is: 2(NEERC3(YES)) and length of string 2(NEERC3(YES)) is 14.

dp[l][r] to denote the shortest fold length of s[l:r]

There is formula:

dp[l][r] = min(r-l+1, dp[l][k] + dp[k+1][r]) where l<=k<r

But there is a edge case will make this formula fail. If s is a string with 10 repeated abc, then abc9(abc) and 9(abc)abc will be the solution, which is wrong. To fix this, we need to consider the case when [k+1][r] can be derived from repeating [l][k]:

dp[l][r]=min(dp[l][r],dp[l][k]+2+IntLen((r-l+1)/(k-l+1)))；

struct Solution {
  string s;
  vector<vector<int>> results;
  bool is_multipler_string(int l, int r, int cl, int cr) {
    if ((r - l + 1) % (cr - cl + 1) != 0)
      return 0;
    for (int i = l; i <= r; i++)
      if (s[i] != s[(i - l) % (cr - cl + 1) + cl])
        return 0;
    return 1;
  }
  int int_length(int x) {
    int t = 0;
    while (x) {
      x /= 10;
      t++;
    }
    return t;
  }
  int dp(int l, int r) {
    if (l == r)
      return 1;
    if (results[l][r])
      return results[l][r];
    int t = r - l + 1;
    for (int i = l; i < r; i++) {
      t = min(t, dp(l, i) + dp(i + 1, r));
      if (is_multipler_string(i + 1, r, l, i))
        t = min(t, dp(l, i) + 2 + int_length((r - l + 1) / (i - l + 1)));
    }

TC:O(N^2), SC:O(N^2)

This is a top-down DP.

http://hzwer.com/1905.html Refer to: BZOJ1090, SCOI2003

2.2.1.3. Repeated Substring Pattern

Given a string str, check if it can be constructed by taking a substring of it and appending multiple copies of the substring together.

Examples:

Input: str = "abcabcabc"
Output: true
The given string is 3 times repetition of "abc"

Input: str = "abadabad"
Output: true
The given string is 2 times repetition of "abad"

Input: str = "aabaabaabaab"
Output: true
The given string is 4 times repetition of "aab"

Input: str = "abcdabc"
Output: false

leetcode
G4G

Brute Force

namespace repeated {
class Solution {
  bool f(string s, int l) { // TC: O(N), SC: O(1)
    if (s.size() % l != 0 or s.size() <= l) {
      return false;
    }
    for (int j = l; j < s.size(); j++) {
      if (s[(j - l) % l] != s[j]) {
        return false;
      }
    }
    return true;
  }

public:
  bool repeatedSubstringPattern(string s) { // TC: O(N^2), SC: O(1)
    if (s.size() <= 1)
      return false;
    for (int i = 0; i < s.size() / 2 + 1; i++) {
      if (f(s, i + 1))
        return true;
    }
    return false;

LPPP (longest proper prefix and postfix)

2.2.1.4. Longest Palindromic Prefix

You are given a string s. You can convert s to a palindrome by adding characters in front of it.

Return the shortest palindrome you can find by performing this transformation.

Input: s = "aacecaaa", Output: "aaacecaaa"
Input: s = "abcd", Output: "dcbabcd"

Brute Force (T:O(N^2), SC:O(1))

bool is_pal(string s, int h, int t) {
  while (h < t)
    if (s[h++] != s[t--])
      return false;
  return true;
}
string longest_palindromic_prefix_v1(string s) {
  if (s.empty())
    return s;
  int l = 0;
  for (int i = 0; i < s.size(); i++)
    if (is_pal(s, 0, i))
      l = i;
  auto t = s.substr(l + 1);
  reverse(t.begin(), t.end());
  return t + s;
}

string longest_palindromic_prefix_v2(string s) {

Rolling Hash (T:O(N), SC:O(1))

string longest_palindromic_prefix_v2(string s) {
  if (s.size() <= 1)
    return s;
  int r = 0, hash1 = 0, hash2 = 0, BASE = 37, POW = 1;
  for (int i = 0; i < s.size(); ++i) {
    hash1 = hash1 * BASE + s[i];
    hash2 = hash2 + s[i] * POW;
    if (hash1 == hash2)
      r = i;
    POW *= BASE;
  }
  string tmp = s.substr(r + 1); // :-)
  reverse(tmp.begin(), tmp.end());
  return tmp + s;
}

💡

2.2.1.5. Guess Word

给一个target单词，一个guess单词，如果位置完全匹配是G，字母匹配但是位置不匹配是Y，否则是R。如果有多个可以匹配为Y的，则把index最小的匹配成Y，其他的还是R，然后输出结果的string。比如BACD和CAGE，就输出YGRR。

follow up是如果给一个target和a sequence of guess words，每一步要求前一步的guess是G的地方需要retain，前一步如果是Y的corresponding letter must be included in这个单词。输出这sequence of guess words是不是全部valid.

比如说我的target是ABCDE, 我有一个guess word的序列，The first guess word是AGHBD，那么第一步得到的结果就是GRRYY，下一步的话valid的guess就可以是比如ACBDG（G的位置必须index和值都还是原来的，所以第一个位置必须是A，Y的地方必需至少包含，所以必须包含BD），像AGHYU或者BDAHG就不行给一个guess word的list，判断是不是每次猜测都是基于前一步的guess的valid guess

Example:
target: ABCDE, guess words: {"AGHBD","ACBDG","AFBDC","ABCDE"}, output: true
target: ABCDE, guess words: {"AGHBD","AGHYU"}, output: false
target: ABCDE, guess words: {"AGHBD","BDAHG"}, output: false

#include <gtest/gtest.h>
#include <sein.hpp>

namespace ns_string_guess {

string guess_result(string secret, string guess) {
  if (secret.size() != guess.size()) throw invalid_argument("length mismatches");
  vector<int> counter(128, -1); // ascii table length is 128
  for (int i = secret.size() - 1; i >= 0; i--)
    counter[secret[i]] = i;
  string res(secret.size(), 'G');
  for (int i = 0; i < secret.size(); i++) {
    if (secret[i] == guess[i]) {
      continue;
    } else if (counter.at(guess[i]) > 0) {
      res[i] = 'Y', counter[guess[i]] = -1; // 💣
    } else res[i] = 'R';
  }
  return res;
}

// TC: O(MN)
bool valid_guess_sequence(string secret, vector<string> guess_words) {
  unordered_set<int> match_indices;
  unordered_set<char> contains;
  vector<int> counter(128, -1); // ascii table length is 128
  for (int i = secret.size() - 1; i >= 0; i--)
    counter[secret[i]] = i;
  for (const string &g: guess_words) {
    if (secret.size() != g.size()) return false;
    auto _contains = contains;
    auto _counter = counter;
    for (int i = 0; i < secret.size(); i++) {
      if (match_indices.count(i) and secret[i] != g[i]) return false;
      if (secret[i] == g[i]) match_indices.insert(i);
      if (_contains.count(g[i])) {
        _contains.erase(g[i]);
        continue;
      }
      if (_counter[g[i]] > 0) { // new char
        contains.insert(g[i]), _counter[g[i]] = -1;
      } // 💣
    }
    if (!_contains.empty()) return false;
  }
  return true;
}

}
using namespace ns_string_guess;
TEST(_string_guess, a) {
  EXPECT_EQ(guess_result("BACDF", "CAGEC"), "YGRRR");
  EXPECT_TRUE(valid_guess_sequence("ABCDE", {"AGHBD", "ACBDG", "AFBDC", "ABCDE"}));
  EXPECT_FALSE(valid_guess_sequence("ABCDE", {"AGHBD", "ACBDG", "AFBDE"}));
  EXPECT_FALSE(valid_guess_sequence("ABCDE", {"AGHBD", "ACBDG", "ABBDE"}));
}