From 52f6d7883d37f3c72b76550846074d45db2b238f Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Sun, 27 Sep 2020 19:31:05 -0500
Subject: [PATCH 01/30] API: Deprecate regex=True default in Series.str.replace

---
 pandas/core/strings.py | 13 ++++++++++++-
 1 file changed, 12 insertions(+), 1 deletion(-)

diff --git a/pandas/core/strings.py b/pandas/core/strings.py
index 4467c96041dc7..4fabad8278839 100644
--- a/pandas/core/strings.py
+++ b/pandas/core/strings.py
@@ -2837,7 +2837,18 @@ def fullmatch(self, pat, case=True, flags=0, na=np.nan):
 
     @copy(str_replace)
     @forbid_nonstring_types(["bytes"])
-    def replace(self, pat, repl, n=-1, case=None, flags=0, regex=True):
+    def replace(self, pat, repl, n=-1, case=None, flags=0, regex=None):
+        if regex is None:
+            msg = (
+                "The default value of regex will change from "
+                "True to False in a future version."
+            )
+            warnings.warn(
+                msg,
+                FutureWarning,
+                stacklevel=2,
+            )
+            regex = True
         result = str_replace(
             self._parent, pat, repl, n=n, case=case, flags=flags, regex=regex
         )

From 3b9bcb284dd99beb63699298dc76bc30e039330f Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Sun, 27 Sep 2020 19:48:44 -0500
Subject: [PATCH 02/30] Format

---
 pandas/core/strings.py | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/pandas/core/strings.py b/pandas/core/strings.py
index 4fabad8278839..5b1e0107d97f2 100644
--- a/pandas/core/strings.py
+++ b/pandas/core/strings.py
@@ -2843,11 +2843,7 @@ def replace(self, pat, repl, n=-1, case=None, flags=0, regex=None):
                 "The default value of regex will change from "
                 "True to False in a future version."
             )
-            warnings.warn(
-                msg,
-                FutureWarning,
-                stacklevel=2,
-            )
+            warnings.warn(msg, FutureWarning, stacklevel=2)
             regex = True
         result = str_replace(
             self._parent, pat, repl, n=n, case=case, flags=flags, regex=regex

From c51e83722309cce33e8ec70af0aff1984d9abeb8 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Sun, 27 Sep 2020 19:52:09 -0500
Subject: [PATCH 03/30] Stacklevel

---
 pandas/core/strings.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pandas/core/strings.py b/pandas/core/strings.py
index 5b1e0107d97f2..d8912cefdf1e8 100644
--- a/pandas/core/strings.py
+++ b/pandas/core/strings.py
@@ -2843,7 +2843,7 @@ def replace(self, pat, repl, n=-1, case=None, flags=0, regex=None):
                 "The default value of regex will change from "
                 "True to False in a future version."
             )
-            warnings.warn(msg, FutureWarning, stacklevel=2)
+            warnings.warn(msg, FutureWarning, stacklevel=3)
             regex = True
         result = str_replace(
             self._parent, pat, repl, n=n, case=case, flags=flags, regex=regex

From 376162511c8dc501cd1ae8d249f2e938791b5e5c Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Sun, 27 Sep 2020 19:56:56 -0500
Subject: [PATCH 04/30] Test

---
 pandas/tests/series/methods/test_replace.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/pandas/tests/series/methods/test_replace.py b/pandas/tests/series/methods/test_replace.py
index e255d46e81851..ce2d2b72c9c26 100644
--- a/pandas/tests/series/methods/test_replace.py
+++ b/pandas/tests/series/methods/test_replace.py
@@ -449,3 +449,8 @@ def test_replace_with_compiled_regex(self):
         result = s.replace({regex: "z"}, regex=True)
         expected = pd.Series(["z", "b", "c"])
         tm.assert_series_equal(result, expected)
+
+    def test_str_replace_regex_default(self):
+        s = pd.Series(["a", "b", "c"])
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
+            s.str.replace(".", "")

From 7583b7fa357a764d7be4f4ad6b005a94cd922d20 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Sun, 27 Sep 2020 20:00:07 -0500
Subject: [PATCH 05/30] Test name

---
 pandas/tests/series/methods/test_replace.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pandas/tests/series/methods/test_replace.py b/pandas/tests/series/methods/test_replace.py
index ce2d2b72c9c26..72dd05b1568a4 100644
--- a/pandas/tests/series/methods/test_replace.py
+++ b/pandas/tests/series/methods/test_replace.py
@@ -450,7 +450,7 @@ def test_replace_with_compiled_regex(self):
         expected = pd.Series(["z", "b", "c"])
         tm.assert_series_equal(result, expected)
 
-    def test_str_replace_regex_default(self):
+    def test_str_replace_regex_default_raises_warning(self):
         s = pd.Series(["a", "b", "c"])
         with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
             s.str.replace(".", "")

From 8e0d1a5fa7d22ec8fcb21ec32c0f615604cebe5e Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Sun, 27 Sep 2020 20:01:01 -0500
Subject: [PATCH 06/30] Link discussion

---
 pandas/tests/series/methods/test_replace.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/pandas/tests/series/methods/test_replace.py b/pandas/tests/series/methods/test_replace.py
index 72dd05b1568a4..2aeb6ab3153c1 100644
--- a/pandas/tests/series/methods/test_replace.py
+++ b/pandas/tests/series/methods/test_replace.py
@@ -451,6 +451,7 @@ def test_replace_with_compiled_regex(self):
         tm.assert_series_equal(result, expected)
 
     def test_str_replace_regex_default_raises_warning(self):
+        # https://github.com/pandas-dev/pandas/pull/24809
         s = pd.Series(["a", "b", "c"])
         with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
             s.str.replace(".", "")

From 79e44009e69bc1861c0894f1edb8500cc431837e Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Sun, 27 Sep 2020 20:27:59 -0500
Subject: [PATCH 07/30] Set regex

---
 pandas/core/reshape/melt.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pandas/core/reshape/melt.py b/pandas/core/reshape/melt.py
index 83a5f43c2a340..952cb419c1a0d 100644
--- a/pandas/core/reshape/melt.py
+++ b/pandas/core/reshape/melt.py
@@ -483,7 +483,7 @@ def melt_stub(df, stub: str, i, j, value_vars, sep: str):
             var_name=j,
         )
         newdf[j] = Categorical(newdf[j])
-        newdf[j] = newdf[j].str.replace(re.escape(stub + sep), "")
+        newdf[j] = newdf[j].str.replace(re.escape(stub + sep), "", regex=True)
 
         # GH17627 Cast numerics suffixes to int/float
         newdf[j] = to_numeric(newdf[j], errors="ignore")

From ecc578685865b46b21fa75563deee7660321ae6c Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Mon, 28 Sep 2020 16:22:45 -0500
Subject: [PATCH 08/30] Update

---
 doc/source/user_guide/text.rst              | 18 ++++++++++--------
 pandas/core/strings.py                      | 12 +++++++-----
 pandas/tests/series/methods/test_replace.py |  2 +-
 3 files changed, 18 insertions(+), 14 deletions(-)

diff --git a/doc/source/user_guide/text.rst b/doc/source/user_guide/text.rst
index dd6ac37d88f08..0828fcef24139 100644
--- a/doc/source/user_guide/text.rst
+++ b/doc/source/user_guide/text.rst
@@ -264,23 +264,25 @@ i.e., from the end of the string to the beginning of the string:
    s3
    s3.str.replace('^.a|dog', 'XX-XX ', case=False)
 
-Some caution must be taken to keep regular expressions in mind! For example, the
-following code will cause trouble because of the regular expression meaning of
-``$``:
+Some caution must be taken when dealing with regular expressions! The current behavior
+is to treat single character patterns as literal strings, even when ``regex`` is set
+to ``True``. (This behavior is deprecated and will be removed in a future version so
+that the ``regex`` keyword is always respected.) For example, the following code will
+cause trouble because of the regular expression meaning of ``$``:
 
 .. ipython:: python
 
    # Consider the following badly formatted financial data
    dollars = pd.Series(['12', '-$10', '$10,000'], dtype="string")
 
-   # This does what you'd naively expect:
-   dollars.str.replace('$', '')
+   # Here ``$`` is treated as a literal character:
+   dollars.str.replace('$', '', regex=True)
 
-   # But this doesn't:
-   dollars.str.replace('-$', '-')
+   # But here it is not:
+   dollars.str.replace('-$', '-', regex=True)
 
    # We need to escape the special character (for >1 len patterns)
-   dollars.str.replace(r'-\$', '-')
+   dollars.str.replace(r'-\$', '-', regex=True)
 
 If you do want literal replacement of a string (equivalent to
 :meth:`str.replace`), you can set the optional ``regex`` parameter to
diff --git a/pandas/core/strings.py b/pandas/core/strings.py
index d8912cefdf1e8..f0379a3858a6e 100644
--- a/pandas/core/strings.py
+++ b/pandas/core/strings.py
@@ -2839,11 +2839,13 @@ def fullmatch(self, pat, case=True, flags=0, na=np.nan):
     @forbid_nonstring_types(["bytes"])
     def replace(self, pat, repl, n=-1, case=None, flags=0, regex=None):
         if regex is None:
-            msg = (
-                "The default value of regex will change from "
-                "True to False in a future version."
-            )
-            warnings.warn(msg, FutureWarning, stacklevel=3)
+            if len(pat) > 1 and any(c in pat for c in ".+*|^$&[](){}\\"):
+                # warn only in cases where regex behavior would differ from literal
+                msg = (
+                    "The default value of regex will change from "
+                    "True to False in a future version."
+                )
+                warnings.warn(msg, FutureWarning, stacklevel=3)
             regex = True
         result = str_replace(
             self._parent, pat, repl, n=n, case=case, flags=flags, regex=regex
diff --git a/pandas/tests/series/methods/test_replace.py b/pandas/tests/series/methods/test_replace.py
index 2aeb6ab3153c1..7bc7993b38a22 100644
--- a/pandas/tests/series/methods/test_replace.py
+++ b/pandas/tests/series/methods/test_replace.py
@@ -454,4 +454,4 @@ def test_str_replace_regex_default_raises_warning(self):
         # https://github.com/pandas-dev/pandas/pull/24809
         s = pd.Series(["a", "b", "c"])
         with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            s.str.replace(".", "")
+            s.str.replace("^.$", "")

From 628cfa3f9ea8d5dcb059fd0163690fb9bb7c9b20 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Mon, 28 Sep 2020 16:35:18 -0500
Subject: [PATCH 09/30] Update

---
 doc/source/user_guide/text.rst | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/doc/source/user_guide/text.rst b/doc/source/user_guide/text.rst
index 0828fcef24139..17802b7ca6584 100644
--- a/doc/source/user_guide/text.rst
+++ b/doc/source/user_guide/text.rst
@@ -275,15 +275,18 @@ cause trouble because of the regular expression meaning of ``$``:
    # Consider the following badly formatted financial data
    dollars = pd.Series(['12', '-$10', '$10,000'], dtype="string")
 
-   # Here ``$`` is treated as a literal character:
+   # Here ``$`` is treated as a literal character
    dollars.str.replace('$', '', regex=True)
 
-   # But here it is not:
+   # But here it is not
    dollars.str.replace('-$', '-', regex=True)
 
    # We need to escape the special character (for >1 len patterns)
    dollars.str.replace(r'-\$', '-', regex=True)
 
+   # Or set ``regex`` equal to ``False``
+   dollars.str.replace('-$', '-', regex=False)
+
 If you do want literal replacement of a string (equivalent to
 :meth:`str.replace`), you can set the optional ``regex`` parameter to
 ``False``, rather than escaping each character. In this case both ``pat``

From f2160228fada4e4d081e78ffeedd915ed8e4d5af Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Mon, 28 Sep 2020 16:51:22 -0500
Subject: [PATCH 10/30] Fix

---
 pandas/core/strings.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pandas/core/strings.py b/pandas/core/strings.py
index f0379a3858a6e..67ffc2d2138ed 100644
--- a/pandas/core/strings.py
+++ b/pandas/core/strings.py
@@ -2839,7 +2839,7 @@ def fullmatch(self, pat, case=True, flags=0, na=np.nan):
     @forbid_nonstring_types(["bytes"])
     def replace(self, pat, repl, n=-1, case=None, flags=0, regex=None):
         if regex is None:
-            if len(pat) > 1 and any(c in pat for c in ".+*|^$&[](){}\\"):
+            if len(pat) > 1 and any(c in pat for c in ".+*|^$[](){}\\"):
                 # warn only in cases where regex behavior would differ from literal
                 msg = (
                     "The default value of regex will change from "

From e6b3e0fcd9fa37c215d9129bca95860cd3416112 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Mon, 28 Sep 2020 18:05:40 -0500
Subject: [PATCH 11/30] Check for str

---
 pandas/core/strings.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/pandas/core/strings.py b/pandas/core/strings.py
index 67ffc2d2138ed..0483fca7c79e1 100644
--- a/pandas/core/strings.py
+++ b/pandas/core/strings.py
@@ -2839,7 +2839,11 @@ def fullmatch(self, pat, case=True, flags=0, na=np.nan):
     @forbid_nonstring_types(["bytes"])
     def replace(self, pat, repl, n=-1, case=None, flags=0, regex=None):
         if regex is None:
-            if len(pat) > 1 and any(c in pat for c in ".+*|^$[](){}\\"):
+            if (
+                isinstance(pat, str)
+                and len(pat) > 1
+                and any(c in pat for c in ".+*|^$[](){}\\")
+            ):
                 # warn only in cases where regex behavior would differ from literal
                 msg = (
                     "The default value of regex will change from "

From ee67284d25496b63dd3d5b774f5521e5cf533ddd Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Mon, 28 Sep 2020 19:42:29 -0500
Subject: [PATCH 12/30] Doc updates

---
 doc/source/user_guide/text.rst | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/doc/source/user_guide/text.rst b/doc/source/user_guide/text.rst
index 17802b7ca6584..b3ba6d614161e 100644
--- a/doc/source/user_guide/text.rst
+++ b/doc/source/user_guide/text.rst
@@ -262,7 +262,7 @@ i.e., from the end of the string to the beginning of the string:
                    '', np.nan, 'CABA', 'dog', 'cat'],
                   dtype="string")
    s3
-   s3.str.replace('^.a|dog', 'XX-XX ', case=False)
+   s3.str.replace('^.a|dog', 'XX-XX ', case=False, regex=True)
 
 Some caution must be taken when dealing with regular expressions! The current behavior
 is to treat single character patterns as literal strings, even when ``regex`` is set
@@ -295,7 +295,7 @@ and ``repl`` must be strings:
 .. ipython:: python
 
     # These lines are equivalent
-    dollars.str.replace(r'-\$', '-')
+    dollars.str.replace(r'-\$', '-', regex=True)
     dollars.str.replace('-$', '-', regex=False)
 
 The ``replace`` method can also take a callable as replacement. It is called
@@ -311,7 +311,7 @@ positional argument (a regex object) and return a string.
        return m.group(0)[::-1]
 
    pd.Series(['foo 123', 'bar baz', np.nan],
-             dtype="string").str.replace(pat, repl)
+             dtype="string").str.replace(pat, repl, regex=True)
 
    # Using regex groups
    pat = r"(?P<one>\w+) (?P<two>\w+) (?P<three>\w+)"
@@ -320,7 +320,7 @@ positional argument (a regex object) and return a string.
        return m.group('two').swapcase()
 
    pd.Series(['Foo Bar Baz', np.nan],
-             dtype="string").str.replace(pat, repl)
+             dtype="string").str.replace(pat, repl, regex=True)
 
 The ``replace`` method also accepts a compiled regular expression object
 from :func:`re.compile` as a pattern. All flags should be included in the
@@ -330,7 +330,7 @@ compiled regular expression object.
 
    import re
    regex_pat = re.compile(r'^.a|dog', flags=re.IGNORECASE)
-   s3.str.replace(regex_pat, 'XX-XX ')
+   s3.str.replace(regex_pat, 'XX-XX ', regex=True)
 
 Including a ``flags`` argument when calling ``replace`` with a compiled
 regular expression object will raise a ``ValueError``.

From c832a2148d4da4e7cf4ade5f2eae5e5cc6a84665 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Mon, 28 Sep 2020 20:34:40 -0500
Subject: [PATCH 13/30] Nit

---
 doc/source/user_guide/text.rst | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/doc/source/user_guide/text.rst b/doc/source/user_guide/text.rst
index b3ba6d614161e..7bce895cecac3 100644
--- a/doc/source/user_guide/text.rst
+++ b/doc/source/user_guide/text.rst
@@ -275,7 +275,7 @@ cause trouble because of the regular expression meaning of ``$``:
    # Consider the following badly formatted financial data
    dollars = pd.Series(['12', '-$10', '$10,000'], dtype="string")
 
-   # Here ``$`` is treated as a literal character
+   # Here $ is treated as a literal character
    dollars.str.replace('$', '', regex=True)
 
    # But here it is not
@@ -284,7 +284,7 @@ cause trouble because of the regular expression meaning of ``$``:
    # We need to escape the special character (for >1 len patterns)
    dollars.str.replace(r'-\$', '-', regex=True)
 
-   # Or set ``regex`` equal to ``False``
+   # Or set regex equal to False
    dollars.str.replace('-$', '-', regex=False)
 
 If you do want literal replacement of a string (equivalent to

From 09b07e68a9a74b68380677ecc71746f24bf2cb4e Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Mon, 28 Sep 2020 20:42:34 -0500
Subject: [PATCH 14/30] Silence some warnings

---
 pandas/tests/test_strings.py | 24 +++++++++++++-----------
 1 file changed, 13 insertions(+), 11 deletions(-)

diff --git a/pandas/tests/test_strings.py b/pandas/tests/test_strings.py
index c792a48d3ef08..8df62adfec71b 100644
--- a/pandas/tests/test_strings.py
+++ b/pandas/tests/test_strings.py
@@ -995,11 +995,11 @@ def test_casemethods(self):
     def test_replace(self):
         values = Series(["fooBAD__barBAD", np.nan])
 
-        result = values.str.replace("BAD[_]*", "")
+        result = values.str.replace("BAD[_]*", "", regex=True)
         exp = Series(["foobar", np.nan])
         tm.assert_series_equal(result, exp)
 
-        result = values.str.replace("BAD[_]*", "", n=1)
+        result = values.str.replace("BAD[_]*", "", regex=True, n=1)
         exp = Series(["foobarBAD", np.nan])
         tm.assert_series_equal(result, exp)
 
@@ -1008,7 +1008,7 @@ def test_replace(self):
             ["aBAD", np.nan, "bBAD", True, datetime.today(), "fooBAD", None, 1, 2.0]
         )
 
-        rs = Series(mixed).str.replace("BAD[_]*", "")
+        rs = Series(mixed).str.replace("BAD[_]*", "", regex=True)
         xp = Series(["a", np.nan, "b", np.nan, np.nan, "foo", np.nan, np.nan, np.nan])
         assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
@@ -1016,7 +1016,9 @@ def test_replace(self):
         # flags + unicode
         values = Series([b"abcd,\xc3\xa0".decode("utf-8")])
         exp = Series([b"abcd, \xc3\xa0".decode("utf-8")])
-        result = values.str.replace(r"(?<=\w),(?=\w)", ", ", flags=re.UNICODE)
+        result = values.str.replace(
+            r"(?<=\w),(?=\w)", ", ", regex=True, flags=re.UNICODE
+        )
         tm.assert_series_equal(result, exp)
 
         # GH 13438
@@ -1034,7 +1036,7 @@ def test_replace_callable(self):
 
         # test with callable
         repl = lambda m: m.group(0).swapcase()
-        result = values.str.replace("[a-z][A-Z]{2}", repl, n=2)
+        result = values.str.replace("[a-z][A-Z]{2}", repl, n=2, regex=True)
         exp = Series(["foObaD__baRbaD", np.nan])
         tm.assert_series_equal(result, exp)
 
@@ -1060,7 +1062,7 @@ def test_replace_callable(self):
         values = Series(["Foo Bar Baz", np.nan])
         pat = r"(?P<first>\w+) (?P<middle>\w+) (?P<last>\w+)"
         repl = lambda m: m.group("middle").swapcase()
-        result = values.str.replace(pat, repl)
+        result = values.str.replace(pat, repl, regex=True)
         exp = Series(["bAR", np.nan])
         tm.assert_series_equal(result, exp)
 
@@ -1070,11 +1072,11 @@ def test_replace_compiled_regex(self):
 
         # test with compiled regex
         pat = re.compile(r"BAD[_]*")
-        result = values.str.replace(pat, "")
+        result = values.str.replace(pat, "", regex=True)
         exp = Series(["foobar", np.nan])
         tm.assert_series_equal(result, exp)
 
-        result = values.str.replace(pat, "", n=1)
+        result = values.str.replace(pat, "", n=1, regex=True)
         exp = Series(["foobarBAD", np.nan])
         tm.assert_series_equal(result, exp)
 
@@ -1083,7 +1085,7 @@ def test_replace_compiled_regex(self):
             ["aBAD", np.nan, "bBAD", True, datetime.today(), "fooBAD", None, 1, 2.0]
         )
 
-        rs = Series(mixed).str.replace(pat, "")
+        rs = Series(mixed).str.replace(pat, "", regex=True)
         xp = Series(["a", np.nan, "b", np.nan, np.nan, "foo", np.nan, np.nan, np.nan])
         assert isinstance(rs, Series)
         tm.assert_almost_equal(rs, xp)
@@ -1121,7 +1123,7 @@ def test_replace_literal(self):
         # GH16808 literal replace (regex=False vs regex=True)
         values = Series(["f.o", "foo", np.nan])
         exp = Series(["bao", "bao", np.nan])
-        result = values.str.replace("f.", "ba")
+        result = values.str.replace("f.", "ba", regex=True)
         tm.assert_series_equal(result, exp)
 
         exp = Series(["bao", "foo", np.nan])
@@ -3331,7 +3333,7 @@ def test_replace_moar(self):
         )
         tm.assert_series_equal(result, expected)
 
-        result = s.str.replace("^.a|dog", "XX-XX ", case=False)
+        result = s.str.replace("^.a|dog", "XX-XX ", case=False, regex=True)
         expected = Series(
             [
                 "A",

From c8541da60584fd457c332f367037db8ca2c2a5dd Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Mon, 28 Sep 2020 20:51:58 -0500
Subject: [PATCH 15/30] Edit

---
 pandas/tests/test_strings.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pandas/tests/test_strings.py b/pandas/tests/test_strings.py
index 8df62adfec71b..d21c7f176386b 100644
--- a/pandas/tests/test_strings.py
+++ b/pandas/tests/test_strings.py
@@ -999,7 +999,7 @@ def test_replace(self):
         exp = Series(["foobar", np.nan])
         tm.assert_series_equal(result, exp)
 
-        result = values.str.replace("BAD[_]*", "", regex=True, n=1)
+        result = values.str.replace("BAD[_]*", "", n=1, regex=True)
         exp = Series(["foobarBAD", np.nan])
         tm.assert_series_equal(result, exp)
 

From bd31857c0c2764f38583e8fb26f68c52e30d5c8e Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Mon, 28 Sep 2020 20:53:20 -0500
Subject: [PATCH 16/30] Edit

---
 pandas/tests/test_strings.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pandas/tests/test_strings.py b/pandas/tests/test_strings.py
index d21c7f176386b..5d4f017ac66a2 100644
--- a/pandas/tests/test_strings.py
+++ b/pandas/tests/test_strings.py
@@ -1017,7 +1017,7 @@ def test_replace(self):
         values = Series([b"abcd,\xc3\xa0".decode("utf-8")])
         exp = Series([b"abcd, \xc3\xa0".decode("utf-8")])
         result = values.str.replace(
-            r"(?<=\w),(?=\w)", ", ", regex=True, flags=re.UNICODE
+            r"(?<=\w),(?=\w)", ", ", flags=re.UNICODE, regex=True
         )
         tm.assert_series_equal(result, exp)
 

From 377a2bae43c8fbf4f2dd3ddcb8335d8d8837032f Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Tue, 29 Sep 2020 07:21:31 -0500
Subject: [PATCH 17/30] Question mark

---
 pandas/core/strings.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pandas/core/strings.py b/pandas/core/strings.py
index 0483fca7c79e1..79cba6d29b429 100644
--- a/pandas/core/strings.py
+++ b/pandas/core/strings.py
@@ -2842,7 +2842,7 @@ def replace(self, pat, repl, n=-1, case=None, flags=0, regex=None):
             if (
                 isinstance(pat, str)
                 and len(pat) > 1
-                and any(c in pat for c in ".+*|^$[](){}\\")
+                and any(c in pat for c in ".+*|^$?[](){}\\")
             ):
                 # warn only in cases where regex behavior would differ from literal
                 msg = (

From d6b4fbeafbb53616f8dddd59a41f7f189159edf9 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Tue, 29 Sep 2020 07:24:19 -0500
Subject: [PATCH 18/30] Update doc

---
 doc/source/user_guide/text.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/doc/source/user_guide/text.rst b/doc/source/user_guide/text.rst
index 7bce895cecac3..e46990688b404 100644
--- a/doc/source/user_guide/text.rst
+++ b/doc/source/user_guide/text.rst
@@ -253,7 +253,7 @@ i.e., from the end of the string to the beginning of the string:
 
    s2.str.rsplit('_', expand=True, n=1)
 
-``replace`` by default replaces `regular expressions
+``replace`` optionally uses `regular expressions
 <https://docs.python.org/3/library/re.html>`__:
 
 .. ipython:: python

From 1b530510689f6ad876d764688c62cb757ef47096 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Wed, 30 Sep 2020 18:08:32 -0500
Subject: [PATCH 19/30] Add back

---
 pandas/core/strings/accessor.py | 15 ++++++++++++++-
 1 file changed, 14 insertions(+), 1 deletion(-)

diff --git a/pandas/core/strings/accessor.py b/pandas/core/strings/accessor.py
index cae8cc1baf1df..edcaf9416fc7d 100644
--- a/pandas/core/strings/accessor.py
+++ b/pandas/core/strings/accessor.py
@@ -1170,7 +1170,7 @@ def fullmatch(self, pat, case=True, flags=0, na=None):
         return self._wrap_result(result, fill_value=na, returns_string=False)
 
     @forbid_nonstring_types(["bytes"])
-    def replace(self, pat, repl, n=-1, case=None, flags=0, regex=True):
+    def replace(self, pat, repl, n=-1, case=None, flags=0, regex=None):
         r"""
         Replace each occurrence of pattern/regex in the Series/Index.
 
@@ -1288,6 +1288,19 @@ def replace(self, pat, repl, n=-1, case=None, flags=0, regex=True):
         2    NaN
         dtype: object
         """
+        if regex is None:
+            if (
+                isinstance(pat, str)
+                and len(pat) > 1
+                and any(c in pat for c in ".+*|^$?[](){}\\")
+            ):
+                # warn only in cases where regex behavior would differ from literal
+                msg = (
+                    "The default value of regex will change from "
+                    "True to False in a future version."
+                )
+                warnings.warn(msg, FutureWarning, stacklevel=3)
+            regex = True
         result = self._array._str_replace(
             pat, repl, n=n, case=case, flags=flags, regex=regex
         )

From 1931c314f279b0c5c3f22d6d39a0830fd38aaeec Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Wed, 30 Sep 2020 18:13:35 -0500
Subject: [PATCH 20/30] Oops

---
 pandas/core/strings.py | 3663 ----------------------------------------
 1 file changed, 3663 deletions(-)
 delete mode 100644 pandas/core/strings.py

diff --git a/pandas/core/strings.py b/pandas/core/strings.py
deleted file mode 100644
index 79cba6d29b429..0000000000000
--- a/pandas/core/strings.py
+++ /dev/null
@@ -1,3663 +0,0 @@
-import codecs
-from functools import wraps
-import re
-import textwrap
-from typing import TYPE_CHECKING, Any, Callable, Dict, List, Pattern, Type, Union
-import warnings
-
-import numpy as np
-
-import pandas._libs.lib as lib
-import pandas._libs.missing as libmissing
-import pandas._libs.ops as libops
-from pandas._typing import ArrayLike, Dtype, Scalar
-from pandas.util._decorators import Appender
-
-from pandas.core.dtypes.common import (
-    ensure_object,
-    is_bool_dtype,
-    is_categorical_dtype,
-    is_extension_array_dtype,
-    is_integer,
-    is_integer_dtype,
-    is_list_like,
-    is_object_dtype,
-    is_re,
-    is_scalar,
-    is_string_dtype,
-)
-from pandas.core.dtypes.generic import (
-    ABCDataFrame,
-    ABCIndexClass,
-    ABCMultiIndex,
-    ABCSeries,
-)
-from pandas.core.dtypes.missing import isna
-
-from pandas.core.algorithms import take_1d
-from pandas.core.base import NoNewAttributesMixin
-from pandas.core.construction import extract_array
-
-if TYPE_CHECKING:
-    from pandas.arrays import StringArray
-
-_cpython_optimized_encoders = (
-    "utf-8",
-    "utf8",
-    "latin-1",
-    "latin1",
-    "iso-8859-1",
-    "mbcs",
-    "ascii",
-)
-_cpython_optimized_decoders = _cpython_optimized_encoders + ("utf-16", "utf-32")
-
-_shared_docs: Dict[str, str] = dict()
-
-
-def cat_core(list_of_columns: List, sep: str):
-    """
-    Auxiliary function for :meth:`str.cat`
-
-    Parameters
-    ----------
-    list_of_columns : list of numpy arrays
-        List of arrays to be concatenated with sep;
-        these arrays may not contain NaNs!
-    sep : string
-        The separator string for concatenating the columns.
-
-    Returns
-    -------
-    nd.array
-        The concatenation of list_of_columns with sep.
-    """
-    if sep == "":
-        # no need to interleave sep if it is empty
-        arr_of_cols = np.asarray(list_of_columns, dtype=object)
-        return np.sum(arr_of_cols, axis=0)
-    list_with_sep = [sep] * (2 * len(list_of_columns) - 1)
-    list_with_sep[::2] = list_of_columns
-    arr_with_sep = np.asarray(list_with_sep, dtype=object)
-    return np.sum(arr_with_sep, axis=0)
-
-
-def cat_safe(list_of_columns: List, sep: str):
-    """
-    Auxiliary function for :meth:`str.cat`.
-
-    Same signature as cat_core, but handles TypeErrors in concatenation, which
-    happen if the arrays in list_of columns have the wrong dtypes or content.
-
-    Parameters
-    ----------
-    list_of_columns : list of numpy arrays
-        List of arrays to be concatenated with sep;
-        these arrays may not contain NaNs!
-    sep : string
-        The separator string for concatenating the columns.
-
-    Returns
-    -------
-    nd.array
-        The concatenation of list_of_columns with sep.
-    """
-    try:
-        result = cat_core(list_of_columns, sep)
-    except TypeError:
-        # if there are any non-string values (wrong dtype or hidden behind
-        # object dtype), np.sum will fail; catch and return with better message
-        for column in list_of_columns:
-            dtype = lib.infer_dtype(column, skipna=True)
-            if dtype not in ["string", "empty"]:
-                raise TypeError(
-                    "Concatenation requires list-likes containing only "
-                    "strings (or missing values). Offending values found in "
-                    f"column {dtype}"
-                ) from None
-    return result
-
-
-def _na_map(f, arr, na_result=None, dtype=np.dtype(object)):
-    if is_extension_array_dtype(arr.dtype):
-        if na_result is None:
-            na_result = libmissing.NA
-        # just StringDtype
-        arr = extract_array(arr)
-        return _map_stringarray(f, arr, na_value=na_result, dtype=dtype)
-    if na_result is None:
-        na_result = np.nan
-    return _map_object(f, arr, na_mask=True, na_value=na_result, dtype=dtype)
-
-
-def _map_stringarray(
-    func: Callable[[str], Any], arr: "StringArray", na_value: Any, dtype: Dtype
-) -> ArrayLike:
-    """
-    Map a callable over valid elements of a StringArray.
-
-    Parameters
-    ----------
-    func : Callable[[str], Any]
-        Apply to each valid element.
-    arr : StringArray
-    na_value : Any
-        The value to use for missing values. By default, this is
-        the original value (NA).
-    dtype : Dtype
-        The result dtype to use. Specifying this avoids an intermediate
-        object-dtype allocation.
-
-    Returns
-    -------
-    ArrayLike
-        An ExtensionArray for integer or string dtypes, otherwise
-        an ndarray.
-
-    """
-    from pandas.arrays import BooleanArray, IntegerArray, StringArray
-
-    mask = isna(arr)
-
-    assert isinstance(arr, StringArray)
-    arr = np.asarray(arr)
-
-    if is_integer_dtype(dtype) or is_bool_dtype(dtype):
-        constructor: Union[Type[IntegerArray], Type[BooleanArray]]
-        if is_integer_dtype(dtype):
-            constructor = IntegerArray
-        else:
-            constructor = BooleanArray
-
-        na_value_is_na = isna(na_value)
-        if na_value_is_na:
-            na_value = 1
-        result = lib.map_infer_mask(
-            arr,
-            func,
-            mask.view("uint8"),
-            convert=False,
-            na_value=na_value,
-            dtype=np.dtype(dtype),
-        )
-
-        if not na_value_is_na:
-            mask[:] = False
-
-        return constructor(result, mask)
-
-    elif is_string_dtype(dtype) and not is_object_dtype(dtype):
-        # i.e. StringDtype
-        result = lib.map_infer_mask(
-            arr, func, mask.view("uint8"), convert=False, na_value=na_value
-        )
-        return StringArray(result)
-    else:
-        # This is when the result type is object. We reach this when
-        # -> We know the result type is truly object (e.g. .encode returns bytes
-        #    or .findall returns a list).
-        # -> We don't know the result type. E.g. `.get` can return anything.
-        return lib.map_infer_mask(arr, func, mask.view("uint8"))
-
-
-def _map_object(f, arr, na_mask=False, na_value=np.nan, dtype=np.dtype(object)):
-    if not len(arr):
-        return np.ndarray(0, dtype=dtype)
-
-    if isinstance(arr, ABCSeries):
-        arr = arr._values  # TODO: extract_array?
-    if not isinstance(arr, np.ndarray):
-        arr = np.asarray(arr, dtype=object)
-    if na_mask:
-        mask = isna(arr)
-        convert = not np.all(mask)
-        try:
-            result = lib.map_infer_mask(arr, f, mask.view(np.uint8), convert)
-        except (TypeError, AttributeError) as e:
-            # Reraise the exception if callable `f` got wrong number of args.
-            # The user may want to be warned by this, instead of getting NaN
-            p_err = (
-                r"((takes)|(missing)) (?(2)from \d+ to )?\d+ "
-                r"(?(3)required )positional arguments?"
-            )
-
-            if len(e.args) >= 1 and re.search(p_err, e.args[0]):
-                # FIXME: this should be totally avoidable
-                raise e
-
-            def g(x):
-                try:
-                    return f(x)
-                except (TypeError, AttributeError):
-                    return na_value
-
-            return _map_object(g, arr, dtype=dtype)
-        if na_value is not np.nan:
-            np.putmask(result, mask, na_value)
-            if result.dtype == object:
-                result = lib.maybe_convert_objects(result)
-        return result
-    else:
-        return lib.map_infer(arr, f)
-
-
-def str_count(arr, pat, flags=0):
-    """
-    Count occurrences of pattern in each string of the Series/Index.
-
-    This function is used to count the number of times a particular regex
-    pattern is repeated in each of the string elements of the
-    :class:`~pandas.Series`.
-
-    Parameters
-    ----------
-    pat : str
-        Valid regular expression.
-    flags : int, default 0, meaning no flags
-        Flags for the `re` module. For a complete list, `see here
-        <https://docs.python.org/3/howto/regex.html#compilation-flags>`_.
-    **kwargs
-        For compatibility with other string methods. Not used.
-
-    Returns
-    -------
-    Series or Index
-        Same type as the calling object containing the integer counts.
-
-    See Also
-    --------
-    re : Standard library module for regular expressions.
-    str.count : Standard library version, without regular expression support.
-
-    Notes
-    -----
-    Some characters need to be escaped when passing in `pat`.
-    eg. ``'$'`` has a special meaning in regex and must be escaped when
-    finding this literal character.
-
-    Examples
-    --------
-    >>> s = pd.Series(['A', 'B', 'Aaba', 'Baca', np.nan, 'CABA', 'cat'])
-    >>> s.str.count('a')
-    0    0.0
-    1    0.0
-    2    2.0
-    3    2.0
-    4    NaN
-    5    0.0
-    6    1.0
-    dtype: float64
-
-    Escape ``'$'`` to find the literal dollar sign.
-
-    >>> s = pd.Series(['$', 'B', 'Aab$', '$$ca', 'C$B$', 'cat'])
-    >>> s.str.count('\\$')
-    0    1
-    1    0
-    2    1
-    3    2
-    4    2
-    5    0
-    dtype: int64
-
-    This is also available on Index
-
-    >>> pd.Index(['A', 'A', 'Aaba', 'cat']).str.count('a')
-    Int64Index([0, 0, 2, 1], dtype='int64')
-    """
-    regex = re.compile(pat, flags=flags)
-    f = lambda x: len(regex.findall(x))
-    return _na_map(f, arr, dtype="int64")
-
-
-def str_contains(arr, pat, case=True, flags=0, na=np.nan, regex=True):
-    """
-    Test if pattern or regex is contained within a string of a Series or Index.
-
-    Return boolean Series or Index based on whether a given pattern or regex is
-    contained within a string of a Series or Index.
-
-    Parameters
-    ----------
-    pat : str
-        Character sequence or regular expression.
-    case : bool, default True
-        If True, case sensitive.
-    flags : int, default 0 (no flags)
-        Flags to pass through to the re module, e.g. re.IGNORECASE.
-    na : default NaN
-        Fill value for missing values.
-    regex : bool, default True
-        If True, assumes the pat is a regular expression.
-
-        If False, treats the pat as a literal string.
-
-    Returns
-    -------
-    Series or Index of boolean values
-        A Series or Index of boolean values indicating whether the
-        given pattern is contained within the string of each element
-        of the Series or Index.
-
-    See Also
-    --------
-    match : Analogous, but stricter, relying on re.match instead of re.search.
-    Series.str.startswith : Test if the start of each string element matches a
-        pattern.
-    Series.str.endswith : Same as startswith, but tests the end of string.
-
-    Examples
-    --------
-    Returning a Series of booleans using only a literal pattern.
-
-    >>> s1 = pd.Series(['Mouse', 'dog', 'house and parrot', '23', np.NaN])
-    >>> s1.str.contains('og', regex=False)
-    0    False
-    1     True
-    2    False
-    3    False
-    4      NaN
-    dtype: object
-
-    Returning an Index of booleans using only a literal pattern.
-
-    >>> ind = pd.Index(['Mouse', 'dog', 'house and parrot', '23.0', np.NaN])
-    >>> ind.str.contains('23', regex=False)
-    Index([False, False, False, True, nan], dtype='object')
-
-    Specifying case sensitivity using `case`.
-
-    >>> s1.str.contains('oG', case=True, regex=True)
-    0    False
-    1    False
-    2    False
-    3    False
-    4      NaN
-    dtype: object
-
-    Specifying `na` to be `False` instead of `NaN` replaces NaN values
-    with `False`. If Series or Index does not contain NaN values
-    the resultant dtype will be `bool`, otherwise, an `object` dtype.
-
-    >>> s1.str.contains('og', na=False, regex=True)
-    0    False
-    1     True
-    2    False
-    3    False
-    4    False
-    dtype: bool
-
-    Returning 'house' or 'dog' when either expression occurs in a string.
-
-    >>> s1.str.contains('house|dog', regex=True)
-    0    False
-    1     True
-    2     True
-    3    False
-    4      NaN
-    dtype: object
-
-    Ignoring case sensitivity using `flags` with regex.
-
-    >>> import re
-    >>> s1.str.contains('PARROT', flags=re.IGNORECASE, regex=True)
-    0    False
-    1    False
-    2     True
-    3    False
-    4      NaN
-    dtype: object
-
-    Returning any digit using regular expression.
-
-    >>> s1.str.contains('\\d', regex=True)
-    0    False
-    1    False
-    2    False
-    3     True
-    4      NaN
-    dtype: object
-
-    Ensure `pat` is a not a literal pattern when `regex` is set to True.
-    Note in the following example one might expect only `s2[1]` and `s2[3]` to
-    return `True`. However, '.0' as a regex matches any character
-    followed by a 0.
-
-    >>> s2 = pd.Series(['40', '40.0', '41', '41.0', '35'])
-    >>> s2.str.contains('.0', regex=True)
-    0     True
-    1     True
-    2    False
-    3     True
-    4    False
-    dtype: bool
-    """
-    if regex:
-        if not case:
-            flags |= re.IGNORECASE
-
-        regex = re.compile(pat, flags=flags)
-
-        if regex.groups > 0:
-            warnings.warn(
-                "This pattern has match groups. To actually get the "
-                "groups, use str.extract.",
-                UserWarning,
-                stacklevel=3,
-            )
-
-        f = lambda x: regex.search(x) is not None
-    else:
-        if case:
-            f = lambda x: pat in x
-        else:
-            upper_pat = pat.upper()
-            f = lambda x: upper_pat in x
-            uppered = _na_map(lambda x: x.upper(), arr)
-            return _na_map(f, uppered, na, dtype=np.dtype(bool))
-    return _na_map(f, arr, na, dtype=np.dtype(bool))
-
-
-def str_startswith(arr, pat, na=np.nan):
-    """
-    Test if the start of each string element matches a pattern.
-
-    Equivalent to :meth:`str.startswith`.
-
-    Parameters
-    ----------
-    pat : str
-        Character sequence. Regular expressions are not accepted.
-    na : object, default NaN
-        Object shown if element tested is not a string.
-
-    Returns
-    -------
-    Series or Index of bool
-        A Series of booleans indicating whether the given pattern matches
-        the start of each string element.
-
-    See Also
-    --------
-    str.startswith : Python standard library string method.
-    Series.str.endswith : Same as startswith, but tests the end of string.
-    Series.str.contains : Tests if string element contains a pattern.
-
-    Examples
-    --------
-    >>> s = pd.Series(['bat', 'Bear', 'cat', np.nan])
-    >>> s
-    0     bat
-    1    Bear
-    2     cat
-    3     NaN
-    dtype: object
-
-    >>> s.str.startswith('b')
-    0     True
-    1    False
-    2    False
-    3      NaN
-    dtype: object
-
-    Specifying `na` to be `False` instead of `NaN`.
-
-    >>> s.str.startswith('b', na=False)
-    0     True
-    1    False
-    2    False
-    3    False
-    dtype: bool
-    """
-    f = lambda x: x.startswith(pat)
-    return _na_map(f, arr, na, dtype=np.dtype(bool))
-
-
-def str_endswith(arr, pat, na=np.nan):
-    """
-    Test if the end of each string element matches a pattern.
-
-    Equivalent to :meth:`str.endswith`.
-
-    Parameters
-    ----------
-    pat : str
-        Character sequence. Regular expressions are not accepted.
-    na : object, default NaN
-        Object shown if element tested is not a string.
-
-    Returns
-    -------
-    Series or Index of bool
-        A Series of booleans indicating whether the given pattern matches
-        the end of each string element.
-
-    See Also
-    --------
-    str.endswith : Python standard library string method.
-    Series.str.startswith : Same as endswith, but tests the start of string.
-    Series.str.contains : Tests if string element contains a pattern.
-
-    Examples
-    --------
-    >>> s = pd.Series(['bat', 'bear', 'caT', np.nan])
-    >>> s
-    0     bat
-    1    bear
-    2     caT
-    3     NaN
-    dtype: object
-
-    >>> s.str.endswith('t')
-    0     True
-    1    False
-    2    False
-    3      NaN
-    dtype: object
-
-    Specifying `na` to be `False` instead of `NaN`.
-
-    >>> s.str.endswith('t', na=False)
-    0     True
-    1    False
-    2    False
-    3    False
-    dtype: bool
-    """
-    f = lambda x: x.endswith(pat)
-    return _na_map(f, arr, na, dtype=np.dtype(bool))
-
-
-def str_replace(arr, pat, repl, n=-1, case=None, flags=0, regex=True):
-    r"""
-    Replace each occurrence of pattern/regex in the Series/Index.
-
-    Equivalent to :meth:`str.replace` or :func:`re.sub`, depending on the regex value.
-
-    Parameters
-    ----------
-    pat : str or compiled regex
-        String can be a character sequence or regular expression.
-    repl : str or callable
-        Replacement string or a callable. The callable is passed the regex
-        match object and must return a replacement string to be used.
-        See :func:`re.sub`.
-    n : int, default -1 (all)
-        Number of replacements to make from start.
-    case : bool, default None
-        Determines if replace is case sensitive:
-
-        - If True, case sensitive (the default if `pat` is a string)
-        - Set to False for case insensitive
-        - Cannot be set if `pat` is a compiled regex.
-
-    flags : int, default 0 (no flags)
-        Regex module flags, e.g. re.IGNORECASE. Cannot be set if `pat` is a compiled
-        regex.
-    regex : bool, default True
-        Determines if assumes the passed-in pattern is a regular expression:
-
-        - If True, assumes the passed-in pattern is a regular expression.
-        - If False, treats the pattern as a literal string
-        - Cannot be set to False if `pat` is a compiled regex or `repl` is
-          a callable.
-
-    Returns
-    -------
-    Series or Index of object
-        A copy of the object with all matching occurrences of `pat` replaced by
-        `repl`.
-
-    Raises
-    ------
-    ValueError
-        * if `regex` is False and `repl` is a callable or `pat` is a compiled
-          regex
-        * if `pat` is a compiled regex and `case` or `flags` is set
-
-    Notes
-    -----
-    When `pat` is a compiled regex, all flags should be included in the
-    compiled regex. Use of `case`, `flags`, or `regex=False` with a compiled
-    regex will raise an error.
-
-    Examples
-    --------
-    When `pat` is a string and `regex` is True (the default), the given `pat`
-    is compiled as a regex. When `repl` is a string, it replaces matching
-    regex patterns as with :meth:`re.sub`. NaN value(s) in the Series are
-    left as is:
-
-    >>> pd.Series(['foo', 'fuz', np.nan]).str.replace('f.', 'ba', regex=True)
-    0    bao
-    1    baz
-    2    NaN
-    dtype: object
-
-    When `pat` is a string and `regex` is False, every `pat` is replaced with
-    `repl` as with :meth:`str.replace`:
-
-    >>> pd.Series(['f.o', 'fuz', np.nan]).str.replace('f.', 'ba', regex=False)
-    0    bao
-    1    fuz
-    2    NaN
-    dtype: object
-
-    When `repl` is a callable, it is called on every `pat` using
-    :func:`re.sub`. The callable should expect one positional argument
-    (a regex object) and return a string.
-
-    To get the idea:
-
-    >>> pd.Series(['foo', 'fuz', np.nan]).str.replace('f', repr)
-    0    <re.Match object; span=(0, 1), match='f'>oo
-    1    <re.Match object; span=(0, 1), match='f'>uz
-    2                                            NaN
-    dtype: object
-
-    Reverse every lowercase alphabetic word:
-
-    >>> repl = lambda m: m.group(0)[::-1]
-    >>> pd.Series(['foo 123', 'bar baz', np.nan]).str.replace(r'[a-z]+', repl)
-    0    oof 123
-    1    rab zab
-    2        NaN
-    dtype: object
-
-    Using regex groups (extract second group and swap case):
-
-    >>> pat = r"(?P<one>\w+) (?P<two>\w+) (?P<three>\w+)"
-    >>> repl = lambda m: m.group('two').swapcase()
-    >>> pd.Series(['One Two Three', 'Foo Bar Baz']).str.replace(pat, repl)
-    0    tWO
-    1    bAR
-    dtype: object
-
-    Using a compiled regex with flags
-
-    >>> import re
-    >>> regex_pat = re.compile(r'FUZ', flags=re.IGNORECASE)
-    >>> pd.Series(['foo', 'fuz', np.nan]).str.replace(regex_pat, 'bar')
-    0    foo
-    1    bar
-    2    NaN
-    dtype: object
-    """
-    # Check whether repl is valid (GH 13438, GH 15055)
-    if not (isinstance(repl, str) or callable(repl)):
-        raise TypeError("repl must be a string or callable")
-
-    is_compiled_re = is_re(pat)
-    if regex:
-        if is_compiled_re:
-            if (case is not None) or (flags != 0):
-                raise ValueError(
-                    "case and flags cannot be set when pat is a compiled regex"
-                )
-        else:
-            # not a compiled regex
-            # set default case
-            if case is None:
-                case = True
-
-            # add case flag, if provided
-            if case is False:
-                flags |= re.IGNORECASE
-        if is_compiled_re or len(pat) > 1 or flags or callable(repl):
-            n = n if n >= 0 else 0
-            compiled = re.compile(pat, flags=flags)
-            f = lambda x: compiled.sub(repl=repl, string=x, count=n)
-        else:
-            f = lambda x: x.replace(pat, repl, n)
-    else:
-        if is_compiled_re:
-            raise ValueError(
-                "Cannot use a compiled regex as replacement pattern with regex=False"
-            )
-        if callable(repl):
-            raise ValueError("Cannot use a callable replacement when regex=False")
-        f = lambda x: x.replace(pat, repl, n)
-
-    return _na_map(f, arr, dtype=str)
-
-
-def str_repeat(arr, repeats):
-    """
-    Duplicate each string in the Series or Index.
-
-    Parameters
-    ----------
-    repeats : int or sequence of int
-        Same value for all (int) or different value per (sequence).
-
-    Returns
-    -------
-    Series or Index of object
-        Series or Index of repeated string objects specified by
-        input parameter repeats.
-
-    Examples
-    --------
-    >>> s = pd.Series(['a', 'b', 'c'])
-    >>> s
-    0    a
-    1    b
-    2    c
-    dtype: object
-
-    Single int repeats string in Series
-
-    >>> s.str.repeat(repeats=2)
-    0    aa
-    1    bb
-    2    cc
-    dtype: object
-
-    Sequence of int repeats corresponding string in Series
-
-    >>> s.str.repeat(repeats=[1, 2, 3])
-    0      a
-    1     bb
-    2    ccc
-    dtype: object
-    """
-    if is_scalar(repeats):
-
-        def scalar_rep(x):
-            try:
-                return bytes.__mul__(x, repeats)
-            except TypeError:
-                return str.__mul__(x, repeats)
-
-        return _na_map(scalar_rep, arr, dtype=str)
-    else:
-
-        def rep(x, r):
-            if x is libmissing.NA:
-                return x
-            try:
-                return bytes.__mul__(x, r)
-            except TypeError:
-                return str.__mul__(x, r)
-
-        repeats = np.asarray(repeats, dtype=object)
-        result = libops.vec_binop(np.asarray(arr), repeats, rep)
-        return result
-
-
-def str_match(
-    arr: ArrayLike,
-    pat: Union[str, Pattern],
-    case: bool = True,
-    flags: int = 0,
-    na: Scalar = np.nan,
-):
-    """
-    Determine if each string starts with a match of a regular expression.
-
-    Parameters
-    ----------
-    pat : str
-        Character sequence or regular expression.
-    case : bool, default True
-        If True, case sensitive.
-    flags : int, default 0 (no flags)
-        Regex module flags, e.g. re.IGNORECASE.
-    na : default NaN
-        Fill value for missing values.
-
-    Returns
-    -------
-    Series/array of boolean values
-
-    See Also
-    --------
-    fullmatch : Stricter matching that requires the entire string to match.
-    contains : Analogous, but less strict, relying on re.search instead of
-        re.match.
-    extract : Extract matched groups.
-    """
-    if not case:
-        flags |= re.IGNORECASE
-
-    regex = re.compile(pat, flags=flags)
-
-    f = lambda x: regex.match(x) is not None
-
-    return _na_map(f, arr, na, dtype=np.dtype(bool))
-
-
-def str_fullmatch(
-    arr: ArrayLike,
-    pat: Union[str, Pattern],
-    case: bool = True,
-    flags: int = 0,
-    na: Scalar = np.nan,
-):
-    """
-    Determine if each string entirely matches a regular expression.
-
-    .. versionadded:: 1.1.0
-
-    Parameters
-    ----------
-    pat : str
-        Character sequence or regular expression.
-    case : bool, default True
-        If True, case sensitive.
-    flags : int, default 0 (no flags)
-        Regex module flags, e.g. re.IGNORECASE.
-    na : default NaN
-        Fill value for missing values.
-
-    Returns
-    -------
-    Series/array of boolean values
-
-    See Also
-    --------
-    match : Similar, but also returns `True` when only a *prefix* of the string
-        matches the regular expression.
-    extract : Extract matched groups.
-    """
-    if not case:
-        flags |= re.IGNORECASE
-
-    regex = re.compile(pat, flags=flags)
-
-    f = lambda x: regex.fullmatch(x) is not None
-
-    return _na_map(f, arr, na, dtype=np.dtype(bool))
-
-
-def _get_single_group_name(rx):
-    try:
-        return list(rx.groupindex.keys()).pop()
-    except IndexError:
-        return None
-
-
-def _groups_or_na_fun(regex):
-    """Used in both extract_noexpand and extract_frame"""
-    if regex.groups == 0:
-        raise ValueError("pattern contains no capture groups")
-    empty_row = [np.nan] * regex.groups
-
-    def f(x):
-        if not isinstance(x, str):
-            return empty_row
-        m = regex.search(x)
-        if m:
-            return [np.nan if item is None else item for item in m.groups()]
-        else:
-            return empty_row
-
-    return f
-
-
-def _result_dtype(arr):
-    # workaround #27953
-    # ideally we just pass `dtype=arr.dtype` unconditionally, but this fails
-    # when the list of values is empty.
-    if arr.dtype.name == "string":
-        return "string"
-    else:
-        return object
-
-
-def _str_extract_noexpand(arr, pat, flags=0):
-    """
-    Find groups in each string in the Series using passed regular
-    expression. This function is called from
-    str_extract(expand=False), and can return Series, DataFrame, or
-    Index.
-
-    """
-    from pandas import DataFrame
-
-    regex = re.compile(pat, flags=flags)
-    groups_or_na = _groups_or_na_fun(regex)
-
-    if regex.groups == 1:
-        result = np.array([groups_or_na(val)[0] for val in arr], dtype=object)
-        name = _get_single_group_name(regex)
-    else:
-        if isinstance(arr, ABCIndexClass):
-            raise ValueError("only one regex group is supported with Index")
-        name = None
-        names = dict(zip(regex.groupindex.values(), regex.groupindex.keys()))
-        columns = [names.get(1 + i, i) for i in range(regex.groups)]
-        if arr.empty:
-            result = DataFrame(columns=columns, dtype=object)
-        else:
-            dtype = _result_dtype(arr)
-            result = DataFrame(
-                [groups_or_na(val) for val in arr],
-                columns=columns,
-                index=arr.index,
-                dtype=dtype,
-            )
-    return result, name
-
-
-def _str_extract_frame(arr, pat, flags=0):
-    """
-    For each subject string in the Series, extract groups from the
-    first match of regular expression pat. This function is called from
-    str_extract(expand=True), and always returns a DataFrame.
-
-    """
-    from pandas import DataFrame
-
-    regex = re.compile(pat, flags=flags)
-    groups_or_na = _groups_or_na_fun(regex)
-    names = dict(zip(regex.groupindex.values(), regex.groupindex.keys()))
-    columns = [names.get(1 + i, i) for i in range(regex.groups)]
-
-    if len(arr) == 0:
-        return DataFrame(columns=columns, dtype=object)
-    try:
-        result_index = arr.index
-    except AttributeError:
-        result_index = None
-    dtype = _result_dtype(arr)
-    return DataFrame(
-        [groups_or_na(val) for val in arr],
-        columns=columns,
-        index=result_index,
-        dtype=dtype,
-    )
-
-
-def str_extract(arr, pat, flags=0, expand=True):
-    r"""
-    Extract capture groups in the regex `pat` as columns in a DataFrame.
-
-    For each subject string in the Series, extract groups from the
-    first match of regular expression `pat`.
-
-    Parameters
-    ----------
-    pat : str
-        Regular expression pattern with capturing groups.
-    flags : int, default 0 (no flags)
-        Flags from the ``re`` module, e.g. ``re.IGNORECASE``, that
-        modify regular expression matching for things like case,
-        spaces, etc. For more details, see :mod:`re`.
-    expand : bool, default True
-        If True, return DataFrame with one column per capture group.
-        If False, return a Series/Index if there is one capture group
-        or DataFrame if there are multiple capture groups.
-
-    Returns
-    -------
-    DataFrame or Series or Index
-        A DataFrame with one row for each subject string, and one
-        column for each group. Any capture group names in regular
-        expression pat will be used for column names; otherwise
-        capture group numbers will be used. The dtype of each result
-        column is always object, even when no match is found. If
-        ``expand=False`` and pat has only one capture group, then
-        return a Series (if subject is a Series) or Index (if subject
-        is an Index).
-
-    See Also
-    --------
-    extractall : Returns all matches (not just the first match).
-
-    Examples
-    --------
-    A pattern with two groups will return a DataFrame with two columns.
-    Non-matches will be NaN.
-
-    >>> s = pd.Series(['a1', 'b2', 'c3'])
-    >>> s.str.extract(r'([ab])(\d)')
-         0    1
-    0    a    1
-    1    b    2
-    2  NaN  NaN
-
-    A pattern may contain optional groups.
-
-    >>> s.str.extract(r'([ab])?(\d)')
-         0  1
-    0    a  1
-    1    b  2
-    2  NaN  3
-
-    Named groups will become column names in the result.
-
-    >>> s.str.extract(r'(?P<letter>[ab])(?P<digit>\d)')
-      letter digit
-    0      a     1
-    1      b     2
-    2    NaN   NaN
-
-    A pattern with one group will return a DataFrame with one column
-    if expand=True.
-
-    >>> s.str.extract(r'[ab](\d)', expand=True)
-         0
-    0    1
-    1    2
-    2  NaN
-
-    A pattern with one group will return a Series if expand=False.
-
-    >>> s.str.extract(r'[ab](\d)', expand=False)
-    0      1
-    1      2
-    2    NaN
-    dtype: object
-    """
-    if not isinstance(expand, bool):
-        raise ValueError("expand must be True or False")
-    if expand:
-        return _str_extract_frame(arr._orig, pat, flags=flags)
-    else:
-        result, name = _str_extract_noexpand(arr._parent, pat, flags=flags)
-        return arr._wrap_result(result, name=name, expand=expand)
-
-
-def str_extractall(arr, pat, flags=0):
-    r"""
-    Extract capture groups in the regex `pat` as columns in DataFrame.
-
-    For each subject string in the Series, extract groups from all
-    matches of regular expression pat. When each subject string in the
-    Series has exactly one match, extractall(pat).xs(0, level='match')
-    is the same as extract(pat).
-
-    Parameters
-    ----------
-    pat : str
-        Regular expression pattern with capturing groups.
-    flags : int, default 0 (no flags)
-        A ``re`` module flag, for example ``re.IGNORECASE``. These allow
-        to modify regular expression matching for things like case, spaces,
-        etc. Multiple flags can be combined with the bitwise OR operator,
-        for example ``re.IGNORECASE | re.MULTILINE``.
-
-    Returns
-    -------
-    DataFrame
-        A ``DataFrame`` with one row for each match, and one column for each
-        group. Its rows have a ``MultiIndex`` with first levels that come from
-        the subject ``Series``. The last level is named 'match' and indexes the
-        matches in each item of the ``Series``. Any capture group names in
-        regular expression pat will be used for column names; otherwise capture
-        group numbers will be used.
-
-    See Also
-    --------
-    extract : Returns first match only (not all matches).
-
-    Examples
-    --------
-    A pattern with one group will return a DataFrame with one column.
-    Indices with no matches will not appear in the result.
-
-    >>> s = pd.Series(["a1a2", "b1", "c1"], index=["A", "B", "C"])
-    >>> s.str.extractall(r"[ab](\d)")
-             0
-      match
-    A 0      1
-      1      2
-    B 0      1
-
-    Capture group names are used for column names of the result.
-
-    >>> s.str.extractall(r"[ab](?P<digit>\d)")
-            digit
-      match
-    A 0         1
-      1         2
-    B 0         1
-
-    A pattern with two groups will return a DataFrame with two columns.
-
-    >>> s.str.extractall(r"(?P<letter>[ab])(?P<digit>\d)")
-            letter digit
-      match
-    A 0          a     1
-      1          a     2
-    B 0          b     1
-
-    Optional groups that do not match are NaN in the result.
-
-    >>> s.str.extractall(r"(?P<letter>[ab])?(?P<digit>\d)")
-            letter digit
-      match
-    A 0          a     1
-      1          a     2
-    B 0          b     1
-    C 0        NaN     1
-    """
-    regex = re.compile(pat, flags=flags)
-    # the regex must contain capture groups.
-    if regex.groups == 0:
-        raise ValueError("pattern contains no capture groups")
-
-    if isinstance(arr, ABCIndexClass):
-        arr = arr.to_series().reset_index(drop=True)
-
-    names = dict(zip(regex.groupindex.values(), regex.groupindex.keys()))
-    columns = [names.get(1 + i, i) for i in range(regex.groups)]
-    match_list = []
-    index_list = []
-    is_mi = arr.index.nlevels > 1
-
-    for subject_key, subject in arr.items():
-        if isinstance(subject, str):
-
-            if not is_mi:
-                subject_key = (subject_key,)
-
-            for match_i, match_tuple in enumerate(regex.findall(subject)):
-                if isinstance(match_tuple, str):
-                    match_tuple = (match_tuple,)
-                na_tuple = [np.NaN if group == "" else group for group in match_tuple]
-                match_list.append(na_tuple)
-                result_key = tuple(subject_key + (match_i,))
-                index_list.append(result_key)
-
-    from pandas import MultiIndex
-
-    index = MultiIndex.from_tuples(index_list, names=arr.index.names + ["match"])
-    dtype = _result_dtype(arr)
-
-    result = arr._constructor_expanddim(
-        match_list, index=index, columns=columns, dtype=dtype
-    )
-    return result
-
-
-def str_get_dummies(arr, sep="|"):
-    """
-    Return DataFrame of dummy/indicator variables for Series.
-
-    Each string in Series is split by sep and returned as a DataFrame
-    of dummy/indicator variables.
-
-    Parameters
-    ----------
-    sep : str, default "|"
-        String to split on.
-
-    Returns
-    -------
-    DataFrame
-        Dummy variables corresponding to values of the Series.
-
-    See Also
-    --------
-    get_dummies : Convert categorical variable into dummy/indicator
-        variables.
-
-    Examples
-    --------
-    >>> pd.Series(['a|b', 'a', 'a|c']).str.get_dummies()
-       a  b  c
-    0  1  1  0
-    1  1  0  0
-    2  1  0  1
-
-    >>> pd.Series(['a|b', np.nan, 'a|c']).str.get_dummies()
-       a  b  c
-    0  1  1  0
-    1  0  0  0
-    2  1  0  1
-    """
-    arr = arr.fillna("")
-    try:
-        arr = sep + arr + sep
-    except TypeError:
-        arr = sep + arr.astype(str) + sep
-
-    tags = set()
-    for ts in arr.str.split(sep):
-        tags.update(ts)
-    tags = sorted(tags - {""})
-
-    dummies = np.empty((len(arr), len(tags)), dtype=np.int64)
-
-    for i, t in enumerate(tags):
-        pat = sep + t + sep
-        dummies[:, i] = lib.map_infer(arr.to_numpy(), lambda x: pat in x)
-    return dummies, tags
-
-
-def str_join(arr, sep):
-    """
-    Join lists contained as elements in the Series/Index with passed delimiter.
-
-    If the elements of a Series are lists themselves, join the content of these
-    lists using the delimiter passed to the function.
-    This function is an equivalent to :meth:`str.join`.
-
-    Parameters
-    ----------
-    sep : str
-        Delimiter to use between list entries.
-
-    Returns
-    -------
-    Series/Index: object
-        The list entries concatenated by intervening occurrences of the
-        delimiter.
-
-    Raises
-    ------
-    AttributeError
-        If the supplied Series contains neither strings nor lists.
-
-    See Also
-    --------
-    str.join : Standard library version of this method.
-    Series.str.split : Split strings around given separator/delimiter.
-
-    Notes
-    -----
-    If any of the list items is not a string object, the result of the join
-    will be `NaN`.
-
-    Examples
-    --------
-    Example with a list that contains non-string elements.
-
-    >>> s = pd.Series([['lion', 'elephant', 'zebra'],
-    ...                [1.1, 2.2, 3.3],
-    ...                ['cat', np.nan, 'dog'],
-    ...                ['cow', 4.5, 'goat'],
-    ...                ['duck', ['swan', 'fish'], 'guppy']])
-    >>> s
-    0        [lion, elephant, zebra]
-    1                [1.1, 2.2, 3.3]
-    2                [cat, nan, dog]
-    3               [cow, 4.5, goat]
-    4    [duck, [swan, fish], guppy]
-    dtype: object
-
-    Join all lists using a '-'. The lists containing object(s) of types other
-    than str will produce a NaN.
-
-    >>> s.str.join('-')
-    0    lion-elephant-zebra
-    1                    NaN
-    2                    NaN
-    3                    NaN
-    4                    NaN
-    dtype: object
-    """
-    return _na_map(sep.join, arr, dtype=str)
-
-
-def str_findall(arr, pat, flags=0):
-    """
-    Find all occurrences of pattern or regular expression in the Series/Index.
-
-    Equivalent to applying :func:`re.findall` to all the elements in the
-    Series/Index.
-
-    Parameters
-    ----------
-    pat : str
-        Pattern or regular expression.
-    flags : int, default 0
-        Flags from ``re`` module, e.g. `re.IGNORECASE` (default is 0, which
-        means no flags).
-
-    Returns
-    -------
-    Series/Index of lists of strings
-        All non-overlapping matches of pattern or regular expression in each
-        string of this Series/Index.
-
-    See Also
-    --------
-    count : Count occurrences of pattern or regular expression in each string
-        of the Series/Index.
-    extractall : For each string in the Series, extract groups from all matches
-        of regular expression and return a DataFrame with one row for each
-        match and one column for each group.
-    re.findall : The equivalent ``re`` function to all non-overlapping matches
-        of pattern or regular expression in string, as a list of strings.
-
-    Examples
-    --------
-    >>> s = pd.Series(['Lion', 'Monkey', 'Rabbit'])
-
-    The search for the pattern 'Monkey' returns one match:
-
-    >>> s.str.findall('Monkey')
-    0          []
-    1    [Monkey]
-    2          []
-    dtype: object
-
-    On the other hand, the search for the pattern 'MONKEY' doesn't return any
-    match:
-
-    >>> s.str.findall('MONKEY')
-    0    []
-    1    []
-    2    []
-    dtype: object
-
-    Flags can be added to the pattern or regular expression. For instance,
-    to find the pattern 'MONKEY' ignoring the case:
-
-    >>> import re
-    >>> s.str.findall('MONKEY', flags=re.IGNORECASE)
-    0          []
-    1    [Monkey]
-    2          []
-    dtype: object
-
-    When the pattern matches more than one string in the Series, all matches
-    are returned:
-
-    >>> s.str.findall('on')
-    0    [on]
-    1    [on]
-    2      []
-    dtype: object
-
-    Regular expressions are supported too. For instance, the search for all the
-    strings ending with the word 'on' is shown next:
-
-    >>> s.str.findall('on$')
-    0    [on]
-    1      []
-    2      []
-    dtype: object
-
-    If the pattern is found more than once in the same string, then a list of
-    multiple strings is returned:
-
-    >>> s.str.findall('b')
-    0        []
-    1        []
-    2    [b, b]
-    dtype: object
-    """
-    regex = re.compile(pat, flags=flags)
-    return _na_map(regex.findall, arr)
-
-
-def str_find(arr, sub, start=0, end=None, side="left"):
-    """
-    Return indexes in each strings in the Series/Index where the
-    substring is fully contained between [start:end]. Return -1 on failure.
-
-    Parameters
-    ----------
-    sub : str
-        Substring being searched.
-    start : int
-        Left edge index.
-    end : int
-        Right edge index.
-    side : {'left', 'right'}, default 'left'
-        Specifies a starting side, equivalent to ``find`` or ``rfind``.
-
-    Returns
-    -------
-    Series or Index
-        Indexes where substring is found.
-    """
-    if not isinstance(sub, str):
-        msg = f"expected a string object, not {type(sub).__name__}"
-        raise TypeError(msg)
-
-    if side == "left":
-        method = "find"
-    elif side == "right":
-        method = "rfind"
-    else:  # pragma: no cover
-        raise ValueError("Invalid side")
-
-    if end is None:
-        f = lambda x: getattr(x, method)(sub, start)
-    else:
-        f = lambda x: getattr(x, method)(sub, start, end)
-
-    return _na_map(f, arr, dtype=np.dtype("int64"))
-
-
-def str_index(arr, sub, start=0, end=None, side="left"):
-    if not isinstance(sub, str):
-        msg = f"expected a string object, not {type(sub).__name__}"
-        raise TypeError(msg)
-
-    if side == "left":
-        method = "index"
-    elif side == "right":
-        method = "rindex"
-    else:  # pragma: no cover
-        raise ValueError("Invalid side")
-
-    if end is None:
-        f = lambda x: getattr(x, method)(sub, start)
-    else:
-        f = lambda x: getattr(x, method)(sub, start, end)
-
-    return _na_map(f, arr, dtype=np.dtype("int64"))
-
-
-def str_pad(arr, width, side="left", fillchar=" "):
-    """
-    Pad strings in the Series/Index up to width.
-
-    Parameters
-    ----------
-    width : int
-        Minimum width of resulting string; additional characters will be filled
-        with character defined in `fillchar`.
-    side : {'left', 'right', 'both'}, default 'left'
-        Side from which to fill resulting string.
-    fillchar : str, default ' '
-        Additional character for filling, default is whitespace.
-
-    Returns
-    -------
-    Series or Index of object
-        Returns Series or Index with minimum number of char in object.
-
-    See Also
-    --------
-    Series.str.rjust : Fills the left side of strings with an arbitrary
-        character. Equivalent to ``Series.str.pad(side='left')``.
-    Series.str.ljust : Fills the right side of strings with an arbitrary
-        character. Equivalent to ``Series.str.pad(side='right')``.
-    Series.str.center : Fills both sides of strings with an arbitrary
-        character. Equivalent to ``Series.str.pad(side='both')``.
-    Series.str.zfill : Pad strings in the Series/Index by prepending '0'
-        character. Equivalent to ``Series.str.pad(side='left', fillchar='0')``.
-
-    Examples
-    --------
-    >>> s = pd.Series(["caribou", "tiger"])
-    >>> s
-    0    caribou
-    1      tiger
-    dtype: object
-
-    >>> s.str.pad(width=10)
-    0       caribou
-    1         tiger
-    dtype: object
-
-    >>> s.str.pad(width=10, side='right', fillchar='-')
-    0    caribou---
-    1    tiger-----
-    dtype: object
-
-    >>> s.str.pad(width=10, side='both', fillchar='-')
-    0    -caribou--
-    1    --tiger---
-    dtype: object
-    """
-    if not isinstance(fillchar, str):
-        msg = f"fillchar must be a character, not {type(fillchar).__name__}"
-        raise TypeError(msg)
-
-    if len(fillchar) != 1:
-        raise TypeError("fillchar must be a character, not str")
-
-    if not is_integer(width):
-        msg = f"width must be of integer type, not {type(width).__name__}"
-        raise TypeError(msg)
-
-    if side == "left":
-        f = lambda x: x.rjust(width, fillchar)
-    elif side == "right":
-        f = lambda x: x.ljust(width, fillchar)
-    elif side == "both":
-        f = lambda x: x.center(width, fillchar)
-    else:  # pragma: no cover
-        raise ValueError("Invalid side")
-
-    return _na_map(f, arr, dtype=str)
-
-
-def str_split(arr, pat=None, n=None):
-
-    if pat is None:
-        if n is None or n == 0:
-            n = -1
-        f = lambda x: x.split(pat, n)
-    else:
-        if len(pat) == 1:
-            if n is None or n == 0:
-                n = -1
-            f = lambda x: x.split(pat, n)
-        else:
-            if n is None or n == -1:
-                n = 0
-            regex = re.compile(pat)
-            f = lambda x: regex.split(x, maxsplit=n)
-    res = _na_map(f, arr)
-    return res
-
-
-def str_rsplit(arr, pat=None, n=None):
-
-    if n is None or n == 0:
-        n = -1
-    f = lambda x: x.rsplit(pat, n)
-    res = _na_map(f, arr)
-    return res
-
-
-def str_slice(arr, start=None, stop=None, step=None):
-    """
-    Slice substrings from each element in the Series or Index.
-
-    Parameters
-    ----------
-    start : int, optional
-        Start position for slice operation.
-    stop : int, optional
-        Stop position for slice operation.
-    step : int, optional
-        Step size for slice operation.
-
-    Returns
-    -------
-    Series or Index of object
-        Series or Index from sliced substring from original string object.
-
-    See Also
-    --------
-    Series.str.slice_replace : Replace a slice with a string.
-    Series.str.get : Return element at position.
-        Equivalent to `Series.str.slice(start=i, stop=i+1)` with `i`
-        being the position.
-
-    Examples
-    --------
-    >>> s = pd.Series(["koala", "fox", "chameleon"])
-    >>> s
-    0        koala
-    1          fox
-    2    chameleon
-    dtype: object
-
-    >>> s.str.slice(start=1)
-    0        oala
-    1          ox
-    2    hameleon
-    dtype: object
-
-    >>> s.str.slice(start=-1)
-    0           a
-    1           x
-    2           n
-    dtype: object
-
-    >>> s.str.slice(stop=2)
-    0    ko
-    1    fo
-    2    ch
-    dtype: object
-
-    >>> s.str.slice(step=2)
-    0      kaa
-    1       fx
-    2    caeen
-    dtype: object
-
-    >>> s.str.slice(start=0, stop=5, step=3)
-    0    kl
-    1     f
-    2    cm
-    dtype: object
-
-    Equivalent behaviour to:
-
-    >>> s.str[0:5:3]
-    0    kl
-    1     f
-    2    cm
-    dtype: object
-    """
-    obj = slice(start, stop, step)
-    f = lambda x: x[obj]
-    return _na_map(f, arr, dtype=str)
-
-
-def str_slice_replace(arr, start=None, stop=None, repl=None):
-    """
-    Replace a positional slice of a string with another value.
-
-    Parameters
-    ----------
-    start : int, optional
-        Left index position to use for the slice. If not specified (None),
-        the slice is unbounded on the left, i.e. slice from the start
-        of the string.
-    stop : int, optional
-        Right index position to use for the slice. If not specified (None),
-        the slice is unbounded on the right, i.e. slice until the
-        end of the string.
-    repl : str, optional
-        String for replacement. If not specified (None), the sliced region
-        is replaced with an empty string.
-
-    Returns
-    -------
-    Series or Index
-        Same type as the original object.
-
-    See Also
-    --------
-    Series.str.slice : Just slicing without replacement.
-
-    Examples
-    --------
-    >>> s = pd.Series(['a', 'ab', 'abc', 'abdc', 'abcde'])
-    >>> s
-    0        a
-    1       ab
-    2      abc
-    3     abdc
-    4    abcde
-    dtype: object
-
-    Specify just `start`, meaning replace `start` until the end of the
-    string with `repl`.
-
-    >>> s.str.slice_replace(1, repl='X')
-    0    aX
-    1    aX
-    2    aX
-    3    aX
-    4    aX
-    dtype: object
-
-    Specify just `stop`, meaning the start of the string to `stop` is replaced
-    with `repl`, and the rest of the string is included.
-
-    >>> s.str.slice_replace(stop=2, repl='X')
-    0       X
-    1       X
-    2      Xc
-    3     Xdc
-    4    Xcde
-    dtype: object
-
-    Specify `start` and `stop`, meaning the slice from `start` to `stop` is
-    replaced with `repl`. Everything before or after `start` and `stop` is
-    included as is.
-
-    >>> s.str.slice_replace(start=1, stop=3, repl='X')
-    0      aX
-    1      aX
-    2      aX
-    3     aXc
-    4    aXde
-    dtype: object
-    """
-    if repl is None:
-        repl = ""
-
-    def f(x):
-        if x[start:stop] == "":
-            local_stop = start
-        else:
-            local_stop = stop
-        y = ""
-        if start is not None:
-            y += x[:start]
-        y += repl
-        if stop is not None:
-            y += x[local_stop:]
-        return y
-
-    return _na_map(f, arr, dtype=str)
-
-
-def str_strip(arr, to_strip=None, side="both"):
-    """
-    Strip whitespace (including newlines) from each string in the
-    Series/Index.
-
-    Parameters
-    ----------
-    to_strip : str or unicode
-    side : {'left', 'right', 'both'}, default 'both'
-
-    Returns
-    -------
-    Series or Index
-    """
-    if side == "both":
-        f = lambda x: x.strip(to_strip)
-    elif side == "left":
-        f = lambda x: x.lstrip(to_strip)
-    elif side == "right":
-        f = lambda x: x.rstrip(to_strip)
-    else:  # pragma: no cover
-        raise ValueError("Invalid side")
-    return _na_map(f, arr, dtype=str)
-
-
-def str_wrap(arr, width, **kwargs):
-    r"""
-    Wrap strings in Series/Index at specified line width.
-
-    This method has the same keyword parameters and defaults as
-    :class:`textwrap.TextWrapper`.
-
-    Parameters
-    ----------
-    width : int
-        Maximum line width.
-    expand_tabs : bool, optional
-        If True, tab characters will be expanded to spaces (default: True).
-    replace_whitespace : bool, optional
-        If True, each whitespace character (as defined by string.whitespace)
-        remaining after tab expansion will be replaced by a single space
-        (default: True).
-    drop_whitespace : bool, optional
-        If True, whitespace that, after wrapping, happens to end up at the
-        beginning or end of a line is dropped (default: True).
-    break_long_words : bool, optional
-        If True, then words longer than width will be broken in order to ensure
-        that no lines are longer than width. If it is false, long words will
-        not be broken, and some lines may be longer than width (default: True).
-    break_on_hyphens : bool, optional
-        If True, wrapping will occur preferably on whitespace and right after
-        hyphens in compound words, as it is customary in English. If false,
-        only whitespaces will be considered as potentially good places for line
-        breaks, but you need to set break_long_words to false if you want truly
-        insecable words (default: True).
-
-    Returns
-    -------
-    Series or Index
-
-    Notes
-    -----
-    Internally, this method uses a :class:`textwrap.TextWrapper` instance with
-    default settings. To achieve behavior matching R's stringr library str_wrap
-    function, use the arguments:
-
-    - expand_tabs = False
-    - replace_whitespace = True
-    - drop_whitespace = True
-    - break_long_words = False
-    - break_on_hyphens = False
-
-    Examples
-    --------
-    >>> s = pd.Series(['line to be wrapped', 'another line to be wrapped'])
-    >>> s.str.wrap(12)
-    0             line to be\nwrapped
-    1    another line\nto be\nwrapped
-    dtype: object
-    """
-    kwargs["width"] = width
-
-    tw = textwrap.TextWrapper(**kwargs)
-
-    return _na_map(lambda s: "\n".join(tw.wrap(s)), arr, dtype=str)
-
-
-def str_translate(arr, table):
-    """
-    Map all characters in the string through the given mapping table.
-
-    Equivalent to standard :meth:`str.translate`.
-
-    Parameters
-    ----------
-    table : dict
-        Table is a mapping of Unicode ordinals to Unicode ordinals, strings, or
-        None. Unmapped characters are left untouched.
-        Characters mapped to None are deleted. :meth:`str.maketrans` is a
-        helper function for making translation tables.
-
-    Returns
-    -------
-    Series or Index
-    """
-    return _na_map(lambda x: x.translate(table), arr, dtype=str)
-
-
-def str_get(arr, i):
-    """
-    Extract element from each component at specified position.
-
-    Extract element from lists, tuples, or strings in each element in the
-    Series/Index.
-
-    Parameters
-    ----------
-    i : int
-        Position of element to extract.
-
-    Returns
-    -------
-    Series or Index
-
-    Examples
-    --------
-    >>> s = pd.Series(["String",
-    ...               (1, 2, 3),
-    ...               ["a", "b", "c"],
-    ...               123,
-    ...               -456,
-    ...               {1: "Hello", "2": "World"}])
-    >>> s
-    0                        String
-    1                     (1, 2, 3)
-    2                     [a, b, c]
-    3                           123
-    4                          -456
-    5    {1: 'Hello', '2': 'World'}
-    dtype: object
-
-    >>> s.str.get(1)
-    0        t
-    1        2
-    2        b
-    3      NaN
-    4      NaN
-    5    Hello
-    dtype: object
-
-    >>> s.str.get(-1)
-    0      g
-    1      3
-    2      c
-    3    NaN
-    4    NaN
-    5    None
-    dtype: object
-    """
-
-    def f(x):
-        if isinstance(x, dict):
-            return x.get(i)
-        elif len(x) > i >= -len(x):
-            return x[i]
-        return np.nan
-
-    return _na_map(f, arr)
-
-
-def str_decode(arr, encoding, errors="strict"):
-    """
-    Decode character string in the Series/Index using indicated encoding.
-
-    Equivalent to :meth:`str.decode` in python2 and :meth:`bytes.decode` in
-    python3.
-
-    Parameters
-    ----------
-    encoding : str
-    errors : str, optional
-
-    Returns
-    -------
-    Series or Index
-    """
-    if encoding in _cpython_optimized_decoders:
-        # CPython optimized implementation
-        f = lambda x: x.decode(encoding, errors)
-    else:
-        decoder = codecs.getdecoder(encoding)
-        f = lambda x: decoder(x, errors)[0]
-    return _na_map(f, arr)
-
-
-def str_encode(arr, encoding, errors="strict"):
-    """
-    Encode character string in the Series/Index using indicated encoding.
-
-    Equivalent to :meth:`str.encode`.
-
-    Parameters
-    ----------
-    encoding : str
-    errors : str, optional
-
-    Returns
-    -------
-    encoded : Series/Index of objects
-    """
-    if encoding in _cpython_optimized_encoders:
-        # CPython optimized implementation
-        f = lambda x: x.encode(encoding, errors)
-    else:
-        encoder = codecs.getencoder(encoding)
-        f = lambda x: encoder(x, errors)[0]
-    return _na_map(f, arr)
-
-
-def forbid_nonstring_types(forbidden, name=None):
-    """
-    Decorator to forbid specific types for a method of StringMethods.
-
-    For calling `.str.{method}` on a Series or Index, it is necessary to first
-    initialize the :class:`StringMethods` object, and then call the method.
-    However, different methods allow different input types, and so this can not
-    be checked during :meth:`StringMethods.__init__`, but must be done on a
-    per-method basis. This decorator exists to facilitate this process, and
-    make it explicit which (inferred) types are disallowed by the method.
-
-    :meth:`StringMethods.__init__` allows the *union* of types its different
-    methods allow (after skipping NaNs; see :meth:`StringMethods._validate`),
-    namely: ['string', 'empty', 'bytes', 'mixed', 'mixed-integer'].
-
-    The default string types ['string', 'empty'] are allowed for all methods.
-    For the additional types ['bytes', 'mixed', 'mixed-integer'], each method
-    then needs to forbid the types it is not intended for.
-
-    Parameters
-    ----------
-    forbidden : list-of-str or None
-        List of forbidden non-string types, may be one or more of
-        `['bytes', 'mixed', 'mixed-integer']`.
-    name : str, default None
-        Name of the method to use in the error message. By default, this is
-        None, in which case the name from the method being wrapped will be
-        copied. However, for working with further wrappers (like _pat_wrapper
-        and _noarg_wrapper), it is necessary to specify the name.
-
-    Returns
-    -------
-    func : wrapper
-        The method to which the decorator is applied, with an added check that
-        enforces the inferred type to not be in the list of forbidden types.
-
-    Raises
-    ------
-    TypeError
-        If the inferred type of the underlying data is in `forbidden`.
-    """
-    # deal with None
-    forbidden = [] if forbidden is None else forbidden
-
-    allowed_types = {"string", "empty", "bytes", "mixed", "mixed-integer"} - set(
-        forbidden
-    )
-
-    def _forbid_nonstring_types(func):
-        func_name = func.__name__ if name is None else name
-
-        @wraps(func)
-        def wrapper(self, *args, **kwargs):
-            if self._inferred_dtype not in allowed_types:
-                msg = (
-                    f"Cannot use .str.{func_name} with values of "
-                    f"inferred dtype '{self._inferred_dtype}'."
-                )
-                raise TypeError(msg)
-            return func(self, *args, **kwargs)
-
-        wrapper.__name__ = func_name
-        return wrapper
-
-    return _forbid_nonstring_types
-
-
-def _noarg_wrapper(
-    f,
-    name=None,
-    docstring=None,
-    forbidden_types=["bytes"],
-    returns_string=True,
-    **kwargs,
-):
-    @forbid_nonstring_types(forbidden_types, name=name)
-    def wrapper(self):
-        result = _na_map(f, self._parent, **kwargs)
-        return self._wrap_result(result, returns_string=returns_string)
-
-    wrapper.__name__ = f.__name__ if name is None else name
-    if docstring is not None:
-        wrapper.__doc__ = docstring
-    else:
-        raise ValueError("Provide docstring")
-
-    return wrapper
-
-
-def _pat_wrapper(
-    f,
-    flags=False,
-    na=False,
-    name=None,
-    forbidden_types=["bytes"],
-    returns_string=True,
-    **kwargs,
-):
-    @forbid_nonstring_types(forbidden_types, name=name)
-    def wrapper1(self, pat):
-        result = f(self._parent, pat)
-        return self._wrap_result(result, returns_string=returns_string)
-
-    @forbid_nonstring_types(forbidden_types, name=name)
-    def wrapper2(self, pat, flags=0, **kwargs):
-        result = f(self._parent, pat, flags=flags, **kwargs)
-        return self._wrap_result(result, returns_string=returns_string)
-
-    @forbid_nonstring_types(forbidden_types, name=name)
-    def wrapper3(self, pat, na=np.nan):
-        result = f(self._parent, pat, na=na)
-        return self._wrap_result(result, returns_string=returns_string, fill_value=na)
-
-    wrapper = wrapper3 if na else wrapper2 if flags else wrapper1
-
-    wrapper.__name__ = f.__name__ if name is None else name
-    if f.__doc__:
-        wrapper.__doc__ = f.__doc__
-
-    return wrapper
-
-
-def copy(source):
-    """Copy a docstring from another source function (if present)"""
-
-    def do_copy(target):
-        if source.__doc__:
-            target.__doc__ = source.__doc__
-        return target
-
-    return do_copy
-
-
-class StringMethods(NoNewAttributesMixin):
-    """
-    Vectorized string functions for Series and Index.
-
-    NAs stay NA unless handled otherwise by a particular method.
-    Patterned after Python's string methods, with some inspiration from
-    R's stringr package.
-
-    Examples
-    --------
-    >>> s = pd.Series(["A_Str_Series"])
-    >>> s
-    0    A_Str_Series
-    dtype: object
-
-    >>> s.str.split("_")
-    0    [A, Str, Series]
-    dtype: object
-
-    >>> s.str.replace("_", "")
-    0    AStrSeries
-    dtype: object
-    """
-
-    def __init__(self, data):
-        self._inferred_dtype = self._validate(data)
-        self._is_categorical = is_categorical_dtype(data.dtype)
-        self._is_string = data.dtype.name == "string"
-
-        # ._values.categories works for both Series/Index
-        self._parent = data._values.categories if self._is_categorical else data
-        # save orig to blow up categoricals to the right type
-        self._orig = data
-        self._freeze()
-
-    @staticmethod
-    def _validate(data):
-        """
-        Auxiliary function for StringMethods, infers and checks dtype of data.
-
-        This is a "first line of defence" at the creation of the StringMethods-
-        object (see _make_accessor), and just checks that the dtype is in the
-        *union* of the allowed types over all string methods below; this
-        restriction is then refined on a per-method basis using the decorator
-        @forbid_nonstring_types (more info in the corresponding docstring).
-
-        This really should exclude all series/index with any non-string values,
-        but that isn't practical for performance reasons until we have a str
-        dtype (GH 9343 / 13877)
-
-        Parameters
-        ----------
-        data : The content of the Series
-
-        Returns
-        -------
-        dtype : inferred dtype of data
-        """
-        from pandas import StringDtype
-
-        if isinstance(data, ABCMultiIndex):
-            raise AttributeError(
-                "Can only use .str accessor with Index, not MultiIndex"
-            )
-
-        # see _libs/lib.pyx for list of inferred types
-        allowed_types = ["string", "empty", "bytes", "mixed", "mixed-integer"]
-
-        values = getattr(data, "values", data)  # Series / Index
-        values = getattr(values, "categories", values)  # categorical / normal
-
-        # explicitly allow StringDtype
-        if isinstance(values.dtype, StringDtype):
-            return "string"
-
-        try:
-            inferred_dtype = lib.infer_dtype(values, skipna=True)
-        except ValueError:
-            # GH#27571 mostly occurs with ExtensionArray
-            inferred_dtype = None
-
-        if inferred_dtype not in allowed_types:
-            raise AttributeError("Can only use .str accessor with string values!")
-        return inferred_dtype
-
-    def __getitem__(self, key):
-        if isinstance(key, slice):
-            return self.slice(start=key.start, stop=key.stop, step=key.step)
-        else:
-            return self.get(key)
-
-    def __iter__(self):
-        warnings.warn(
-            "Columnar iteration over characters will be deprecated in future releases.",
-            FutureWarning,
-            stacklevel=2,
-        )
-        i = 0
-        g = self.get(i)
-        while g.notna().any():
-            yield g
-            i += 1
-            g = self.get(i)
-
-    def _wrap_result(
-        self,
-        result,
-        use_codes=True,
-        name=None,
-        expand=None,
-        fill_value=np.nan,
-        returns_string=True,
-    ):
-
-        from pandas import Index, MultiIndex, Series
-
-        # for category, we do the stuff on the categories, so blow it up
-        # to the full series again
-        # But for some operations, we have to do the stuff on the full values,
-        # so make it possible to skip this step as the method already did this
-        # before the transformation...
-        if use_codes and self._is_categorical:
-            # if self._orig is a CategoricalIndex, there is no .cat-accessor
-            result = take_1d(
-                result, Series(self._orig, copy=False).cat.codes, fill_value=fill_value
-            )
-
-        if not hasattr(result, "ndim") or not hasattr(result, "dtype"):
-            return result
-        assert result.ndim < 3
-
-        # We can be wrapping a string / object / categorical result, in which
-        # case we'll want to return the same dtype as the input.
-        # Or we can be wrapping a numeric output, in which case we don't want
-        # to return a StringArray.
-        if self._is_string and returns_string:
-            dtype = "string"
-        else:
-            dtype = None
-
-        if expand is None:
-            # infer from ndim if expand is not specified
-            expand = result.ndim != 1
-
-        elif expand is True and not isinstance(self._orig, ABCIndexClass):
-            # required when expand=True is explicitly specified
-            # not needed when inferred
-
-            def cons_row(x):
-                if is_list_like(x):
-                    return x
-                else:
-                    return [x]
-
-            result = [cons_row(x) for x in result]
-            if result:
-                # propagate nan values to match longest sequence (GH 18450)
-                max_len = max(len(x) for x in result)
-                result = [
-                    x * max_len if len(x) == 0 or x[0] is np.nan else x for x in result
-                ]
-
-        if not isinstance(expand, bool):
-            raise ValueError("expand must be True or False")
-
-        if expand is False:
-            # if expand is False, result should have the same name
-            # as the original otherwise specified
-            if name is None:
-                name = getattr(result, "name", None)
-            if name is None:
-                # do not use logical or, _orig may be a DataFrame
-                # which has "name" column
-                name = self._orig.name
-
-        # Wait until we are sure result is a Series or Index before
-        # checking attributes (GH 12180)
-        if isinstance(self._orig, ABCIndexClass):
-            # if result is a boolean np.array, return the np.array
-            # instead of wrapping it into a boolean Index (GH 8875)
-            if is_bool_dtype(result):
-                return result
-
-            if expand:
-                result = list(result)
-                out = MultiIndex.from_tuples(result, names=name)
-                if out.nlevels == 1:
-                    # We had all tuples of length-one, which are
-                    # better represented as a regular Index.
-                    out = out.get_level_values(0)
-                return out
-            else:
-                return Index(result, name=name)
-        else:
-            index = self._orig.index
-            if expand:
-                cons = self._orig._constructor_expanddim
-                result = cons(result, columns=name, index=index, dtype=dtype)
-            else:
-                # Must be a Series
-                cons = self._orig._constructor
-                result = cons(result, name=name, index=index, dtype=dtype)
-            return result
-
-    def _get_series_list(self, others):
-        """
-        Auxiliary function for :meth:`str.cat`. Turn potentially mixed input
-        into a list of Series (elements without an index must match the length
-        of the calling Series/Index).
-
-        Parameters
-        ----------
-        others : Series, DataFrame, np.ndarray, list-like or list-like of
-            Objects that are either Series, Index or np.ndarray (1-dim).
-
-        Returns
-        -------
-        list of Series
-            Others transformed into list of Series.
-        """
-        from pandas import DataFrame, Series
-
-        # self._orig is either Series or Index
-        idx = self._orig if isinstance(self._orig, ABCIndexClass) else self._orig.index
-
-        # Generally speaking, all objects without an index inherit the index
-        # `idx` of the calling Series/Index - i.e. must have matching length.
-        # Objects with an index (i.e. Series/Index/DataFrame) keep their own.
-        if isinstance(others, ABCSeries):
-            return [others]
-        elif isinstance(others, ABCIndexClass):
-            return [Series(others._values, index=idx)]
-        elif isinstance(others, ABCDataFrame):
-            return [others[x] for x in others]
-        elif isinstance(others, np.ndarray) and others.ndim == 2:
-            others = DataFrame(others, index=idx)
-            return [others[x] for x in others]
-        elif is_list_like(others, allow_sets=False):
-            others = list(others)  # ensure iterators do not get read twice etc
-
-            # in case of list-like `others`, all elements must be
-            # either Series/Index/np.ndarray (1-dim)...
-            if all(
-                isinstance(x, (ABCSeries, ABCIndexClass))
-                or (isinstance(x, np.ndarray) and x.ndim == 1)
-                for x in others
-            ):
-                los = []
-                while others:  # iterate through list and append each element
-                    los = los + self._get_series_list(others.pop(0))
-                return los
-            # ... or just strings
-            elif all(not is_list_like(x) for x in others):
-                return [Series(others, index=idx)]
-        raise TypeError(
-            "others must be Series, Index, DataFrame, np.ndarray "
-            "or list-like (either containing only strings or "
-            "containing only objects of type Series/Index/"
-            "np.ndarray[1-dim])"
-        )
-
-    @forbid_nonstring_types(["bytes", "mixed", "mixed-integer"])
-    def cat(self, others=None, sep=None, na_rep=None, join="left"):
-        """
-        Concatenate strings in the Series/Index with given separator.
-
-        If `others` is specified, this function concatenates the Series/Index
-        and elements of `others` element-wise.
-        If `others` is not passed, then all values in the Series/Index are
-        concatenated into a single string with a given `sep`.
-
-        Parameters
-        ----------
-        others : Series, Index, DataFrame, np.ndarray or list-like
-            Series, Index, DataFrame, np.ndarray (one- or two-dimensional) and
-            other list-likes of strings must have the same length as the
-            calling Series/Index, with the exception of indexed objects (i.e.
-            Series/Index/DataFrame) if `join` is not None.
-
-            If others is a list-like that contains a combination of Series,
-            Index or np.ndarray (1-dim), then all elements will be unpacked and
-            must satisfy the above criteria individually.
-
-            If others is None, the method returns the concatenation of all
-            strings in the calling Series/Index.
-        sep : str, default ''
-            The separator between the different elements/columns. By default
-            the empty string `''` is used.
-        na_rep : str or None, default None
-            Representation that is inserted for all missing values:
-
-            - If `na_rep` is None, and `others` is None, missing values in the
-              Series/Index are omitted from the result.
-            - If `na_rep` is None, and `others` is not None, a row containing a
-              missing value in any of the columns (before concatenation) will
-              have a missing value in the result.
-        join : {'left', 'right', 'outer', 'inner'}, default 'left'
-            Determines the join-style between the calling Series/Index and any
-            Series/Index/DataFrame in `others` (objects without an index need
-            to match the length of the calling Series/Index). To disable
-            alignment, use `.values` on any Series/Index/DataFrame in `others`.
-
-            .. versionchanged:: 1.0.0
-                Changed default of `join` from None to `'left'`.
-
-        Returns
-        -------
-        str, Series or Index
-            If `others` is None, `str` is returned, otherwise a `Series/Index`
-            (same type as caller) of objects is returned.
-
-        See Also
-        --------
-        split : Split each string in the Series/Index.
-        join : Join lists contained as elements in the Series/Index.
-
-        Examples
-        --------
-        When not passing `others`, all values are concatenated into a single
-        string:
-
-        >>> s = pd.Series(['a', 'b', np.nan, 'd'])
-        >>> s.str.cat(sep=' ')
-        'a b d'
-
-        By default, NA values in the Series are ignored. Using `na_rep`, they
-        can be given a representation:
-
-        >>> s.str.cat(sep=' ', na_rep='?')
-        'a b ? d'
-
-        If `others` is specified, corresponding values are concatenated with
-        the separator. Result will be a Series of strings.
-
-        >>> s.str.cat(['A', 'B', 'C', 'D'], sep=',')
-        0    a,A
-        1    b,B
-        2    NaN
-        3    d,D
-        dtype: object
-
-        Missing values will remain missing in the result, but can again be
-        represented using `na_rep`
-
-        >>> s.str.cat(['A', 'B', 'C', 'D'], sep=',', na_rep='-')
-        0    a,A
-        1    b,B
-        2    -,C
-        3    d,D
-        dtype: object
-
-        If `sep` is not specified, the values are concatenated without
-        separation.
-
-        >>> s.str.cat(['A', 'B', 'C', 'D'], na_rep='-')
-        0    aA
-        1    bB
-        2    -C
-        3    dD
-        dtype: object
-
-        Series with different indexes can be aligned before concatenation. The
-        `join`-keyword works as in other methods.
-
-        >>> t = pd.Series(['d', 'a', 'e', 'c'], index=[3, 0, 4, 2])
-        >>> s.str.cat(t, join='left', na_rep='-')
-        0    aa
-        1    b-
-        2    -c
-        3    dd
-        dtype: object
-        >>>
-        >>> s.str.cat(t, join='outer', na_rep='-')
-        0    aa
-        1    b-
-        2    -c
-        3    dd
-        4    -e
-        dtype: object
-        >>>
-        >>> s.str.cat(t, join='inner', na_rep='-')
-        0    aa
-        2    -c
-        3    dd
-        dtype: object
-        >>>
-        >>> s.str.cat(t, join='right', na_rep='-')
-        3    dd
-        0    aa
-        4    -e
-        2    -c
-        dtype: object
-
-        For more examples, see :ref:`here <text.concatenate>`.
-        """
-        from pandas import Index, Series, concat
-
-        if isinstance(others, str):
-            raise ValueError("Did you mean to supply a `sep` keyword?")
-        if sep is None:
-            sep = ""
-
-        if isinstance(self._orig, ABCIndexClass):
-            data = Series(self._orig, index=self._orig)
-        else:  # Series
-            data = self._orig
-
-        # concatenate Series/Index with itself if no "others"
-        if others is None:
-            data = ensure_object(data)
-            na_mask = isna(data)
-            if na_rep is None and na_mask.any():
-                data = data[~na_mask]
-            elif na_rep is not None and na_mask.any():
-                data = np.where(na_mask, na_rep, data)
-            return sep.join(data)
-
-        try:
-            # turn anything in "others" into lists of Series
-            others = self._get_series_list(others)
-        except ValueError as err:  # do not catch TypeError raised by _get_series_list
-            raise ValueError(
-                "If `others` contains arrays or lists (or other "
-                "list-likes without an index), these must all be "
-                "of the same length as the calling Series/Index."
-            ) from err
-
-        # align if required
-        if any(not data.index.equals(x.index) for x in others):
-            # Need to add keys for uniqueness in case of duplicate columns
-            others = concat(
-                others,
-                axis=1,
-                join=(join if join == "inner" else "outer"),
-                keys=range(len(others)),
-                sort=False,
-                copy=False,
-            )
-            data, others = data.align(others, join=join)
-            others = [others[x] for x in others]  # again list of Series
-
-        all_cols = [ensure_object(x) for x in [data] + others]
-        na_masks = np.array([isna(x) for x in all_cols])
-        union_mask = np.logical_or.reduce(na_masks, axis=0)
-
-        if na_rep is None and union_mask.any():
-            # no na_rep means NaNs for all rows where any column has a NaN
-            # only necessary if there are actually any NaNs
-            result = np.empty(len(data), dtype=object)
-            np.putmask(result, union_mask, np.nan)
-
-            not_masked = ~union_mask
-            result[not_masked] = cat_safe([x[not_masked] for x in all_cols], sep)
-        elif na_rep is not None and union_mask.any():
-            # fill NaNs with na_rep in case there are actually any NaNs
-            all_cols = [
-                np.where(nm, na_rep, col) for nm, col in zip(na_masks, all_cols)
-            ]
-            result = cat_safe(all_cols, sep)
-        else:
-            # no NaNs - can just concatenate
-            result = cat_safe(all_cols, sep)
-
-        if isinstance(self._orig, ABCIndexClass):
-            # add dtype for case that result is all-NA
-            result = Index(result, dtype=object, name=self._orig.name)
-        else:  # Series
-            if is_categorical_dtype(self._orig.dtype):
-                # We need to infer the new categories.
-                dtype = None
-            else:
-                dtype = self._orig.dtype
-            result = Series(result, dtype=dtype, index=data.index, name=self._orig.name)
-        return result
-
-    _shared_docs[
-        "str_split"
-    ] = r"""
-    Split strings around given separator/delimiter.
-
-    Splits the string in the Series/Index from the %(side)s,
-    at the specified delimiter string. Equivalent to :meth:`str.%(method)s`.
-
-    Parameters
-    ----------
-    pat : str, optional
-        String or regular expression to split on.
-        If not specified, split on whitespace.
-    n : int, default -1 (all)
-        Limit number of splits in output.
-        ``None``, 0 and -1 will be interpreted as return all splits.
-    expand : bool, default False
-        Expand the split strings into separate columns.
-
-        * If ``True``, return DataFrame/MultiIndex expanding dimensionality.
-        * If ``False``, return Series/Index, containing lists of strings.
-
-    Returns
-    -------
-    Series, Index, DataFrame or MultiIndex
-        Type matches caller unless ``expand=True`` (see Notes).
-
-    See Also
-    --------
-    Series.str.split : Split strings around given separator/delimiter.
-    Series.str.rsplit : Splits string around given separator/delimiter,
-        starting from the right.
-    Series.str.join : Join lists contained as elements in the Series/Index
-        with passed delimiter.
-    str.split : Standard library version for split.
-    str.rsplit : Standard library version for rsplit.
-
-    Notes
-    -----
-    The handling of the `n` keyword depends on the number of found splits:
-
-    - If found splits > `n`,  make first `n` splits only
-    - If found splits <= `n`, make all splits
-    - If for a certain row the number of found splits < `n`,
-      append `None` for padding up to `n` if ``expand=True``
-
-    If using ``expand=True``, Series and Index callers return DataFrame and
-    MultiIndex objects, respectively.
-
-    Examples
-    --------
-    >>> s = pd.Series(
-    ...     [
-    ...         "this is a regular sentence",
-    ...         "https://docs.python.org/3/tutorial/index.html",
-    ...         np.nan
-    ...     ]
-    ... )
-    >>> s
-    0                       this is a regular sentence
-    1    https://docs.python.org/3/tutorial/index.html
-    2                                              NaN
-    dtype: object
-
-    In the default setting, the string is split by whitespace.
-
-    >>> s.str.split()
-    0                   [this, is, a, regular, sentence]
-    1    [https://docs.python.org/3/tutorial/index.html]
-    2                                                NaN
-    dtype: object
-
-    Without the `n` parameter, the outputs of `rsplit` and `split`
-    are identical.
-
-    >>> s.str.rsplit()
-    0                   [this, is, a, regular, sentence]
-    1    [https://docs.python.org/3/tutorial/index.html]
-    2                                                NaN
-    dtype: object
-
-    The `n` parameter can be used to limit the number of splits on the
-    delimiter. The outputs of `split` and `rsplit` are different.
-
-    >>> s.str.split(n=2)
-    0                     [this, is, a regular sentence]
-    1    [https://docs.python.org/3/tutorial/index.html]
-    2                                                NaN
-    dtype: object
-
-    >>> s.str.rsplit(n=2)
-    0                     [this is a, regular, sentence]
-    1    [https://docs.python.org/3/tutorial/index.html]
-    2                                                NaN
-    dtype: object
-
-    The `pat` parameter can be used to split by other characters.
-
-    >>> s.str.split(pat="/")
-    0                         [this is a regular sentence]
-    1    [https:, , docs.python.org, 3, tutorial, index...
-    2                                                  NaN
-    dtype: object
-
-    When using ``expand=True``, the split elements will expand out into
-    separate columns. If NaN is present, it is propagated throughout
-    the columns during the split.
-
-    >>> s.str.split(expand=True)
-                                                   0     1     2        3         4
-    0                                           this    is     a  regular  sentence
-    1  https://docs.python.org/3/tutorial/index.html  None  None     None      None
-    2                                            NaN   NaN   NaN      NaN       NaN
-
-    For slightly more complex use cases like splitting the html document name
-    from a url, a combination of parameter settings can be used.
-
-    >>> s.str.rsplit("/", n=1, expand=True)
-                                        0           1
-    0          this is a regular sentence        None
-    1  https://docs.python.org/3/tutorial  index.html
-    2                                 NaN         NaN
-
-    Remember to escape special characters when explicitly using regular
-    expressions.
-
-    >>> s = pd.Series(["1+1=2"])
-    >>> s
-    0    1+1=2
-    dtype: object
-    >>> s.str.split(r"\+|=", expand=True)
-         0    1    2
-    0    1    1    2
-    """
-
-    @Appender(_shared_docs["str_split"] % {"side": "beginning", "method": "split"})
-    @forbid_nonstring_types(["bytes"])
-    def split(self, pat=None, n=-1, expand=False):
-        result = str_split(self._parent, pat, n=n)
-        return self._wrap_result(result, expand=expand, returns_string=expand)
-
-    @Appender(_shared_docs["str_split"] % {"side": "end", "method": "rsplit"})
-    @forbid_nonstring_types(["bytes"])
-    def rsplit(self, pat=None, n=-1, expand=False):
-        result = str_rsplit(self._parent, pat, n=n)
-        return self._wrap_result(result, expand=expand, returns_string=expand)
-
-    _shared_docs[
-        "str_partition"
-    ] = """
-    Split the string at the %(side)s occurrence of `sep`.
-
-    This method splits the string at the %(side)s occurrence of `sep`,
-    and returns 3 elements containing the part before the separator,
-    the separator itself, and the part after the separator.
-    If the separator is not found, return %(return)s.
-
-    Parameters
-    ----------
-    sep : str, default whitespace
-        String to split on.
-    expand : bool, default True
-        If True, return DataFrame/MultiIndex expanding dimensionality.
-        If False, return Series/Index.
-
-    Returns
-    -------
-    DataFrame/MultiIndex or Series/Index of objects
-
-    See Also
-    --------
-    %(also)s
-    Series.str.split : Split strings around given separators.
-    str.partition : Standard library version.
-
-    Examples
-    --------
-
-    >>> s = pd.Series(['Linda van der Berg', 'George Pitt-Rivers'])
-    >>> s
-    0    Linda van der Berg
-    1    George Pitt-Rivers
-    dtype: object
-
-    >>> s.str.partition()
-            0  1             2
-    0   Linda     van der Berg
-    1  George      Pitt-Rivers
-
-    To partition by the last space instead of the first one:
-
-    >>> s.str.rpartition()
-                   0  1            2
-    0  Linda van der            Berg
-    1         George     Pitt-Rivers
-
-    To partition by something different than a space:
-
-    >>> s.str.partition('-')
-                        0  1       2
-    0  Linda van der Berg
-    1         George Pitt  -  Rivers
-
-    To return a Series containing tuples instead of a DataFrame:
-
-    >>> s.str.partition('-', expand=False)
-    0    (Linda van der Berg, , )
-    1    (George Pitt, -, Rivers)
-    dtype: object
-
-    Also available on indices:
-
-    >>> idx = pd.Index(['X 123', 'Y 999'])
-    >>> idx
-    Index(['X 123', 'Y 999'], dtype='object')
-
-    Which will create a MultiIndex:
-
-    >>> idx.str.partition()
-    MultiIndex([('X', ' ', '123'),
-                ('Y', ' ', '999')],
-               )
-
-    Or an index with tuples with ``expand=False``:
-
-    >>> idx.str.partition(expand=False)
-    Index([('X', ' ', '123'), ('Y', ' ', '999')], dtype='object')
-    """
-
-    @Appender(
-        _shared_docs["str_partition"]
-        % {
-            "side": "first",
-            "return": "3 elements containing the string itself, followed by two "
-            "empty strings",
-            "also": "rpartition : Split the string at the last occurrence of `sep`.",
-        }
-    )
-    @forbid_nonstring_types(["bytes"])
-    def partition(self, sep=" ", expand=True):
-        f = lambda x: x.partition(sep)
-        result = _na_map(f, self._parent)
-        return self._wrap_result(result, expand=expand, returns_string=expand)
-
-    @Appender(
-        _shared_docs["str_partition"]
-        % {
-            "side": "last",
-            "return": "3 elements containing two empty strings, followed by the "
-            "string itself",
-            "also": "partition : Split the string at the first occurrence of `sep`.",
-        }
-    )
-    @forbid_nonstring_types(["bytes"])
-    def rpartition(self, sep=" ", expand=True):
-        f = lambda x: x.rpartition(sep)
-        result = _na_map(f, self._parent)
-        return self._wrap_result(result, expand=expand, returns_string=expand)
-
-    @copy(str_get)
-    def get(self, i):
-        result = str_get(self._parent, i)
-        return self._wrap_result(result)
-
-    @copy(str_join)
-    @forbid_nonstring_types(["bytes"])
-    def join(self, sep):
-        result = str_join(self._parent, sep)
-        return self._wrap_result(result)
-
-    @copy(str_contains)
-    @forbid_nonstring_types(["bytes"])
-    def contains(self, pat, case=True, flags=0, na=np.nan, regex=True):
-        result = str_contains(
-            self._parent, pat, case=case, flags=flags, na=na, regex=regex
-        )
-        return self._wrap_result(result, fill_value=na, returns_string=False)
-
-    @copy(str_match)
-    @forbid_nonstring_types(["bytes"])
-    def match(self, pat, case=True, flags=0, na=np.nan):
-        result = str_match(self._parent, pat, case=case, flags=flags, na=na)
-        return self._wrap_result(result, fill_value=na, returns_string=False)
-
-    @copy(str_fullmatch)
-    @forbid_nonstring_types(["bytes"])
-    def fullmatch(self, pat, case=True, flags=0, na=np.nan):
-        result = str_fullmatch(self._parent, pat, case=case, flags=flags, na=na)
-        return self._wrap_result(result, fill_value=na, returns_string=False)
-
-    @copy(str_replace)
-    @forbid_nonstring_types(["bytes"])
-    def replace(self, pat, repl, n=-1, case=None, flags=0, regex=None):
-        if regex is None:
-            if (
-                isinstance(pat, str)
-                and len(pat) > 1
-                and any(c in pat for c in ".+*|^$?[](){}\\")
-            ):
-                # warn only in cases where regex behavior would differ from literal
-                msg = (
-                    "The default value of regex will change from "
-                    "True to False in a future version."
-                )
-                warnings.warn(msg, FutureWarning, stacklevel=3)
-            regex = True
-        result = str_replace(
-            self._parent, pat, repl, n=n, case=case, flags=flags, regex=regex
-        )
-        return self._wrap_result(result)
-
-    @copy(str_repeat)
-    @forbid_nonstring_types(["bytes"])
-    def repeat(self, repeats):
-        result = str_repeat(self._parent, repeats)
-        return self._wrap_result(result)
-
-    @copy(str_pad)
-    @forbid_nonstring_types(["bytes"])
-    def pad(self, width, side="left", fillchar=" "):
-        result = str_pad(self._parent, width, side=side, fillchar=fillchar)
-        return self._wrap_result(result)
-
-    _shared_docs[
-        "str_pad"
-    ] = """
-    Pad %(side)s side of strings in the Series/Index.
-
-    Equivalent to :meth:`str.%(method)s`.
-
-    Parameters
-    ----------
-    width : int
-        Minimum width of resulting string; additional characters will be filled
-        with ``fillchar``.
-    fillchar : str
-        Additional character for filling, default is whitespace.
-
-    Returns
-    -------
-    filled : Series/Index of objects.
-    """
-
-    @Appender(_shared_docs["str_pad"] % dict(side="left and right", method="center"))
-    @forbid_nonstring_types(["bytes"])
-    def center(self, width, fillchar=" "):
-        return self.pad(width, side="both", fillchar=fillchar)
-
-    @Appender(_shared_docs["str_pad"] % dict(side="right", method="ljust"))
-    @forbid_nonstring_types(["bytes"])
-    def ljust(self, width, fillchar=" "):
-        return self.pad(width, side="right", fillchar=fillchar)
-
-    @Appender(_shared_docs["str_pad"] % dict(side="left", method="rjust"))
-    @forbid_nonstring_types(["bytes"])
-    def rjust(self, width, fillchar=" "):
-        return self.pad(width, side="left", fillchar=fillchar)
-
-    @forbid_nonstring_types(["bytes"])
-    def zfill(self, width):
-        """
-        Pad strings in the Series/Index by prepending '0' characters.
-
-        Strings in the Series/Index are padded with '0' characters on the
-        left of the string to reach a total string length  `width`. Strings
-        in the Series/Index with length greater or equal to `width` are
-        unchanged.
-
-        Parameters
-        ----------
-        width : int
-            Minimum length of resulting string; strings with length less
-            than `width` be prepended with '0' characters.
-
-        Returns
-        -------
-        Series/Index of objects.
-
-        See Also
-        --------
-        Series.str.rjust : Fills the left side of strings with an arbitrary
-            character.
-        Series.str.ljust : Fills the right side of strings with an arbitrary
-            character.
-        Series.str.pad : Fills the specified sides of strings with an arbitrary
-            character.
-        Series.str.center : Fills both sides of strings with an arbitrary
-            character.
-
-        Notes
-        -----
-        Differs from :meth:`str.zfill` which has special handling
-        for '+'/'-' in the string.
-
-        Examples
-        --------
-        >>> s = pd.Series(['-1', '1', '1000', 10, np.nan])
-        >>> s
-        0      -1
-        1       1
-        2    1000
-        3      10
-        4     NaN
-        dtype: object
-
-        Note that ``10`` and ``NaN`` are not strings, therefore they are
-        converted to ``NaN``. The minus sign in ``'-1'`` is treated as a
-        regular character and the zero is added to the left of it
-        (:meth:`str.zfill` would have moved it to the left). ``1000``
-        remains unchanged as it is longer than `width`.
-
-        >>> s.str.zfill(3)
-        0     0-1
-        1     001
-        2    1000
-        3     NaN
-        4     NaN
-        dtype: object
-        """
-        result = str_pad(self._parent, width, side="left", fillchar="0")
-        return self._wrap_result(result)
-
-    @copy(str_slice)
-    def slice(self, start=None, stop=None, step=None):
-        result = str_slice(self._parent, start, stop, step)
-        return self._wrap_result(result)
-
-    @copy(str_slice_replace)
-    @forbid_nonstring_types(["bytes"])
-    def slice_replace(self, start=None, stop=None, repl=None):
-        result = str_slice_replace(self._parent, start, stop, repl)
-        return self._wrap_result(result)
-
-    @copy(str_decode)
-    def decode(self, encoding, errors="strict"):
-        # need to allow bytes here
-        result = str_decode(self._parent, encoding, errors)
-        # TODO: Not sure how to handle this.
-        return self._wrap_result(result, returns_string=False)
-
-    @copy(str_encode)
-    @forbid_nonstring_types(["bytes"])
-    def encode(self, encoding, errors="strict"):
-        result = str_encode(self._parent, encoding, errors)
-        return self._wrap_result(result, returns_string=False)
-
-    _shared_docs[
-        "str_strip"
-    ] = r"""
-    Remove %(position)s characters.
-
-    Strip whitespaces (including newlines) or a set of specified characters
-    from each string in the Series/Index from %(side)s.
-    Equivalent to :meth:`str.%(method)s`.
-
-    Parameters
-    ----------
-    to_strip : str or None, default None
-        Specifying the set of characters to be removed.
-        All combinations of this set of characters will be stripped.
-        If None then whitespaces are removed.
-
-    Returns
-    -------
-    Series or Index of object
-
-    See Also
-    --------
-    Series.str.strip : Remove leading and trailing characters in Series/Index.
-    Series.str.lstrip : Remove leading characters in Series/Index.
-    Series.str.rstrip : Remove trailing characters in Series/Index.
-
-    Examples
-    --------
-    >>> s = pd.Series(['1. Ant.  ', '2. Bee!\n', '3. Cat?\t', np.nan])
-    >>> s
-    0    1. Ant.
-    1    2. Bee!\n
-    2    3. Cat?\t
-    3          NaN
-    dtype: object
-
-    >>> s.str.strip()
-    0    1. Ant.
-    1    2. Bee!
-    2    3. Cat?
-    3        NaN
-    dtype: object
-
-    >>> s.str.lstrip('123.')
-    0    Ant.
-    1    Bee!\n
-    2    Cat?\t
-    3       NaN
-    dtype: object
-
-    >>> s.str.rstrip('.!? \n\t')
-    0    1. Ant
-    1    2. Bee
-    2    3. Cat
-    3       NaN
-    dtype: object
-
-    >>> s.str.strip('123.!? \n\t')
-    0    Ant
-    1    Bee
-    2    Cat
-    3    NaN
-    dtype: object
-    """
-
-    @Appender(
-        _shared_docs["str_strip"]
-        % dict(
-            side="left and right sides", method="strip", position="leading and trailing"
-        )
-    )
-    @forbid_nonstring_types(["bytes"])
-    def strip(self, to_strip=None):
-        result = str_strip(self._parent, to_strip, side="both")
-        return self._wrap_result(result)
-
-    @Appender(
-        _shared_docs["str_strip"]
-        % dict(side="left side", method="lstrip", position="leading")
-    )
-    @forbid_nonstring_types(["bytes"])
-    def lstrip(self, to_strip=None):
-        result = str_strip(self._parent, to_strip, side="left")
-        return self._wrap_result(result)
-
-    @Appender(
-        _shared_docs["str_strip"]
-        % dict(side="right side", method="rstrip", position="trailing")
-    )
-    @forbid_nonstring_types(["bytes"])
-    def rstrip(self, to_strip=None):
-        result = str_strip(self._parent, to_strip, side="right")
-        return self._wrap_result(result)
-
-    @copy(str_wrap)
-    @forbid_nonstring_types(["bytes"])
-    def wrap(self, width, **kwargs):
-        result = str_wrap(self._parent, width, **kwargs)
-        return self._wrap_result(result)
-
-    @copy(str_get_dummies)
-    @forbid_nonstring_types(["bytes"])
-    def get_dummies(self, sep="|"):
-        # we need to cast to Series of strings as only that has all
-        # methods available for making the dummies...
-        data = self._orig.astype(str) if self._is_categorical else self._parent
-        result, name = str_get_dummies(data, sep)
-        return self._wrap_result(
-            result,
-            use_codes=(not self._is_categorical),
-            name=name,
-            expand=True,
-            returns_string=False,
-        )
-
-    @copy(str_translate)
-    @forbid_nonstring_types(["bytes"])
-    def translate(self, table):
-        result = str_translate(self._parent, table)
-        return self._wrap_result(result)
-
-    count = _pat_wrapper(str_count, flags=True, name="count", returns_string=False)
-    startswith = _pat_wrapper(
-        str_startswith, na=True, name="startswith", returns_string=False
-    )
-    endswith = _pat_wrapper(
-        str_endswith, na=True, name="endswith", returns_string=False
-    )
-    findall = _pat_wrapper(
-        str_findall, flags=True, name="findall", returns_string=False
-    )
-
-    @copy(str_extract)
-    @forbid_nonstring_types(["bytes"])
-    def extract(self, pat, flags=0, expand=True):
-        return str_extract(self, pat, flags=flags, expand=expand)
-
-    @copy(str_extractall)
-    @forbid_nonstring_types(["bytes"])
-    def extractall(self, pat, flags=0):
-        return str_extractall(self._orig, pat, flags=flags)
-
-    _shared_docs[
-        "find"
-    ] = """
-    Return %(side)s indexes in each strings in the Series/Index.
-
-    Each of returned indexes corresponds to the position where the
-    substring is fully contained between [start:end]. Return -1 on
-    failure. Equivalent to standard :meth:`str.%(method)s`.
-
-    Parameters
-    ----------
-    sub : str
-        Substring being searched.
-    start : int
-        Left edge index.
-    end : int
-        Right edge index.
-
-    Returns
-    -------
-    Series or Index of int.
-
-    See Also
-    --------
-    %(also)s
-    """
-
-    @Appender(
-        _shared_docs["find"]
-        % dict(
-            side="lowest",
-            method="find",
-            also="rfind : Return highest indexes in each strings.",
-        )
-    )
-    @forbid_nonstring_types(["bytes"])
-    def find(self, sub, start=0, end=None):
-        result = str_find(self._parent, sub, start=start, end=end, side="left")
-        return self._wrap_result(result, returns_string=False)
-
-    @Appender(
-        _shared_docs["find"]
-        % dict(
-            side="highest",
-            method="rfind",
-            also="find : Return lowest indexes in each strings.",
-        )
-    )
-    @forbid_nonstring_types(["bytes"])
-    def rfind(self, sub, start=0, end=None):
-        result = str_find(self._parent, sub, start=start, end=end, side="right")
-        return self._wrap_result(result, returns_string=False)
-
-    @forbid_nonstring_types(["bytes"])
-    def normalize(self, form):
-        """
-        Return the Unicode normal form for the strings in the Series/Index.
-
-        For more information on the forms, see the
-        :func:`unicodedata.normalize`.
-
-        Parameters
-        ----------
-        form : {'NFC', 'NFKC', 'NFD', 'NFKD'}
-            Unicode form.
-
-        Returns
-        -------
-        normalized : Series/Index of objects
-        """
-        import unicodedata
-
-        f = lambda x: unicodedata.normalize(form, x)
-        result = _na_map(f, self._parent, dtype=str)
-        return self._wrap_result(result)
-
-    _shared_docs[
-        "index"
-    ] = """
-    Return %(side)s indexes in each string in Series/Index.
-
-    Each of the returned indexes corresponds to the position where the
-    substring is fully contained between [start:end]. This is the same
-    as ``str.%(similar)s`` except instead of returning -1, it raises a
-    ValueError when the substring is not found. Equivalent to standard
-    ``str.%(method)s``.
-
-    Parameters
-    ----------
-    sub : str
-        Substring being searched.
-    start : int
-        Left edge index.
-    end : int
-        Right edge index.
-
-    Returns
-    -------
-    Series or Index of object
-
-    See Also
-    --------
-    %(also)s
-    """
-
-    @Appender(
-        _shared_docs["index"]
-        % dict(
-            side="lowest",
-            similar="find",
-            method="index",
-            also="rindex : Return highest indexes in each strings.",
-        )
-    )
-    @forbid_nonstring_types(["bytes"])
-    def index(self, sub, start=0, end=None):
-        result = str_index(self._parent, sub, start=start, end=end, side="left")
-        return self._wrap_result(result, returns_string=False)
-
-    @Appender(
-        _shared_docs["index"]
-        % dict(
-            side="highest",
-            similar="rfind",
-            method="rindex",
-            also="index : Return lowest indexes in each strings.",
-        )
-    )
-    @forbid_nonstring_types(["bytes"])
-    def rindex(self, sub, start=0, end=None):
-        result = str_index(self._parent, sub, start=start, end=end, side="right")
-        return self._wrap_result(result, returns_string=False)
-
-    _shared_docs[
-        "len"
-    ] = """
-    Compute the length of each element in the Series/Index.
-
-    The element may be a sequence (such as a string, tuple or list) or a collection
-    (such as a dictionary).
-
-    Returns
-    -------
-    Series or Index of int
-        A Series or Index of integer values indicating the length of each
-        element in the Series or Index.
-
-    See Also
-    --------
-    str.len : Python built-in function returning the length of an object.
-    Series.size : Returns the length of the Series.
-
-    Examples
-    --------
-    Returns the length (number of characters) in a string. Returns the
-    number of entries for dictionaries, lists or tuples.
-
-    >>> s = pd.Series(['dog',
-    ...                 '',
-    ...                 5,
-    ...                 {'foo' : 'bar'},
-    ...                 [2, 3, 5, 7],
-    ...                 ('one', 'two', 'three')])
-    >>> s
-    0                  dog
-    1
-    2                    5
-    3       {'foo': 'bar'}
-    4         [2, 3, 5, 7]
-    5    (one, two, three)
-    dtype: object
-    >>> s.str.len()
-    0    3.0
-    1    0.0
-    2    NaN
-    3    1.0
-    4    4.0
-    5    3.0
-    dtype: float64
-    """
-    len = _noarg_wrapper(
-        len,
-        docstring=_shared_docs["len"],
-        forbidden_types=None,
-        dtype=np.dtype("int64"),
-        returns_string=False,
-    )
-
-    _shared_docs[
-        "casemethods"
-    ] = """
-    Convert strings in the Series/Index to %(type)s.
-    %(version)s
-    Equivalent to :meth:`str.%(method)s`.
-
-    Returns
-    -------
-    Series or Index of object
-
-    See Also
-    --------
-    Series.str.lower : Converts all characters to lowercase.
-    Series.str.upper : Converts all characters to uppercase.
-    Series.str.title : Converts first character of each word to uppercase and
-        remaining to lowercase.
-    Series.str.capitalize : Converts first character to uppercase and
-        remaining to lowercase.
-    Series.str.swapcase : Converts uppercase to lowercase and lowercase to
-        uppercase.
-    Series.str.casefold: Removes all case distinctions in the string.
-
-    Examples
-    --------
-    >>> s = pd.Series(['lower', 'CAPITALS', 'this is a sentence', 'SwApCaSe'])
-    >>> s
-    0                 lower
-    1              CAPITALS
-    2    this is a sentence
-    3              SwApCaSe
-    dtype: object
-
-    >>> s.str.lower()
-    0                 lower
-    1              capitals
-    2    this is a sentence
-    3              swapcase
-    dtype: object
-
-    >>> s.str.upper()
-    0                 LOWER
-    1              CAPITALS
-    2    THIS IS A SENTENCE
-    3              SWAPCASE
-    dtype: object
-
-    >>> s.str.title()
-    0                 Lower
-    1              Capitals
-    2    This Is A Sentence
-    3              Swapcase
-    dtype: object
-
-    >>> s.str.capitalize()
-    0                 Lower
-    1              Capitals
-    2    This is a sentence
-    3              Swapcase
-    dtype: object
-
-    >>> s.str.swapcase()
-    0                 LOWER
-    1              capitals
-    2    THIS IS A SENTENCE
-    3              sWaPcAsE
-    dtype: object
-    """
-
-    # _doc_args holds dict of strings to use in substituting casemethod docs
-    _doc_args: Dict[str, Dict[str, str]] = {}
-    _doc_args["lower"] = dict(type="lowercase", method="lower", version="")
-    _doc_args["upper"] = dict(type="uppercase", method="upper", version="")
-    _doc_args["title"] = dict(type="titlecase", method="title", version="")
-    _doc_args["capitalize"] = dict(
-        type="be capitalized", method="capitalize", version=""
-    )
-    _doc_args["swapcase"] = dict(type="be swapcased", method="swapcase", version="")
-    _doc_args["casefold"] = dict(
-        type="be casefolded",
-        method="casefold",
-        version="\n    .. versionadded:: 0.25.0\n",
-    )
-    lower = _noarg_wrapper(
-        lambda x: x.lower(),
-        name="lower",
-        docstring=_shared_docs["casemethods"] % _doc_args["lower"],
-        dtype=str,
-    )
-    upper = _noarg_wrapper(
-        lambda x: x.upper(),
-        name="upper",
-        docstring=_shared_docs["casemethods"] % _doc_args["upper"],
-        dtype=str,
-    )
-    title = _noarg_wrapper(
-        lambda x: x.title(),
-        name="title",
-        docstring=_shared_docs["casemethods"] % _doc_args["title"],
-        dtype=str,
-    )
-    capitalize = _noarg_wrapper(
-        lambda x: x.capitalize(),
-        name="capitalize",
-        docstring=_shared_docs["casemethods"] % _doc_args["capitalize"],
-        dtype=str,
-    )
-    swapcase = _noarg_wrapper(
-        lambda x: x.swapcase(),
-        name="swapcase",
-        docstring=_shared_docs["casemethods"] % _doc_args["swapcase"],
-        dtype=str,
-    )
-    casefold = _noarg_wrapper(
-        lambda x: x.casefold(),
-        name="casefold",
-        docstring=_shared_docs["casemethods"] % _doc_args["casefold"],
-        dtype=str,
-    )
-
-    _shared_docs[
-        "ismethods"
-    ] = """
-    Check whether all characters in each string are %(type)s.
-
-    This is equivalent to running the Python string method
-    :meth:`str.%(method)s` for each element of the Series/Index. If a string
-    has zero characters, ``False`` is returned for that check.
-
-    Returns
-    -------
-    Series or Index of bool
-        Series or Index of boolean values with the same length as the original
-        Series/Index.
-
-    See Also
-    --------
-    Series.str.isalpha : Check whether all characters are alphabetic.
-    Series.str.isnumeric : Check whether all characters are numeric.
-    Series.str.isalnum : Check whether all characters are alphanumeric.
-    Series.str.isdigit : Check whether all characters are digits.
-    Series.str.isdecimal : Check whether all characters are decimal.
-    Series.str.isspace : Check whether all characters are whitespace.
-    Series.str.islower : Check whether all characters are lowercase.
-    Series.str.isupper : Check whether all characters are uppercase.
-    Series.str.istitle : Check whether all characters are titlecase.
-
-    Examples
-    --------
-    **Checks for Alphabetic and Numeric Characters**
-
-    >>> s1 = pd.Series(['one', 'one1', '1', ''])
-
-    >>> s1.str.isalpha()
-    0     True
-    1    False
-    2    False
-    3    False
-    dtype: bool
-
-    >>> s1.str.isnumeric()
-    0    False
-    1    False
-    2     True
-    3    False
-    dtype: bool
-
-    >>> s1.str.isalnum()
-    0     True
-    1     True
-    2     True
-    3    False
-    dtype: bool
-
-    Note that checks against characters mixed with any additional punctuation
-    or whitespace will evaluate to false for an alphanumeric check.
-
-    >>> s2 = pd.Series(['A B', '1.5', '3,000'])
-    >>> s2.str.isalnum()
-    0    False
-    1    False
-    2    False
-    dtype: bool
-
-    **More Detailed Checks for Numeric Characters**
-
-    There are several different but overlapping sets of numeric characters that
-    can be checked for.
-
-    >>> s3 = pd.Series(['23', '³', '⅕', ''])
-
-    The ``s3.str.isdecimal`` method checks for characters used to form numbers
-    in base 10.
-
-    >>> s3.str.isdecimal()
-    0     True
-    1    False
-    2    False
-    3    False
-    dtype: bool
-
-    The ``s.str.isdigit`` method is the same as ``s3.str.isdecimal`` but also
-    includes special digits, like superscripted and subscripted digits in
-    unicode.
-
-    >>> s3.str.isdigit()
-    0     True
-    1     True
-    2    False
-    3    False
-    dtype: bool
-
-    The ``s.str.isnumeric`` method is the same as ``s3.str.isdigit`` but also
-    includes other characters that can represent quantities such as unicode
-    fractions.
-
-    >>> s3.str.isnumeric()
-    0     True
-    1     True
-    2     True
-    3    False
-    dtype: bool
-
-    **Checks for Whitespace**
-
-    >>> s4 = pd.Series([' ', '\\t\\r\\n ', ''])
-    >>> s4.str.isspace()
-    0     True
-    1     True
-    2    False
-    dtype: bool
-
-    **Checks for Character Case**
-
-    >>> s5 = pd.Series(['leopard', 'Golden Eagle', 'SNAKE', ''])
-
-    >>> s5.str.islower()
-    0     True
-    1    False
-    2    False
-    3    False
-    dtype: bool
-
-    >>> s5.str.isupper()
-    0    False
-    1    False
-    2     True
-    3    False
-    dtype: bool
-
-    The ``s5.str.istitle`` method checks for whether all words are in title
-    case (whether only the first letter of each word is capitalized). Words are
-    assumed to be as any sequence of non-numeric characters separated by
-    whitespace characters.
-
-    >>> s5.str.istitle()
-    0    False
-    1     True
-    2    False
-    3    False
-    dtype: bool
-    """
-    _doc_args["isalnum"] = dict(type="alphanumeric", method="isalnum")
-    _doc_args["isalpha"] = dict(type="alphabetic", method="isalpha")
-    _doc_args["isdigit"] = dict(type="digits", method="isdigit")
-    _doc_args["isspace"] = dict(type="whitespace", method="isspace")
-    _doc_args["islower"] = dict(type="lowercase", method="islower")
-    _doc_args["isupper"] = dict(type="uppercase", method="isupper")
-    _doc_args["istitle"] = dict(type="titlecase", method="istitle")
-    _doc_args["isnumeric"] = dict(type="numeric", method="isnumeric")
-    _doc_args["isdecimal"] = dict(type="decimal", method="isdecimal")
-    # force _noarg_wrapper return type with dtype=np.dtype(bool) (GH 29624)
-    isalnum = _noarg_wrapper(
-        lambda x: x.isalnum(),
-        name="isalnum",
-        docstring=_shared_docs["ismethods"] % _doc_args["isalnum"],
-        returns_string=False,
-        dtype=np.dtype(bool),
-    )
-    isalpha = _noarg_wrapper(
-        lambda x: x.isalpha(),
-        name="isalpha",
-        docstring=_shared_docs["ismethods"] % _doc_args["isalpha"],
-        returns_string=False,
-        dtype=np.dtype(bool),
-    )
-    isdigit = _noarg_wrapper(
-        lambda x: x.isdigit(),
-        name="isdigit",
-        docstring=_shared_docs["ismethods"] % _doc_args["isdigit"],
-        returns_string=False,
-        dtype=np.dtype(bool),
-    )
-    isspace = _noarg_wrapper(
-        lambda x: x.isspace(),
-        name="isspace",
-        docstring=_shared_docs["ismethods"] % _doc_args["isspace"],
-        returns_string=False,
-        dtype=np.dtype(bool),
-    )
-    islower = _noarg_wrapper(
-        lambda x: x.islower(),
-        name="islower",
-        docstring=_shared_docs["ismethods"] % _doc_args["islower"],
-        returns_string=False,
-        dtype=np.dtype(bool),
-    )
-    isupper = _noarg_wrapper(
-        lambda x: x.isupper(),
-        name="isupper",
-        docstring=_shared_docs["ismethods"] % _doc_args["isupper"],
-        returns_string=False,
-        dtype=np.dtype(bool),
-    )
-    istitle = _noarg_wrapper(
-        lambda x: x.istitle(),
-        name="istitle",
-        docstring=_shared_docs["ismethods"] % _doc_args["istitle"],
-        returns_string=False,
-        dtype=np.dtype(bool),
-    )
-    isnumeric = _noarg_wrapper(
-        lambda x: x.isnumeric(),
-        name="isnumeric",
-        docstring=_shared_docs["ismethods"] % _doc_args["isnumeric"],
-        returns_string=False,
-        dtype=np.dtype(bool),
-    )
-    isdecimal = _noarg_wrapper(
-        lambda x: x.isdecimal(),
-        name="isdecimal",
-        docstring=_shared_docs["ismethods"] % _doc_args["isdecimal"],
-        returns_string=False,
-        dtype=np.dtype(bool),
-    )
-
-    @classmethod
-    def _make_accessor(cls, data):
-        cls._validate(data)
-        return cls(data)

From 20bfe1615e718963133ed5c55c4d3b371c17261d Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Wed, 30 Sep 2020 18:20:18 -0500
Subject: [PATCH 21/30] Note

---
 doc/source/whatsnew/v1.2.0.rst | 1 +
 1 file changed, 1 insertion(+)

diff --git a/doc/source/whatsnew/v1.2.0.rst b/doc/source/whatsnew/v1.2.0.rst
index ddee06aeab779..c74065c9dbab9 100644
--- a/doc/source/whatsnew/v1.2.0.rst
+++ b/doc/source/whatsnew/v1.2.0.rst
@@ -264,6 +264,7 @@ Deprecations
 - Deprecated indexing :class:`DataFrame` rows with datetime-like strings ``df[string]``, use ``df.loc[string]`` instead (:issue:`36179`)
 - Deprecated casting an object-dtype index of ``datetime`` objects to :class:`DatetimeIndex` in the :class:`Series` constructor (:issue:`23598`)
 - Deprecated :meth:`Index.is_all_dates` (:issue:`27744`)
+- The default value of ``regex`` for :meth:`Series.str.replace` will change from ``True`` to ``False`` in a future release (:issue:`24804`)
 
 .. ---------------------------------------------------------------------------
 

From cea44a77b5d49bf066ffcaa9f9c78f767bbd61a5 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Thu, 1 Oct 2020 08:29:38 -0500
Subject: [PATCH 22/30] Fix

---
 doc/source/user_guide/text.rst | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/doc/source/user_guide/text.rst b/doc/source/user_guide/text.rst
index 6907864bf4317..ba4f2407afbc1 100644
--- a/doc/source/user_guide/text.rst
+++ b/doc/source/user_guide/text.rst
@@ -314,7 +314,10 @@ positional argument (a regex object) and return a string.
        return m.group(0)[::-1]
 
 
-   pd.Series(["foo 123", "bar baz", np.nan], dtype="string").str.replace(pat, repl, regex=True)
+   pd.Series(
+       ["foo 123", "bar baz", np.nan],
+       dtype="string"
+   ).str.replace(pat, repl, regex=True)
 
    # Using regex groups
    pat = r"(?P<one>\w+) (?P<two>\w+) (?P<three>\w+)"

From f87201123c250864cdd20d5f793965315b554d00 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Wed, 7 Oct 2020 10:06:01 -0500
Subject: [PATCH 23/30] Update warning

---
 doc/source/whatsnew/v1.2.0.rst  |  2 +-
 pandas/core/strings/accessor.py | 15 ++++++++-------
 2 files changed, 9 insertions(+), 8 deletions(-)

diff --git a/doc/source/whatsnew/v1.2.0.rst b/doc/source/whatsnew/v1.2.0.rst
index 2e9c7d9aef216..fc2e3f9ad5072 100644
--- a/doc/source/whatsnew/v1.2.0.rst
+++ b/doc/source/whatsnew/v1.2.0.rst
@@ -287,7 +287,7 @@ Deprecations
 - Deprecated indexing :class:`DataFrame` rows with datetime-like strings ``df[string]``, use ``df.loc[string]`` instead (:issue:`36179`)
 - Deprecated casting an object-dtype index of ``datetime`` objects to :class:`DatetimeIndex` in the :class:`Series` constructor (:issue:`23598`)
 - Deprecated :meth:`Index.is_all_dates` (:issue:`27744`)
-- The default value of ``regex`` for :meth:`Series.str.replace` will change from ``True`` to ``False`` in a future release (:issue:`24804`)
+- The default value of ``regex`` for :meth:`Series.str.replace` will change from ``True`` to ``False`` in a future release. In addition, single character regexes will not be treated as literal strings when ``regex=True`` is set. (:issue:`24804`)
 - Deprecated automatic alignment on comparison operations between :class:`DataFrame` and :class:`Series`, do ``frame, ser = frame.align(ser, axis=1, copy=False)`` before e.g. ``frame == ser`` (:issue:`28759`)
 - :meth:`Rolling.count` with ``min_periods=None`` will default to the size of the window in a future version (:issue:`31302`)
 - :meth:`Index.ravel` returning a ``np.ndarray`` is deprecated, in the future this will return a view on the same index (:issue:`19956`)
diff --git a/pandas/core/strings/accessor.py b/pandas/core/strings/accessor.py
index edcaf9416fc7d..f0824a84f13bb 100644
--- a/pandas/core/strings/accessor.py
+++ b/pandas/core/strings/accessor.py
@@ -1289,16 +1289,17 @@ def replace(self, pat, repl, n=-1, case=None, flags=0, regex=None):
         dtype: object
         """
         if regex is None:
-            if (
-                isinstance(pat, str)
-                and len(pat) > 1
-                and any(c in pat for c in ".+*|^$?[](){}\\")
-            ):
+            if isinstance(pat, str) and any(c in pat for c in ".+*|^$?[](){}\\"):
                 # warn only in cases where regex behavior would differ from literal
                 msg = (
-                    "The default value of regex will change from "
-                    "True to False in a future version."
+                    "The default value of regex will change from True to False "
+                    "in a future version."
                 )
+                if len(pat) == 1:
+                    msg += (
+                        " In addition, single character regexes will not be "
+                        "treated as literal strings when regex=True."
+                    )
                 warnings.warn(msg, FutureWarning, stacklevel=3)
             regex = True
         result = self._array._str_replace(

From c0a473efaf77e405839a2f025053cbcb2f29c578 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Wed, 7 Oct 2020 10:56:53 -0500
Subject: [PATCH 24/30] rst lint

---
 doc/source/user_guide/text.rst | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/doc/source/user_guide/text.rst b/doc/source/user_guide/text.rst
index 61a841645f323..895f2857355e5 100644
--- a/doc/source/user_guide/text.rst
+++ b/doc/source/user_guide/text.rst
@@ -328,7 +328,9 @@ positional argument (a regex object) and return a string.
        return m.group("two").swapcase()
 
 
-   pd.Series(["Foo Bar Baz", np.nan], dtype="string").str.replace(pat, repl, regex=True)
+   pd.Series(["Foo Bar Baz", np.nan], dtype="string").str.replace(
+       pat, repl, regex=True
+   )
 
 The ``replace`` method also accepts a compiled regular expression object
 from :func:`re.compile` as a pattern. All flags should be included in the

From 89013db528cc1de15d171af4d0253a7dec9aa9db Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Fri, 9 Oct 2020 15:52:36 -0500
Subject: [PATCH 25/30] Nit + emphasis

---
 doc/source/whatsnew/v1.2.0.rst  | 2 +-
 pandas/core/strings/accessor.py | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/doc/source/whatsnew/v1.2.0.rst b/doc/source/whatsnew/v1.2.0.rst
index 38f6debb1ee56..c56e754c6abdf 100644
--- a/doc/source/whatsnew/v1.2.0.rst
+++ b/doc/source/whatsnew/v1.2.0.rst
@@ -287,7 +287,7 @@ Deprecations
 - Deprecated indexing :class:`DataFrame` rows with datetime-like strings ``df[string]``, use ``df.loc[string]`` instead (:issue:`36179`)
 - Deprecated casting an object-dtype index of ``datetime`` objects to :class:`DatetimeIndex` in the :class:`Series` constructor (:issue:`23598`)
 - Deprecated :meth:`Index.is_all_dates` (:issue:`27744`)
-- The default value of ``regex`` for :meth:`Series.str.replace` will change from ``True`` to ``False`` in a future release. In addition, single character regexes will not be treated as literal strings when ``regex=True`` is set. (:issue:`24804`)
+- The default value of ``regex`` for :meth:`Series.str.replace` will change from ``True`` to ``False`` in a future release. In addition, single character regular expressions will *not* be treated as literal strings when ``regex=True`` is set. (:issue:`24804`)
 - Deprecated automatic alignment on comparison operations between :class:`DataFrame` and :class:`Series`, do ``frame, ser = frame.align(ser, axis=1, copy=False)`` before e.g. ``frame == ser`` (:issue:`28759`)
 - :meth:`Rolling.count` with ``min_periods=None`` will default to the size of the window in a future version (:issue:`31302`)
 - Deprecated slice-indexing on timezone-aware :class:`DatetimeIndex` with naive ``datetime`` objects, to match scalar indexing behavior (:issue:`36148`)
diff --git a/pandas/core/strings/accessor.py b/pandas/core/strings/accessor.py
index f0824a84f13bb..df37cd47a9e7c 100644
--- a/pandas/core/strings/accessor.py
+++ b/pandas/core/strings/accessor.py
@@ -1297,8 +1297,8 @@ def replace(self, pat, repl, n=-1, case=None, flags=0, regex=None):
                 )
                 if len(pat) == 1:
                     msg += (
-                        " In addition, single character regexes will not be "
-                        "treated as literal strings when regex=True."
+                        " In addition, single character regular expressions will"
+                        "*not* be treated as literal strings when regex=True."
                     )
                 warnings.warn(msg, FutureWarning, stacklevel=3)
             regex = True

From e78017c7a924742cb459f2b20e9df71e80c927db Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Fri, 9 Oct 2020 17:13:48 -0500
Subject: [PATCH 26/30] regex=False

---
 pandas/tests/test_strings.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pandas/tests/test_strings.py b/pandas/tests/test_strings.py
index 96cedab4ac91b..61df5d4d5fdd6 100644
--- a/pandas/tests/test_strings.py
+++ b/pandas/tests/test_strings.py
@@ -3046,7 +3046,7 @@ def test_pipe_failures(self):
 
         tm.assert_series_equal(result, exp)
 
-        result = s.str.replace("|", " ")
+        result = s.str.replace("|", " ", regex=False)
         exp = Series(["A B C"])
 
         tm.assert_series_equal(result, exp)

From e396ce592686247eb557108a5a08d0f9b918f435 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Sat, 10 Oct 2020 11:10:43 -0500
Subject: [PATCH 27/30] Update

---
 doc/source/user_guide/text.rst              | 29 +++++----------------
 pandas/tests/series/methods/test_replace.py | 11 +++++---
 2 files changed, 14 insertions(+), 26 deletions(-)

diff --git a/doc/source/user_guide/text.rst b/doc/source/user_guide/text.rst
index 895f2857355e5..7792805a30c16 100644
--- a/doc/source/user_guide/text.rst
+++ b/doc/source/user_guide/text.rst
@@ -269,31 +269,14 @@ i.e., from the end of the string to the beginning of the string:
 
 Some caution must be taken when dealing with regular expressions! The current behavior
 is to treat single character patterns as literal strings, even when ``regex`` is set
-to ``True``. (This behavior is deprecated and will be removed in a future version so
-that the ``regex`` keyword is always respected.) For example, the following code will
-cause trouble because of the regular expression meaning of ``$``:
+to ``True``. This behavior is deprecated and will be removed in a future version so
+that the ``regex`` keyword is always respected.
 
-.. ipython:: python
-
-   # Consider the following badly formatted financial data
-   dollars = pd.Series(["12", "-$10", "$10,000"], dtype="string")
-
-   # Here $ is treated as a literal character
-   dollars.str.replace("$", "", regex=True)
-
-   # But here it is not
-   dollars.str.replace("-$", "-", regex=True)
-
-   # We need to escape the special character (for >1 len patterns)
-   dollars.str.replace(r"-\$", "-", regex=True)
-
-   # Or set regex equal to False
-   dollars.str.replace("-$", "-", regex=False)
+.. versionchanged:: 1.2.0
 
-If you do want literal replacement of a string (equivalent to
-:meth:`str.replace`), you can set the optional ``regex`` parameter to
-``False``, rather than escaping each character. In this case both ``pat``
-and ``repl`` must be strings:
+If you want literal replacement of a string (equivalent to :meth:`str.replace`), you
+can set the optional ``regex`` parameter to ``False``, rather than escaping each
+character. In this case both ``pat`` and ``repl`` must be strings:
 
 .. ipython:: python
 
diff --git a/pandas/tests/series/methods/test_replace.py b/pandas/tests/series/methods/test_replace.py
index 7bc7993b38a22..a52cb7e46f434 100644
--- a/pandas/tests/series/methods/test_replace.py
+++ b/pandas/tests/series/methods/test_replace.py
@@ -450,8 +450,13 @@ def test_replace_with_compiled_regex(self):
         expected = pd.Series(["z", "b", "c"])
         tm.assert_series_equal(result, expected)
 
-    def test_str_replace_regex_default_raises_warning(self):
+    @pytest.mark.parametrize("pattern", ["^.$", "."])
+    def test_str_replace_regex_default_raises_warning(self, pattern):
         # https://github.com/pandas-dev/pandas/pull/24809
         s = pd.Series(["a", "b", "c"])
-        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False):
-            s.str.replace("^.$", "")
+        msg = r"The default value of regex will change from True to False.*"
+        if len(pattern) == 1:
+            msg += r".*single character regular expressions.*not.*literal strings"
+        with tm.assert_produces_warning(FutureWarning, check_stacklevel=False) as w:
+            s.str.replace(pattern, "")
+            assert re.match(msg, str(w[0].message))

From e799b12fc1aaaf8a8575d6ec3b7eb790cb352056 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Sat, 10 Oct 2020 11:20:49 -0500
Subject: [PATCH 28/30] fix

---
 pandas/tests/series/methods/test_replace.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pandas/tests/series/methods/test_replace.py b/pandas/tests/series/methods/test_replace.py
index a52cb7e46f434..79d6fc22aba97 100644
--- a/pandas/tests/series/methods/test_replace.py
+++ b/pandas/tests/series/methods/test_replace.py
@@ -454,7 +454,7 @@ def test_replace_with_compiled_regex(self):
     def test_str_replace_regex_default_raises_warning(self, pattern):
         # https://github.com/pandas-dev/pandas/pull/24809
         s = pd.Series(["a", "b", "c"])
-        msg = r"The default value of regex will change from True to False.*"
+        msg = r"The default value of regex will change from True to False"
         if len(pattern) == 1:
             msg += r".*single character regular expressions.*not.*literal strings"
         with tm.assert_produces_warning(FutureWarning, check_stacklevel=False) as w:

From 9f7545f1af471baf73aec99023240db4dbfbc4c2 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Sat, 10 Oct 2020 15:45:08 -0500
Subject: [PATCH 29/30] rst fix

---
 doc/source/user_guide/text.rst | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/doc/source/user_guide/text.rst b/doc/source/user_guide/text.rst
index 7792805a30c16..0b1ff69079d6d 100644
--- a/doc/source/user_guide/text.rst
+++ b/doc/source/user_guide/text.rst
@@ -280,6 +280,8 @@ character. In this case both ``pat`` and ``repl`` must be strings:
 
 .. ipython:: python
 
+    dollars = pd.Series(["12", "-$10", "$10,000"], dtype="string")
+
     # These lines are equivalent
     dollars.str.replace(r"-\$", "-", regex=True)
     dollars.str.replace("-$", "-", regex=False)

From 8a4a83358c86b005d3f0d2c189cff83d5cb695c4 Mon Sep 17 00:00:00 2001
From: Daniel Saxton <dsaxton@pm.me>
Date: Sat, 10 Oct 2020 15:49:43 -0500
Subject: [PATCH 30/30] Make a warning

---
 doc/source/user_guide/text.rst | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/doc/source/user_guide/text.rst b/doc/source/user_guide/text.rst
index 0b1ff69079d6d..9dd4fb68ae26a 100644
--- a/doc/source/user_guide/text.rst
+++ b/doc/source/user_guide/text.rst
@@ -267,10 +267,12 @@ i.e., from the end of the string to the beginning of the string:
    s3
    s3.str.replace("^.a|dog", "XX-XX ", case=False, regex=True)
 
-Some caution must be taken when dealing with regular expressions! The current behavior
-is to treat single character patterns as literal strings, even when ``regex`` is set
-to ``True``. This behavior is deprecated and will be removed in a future version so
-that the ``regex`` keyword is always respected.
+.. warning::
+
+    Some caution must be taken when dealing with regular expressions! The current behavior
+    is to treat single character patterns as literal strings, even when ``regex`` is set
+    to ``True``. This behavior is deprecated and will be removed in a future version so
+    that the ``regex`` keyword is always respected.
 
 .. versionchanged:: 1.2.0