From 9fe8f5b4454bc5dd2c8a0a0daa09452077cfa9a2 Mon Sep 17 00:00:00 2001
From: amunger <aamunger@microsoft.com>
Date: Tue, 10 Sep 2024 10:00:10 -0700
Subject: [PATCH 1/3] use pydevd safeRepr

---
 .../vscodeGetVariablesForProvider.py          | 416 +++++++++++++++++-
 1 file changed, 398 insertions(+), 18 deletions(-)

diff --git a/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py b/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py
index f83fe015638..57540f935ff 100644
--- a/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py
+++ b/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py
@@ -1,21 +1,401 @@
-# Query Jupyter server for the info about a dataframe
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License. See LICENSE in the project root
+# for license information.
+
+# Gotten from ptvsd for supporting the format expected there.
+import sys
+import locale
 from collections import namedtuple
 from importlib.util import find_spec
 import json
 
-maxStringLength = 1000
-collectionTypes = ["list", "tuple", "set"]
-arrayPageSize = 50
+# The pydevd SafeRepr class used in ptvsd/debugpy
+class SafeRepr(object):
+    # Can be used to override the encoding from locale.getpreferredencoding()
+    locale_preferred_encoding = None
+
+    # Can be used to override the encoding used for sys.stdout.encoding
+    sys_stdout_encoding = None
+
+    # String types are truncated to maxstring_outer when at the outer-
+    # most level, and truncated to maxstring_inner characters inside
+    # collections.
+    maxstring_outer = 2 ** 16
+    maxstring_inner = 128
+    string_types = (str, bytes)
+    bytes = bytes
+    set_info = (set, '{', '}', False)
+    frozenset_info = (frozenset, 'frozenset({', '})', False)
+    int_types = (int,)
+    long_iter_types = (list, tuple, bytearray, range,
+                       dict, set, frozenset)
+
+    # Collection types are recursively iterated for each limit in
+    # maxcollection.
+    maxcollection = (60, 20)
+
+    # Specifies type, prefix string, suffix string, and whether to include a
+    # comma if there is only one element. (Using a sequence rather than a
+    # mapping because we use isinstance() to determine the matching type.)
+    collection_types = [
+        (tuple, '(', ')', True),
+        (list, '[', ']', False),
+        frozenset_info,
+        set_info,
+    ]
+    try:
+        from collections import deque
+        collection_types.append((deque, 'deque([', '])', False))
+    except Exception:
+        pass
+
+    # type, prefix string, suffix string, item prefix string,
+    # item key/value separator, item suffix string
+    dict_types = [(dict, '{', '}', '', ': ', '')]
+    try:
+        from collections import OrderedDict
+        dict_types.append((OrderedDict, 'OrderedDict([', '])', '(', ', ', ')'))
+    except Exception:
+        pass
+
+    # All other types are treated identically to strings, but using
+    # different limits.
+    maxother_outer = 2 ** 16
+    maxother_inner = 128
+
+    convert_to_hex = False
+    raw_value = False
+
+    def __call__(self, obj):
+        '''
+        :param object obj:
+            The object for which we want a representation.
+
+        :return str:
+            Returns bytes encoded as utf-8 on py2 and str on py3.
+        '''
+        try:
+            return ''.join(self._repr(obj, 0))
+        except Exception:
+            try:
+                return 'An exception was raised: %r' % sys.exc_info()[1]
+            except Exception:
+                return 'An exception was raised'
 
+    def _repr(self, obj, level):
+        '''Returns an iterable of the parts in the final repr string.'''
 
-def truncateString(variable):
-    string = repr(variable)
-    if len(string) > maxStringLength:
-        sizeInfo = "\n\nLength: " + str(len(variable)) if type(variable) == str else ""
-        return string[: maxStringLength - 1] + "..." + sizeInfo
-    else:
-        return string
+        try:
+            obj_repr = type(obj).__repr__
+        except Exception:
+            obj_repr = None
+
+        def has_obj_repr(t):
+            r = t.__repr__
+            try:
+                return obj_repr == r
+            except Exception:
+                return obj_repr is r
+
+        for t, prefix, suffix, comma in self.collection_types:
+            if isinstance(obj, t) and has_obj_repr(t):
+                return self._repr_iter(obj, level, prefix, suffix, comma)
+
+        for t, prefix, suffix, item_prefix, item_sep, item_suffix in self.dict_types:  # noqa
+            if isinstance(obj, t) and has_obj_repr(t):
+                return self._repr_dict(obj, level, prefix, suffix,
+                                       item_prefix, item_sep, item_suffix)
+
+        for t in self.string_types:
+            if isinstance(obj, t) and has_obj_repr(t):
+                return self._repr_str(obj, level)
+
+        if self._is_long_iter(obj):
+            return self._repr_long_iter(obj)
+
+        return self._repr_other(obj, level)
+
+    # Determines whether an iterable exceeds the limits set in
+    # maxlimits, and is therefore unsafe to repr().
+    def _is_long_iter(self, obj, level=0):
+        try:
+            # Strings have their own limits (and do not nest). Because
+            # they don't have __iter__ in 2.x, this check goes before
+            # the next one.
+            if isinstance(obj, self.string_types):
+                return len(obj) > self.maxstring_inner
+
+            # If it's not an iterable (and not a string), it's fine.
+            if not hasattr(obj, '__iter__'):
+                return False
+
+            # If it's not an instance of these collection types then it
+            # is fine. Note: this is a fix for
+            # https://github.com/Microsoft/ptvsd/issues/406
+            if not isinstance(obj, self.long_iter_types):
+                return False
+
+            # Iterable is its own iterator - this is a one-off iterable
+            # like generator or enumerate(). We can't really count that,
+            # but repr() for these should not include any elements anyway,
+            # so we can treat it the same as non-iterables.
+            if obj is iter(obj):
+                return False
+
+            # range reprs fine regardless of length.
+            if isinstance(obj, range):
+                return False
+
+            # numpy and scipy collections (ndarray etc) have
+            # self-truncating repr, so they're always safe.
+            try:
+                module = type(obj).__module__.partition('.')[0]
+                if module in ('numpy', 'scipy'):
+                    return False
+            except Exception:
+                pass
+
+            # Iterables that nest too deep are considered long.
+            if level >= len(self.maxcollection):
+                return True
+
+            # It is too long if the length exceeds the limit, or any
+            # of its elements are long iterables.
+            if hasattr(obj, '__len__'):
+                try:
+                    size = len(obj)
+                except Exception:
+                    size = None
+                if size is not None and size > self.maxcollection[level]:
+                    return True
+                return any((self._is_long_iter(item, level + 1) for item in obj))  # noqa
+            return any(i > self.maxcollection[level] or self._is_long_iter(item, level + 1) for i, item in enumerate(obj))  # noqa
+
+        except Exception:
+            # If anything breaks, assume the worst case.
+            return True
+
+    def _repr_iter(self, obj, level, prefix, suffix,
+                   comma_after_single_element=False):
+        yield prefix
+
+        if level >= len(self.maxcollection):
+            yield '...'
+        else:
+            count = self.maxcollection[level]
+            yield_comma = False
+            for item in obj:
+                if yield_comma:
+                    yield ', '
+                yield_comma = True
+
+                count -= 1
+                if count <= 0:
+                    yield '...'
+                    break
+
+                for p in self._repr(item, 100 if item is obj else level + 1):
+                    yield p
+            else:
+                if comma_after_single_element:
+                    if count == self.maxcollection[level] - 1:
+                        yield ','
+        yield suffix
+
+    def _repr_long_iter(self, obj):
+        try:
+            length = hex(len(obj)) if self.convert_to_hex else len(obj)
+            obj_repr = '<%s, len() = %s>' % (type(obj).__name__, length)
+        except Exception:
+            try:
+                obj_repr = '<' + type(obj).__name__ + '>'
+            except Exception:
+                obj_repr = '<no repr available for object>'
+        yield obj_repr
+
+    def _repr_dict(self, obj, level, prefix, suffix,
+                   item_prefix, item_sep, item_suffix):
+        if not obj:
+            yield prefix + suffix
+            return
+        if level >= len(self.maxcollection):
+            yield prefix + '...' + suffix
+            return
+
+        yield prefix
+
+        count = self.maxcollection[level]
+        yield_comma = False
+
+
+        obj_keys = list(obj)
+
+        for key in obj_keys:
+            if yield_comma:
+                yield ', '
+            yield_comma = True
+
+            count -= 1
+            if count <= 0:
+                yield '...'
+                break
+
+            yield item_prefix
+            for p in self._repr(key, level + 1):
+                yield p
+
+            yield item_sep
+
+            try:
+                item = obj[key]
+            except Exception:
+                yield '<?>'
+            else:
+                for p in self._repr(item, 100 if item is obj else level + 1):
+                    yield p
+            yield item_suffix
 
+        yield suffix
+
+    def _repr_str(self, obj, level):
+        try:
+            if self.raw_value:
+                # For raw value retrieval, ignore all limits.
+                if isinstance(obj, bytes):
+                    yield obj.decode('latin-1')
+                else:
+                    yield obj
+                return
+
+            limit_inner = self.maxother_inner
+            limit_outer = self.maxother_outer
+            limit = limit_inner if level > 0 else limit_outer
+            if len(obj) <= limit:
+                # Note that we check the limit before doing the repr (so, the final string
+                # may actually be considerably bigger on some cases, as besides
+                # the additional u, b, ' chars, some chars may be escaped in repr, so
+                # even a single char such as \U0010ffff may end up adding more
+                # chars than expected).
+                yield self._convert_to_unicode_or_bytes_repr(repr(obj))
+                return
+
+            # Slightly imprecise calculations - we may end up with a string that is
+            # up to 6 characters longer than limit. If you need precise formatting,
+            # you are using the wrong class.
+            left_count, right_count = max(1, int(2 * limit / 3)), max(1, int(limit / 3))  # noqa
+
+            # Important: only do repr after slicing to avoid duplicating a byte array that could be
+            # huge.
+
+            # Note: we don't deal with high surrogates here because we're not dealing with the
+            # repr() of a random object.
+            # i.e.: A high surrogate unicode char may be splitted on Py2, but as we do a `repr`
+            # afterwards, that's ok.
+
+            # Also, we just show the unicode/string/bytes repr() directly to make clear what the
+            # input type was (so, on py2 a unicode would start with u' and on py3 a bytes would
+            # start with b').
+
+            part1 = obj[:left_count]
+            part1 = repr(part1)
+            part1 = part1[:part1.rindex("'")]  # Remove the last '
+
+            part2 = obj[-right_count:]
+            part2 = repr(part2)
+            part2 = part2[part2.index("'") + 1:]  # Remove the first ' (and possibly u or b).
+
+            yield part1
+            yield '...'
+            yield part2
+        except:
+            # This shouldn't really happen, but let's play it safe.
+            #exception('Error getting string representation to show.')
+            for part in self._repr_obj(obj, level,
+                                  self.maxother_inner, self.maxother_outer):
+                yield part
+
+    def _repr_other(self, obj, level):
+        return self._repr_obj(obj, level,
+                              self.maxother_inner, self.maxother_outer)
+
+    def _repr_obj(self, obj, level, limit_inner, limit_outer):
+        try:
+            if self.raw_value:
+                # For raw value retrieval, ignore all limits.
+                if isinstance(obj, bytes):
+                    yield obj.decode('latin-1')
+                    return
+
+                try:
+                    mv = memoryview(obj)
+                except Exception:
+                    yield self._convert_to_unicode_or_bytes_repr(repr(obj))
+                    return
+                else:
+                    # Map bytes to Unicode codepoints with same values.
+                    yield mv.tobytes().decode('latin-1')
+                    return
+            elif self.convert_to_hex and isinstance(obj, self.int_types):
+                obj_repr = hex(obj)
+            else:
+                obj_repr = repr(obj)
+        except Exception:
+            try:
+                obj_repr = object.__repr__(obj)
+            except Exception:
+                try:
+                    obj_repr = '<no repr available for ' + type(obj).__name__ + '>'  # noqa
+                except Exception:
+                    obj_repr = '<no repr available for object>'
+
+        limit = limit_inner if level > 0 else limit_outer
+
+        if limit >= len(obj_repr):
+            yield self._convert_to_unicode_or_bytes_repr(obj_repr)
+            return
+
+        # Slightly imprecise calculations - we may end up with a string that is
+        # up to 3 characters longer than limit. If you need precise formatting,
+        # you are using the wrong class.
+        left_count, right_count = max(1, int(2 * limit / 3)), max(1, int(limit / 3))  # noqa
+
+        yield obj_repr[:left_count]
+        yield '...'
+        yield obj_repr[-right_count:]
+
+    def _convert_to_unicode_or_bytes_repr(self, obj_repr):
+        return obj_repr
+
+    def _bytes_as_unicode_if_possible(self, obj_repr):
+        # We try to decode with 3 possible encoding (sys.stdout.encoding,
+        # locale.getpreferredencoding() and 'utf-8). If no encoding can decode
+        # the input, we return the original bytes.
+        try_encodings = []
+        encoding = self.sys_stdout_encoding or getattr(sys.stdout, 'encoding', '')
+        if encoding:
+            try_encodings.append(encoding.lower())
+
+        preferred_encoding = self.locale_preferred_encoding or locale.getpreferredencoding()
+        if preferred_encoding:
+            preferred_encoding = preferred_encoding.lower()
+            if preferred_encoding not in try_encodings:
+                try_encodings.append(preferred_encoding)
+
+        if 'utf-8' not in try_encodings:
+            try_encodings.append('utf-8')
+
+        for encoding in try_encodings:
+            try:
+                return obj_repr.decode(encoding)
+            except UnicodeDecodeError:
+                pass
+
+        return obj_repr  # Return the original version (in bytes)
+
+safeRepr = SafeRepr()
+maxStringLength = 1000
+collectionTypes = ["list", "tuple", "set"]
+arrayPageSize = 50
 
 DisplayOptions = namedtuple("DisplayOptions", ["width", "max_columns"])
 
@@ -23,7 +403,7 @@ def truncateString(variable):
 def set_pandas_display_options(display_options=None):
     if find_spec("pandas") is not None:
         try:
-            import pandas as _VSCODE_PD
+            import pandas as _VSCODE_PD # type: ignore
 
             original_display = DisplayOptions(
                 width=_VSCODE_PD.options.display.width,
@@ -50,7 +430,7 @@ def getValue(variable):
         original_display = set_pandas_display_options()
 
     try:
-        return truncateString(variable=variable)
+        return safeRepr(variable)
     finally:
         if original_display:
             set_pandas_display_options(original_display)
@@ -91,7 +471,7 @@ def getVariableDescription(variable):
     if hasattr(variable, "__len__") and result["type"] in collectionTypes:
         result["count"] = len(variable)
 
-    result["hasNamedChildren"] = hasattr(variable, "__dict__") or type(variable) == dict
+    result["hasNamedChildren"] = hasattr(variable, "__dict__") or isinstance(variable, dict)
 
     result["value"] = getValue(variable)
     return result
@@ -101,16 +481,16 @@ def getChildProperty(root, propertyChain):
     try:
         variable = root
         for property in propertyChain:
-            if type(property) == int:
+            if isinstance(property,int):
                 if hasattr(variable, "__getitem__"):
                     variable = variable[property]
-                elif type(variable) == set:
+                elif isinstance(variable, set):
                     variable = list(variable)[property]
                 else:
                     return None
             elif hasattr(variable, property):
                 variable = getattr(variable, property)
-            elif type(variable) == dict and property in variable:
+            elif isinstance(variable, dict) and property in variable:
                 variable = variable[property]
             else:
                 return None
@@ -168,7 +548,7 @@ def _VSCODE_getAllChildrenDescriptions(rootVarName, propertyChain, startIndex):
         childrenNames = []
         if hasattr(parent, "__dict__"):
             childrenNames = getPropertyNames(parent)
-        elif type(parent) == dict:
+        elif isinstance(parent, dict):
             childrenNames = list(parent.keys())
 
         children = []

From 1cfda9e6c5935b377e5989f1d557a2903eb28e6b Mon Sep 17 00:00:00 2001
From: amunger <aamunger@microsoft.com>
Date: Tue, 10 Sep 2024 10:11:08 -0700
Subject: [PATCH 2/3] lint fix

---
 .../vscodeGetVariablesForProvider.py          | 134 ++++++++++--------
 1 file changed, 73 insertions(+), 61 deletions(-)

diff --git a/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py b/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py
index 57540f935ff..6ea7a0b75b2 100644
--- a/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py
+++ b/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py
@@ -9,6 +9,7 @@
 from importlib.util import find_spec
 import json
 
+
 # The pydevd SafeRepr class used in ptvsd/debugpy
 class SafeRepr(object):
     # Can be used to override the encoding from locale.getpreferredencoding()
@@ -20,15 +21,14 @@ class SafeRepr(object):
     # String types are truncated to maxstring_outer when at the outer-
     # most level, and truncated to maxstring_inner characters inside
     # collections.
-    maxstring_outer = 2 ** 16
+    maxstring_outer = 2**16
     maxstring_inner = 128
     string_types = (str, bytes)
     bytes = bytes
-    set_info = (set, '{', '}', False)
-    frozenset_info = (frozenset, 'frozenset({', '})', False)
+    set_info = (set, "{", "}", False)
+    frozenset_info = (frozenset, "frozenset({", "})", False)
     int_types = (int,)
-    long_iter_types = (list, tuple, bytearray, range,
-                       dict, set, frozenset)
+    long_iter_types = (list, tuple, bytearray, range, dict, set, frozenset)
 
     # Collection types are recursively iterated for each limit in
     # maxcollection.
@@ -38,52 +38,54 @@ class SafeRepr(object):
     # comma if there is only one element. (Using a sequence rather than a
     # mapping because we use isinstance() to determine the matching type.)
     collection_types = [
-        (tuple, '(', ')', True),
-        (list, '[', ']', False),
+        (tuple, "(", ")", True),
+        (list, "[", "]", False),
         frozenset_info,
         set_info,
     ]
     try:
         from collections import deque
-        collection_types.append((deque, 'deque([', '])', False))
+
+        collection_types.append((deque, "deque([", "])", False))
     except Exception:
         pass
 
     # type, prefix string, suffix string, item prefix string,
     # item key/value separator, item suffix string
-    dict_types = [(dict, '{', '}', '', ': ', '')]
+    dict_types = [(dict, "{", "}", "", ": ", "")]
     try:
         from collections import OrderedDict
-        dict_types.append((OrderedDict, 'OrderedDict([', '])', '(', ', ', ')'))
+
+        dict_types.append((OrderedDict, "OrderedDict([", "])", "(", ", ", ")"))
     except Exception:
         pass
 
     # All other types are treated identically to strings, but using
     # different limits.
-    maxother_outer = 2 ** 16
+    maxother_outer = 2**16
     maxother_inner = 128
 
     convert_to_hex = False
     raw_value = False
 
     def __call__(self, obj):
-        '''
+        """
         :param object obj:
             The object for which we want a representation.
 
         :return str:
             Returns bytes encoded as utf-8 on py2 and str on py3.
-        '''
+        """
         try:
-            return ''.join(self._repr(obj, 0))
+            return "".join(self._repr(obj, 0))
         except Exception:
             try:
-                return 'An exception was raised: %r' % sys.exc_info()[1]
+                return "An exception was raised: %r" % sys.exc_info()[1]
             except Exception:
-                return 'An exception was raised'
+                return "An exception was raised"
 
     def _repr(self, obj, level):
-        '''Returns an iterable of the parts in the final repr string.'''
+        """Returns an iterable of the parts in the final repr string."""
 
         try:
             obj_repr = type(obj).__repr__
@@ -103,8 +105,9 @@ def has_obj_repr(t):
 
         for t, prefix, suffix, item_prefix, item_sep, item_suffix in self.dict_types:  # noqa
             if isinstance(obj, t) and has_obj_repr(t):
-                return self._repr_dict(obj, level, prefix, suffix,
-                                       item_prefix, item_sep, item_suffix)
+                return self._repr_dict(
+                    obj, level, prefix, suffix, item_prefix, item_sep, item_suffix
+                )
 
         for t in self.string_types:
             if isinstance(obj, t) and has_obj_repr(t):
@@ -126,7 +129,7 @@ def _is_long_iter(self, obj, level=0):
                 return len(obj) > self.maxstring_inner
 
             # If it's not an iterable (and not a string), it's fine.
-            if not hasattr(obj, '__iter__'):
+            if not hasattr(obj, "__iter__"):
                 return False
 
             # If it's not an instance of these collection types then it
@@ -149,8 +152,8 @@ def _is_long_iter(self, obj, level=0):
             # numpy and scipy collections (ndarray etc) have
             # self-truncating repr, so they're always safe.
             try:
-                module = type(obj).__module__.partition('.')[0]
-                if module in ('numpy', 'scipy'):
+                module = type(obj).__module__.partition(".")[0]
+                if module in ("numpy", "scipy"):
                     return False
             except Exception:
                 pass
@@ -161,7 +164,7 @@ def _is_long_iter(self, obj, level=0):
 
             # It is too long if the length exceeds the limit, or any
             # of its elements are long iterables.
-            if hasattr(obj, '__len__'):
+            if hasattr(obj, "__len__"):
                 try:
                     size = len(obj)
                 except Exception:
@@ -169,29 +172,31 @@ def _is_long_iter(self, obj, level=0):
                 if size is not None and size > self.maxcollection[level]:
                     return True
                 return any((self._is_long_iter(item, level + 1) for item in obj))  # noqa
-            return any(i > self.maxcollection[level] or self._is_long_iter(item, level + 1) for i, item in enumerate(obj))  # noqa
+            return any(
+                i > self.maxcollection[level] or self._is_long_iter(item, level + 1)
+                for i, item in enumerate(obj)
+            )  # noqa
 
         except Exception:
             # If anything breaks, assume the worst case.
             return True
 
-    def _repr_iter(self, obj, level, prefix, suffix,
-                   comma_after_single_element=False):
+    def _repr_iter(self, obj, level, prefix, suffix, comma_after_single_element=False):
         yield prefix
 
         if level >= len(self.maxcollection):
-            yield '...'
+            yield "..."
         else:
             count = self.maxcollection[level]
             yield_comma = False
             for item in obj:
                 if yield_comma:
-                    yield ', '
+                    yield ", "
                 yield_comma = True
 
                 count -= 1
                 if count <= 0:
-                    yield '...'
+                    yield "..."
                     break
 
                 for p in self._repr(item, 100 if item is obj else level + 1):
@@ -199,27 +204,28 @@ def _repr_iter(self, obj, level, prefix, suffix,
             else:
                 if comma_after_single_element:
                     if count == self.maxcollection[level] - 1:
-                        yield ','
+                        yield ","
         yield suffix
 
     def _repr_long_iter(self, obj):
         try:
             length = hex(len(obj)) if self.convert_to_hex else len(obj)
-            obj_repr = '<%s, len() = %s>' % (type(obj).__name__, length)
+            obj_repr = "<%s, len() = %s>" % (type(obj).__name__, length)
         except Exception:
             try:
-                obj_repr = '<' + type(obj).__name__ + '>'
+                obj_repr = "<" + type(obj).__name__ + ">"
             except Exception:
-                obj_repr = '<no repr available for object>'
+                obj_repr = "<no repr available for object>"
         yield obj_repr
 
-    def _repr_dict(self, obj, level, prefix, suffix,
-                   item_prefix, item_sep, item_suffix):
+    def _repr_dict(
+        self, obj, level, prefix, suffix, item_prefix, item_sep, item_suffix
+    ):
         if not obj:
             yield prefix + suffix
             return
         if level >= len(self.maxcollection):
-            yield prefix + '...' + suffix
+            yield prefix + "..." + suffix
             return
 
         yield prefix
@@ -227,17 +233,16 @@ def _repr_dict(self, obj, level, prefix, suffix,
         count = self.maxcollection[level]
         yield_comma = False
 
-
         obj_keys = list(obj)
 
         for key in obj_keys:
             if yield_comma:
-                yield ', '
+                yield ", "
             yield_comma = True
 
             count -= 1
             if count <= 0:
-                yield '...'
+                yield "..."
                 break
 
             yield item_prefix
@@ -249,7 +254,7 @@ def _repr_dict(self, obj, level, prefix, suffix,
             try:
                 item = obj[key]
             except Exception:
-                yield '<?>'
+                yield "<?>"
             else:
                 for p in self._repr(item, 100 if item is obj else level + 1):
                     yield p
@@ -262,7 +267,7 @@ def _repr_str(self, obj, level):
             if self.raw_value:
                 # For raw value retrieval, ignore all limits.
                 if isinstance(obj, bytes):
-                    yield obj.decode('latin-1')
+                    yield obj.decode("latin-1")
                 else:
                     yield obj
                 return
@@ -298,32 +303,34 @@ def _repr_str(self, obj, level):
 
             part1 = obj[:left_count]
             part1 = repr(part1)
-            part1 = part1[:part1.rindex("'")]  # Remove the last '
+            part1 = part1[: part1.rindex("'")]  # Remove the last '
 
             part2 = obj[-right_count:]
             part2 = repr(part2)
-            part2 = part2[part2.index("'") + 1:]  # Remove the first ' (and possibly u or b).
+            part2 = part2[
+                part2.index("'") + 1 :
+            ]  # Remove the first ' (and possibly u or b).
 
             yield part1
-            yield '...'
+            yield "..."
             yield part2
         except:
             # This shouldn't really happen, but let's play it safe.
-            #exception('Error getting string representation to show.')
-            for part in self._repr_obj(obj, level,
-                                  self.maxother_inner, self.maxother_outer):
+            # exception('Error getting string representation to show.')
+            for part in self._repr_obj(
+                obj, level, self.maxother_inner, self.maxother_outer
+            ):
                 yield part
 
     def _repr_other(self, obj, level):
-        return self._repr_obj(obj, level,
-                              self.maxother_inner, self.maxother_outer)
+        return self._repr_obj(obj, level, self.maxother_inner, self.maxother_outer)
 
     def _repr_obj(self, obj, level, limit_inner, limit_outer):
         try:
             if self.raw_value:
                 # For raw value retrieval, ignore all limits.
                 if isinstance(obj, bytes):
-                    yield obj.decode('latin-1')
+                    yield obj.decode("latin-1")
                     return
 
                 try:
@@ -333,7 +340,7 @@ def _repr_obj(self, obj, level, limit_inner, limit_outer):
                     return
                 else:
                     # Map bytes to Unicode codepoints with same values.
-                    yield mv.tobytes().decode('latin-1')
+                    yield mv.tobytes().decode("latin-1")
                     return
             elif self.convert_to_hex and isinstance(obj, self.int_types):
                 obj_repr = hex(obj)
@@ -344,9 +351,9 @@ def _repr_obj(self, obj, level, limit_inner, limit_outer):
                 obj_repr = object.__repr__(obj)
             except Exception:
                 try:
-                    obj_repr = '<no repr available for ' + type(obj).__name__ + '>'  # noqa
+                    obj_repr = "<no repr available for " + type(obj).__name__ + ">"  # noqa
                 except Exception:
-                    obj_repr = '<no repr available for object>'
+                    obj_repr = "<no repr available for object>"
 
         limit = limit_inner if level > 0 else limit_outer
 
@@ -360,7 +367,7 @@ def _repr_obj(self, obj, level, limit_inner, limit_outer):
         left_count, right_count = max(1, int(2 * limit / 3)), max(1, int(limit / 3))  # noqa
 
         yield obj_repr[:left_count]
-        yield '...'
+        yield "..."
         yield obj_repr[-right_count:]
 
     def _convert_to_unicode_or_bytes_repr(self, obj_repr):
@@ -371,18 +378,20 @@ def _bytes_as_unicode_if_possible(self, obj_repr):
         # locale.getpreferredencoding() and 'utf-8). If no encoding can decode
         # the input, we return the original bytes.
         try_encodings = []
-        encoding = self.sys_stdout_encoding or getattr(sys.stdout, 'encoding', '')
+        encoding = self.sys_stdout_encoding or getattr(sys.stdout, "encoding", "")
         if encoding:
             try_encodings.append(encoding.lower())
 
-        preferred_encoding = self.locale_preferred_encoding or locale.getpreferredencoding()
+        preferred_encoding = (
+            self.locale_preferred_encoding or locale.getpreferredencoding()
+        )
         if preferred_encoding:
             preferred_encoding = preferred_encoding.lower()
             if preferred_encoding not in try_encodings:
                 try_encodings.append(preferred_encoding)
 
-        if 'utf-8' not in try_encodings:
-            try_encodings.append('utf-8')
+        if "utf-8" not in try_encodings:
+            try_encodings.append("utf-8")
 
         for encoding in try_encodings:
             try:
@@ -392,6 +401,7 @@ def _bytes_as_unicode_if_possible(self, obj_repr):
 
         return obj_repr  # Return the original version (in bytes)
 
+
 safeRepr = SafeRepr()
 maxStringLength = 1000
 collectionTypes = ["list", "tuple", "set"]
@@ -403,7 +413,7 @@ def _bytes_as_unicode_if_possible(self, obj_repr):
 def set_pandas_display_options(display_options=None):
     if find_spec("pandas") is not None:
         try:
-            import pandas as _VSCODE_PD # type: ignore
+            import pandas as _VSCODE_PD  # type: ignore
 
             original_display = DisplayOptions(
                 width=_VSCODE_PD.options.display.width,
@@ -471,7 +481,9 @@ def getVariableDescription(variable):
     if hasattr(variable, "__len__") and result["type"] in collectionTypes:
         result["count"] = len(variable)
 
-    result["hasNamedChildren"] = hasattr(variable, "__dict__") or isinstance(variable, dict)
+    result["hasNamedChildren"] = hasattr(variable, "__dict__") or isinstance(
+        variable, dict
+    )
 
     result["value"] = getValue(variable)
     return result
@@ -481,7 +493,7 @@ def getChildProperty(root, propertyChain):
     try:
         variable = root
         for property in propertyChain:
-            if isinstance(property,int):
+            if isinstance(property, int):
                 if hasattr(variable, "__getitem__"):
                     variable = variable[property]
                 elif isinstance(variable, set):

From d27e073e23ed472834b338b33c308430acb2ced7 Mon Sep 17 00:00:00 2001
From: amunger <aamunger@microsoft.com>
Date: Tue, 10 Sep 2024 10:29:03 -0700
Subject: [PATCH 3/3] formatted with black

---
 .../vscodeGetVariablesForProvider.py          | 25 +++++++++++++++----
 1 file changed, 20 insertions(+), 5 deletions(-)

diff --git a/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py b/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py
index 6ea7a0b75b2..8313b2d917d 100644
--- a/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py
+++ b/pythonFiles/vscode_datascience_helpers/getVariableInfo/vscodeGetVariablesForProvider.py
@@ -103,7 +103,14 @@ def has_obj_repr(t):
             if isinstance(obj, t) and has_obj_repr(t):
                 return self._repr_iter(obj, level, prefix, suffix, comma)
 
-        for t, prefix, suffix, item_prefix, item_sep, item_suffix in self.dict_types:  # noqa
+        for (
+            t,
+            prefix,
+            suffix,
+            item_prefix,
+            item_sep,
+            item_suffix,
+        ) in self.dict_types:  # noqa
             if isinstance(obj, t) and has_obj_repr(t):
                 return self._repr_dict(
                     obj, level, prefix, suffix, item_prefix, item_sep, item_suffix
@@ -171,7 +178,9 @@ def _is_long_iter(self, obj, level=0):
                     size = None
                 if size is not None and size > self.maxcollection[level]:
                     return True
-                return any((self._is_long_iter(item, level + 1) for item in obj))  # noqa
+                return any(
+                    (self._is_long_iter(item, level + 1) for item in obj)
+                )  # noqa
             return any(
                 i > self.maxcollection[level] or self._is_long_iter(item, level + 1)
                 for i, item in enumerate(obj)
@@ -287,7 +296,9 @@ def _repr_str(self, obj, level):
             # Slightly imprecise calculations - we may end up with a string that is
             # up to 6 characters longer than limit. If you need precise formatting,
             # you are using the wrong class.
-            left_count, right_count = max(1, int(2 * limit / 3)), max(1, int(limit / 3))  # noqa
+            left_count, right_count = max(1, int(2 * limit / 3)), max(
+                1, int(limit / 3)
+            )  # noqa
 
             # Important: only do repr after slicing to avoid duplicating a byte array that could be
             # huge.
@@ -351,7 +362,9 @@ def _repr_obj(self, obj, level, limit_inner, limit_outer):
                 obj_repr = object.__repr__(obj)
             except Exception:
                 try:
-                    obj_repr = "<no repr available for " + type(obj).__name__ + ">"  # noqa
+                    obj_repr = (
+                        "<no repr available for " + type(obj).__name__ + ">"
+                    )  # noqa
                 except Exception:
                     obj_repr = "<no repr available for object>"
 
@@ -364,7 +377,9 @@ def _repr_obj(self, obj, level, limit_inner, limit_outer):
         # Slightly imprecise calculations - we may end up with a string that is
         # up to 3 characters longer than limit. If you need precise formatting,
         # you are using the wrong class.
-        left_count, right_count = max(1, int(2 * limit / 3)), max(1, int(limit / 3))  # noqa
+        left_count, right_count = max(1, int(2 * limit / 3)), max(
+            1, int(limit / 3)
+        )  # noqa
 
         yield obj_repr[:left_count]
         yield "..."