pandas-dev · mvernooy3687 · Dec 8, 2023 · Dec 8, 2023 · Dec 8, 2023 · Dec 8, 2023
diff --git a/doc/source/whatsnew/v2.2.0.rst b/doc/source/whatsnew/v2.2.0.rst
@@ -617,6 +617,7 @@ I/O
 - Bug in :func:`read_json` not handling dtype conversion properly if ``infer_string`` is set (:issue:`56195`)
 - Bug in :meth:`DataFrame.to_excel`, with ``OdsWriter`` (``ods`` files) writing boolean/string value (:issue:`54994`)
 - Bug in :meth:`DataFrame.to_hdf` and :func:`read_hdf` with ``datetime64`` dtypes with non-nanosecond resolution failing to round-trip correctly (:issue:`55622`)
+- Bug in :meth:`DataFrame.to_json` where it would produce duplicate column names for orient=split (:issue:`50456`)
 - Bug in :meth:`~pandas.read_excel` with ``engine="odf"`` (``ods`` files) when string contains annotation (:issue:`55200`)
 - Bug in :meth:`~pandas.read_excel` with an ODS file without cached formatted cell for float values (:issue:`55219`)
 - Bug where :meth:`DataFrame.to_json` would raise an ``OverflowError`` instead of a ``TypeError`` with unsupported NumPy types (:issue:`55403`)

diff --git a/pandas/io/json/_json.py b/pandas/io/json/_json.py
@@ -208,6 +208,16 @@ def to_json(
         indent=indent,
     ).write()
 
+    if orient == "split" and isinstance(obj, DataFrame) and isinstance(obj.columns, MultiIndex):
+        # inverse of multindex.fromArray
+        fixed_columns = [[obj.columns[i][j] for i in range(len(obj.columns))] for j in range(len(obj.columns[0]))]
+
+        new_str = ujson_loads(s)
+
+        # changes columns to starting columns
+        new_str["columns"] = fixed_columns
+        s = ujson_dumps(new_str)
+
     if lines:
         s = convert_to_line_delimits(s)
 
@@ -1396,6 +1406,8 @@ def _parse(self) -> None:
                 orig_names,
                 is_potential_multi_index(orig_names, None),
             )
+            if  is_potential_multi_index(orig_names, None):
+                decoded["columns"] = [list(tup) for tup in decoded["columns"]]
             self.obj = DataFrame(dtype=None, **decoded)
         elif orient == "index":
             self.obj = DataFrame.from_dict(

diff --git a/pandas/tests/io/json/test_pandas.py b/pandas/tests/io/json/test_pandas.py
@@ -321,10 +321,6 @@ def test_roundtrip_mixed(self, orient, convert_axes):
 
         assert_json_roundtrip_equal(result, expected, orient)
 
-    @pytest.mark.xfail(
-        reason="#50456 Column multiindex is stored and loaded differently",
-        raises=AssertionError,
-    )
     @pytest.mark.parametrize(
         "columns",
         [