diff --git a/docs/source/user-guide/common-operations/joins.rst b/docs/source/user-guide/common-operations/joins.rst
index 40d92215..b5c111af 100644
--- a/docs/source/user-guide/common-operations/joins.rst
+++ b/docs/source/user-guide/common-operations/joins.rst
@@ -101,4 +101,48 @@ the right table.
 
 .. ipython:: python
 
-    left.join(right, left_on="customer_id", right_on="id", how="anti")
\ No newline at end of file
+    left.join(right, left_on="customer_id", right_on="id", how="anti")
+
+Disambiguating Columns
+----------------------
+
+When the join key exists in both DataFrames under the same name, the result contains two columns with that name. Assign a name to each DataFrame to use as a prefix and avoid ambiguity.
+
+When you create a DataFrame with a ``name`` argument, that name is used as a prefix in ``col("name.column")`` to reference specific columns.
+
+.. ipython:: python
+
+    from datafusion import col, SessionContext
+    ctx = SessionContext() 
+    left = ctx.from_pydict({"id": [1, 2]}, name="l")
+    right = ctx.from_pydict({"id": [2, 3]}, name="r")
+    joined = left.join(right, on="id")
+    joined.select(col("l.id"), col("r.id"))
+
+Note that the columns in the result appear in the same order as specified in the ``select()`` call.
+
+You can remove the duplicate column after joining. Note that ``drop()`` returns a new DataFrame (DataFusion's API is immutable).
+
+.. ipython:: python
+
+    joined.drop("r.id")
+
+Automatic Deduplication
+----------------------
+
+Use the ``deduplicate`` argument of :py:meth:`DataFrame.join` to automatically
+drop the duplicate join column from the right DataFrame. Unlike PySpark which uses a ``_`` suffix by default, 
+DataFusion uses the ``__right_<col>`` naming convention for conflicting columns when not using deduplication.
+
+.. ipython:: python
+
+    left.join(right, on="id", deduplicate=True)
+
+After deduplication, you can select the join column (which comes from the left DataFrame) and other columns as usual:
+
+.. ipython:: python
+
+    # Select the id column and other columns from both DataFrames
+    joined_dedup = left.join(right, on="id", deduplicate=True)
+    joined_dedup.select("id", "customer", "name")
+
diff --git a/python/datafusion/dataframe.py b/python/datafusion/dataframe.py
index 61cb0943..94a68a44 100644
--- a/python/datafusion/dataframe.py
+++ b/python/datafusion/dataframe.py
@@ -21,7 +21,9 @@
 
 from __future__ import annotations
 
+import uuid
 import warnings
+from dataclasses import dataclass
 from typing import (
     TYPE_CHECKING,
     Any,
@@ -44,6 +46,8 @@
 from datafusion.plan import ExecutionPlan, LogicalPlan
 from datafusion.record_batch import RecordBatchStream
 
+from .functions import coalesce, col
+
 if TYPE_CHECKING:
     import pathlib
     from typing import Callable, Sequence
@@ -57,6 +61,49 @@
 from enum import Enum
 
 
+@dataclass
+class JoinKeys:
+    """Represents the resolved join keys for a DataFrame join operation."""
+
+    on: str | Sequence[str] | None
+    left_names: list[str]
+    right_names: list[str]
+
+
+@dataclass
+class JoinPreparation:
+    """Represents the complete preparation for a DataFrame join operation."""
+
+    join_keys: JoinKeys
+    modified_right: DataFrame
+    drop_cols: list[str]
+
+
+def _deduplicate_right(
+    right: DataFrame, columns: Sequence[str]
+) -> tuple[DataFrame, list[str]]:
+    """Rename join columns on the right DataFrame for deduplication."""
+    existing_columns = set(right.schema().names)
+    modified = right
+    aliases: list[str] = []
+
+    for col_name in columns:
+        base_alias = f"__right_{col_name}"
+        alias = base_alias
+        counter = 0
+        while alias in existing_columns:
+            counter += 1
+            alias = f"{base_alias}_{counter}"
+        if alias in existing_columns:
+            alias = f"__temp_{uuid.uuid4().hex[:8]}_{col_name}"
+
+        modified = modified.with_column_renamed(col_name, alias)
+        aliases.append(alias)
+        existing_columns.add(alias)
+
+    return modified, aliases
+
+
 # excerpt from deltalake
 # https://github.com/apache/datafusion-python/pull/981#discussion_r1905619163
 class Compression(Enum):
@@ -678,6 +725,7 @@ def join(
         left_on: str | Sequence[str] | None = None,
         right_on: str | Sequence[str] | None = None,
         join_keys: tuple[list[str], list[str]] | None = None,
+        deduplicate: bool = False,
     ) -> DataFrame:
         """Join this :py:class:`DataFrame` with another :py:class:`DataFrame`.
 
@@ -691,13 +739,72 @@ def join(
             left_on: Join column of the left dataframe.
             right_on: Join column of the right dataframe.
             join_keys: Tuple of two lists of column names to join on. [Deprecated]
+            deduplicate: If ``True``, drop duplicate join columns from the
+                right DataFrame similar to PySpark's ``on`` behavior.
 
         Returns:
             DataFrame after join.
         """
-        # This check is to prevent breaking API changes where users prior to
-        # DF 43.0.0 would  pass the join_keys as a positional argument instead
-        # of a keyword argument.
+        join_preparation = self._prepare_join(
+            right, on, left_on, right_on, join_keys, deduplicate
+        )
+
+        result = DataFrame(
+            self.df.join(
+                join_preparation.modified_right.df,
+                how,
+                join_preparation.join_keys.left_names,
+                join_preparation.join_keys.right_names,
+            )
+        )
+
+        if (
+            deduplicate
+            and how in ("right", "full")
+            and join_preparation.join_keys.on is not None
+        ):
+            for left_name, right_alias in zip(
+                join_preparation.join_keys.left_names,
+                join_preparation.drop_cols,
+            ):
+                result = result.with_column(
+                    left_name, coalesce(col(left_name), col(right_alias))
+                )
+
+        if join_preparation.drop_cols:
+            result = result.drop(*join_preparation.drop_cols)
+
+        return result
+
+    def _prepare_join(
+        self,
+        right: DataFrame,
+        on: str | Sequence[str] | tuple[list[str], list[str]] | None,
+        left_on: str | Sequence[str] | None,
+        right_on: str | Sequence[str] | None,
+        join_keys: tuple[list[str], list[str]] | None,
+        deduplicate: bool,
+    ) -> JoinPreparation:
+        """Prepare join keys and handle deduplication if requested.
+
+        This method combines join key resolution and deduplication preparation
+        to avoid parameter handling duplication and provide a unified interface.
+
+        Args:
+            right: The right DataFrame to join with.
+            on: Column names to join on in both dataframes.
+            left_on: Join column of the left dataframe.
+            right_on: Join column of the right dataframe.
+            join_keys: Tuple of two lists of column names to join on. [Deprecated]
+            deduplicate: If True, prepare right DataFrame for column deduplication.
+
+        Returns:
+            JoinPreparation containing resolved join keys, modified right DataFrame,
+            and columns to drop after joining.
+        """
+        # Step 1: Resolve join keys
+        # Handle the special case where on is a tuple of lists (legacy format)
+        resolved_on: str | Sequence[str] | None
         if (
             isinstance(on, tuple)
             and len(on) == 2
@@ -706,7 +813,9 @@ def join(
         ):
             # We know this is safe because we've checked the types
             join_keys = on  # type: ignore[assignment]
-            on = None
+            resolved_on = None
+        else:
+            resolved_on = on  # type: ignore[assignment]
 
         if join_keys is not None:
             warnings.warn(
@@ -717,12 +826,12 @@ def join(
             left_on = join_keys[0]
             right_on = join_keys[1]
 
-        if on is not None:
+        if resolved_on is not None:
             if left_on is not None or right_on is not None:
                 error_msg = "`left_on` or `right_on` should not provided with `on`"
                 raise ValueError(error_msg)
-            left_on = on
-            right_on = on
+            left_on = resolved_on
+            right_on = resolved_on
         elif left_on is not None or right_on is not None:
             if left_on is None or right_on is None:
                 error_msg = "`left_on` and `right_on` should both be provided."
@@ -730,12 +839,35 @@ def join(
         else:
             error_msg = "either `on` or `left_on` and `right_on` should be provided."
             raise ValueError(error_msg)
-        if isinstance(left_on, str):
-            left_on = [left_on]
-        if isinstance(right_on, str):
-            right_on = [right_on]
 
-        return DataFrame(self.df.join(right.df, how, left_on, right_on))
+        # At this point, left_on and right_on are guaranteed to be non-None
+        if left_on is None or right_on is None:  # pragma: no cover - sanity check
+            msg = "join keys resolved to None"
+            raise ValueError(msg)
+
+        left_names = [left_on] if isinstance(left_on, str) else list(left_on)
+        right_names = [right_on] if isinstance(right_on, str) else list(right_on)
+
+        drop_cols: list[str] = []
+        modified_right = right
+
+        if deduplicate and resolved_on is not None:
+            on_cols = (
+                [resolved_on] if isinstance(resolved_on, str) else list(resolved_on)
+            )
+            modified_right, aliases = _deduplicate_right(right, on_cols)
+            drop_cols.extend(aliases)
+            right_names = aliases.copy()
+
+        join_keys_resolved = JoinKeys(
+            on=resolved_on, left_names=left_names, right_names=right_names
+        )
+
+        return JoinPreparation(
+            join_keys=join_keys_resolved,
+            modified_right=modified_right,
+            drop_cols=drop_cols,
+        )
 
     def join_on(
         self,
diff --git a/python/datafusion/dataframe_formatter.py b/python/datafusion/dataframe_formatter.py
index 27f00f9c..2323224b 100644
--- a/python/datafusion/dataframe_formatter.py
+++ b/python/datafusion/dataframe_formatter.py
@@ -135,9 +135,6 @@ class DataFrameHtmlFormatter:
           session
     """
 
-    # Class variable to track if styles have been loaded in the notebook
-    _styles_loaded = False
-
     def __init__(
         self,
         max_cell_length: int = 25,
@@ -260,23 +257,6 @@ def set_custom_header_builder(self, builder: Callable[[Any], str]) -> None:
         """
         self._custom_header_builder = builder
 
-    @classmethod
-    def is_styles_loaded(cls) -> bool:
-        """Check if HTML styles have been loaded in the current session.
-
-        This method is primarily intended for debugging UI rendering issues
-        related to style loading.
-
-        Returns:
-            True if styles have been loaded, False otherwise
-
-        Example:
-            >>> from datafusion.dataframe_formatter import DataFrameHtmlFormatter
-            >>> DataFrameHtmlFormatter.is_styles_loaded()
-            False
-        """
-        return cls._styles_loaded
-
     def format_html(
         self,
         batches: list,
@@ -315,18 +295,7 @@ def format_html(
         # Build HTML components
         html = []
 
-        # Only include styles and scripts if:
-        # 1. Not using shared styles, OR
-        # 2. Using shared styles but they haven't been loaded yet
-        include_styles = (
-            not self.use_shared_styles or not DataFrameHtmlFormatter._styles_loaded
-        )
-
-        if include_styles:
-            html.extend(self._build_html_header())
-            # If we're using shared styles, mark them as loaded
-            if self.use_shared_styles:
-                DataFrameHtmlFormatter._styles_loaded = True
+        html.extend(self._build_html_header())
 
         html.extend(self._build_table_container_start())
 
@@ -338,7 +307,7 @@ def format_html(
         html.append("</div>")
 
         # Add footer (JavaScript and messages)
-        if include_styles and self.enable_cell_expansion:
+        if self.enable_cell_expansion:
             html.append(self._get_javascript())
 
         # Always add truncation message if needed (independent of styles)
@@ -375,14 +344,20 @@ def format_str(
 
     def _build_html_header(self) -> list[str]:
         """Build the HTML header with CSS styles."""
-        html = []
-        html.append("<style>")
-        # Only include expandable CSS if cell expansion is enabled
-        if self.enable_cell_expansion:
-            html.append(self._get_default_css())
+        default_css = self._get_default_css() if self.enable_cell_expansion else ""
+        script = f"""
+<script>
+if (!document.getElementById('df-styles')) {{
+  const style = document.createElement('style');
+  style.id = 'df-styles';
+  style.textContent = `{default_css}`;
+  document.head.appendChild(style);
+}}
+</script>
+"""
+        html = [script]
         if self.custom_css:
-            html.append(self.custom_css)
-        html.append("</style>")
+            html.append(f"<style>{self.custom_css}</style>")
         return html
 
     def _build_table_container_start(self) -> list[str]:
@@ -570,28 +545,31 @@ def _get_default_css(self) -> str:
     def _get_javascript(self) -> str:
         """Get JavaScript code for interactive elements."""
         return """
-            <script>
-            function toggleDataFrameCellText(table_uuid, row, col) {
-                var shortText = document.getElementById(
-                    table_uuid + "-min-text-" + row + "-" + col
-                );
-                var fullText = document.getElementById(
-                    table_uuid + "-full-text-" + row + "-" + col
-                );
-                var button = event.target;
-
-                if (fullText.style.display === "none") {
-                    shortText.style.display = "none";
-                    fullText.style.display = "inline";
-                    button.textContent = "(less)";
-                } else {
-                    shortText.style.display = "inline";
-                    fullText.style.display = "none";
-                    button.textContent = "...";
-                }
-            }
-            </script>
-        """
+<script>
+if (!window.__df_formatter_js_loaded__) {
+  window.__df_formatter_js_loaded__ = true;
+  window.toggleDataFrameCellText = function (table_uuid, row, col) {
+    var shortText = document.getElementById(
+      table_uuid + "-min-text-" + row + "-" + col
+    );
+    var fullText = document.getElementById(
+      table_uuid + "-full-text-" + row + "-" + col
+    );
+    var button = event.target;
+
+    if (fullText.style.display === "none") {
+      shortText.style.display = "none";
+      fullText.style.display = "inline";
+      button.textContent = "(less)";
+    } else {
+      shortText.style.display = "inline";
+      fullText.style.display = "none";
+      button.textContent = "...";
+    }
+  };
+}
+</script>
+"""
 
 
 class FormatterManager:
@@ -712,24 +690,9 @@ def reset_formatter() -> None:
         >>> reset_formatter()  # Reset formatter to default settings
     """
     formatter = DataFrameHtmlFormatter()
-    # Reset the styles_loaded flag to ensure styles will be reloaded
-    DataFrameHtmlFormatter._styles_loaded = False
     set_formatter(formatter)
 
 
-def reset_styles_loaded_state() -> None:
-    """Reset the styles loaded state to force reloading of styles.
-
-    This can be useful when switching between notebook sessions or
-    when styles need to be refreshed.
-
-    Example:
-        >>> from datafusion.html_formatter import reset_styles_loaded_state
-        >>> reset_styles_loaded_state()  # Force styles to reload in next render
-    """
-    DataFrameHtmlFormatter._styles_loaded = False
-
-
 def _refresh_formatter_reference() -> None:
     """Refresh formatter reference in any modules using it.
 
diff --git a/python/tests/test_dataframe.py b/python/tests/test_dataframe.py
index c9ae38d8..76dcf54c 100644
--- a/python/tests/test_dataframe.py
+++ b/python/tests/test_dataframe.py
@@ -42,7 +42,6 @@
     configure_formatter,
     get_formatter,
     reset_formatter,
-    reset_styles_loaded_state,
 )
 from datafusion.expr import Window
 from pyarrow.csv import write_csv
@@ -520,6 +519,52 @@ def test_join_on():
     assert table.to_pydict() == expected
 
 
+def test_join_deduplicate():
+    ctx = SessionContext()
+
+    batch = pa.RecordBatch.from_arrays(
+        [pa.array([1, 2]), pa.array(["l1", "l2"])],
+        names=["id", "left_val"],
+    )
+    left = ctx.create_dataframe([[batch]], "l")
+
+    batch = pa.RecordBatch.from_arrays(
+        [pa.array([1, 2]), pa.array(["r1", "r2"])],
+        names=["id", "right_val"],
+    )
+    right = ctx.create_dataframe([[batch]], "r")
+
+    joined = left.join(right, on="id", deduplicate=True)
+    joined = joined.sort(column("id"))
+    table = pa.Table.from_batches(joined.collect())
+
+    expected = {"id": [1, 2], "right_val": ["r1", "r2"], "left_val": ["l1", "l2"]}
+    assert table.to_pydict() == expected
+
+
+def test_join_deduplicate_multi():
+    ctx = SessionContext()
+
+    batch = pa.RecordBatch.from_arrays(
+        [pa.array([1, 2]), pa.array([3, 4]), pa.array(["x", "y"])],
+        names=["a", "b", "l"],
+    )
+    left = ctx.create_dataframe([[batch]], "l")
+
+    batch = pa.RecordBatch.from_arrays(
+        [pa.array([1, 2]), pa.array([3, 4]), pa.array(["u", "v"])],
+        names=["a", "b", "r"],
+    )
+    right = ctx.create_dataframe([[batch]], "r")
+
+    joined = left.join(right, on=["a", "b"], deduplicate=True)
+    joined = joined.sort(column("a"), column("b"))
+    table = pa.Table.from_batches(joined.collect())
+
+    expected = {"a": [1, 2], "b": [3, 4], "r": ["u", "v"], "l": ["x", "y"]}
+    assert table.to_pydict() == expected
+
+
 def test_distinct():
     ctx = SessionContext()
 
@@ -2177,27 +2222,15 @@ def test_html_formatter_shared_styles(df, clean_formatter_state):
     # First, ensure we're using shared styles
     configure_formatter(use_shared_styles=True)
 
-    # Get HTML output for first table - should include styles
     html_first = df._repr_html_()
-
-    # Verify styles are included in first render
-    assert "<style>" in html_first
-    assert ".expandable-container" in html_first
-
-    # Get HTML output for second table - should NOT include styles
     html_second = df._repr_html_()
 
-    # Verify styles are NOT included in second render
+    assert "<script>" in html_first
+    assert "df-styles" in html_first
+    assert "<script>" in html_second
+    assert "df-styles" in html_second
+    assert "<style>" not in html_first
     assert "<style>" not in html_second
-    assert ".expandable-container" not in html_second
-
-    # Reset the styles loaded state and verify styles are included again
-    reset_styles_loaded_state()
-    html_after_reset = df._repr_html_()
-
-    # Verify styles are included after reset
-    assert "<style>" in html_after_reset
-    assert ".expandable-container" in html_after_reset
 
 
 def test_html_formatter_no_shared_styles(df, clean_formatter_state):
@@ -2206,15 +2239,15 @@ def test_html_formatter_no_shared_styles(df, clean_formatter_state):
     # Configure formatter to NOT use shared styles
     configure_formatter(use_shared_styles=False)
 
-    # Generate HTML multiple times
     html_first = df._repr_html_()
     html_second = df._repr_html_()
 
-    # Verify styles are included in both renders
-    assert "<style>" in html_first
-    assert "<style>" in html_second
-    assert ".expandable-container" in html_first
-    assert ".expandable-container" in html_second
+    assert "<script>" in html_first
+    assert "<script>" in html_second
+    assert "df-styles" in html_first
+    assert "df-styles" in html_second
+    assert "<style>" not in html_first
+    assert "<style>" not in html_second
 
 
 def test_html_formatter_manual_format_html(clean_formatter_state):
@@ -2228,20 +2261,15 @@ def test_html_formatter_manual_format_html(clean_formatter_state):
 
     formatter = get_formatter()
 
-    # First call should include styles
     html_first = formatter.format_html([batch], batch.schema)
-    assert "<style>" in html_first
-
-    # Second call should not include styles (using shared styles by default)
     html_second = formatter.format_html([batch], batch.schema)
-    assert "<style>" not in html_second
-
-    # Reset loaded state
-    reset_styles_loaded_state()
 
-    # After reset, styles should be included again
-    html_reset = formatter.format_html([batch], batch.schema)
-    assert "<style>" in html_reset
+    assert "<script>" in html_first
+    assert "<script>" in html_second
+    assert "df-styles" in html_first
+    assert "df-styles" in html_second
+    assert "<style>" not in html_first
+    assert "<style>" not in html_second
 
     # Create a new formatter with shared_styles=False
     local_formatter = DataFrameHtmlFormatter(use_shared_styles=False)
@@ -2250,8 +2278,12 @@ def test_html_formatter_manual_format_html(clean_formatter_state):
     local_html_1 = local_formatter.format_html([batch], batch.schema)
     local_html_2 = local_formatter.format_html([batch], batch.schema)
 
-    assert "<style>" in local_html_1
-    assert "<style>" in local_html_2
+    assert "<script>" in local_html_1
+    assert "<script>" in local_html_2
+    assert "df-styles" in local_html_1
+    assert "df-styles" in local_html_2
+    assert "<style>" not in local_html_1
+    assert "<style>" not in local_html_2
 
 
 def test_fill_null_basic(null_df):
@@ -2603,3 +2635,142 @@ def trigger_interrupt():
 
     # Make sure the interrupt thread has finished
     interrupt_thread.join(timeout=1.0)
+
+
+def test_join_deduplicate_select():
+    """Test that select works correctly after a deduplicated join."""
+    ctx = SessionContext()
+
+    left_df = ctx.from_pydict({"id": [1, 2, 3], "name": ["Alice", "Bob", "Charlie"]})
+    right_df = ctx.from_pydict(
+        {"id": [2, 3, 4], "city": ["New York", "London", "Paris"]}
+    )
+
+    # Join and select the id column to confirm it works
+    joined_df = left_df.join(right_df, on="id", deduplicate=True)
+    selected_df = joined_df.select(column("id"))
+    result = selected_df.collect()[0]
+
+    # Should have only the matching ids (2, 3)
+    expected_ids = [2, 3]
+    assert result.column(0).to_pylist() == expected_ids
+
+    # Also test selecting multiple columns
+    multi_select_df = joined_df.select(column("id"), column("name"), column("city"))
+    multi_result = multi_select_df.collect()[0]
+
+    expected_data = {
+        "id": [2, 3],
+        "name": ["Bob", "Charlie"],
+        "city": ["New York", "London"],
+    }
+
+    assert multi_result.column(0).to_pylist() == expected_data["id"]
+    assert multi_result.column(1).to_pylist() == expected_data["name"]
+    assert multi_result.column(2).to_pylist() == expected_data["city"]
+
+    # Test that schema only contains expected column names (no internal aliases)
+    joined_schema = joined_df.schema()
+    column_names = [field.name for field in joined_schema]
+    expected_columns = ["id", "name", "city"]
+    assert column_names == expected_columns
+
+    # Ensure no internal alias names like "__right_id" appear in the schema
+    for col_name in column_names:
+        assert not col_name.startswith("__"), (
+            f"Internal alias '{col_name}' leaked into schema"
+        )
+
+    # Test selecting each column individually to ensure they all work
+    for col_name in expected_columns:
+        individual_select = joined_df.select(column(col_name))
+        result = individual_select.collect()[0]
+        assert len(result) == 2, f"Column '{col_name}' selection failed"
+        assert result.schema.field(0).name == col_name
+
+    # Test that we can select all columns using their names
+    all_columns_select = joined_df.select(*[column(name) for name in expected_columns])
+    all_result = all_columns_select.collect()[0]
+    assert all_result.schema.names == expected_columns
+
+    # Verify that attempting to select a potential internal alias fails appropriately
+    with pytest.raises(Exception):  # noqa: B017 - generic exception from FFI
+        joined_df.select(column("__right_id")).collect()
+
+
+def test_join_deduplicate_all_types():
+    """Test deduplication behavior across different join types (left, right, outer).
+
+    Note: This test may show linting errors due to method signature overloads,
+    but the functionality should work correctly at runtime.
+    """
+    ctx = SessionContext()
+
+    # Create left dataframe with some rows that won't match
+    left_batch = pa.RecordBatch.from_arrays(
+        [pa.array([1, 2, 3, 4]), pa.array(["a", "b", "c", "d"])],
+        names=["id", "left_value"],
+    )
+    left_df = ctx.create_dataframe([[left_batch]], "left")
+
+    # Create right dataframe with some rows that won't match and duplicate column name
+    right_batch = pa.RecordBatch.from_arrays(
+        [pa.array([2, 3, 5, 6]), pa.array(["x", "y", "z", "w"])],
+        names=["id", "right_value"],
+    )
+    right_df = ctx.create_dataframe([[right_batch]], "right")
+
+    # Test inner join with deduplication (default behavior)
+    inner_joined = left_df.join(right_df, on="id", how="inner", deduplicate=True)
+    inner_result = inner_joined.sort(column("id")).collect()[0]
+
+    # Should only have matching rows (2, 3)
+    expected_inner = {
+        "id": [2, 3],
+        "left_value": ["b", "c"],
+        "right_value": ["x", "y"],
+    }
+    assert inner_result.to_pydict() == expected_inner
+
+    # Test left join with deduplication
+    left_joined = left_df.join(right_df, on="id", how="left", deduplicate=True)
+    left_result = left_joined.sort(column("id")).collect()[0]
+
+    # Should have all left rows, with nulls for unmatched right rows
+    expected_left = {
+        "id": [1, 2, 3, 4],
+        "left_value": ["a", "b", "c", "d"],
+        "right_value": [None, "x", "y", None],
+    }
+    assert left_result.to_pydict() == expected_left
+
+    # Test right join with deduplication
+    right_joined = left_df.join(right_df, on="id", how="right", deduplicate=True)
+    right_result = right_joined.sort(column("id")).collect()[0]
+
+    # Should have all right rows, with nulls for unmatched left rows
+    expected_right = {
+        "id": [2, 3, 5, 6],
+        "left_value": ["b", "c", None, None],
+        "right_value": ["x", "y", "z", "w"],
+    }
+    assert right_result.to_pydict() == expected_right
+
+    # Test full outer join with deduplication
+    outer_joined = left_df.join(right_df, on="id", how="full", deduplicate=True)
+    outer_result = outer_joined.sort(column("id")).collect()[0]
+
+    # Should have all rows from both sides, with nulls for unmatched rows
+    expected_outer = {
+        "id": [1, 2, 3, 4, 5, 6],
+        "left_value": ["a", "b", "c", "d", None, None],
+        "right_value": [None, "x", "y", None, "z", "w"],
+    }
+    assert outer_result.to_pydict() == expected_outer
+
+    # Verify that we can still select the deduplicated column without issues
+    for join_type in ["inner", "left", "right", "full"]:
+        joined = left_df.join(right_df, on="id", how=join_type, deduplicate=True)
+        selected = joined.select(column("id"))
+        # Should not raise an error and should have the same number of rows
+        assert len(selected.collect()[0]) == len(joined.collect()[0])