diff --git a/bigframes/core/compile/polars/compiler.py b/bigframes/core/compile/polars/compiler.py
index 14d8e8501c..a0e85d8c69 100644
--- a/bigframes/core/compile/polars/compiler.py
+++ b/bigframes/core/compile/polars/compiler.py
@@ -16,14 +16,17 @@
 import dataclasses
 import functools
 import itertools
-from typing import cast, Optional, Sequence, Tuple, TYPE_CHECKING
+import operator
+from typing import cast, Literal, Optional, Sequence, Tuple, TYPE_CHECKING
+
+import pandas as pd
 
 import bigframes.core
-from bigframes.core import window_spec
+from bigframes.core import identifiers, nodes, ordering, window_spec
 import bigframes.core.expression as ex
 import bigframes.core.guid as guid
-import bigframes.core.nodes as nodes
 import bigframes.core.rewrite
+import bigframes.dtypes
 import bigframes.operations as ops
 import bigframes.operations.aggregations as agg_ops
 
@@ -37,6 +40,45 @@
         polars_installed = False
 
 if polars_installed:
+    _DTYPE_MAPPING = {
+        # Direct mappings
+        bigframes.dtypes.INT_DTYPE: pl.Int64(),
+        bigframes.dtypes.FLOAT_DTYPE: pl.Float64(),
+        bigframes.dtypes.BOOL_DTYPE: pl.Boolean(),
+        bigframes.dtypes.STRING_DTYPE: pl.String(),
+        bigframes.dtypes.NUMERIC_DTYPE: pl.Decimal(38, 9),
+        bigframes.dtypes.BIGNUMERIC_DTYPE: pl.Decimal(76, 38),
+        bigframes.dtypes.BYTES_DTYPE: pl.Binary(),
+        bigframes.dtypes.DATE_DTYPE: pl.Date(),
+        bigframes.dtypes.DATETIME_DTYPE: pl.Datetime(time_zone=None),
+        bigframes.dtypes.TIMESTAMP_DTYPE: pl.Datetime(time_zone="UTC"),
+        bigframes.dtypes.TIME_DTYPE: pl.Time(),
+        bigframes.dtypes.TIMEDELTA_DTYPE: pl.Duration(),
+        # Indirect mappings
+        bigframes.dtypes.GEO_DTYPE: pl.String(),
+        bigframes.dtypes.JSON_DTYPE: pl.String(),
+    }
+
+    def _bigframes_dtype_to_polars_dtype(
+        dtype: bigframes.dtypes.ExpressionType,
+    ) -> pl.DataType:
+        if dtype is None:
+            return pl.Null()
+        if bigframes.dtypes.is_struct_like(dtype):
+            return pl.Struct(
+                [
+                    pl.Field(name, _bigframes_dtype_to_polars_dtype(type))
+                    for name, type in bigframes.dtypes.get_struct_fields(dtype).items()
+                ]
+            )
+        if bigframes.dtypes.is_array_like(dtype):
+            return pl.Array(
+                inner=_bigframes_dtype_to_polars_dtype(
+                    bigframes.dtypes.get_array_inner_type(dtype)
+                )
+            )
+        else:
+            return _DTYPE_MAPPING[dtype]
 
     @dataclasses.dataclass(frozen=True)
     class PolarsExpressionCompiler:
@@ -47,33 +89,45 @@ class PolarsExpressionCompiler:
         """
 
         @functools.singledispatchmethod
-        def compile_expression(self, expression: ex.Expression):
+        def compile_expression(self, expression: ex.Expression) -> pl.Expr:
             raise NotImplementedError(f"Cannot compile expression: {expression}")
 
         @compile_expression.register
         def _(
             self,
             expression: ex.ScalarConstantExpression,
-        ):
-            return pl.lit(expression.value)
+        ) -> pl.Expr:
+            value = expression.value
+            if not isinstance(value, float) and pd.isna(value):  # type: ignore
+                value = None
+            if expression.dtype is None:
+                return pl.lit(None)
+            return pl.lit(value, _bigframes_dtype_to_polars_dtype(expression.dtype))
 
         @compile_expression.register
         def _(
             self,
             expression: ex.DerefOp,
-        ):
+        ) -> pl.Expr:
             return pl.col(expression.id.sql)
 
+        @compile_expression.register
+        def _(
+            self,
+            expression: ex.SchemaFieldRefExpression,
+        ) -> pl.Expr:
+            return pl.col(expression.field.id.sql)
+
         @compile_expression.register
         def _(
             self,
             expression: ex.OpExpression,
-        ):
+        ) -> pl.Expr:
             # TODO: Complete the implementation, convert to hash dispatch
             op = expression.op
             args = tuple(map(self.compile_expression, expression.inputs))
             if isinstance(op, ops.invert_op.__class__):
-                return args[0].neg()
+                return ~args[0]
             if isinstance(op, ops.and_op.__class__):
                 return args[0] & args[1]
             if isinstance(op, ops.or_op.__class__):
@@ -82,6 +136,21 @@ def _(
                 return args[0] + args[1]
             if isinstance(op, ops.sub_op.__class__):
                 return args[0] - args[1]
+            if isinstance(op, ops.mul_op.__class__):
+                return args[0] * args[1]
+            if isinstance(op, ops.div_op.__class__):
+                return args[0] / args[1]
+            if isinstance(op, ops.floordiv_op.__class__):
+                # TODO: Handle int // 0
+                return args[0] // args[1]
+            if isinstance(op, (ops.pow_op.__class__, ops.unsafe_pow_op.__class__)):
+                return args[0] ** args[1]
+            if isinstance(op, ops.abs_op.__class__):
+                return args[0].abs()
+            if isinstance(op, ops.neg_op.__class__):
+                return args[0].neg()
+            if isinstance(op, ops.pos_op.__class__):
+                return args[0]
             if isinstance(op, ops.ge_op.__class__):
                 return args[0] >= args[1]
             if isinstance(op, ops.gt_op.__class__):
@@ -91,23 +160,48 @@ def _(
             if isinstance(op, ops.lt_op.__class__):
                 return args[0] < args[1]
             if isinstance(op, ops.eq_op.__class__):
-                return args[0] == args[1]
+                return args[0].eq(args[1])
+            if isinstance(op, ops.eq_null_match_op.__class__):
+                return args[0].eq_missing(args[1])
             if isinstance(op, ops.ne_op.__class__):
-                return args[0] != args[1]
+                return args[0].ne(args[1])
+            if isinstance(op, ops.IsInOp):
+                # TODO: Filter out types that can't be coerced to right type
+                if op.match_nulls or not any(map(pd.isna, op.values)):
+                    # newer polars version have nulls_equal arg
+                    return args[0].is_in(op.values)
+                else:
+                    return args[0].is_in(op.values) or args[0].is_null()
             if isinstance(op, ops.mod_op.__class__):
                 return args[0] % args[1]
             if isinstance(op, ops.coalesce_op.__class__):
                 return pl.coalesce(*args)
+            if isinstance(op, ops.fillna_op.__class__):
+                return pl.coalesce(*args)
+            if isinstance(op, ops.isnull_op.__class__):
+                return args[0].is_null()
+            if isinstance(op, ops.notnull_op.__class__):
+                return args[0].is_not_null()
             if isinstance(op, ops.CaseWhenOp):
                 expr = pl.when(args[0]).then(args[1])
                 for pred, result in zip(args[2::2], args[3::2]):
-                    return expr.when(pred).then(result)
+                    expr = expr.when(pred).then(result)  # type: ignore
                 return expr
             if isinstance(op, ops.where_op.__class__):
                 original, condition, otherwise = args
                 return pl.when(condition).then(original).otherwise(otherwise)
+            if isinstance(op, ops.AsTypeOp):
+                return self.astype(args[0], op.to_type, safe=op.safe)
+
             raise NotImplementedError(f"Polars compiler hasn't implemented {op}")
 
+        def astype(
+            self, col: pl.Expr, dtype: bigframes.dtypes.Dtype, safe: bool
+        ) -> pl.Expr:
+            # TODO: Polars casting works differently, need to lower instead to specific conversion ops.
+            # eg. We want "True" instead of "true" for bool to string.
+            return col.cast(_DTYPE_MAPPING[dtype], strict=not safe)
+
     @dataclasses.dataclass(frozen=True)
     class PolarsAggregateCompiler:
         scalar_compiler = PolarsExpressionCompiler()
@@ -149,12 +243,26 @@ def compile_agg_expr(self, expr: ex.Aggregation):
 
             return self.compile_agg_op(expr.op, inputs)
 
-        def compile_agg_op(self, op: agg_ops.WindowOp, inputs: Sequence[str] = []):
+        def compile_agg_op(
+            self, op: agg_ops.WindowOp, inputs: Sequence[str] = []
+        ) -> pl.Expr:
             if isinstance(op, agg_ops.ProductOp):
-                # TODO: Need schema to cast back to original type if posisble (eg float back to int)
-                return pl.col(*inputs).log().sum().exp()
+                # TODO: Fix datatype inconsistency with float/int
+                return pl.col(*inputs).product()
             if isinstance(op, agg_ops.SumOp):
                 return pl.sum(*inputs)
+            if isinstance(op, (agg_ops.SizeOp, agg_ops.SizeUnaryOp)):
+                return pl.len()
+            if isinstance(op, agg_ops.MeanOp):
+                return pl.mean(*inputs)
+            if isinstance(op, agg_ops.MedianOp):
+                return pl.median(*inputs)
+            if isinstance(op, agg_ops.AllOp):
+                return pl.all(*inputs)
+            if isinstance(op, agg_ops.AnyOp):
+                return pl.any(*inputs)  # type: ignore
+            if isinstance(op, agg_ops.NuniqueOp):
+                return pl.col(*inputs).drop_nulls().n_unique()
             if isinstance(op, agg_ops.MinOp):
                 return pl.min(*inputs)
             if isinstance(op, agg_ops.MaxOp):
@@ -162,7 +270,35 @@ def compile_agg_op(self, op: agg_ops.WindowOp, inputs: Sequence[str] = []):
             if isinstance(op, agg_ops.CountOp):
                 return pl.count(*inputs)
             if isinstance(op, agg_ops.CorrOp):
-                return pl.corr(*inputs)
+                return pl.corr(
+                    pl.col(inputs[0]).fill_nan(None), pl.col(inputs[1]).fill_nan(None)
+                )
+            if isinstance(op, agg_ops.CovOp):
+                return pl.cov(
+                    pl.col(inputs[0]).fill_nan(None), pl.col(inputs[1]).fill_nan(None)
+                )
+            if isinstance(op, agg_ops.StdOp):
+                return pl.std(inputs[0])
+            if isinstance(op, agg_ops.VarOp):
+                return pl.var(inputs[0])
+            if isinstance(op, agg_ops.PopVarOp):
+                return pl.var(inputs[0], ddof=0)
+            if isinstance(op, agg_ops.FirstNonNullOp):
+                return pl.col(*inputs).drop_nulls().first()
+            if isinstance(op, agg_ops.LastNonNullOp):
+                return pl.col(*inputs).drop_nulls().last()
+            if isinstance(op, agg_ops.FirstOp):
+                return pl.col(*inputs).first()
+            if isinstance(op, agg_ops.LastOp):
+                return pl.col(*inputs).last()
+            if isinstance(op, agg_ops.ShiftOp):
+                return pl.col(*inputs).shift(op.periods)
+            if isinstance(op, agg_ops.DiffOp):
+                return pl.col(*inputs) - pl.col(*inputs).shift(op.periods)
+            if isinstance(op, agg_ops.AnyValueOp):
+                return pl.max(
+                    *inputs
+                )  # probably something faster? maybe just get first item?
             raise NotImplementedError(
                 f"Aggregate op {op} not yet supported in polars engine."
             )
@@ -197,11 +333,14 @@ def compile(self, array_value: bigframes.core.ArrayValue) -> pl.LazyFrame:
 
         # TODO: Create standard way to configure BFET -> BFET rewrites
         # Polars has incomplete slice support in lazy mode
-        node = nodes.bottom_up(array_value.node, bigframes.core.rewrite.rewrite_slice)
+        node = array_value.node
+        node = bigframes.core.rewrite.column_pruning(node)
+        node = nodes.bottom_up(node, bigframes.core.rewrite.rewrite_slice)
+        node = bigframes.core.rewrite.pull_out_window_order(node)
         return self.compile_node(node)
 
     @functools.singledispatchmethod
-    def compile_node(self, node: nodes.BigFrameNode):
+    def compile_node(self, node: nodes.BigFrameNode) -> pl.LazyFrame:
         """Defines transformation but isn't cached, always use compile_node instead"""
         raise ValueError(f"Can't compile unrecognized node: {node}")
 
@@ -213,7 +352,12 @@ def compile_readlocal(self, node: nodes.ReadLocalNode):
         lazy_frame = cast(
             pl.DataFrame, pl.from_arrow(node.local_data_source.data)
         ).lazy()
-        return lazy_frame.select(cols_to_read.keys()).rename(cols_to_read)
+        lazy_frame = lazy_frame.select(cols_to_read.keys()).rename(cols_to_read)
+        if node.offsets_col:
+            lazy_frame = lazy_frame.with_columns(
+                [pl.int_range(pl.len(), dtype=pl.Int64).alias(node.offsets_col.sql)]
+            )
+        return lazy_frame
 
     @compile_node.register
     def compile_filter(self, node: nodes.FilterNode):
@@ -227,17 +371,18 @@ def compile_orderby(self, node: nodes.OrderByNode):
         if len(node.by) == 0:
             # pragma: no cover
             return frame
-
-        frame = frame.sort(
-            [
-                self.expr_compiler.compile_expression(by.scalar_expression)
-                for by in node.by
-            ],
-            descending=[not by.direction.is_ascending for by in node.by],
-            nulls_last=[by.na_last for by in node.by],
+        return self._sort(frame, node.by)
+
+    def _sort(
+        self, frame: pl.LazyFrame, by: Sequence[ordering.OrderingExpression]
+    ) -> pl.LazyFrame:
+        sorted = frame.sort(
+            [self.expr_compiler.compile_expression(by.scalar_expression) for by in by],
+            descending=[not by.direction.is_ascending for by in by],
+            nulls_last=[by.na_last for by in by],
             maintain_order=True,
         )
-        return frame
+        return sorted
 
     @compile_node.register
     def compile_reversed(self, node: nodes.ReversedNode):
@@ -251,10 +396,15 @@ def compile_selection(self, node: nodes.SelectionNode):
 
     @compile_node.register
     def compile_projection(self, node: nodes.ProjectionNode):
-        new_cols = [
-            self.expr_compiler.compile_expression(ex).alias(name.sql)
-            for ex, name in node.assignments
-        ]
+        new_cols = []
+        for proj_expr, name in node.assignments:
+            bound_expr = ex.bind_schema_fields(proj_expr, node.child.field_by_id)
+            new_col = self.expr_compiler.compile_expression(bound_expr).alias(name.sql)
+            if bound_expr.output_type is None:
+                new_col = new_col.cast(
+                    _bigframes_dtype_to_polars_dtype(bigframes.dtypes.DEFAULT_DTYPE)
+                )
+            new_cols.append(new_col)
         return self.compile_node(node.child).with_columns(new_cols)
 
     @compile_node.register
@@ -265,37 +415,91 @@ def compile_offsets(self, node: nodes.PromoteOffsetsNode):
 
     @compile_node.register
     def compile_join(self, node: nodes.JoinNode):
-        # Always totally order this, as adding offsets is relatively cheap for in-memory columnar data
-        left = self.compile_node(node.left_child).with_columns(
+        left = self.compile_node(node.left_child)
+        right = self.compile_node(node.right_child)
+        left_on = [l_name.id.sql for l_name, _ in node.conditions]
+        right_on = [r_name.id.sql for _, r_name in node.conditions]
+        if node.type == "right":
+            return self._ordered_join(
+                right, left, "left", right_on, left_on, node.joins_nulls
+            ).select([id.sql for id in node.ids])
+        return self._ordered_join(
+            left, right, node.type, left_on, right_on, node.joins_nulls
+        )
+
+    def _ordered_join(
+        self,
+        left_frame: pl.LazyFrame,
+        right_frame: pl.LazyFrame,
+        how: Literal["inner", "outer", "left", "cross"],
+        left_on: Sequence[str],
+        right_on: Sequence[str],
+        join_nulls: bool,
+    ):
+        if how == "right":
+            # seems to cause seg faults as of v1.30 for no apparent reason
+            raise ValueError("right join not supported")
+        left = left_frame.with_columns(
             [
                 pl.int_range(pl.len()).alias("_bf_join_l"),
             ]
         )
-        right = self.compile_node(node.right_child).with_columns(
+        right = right_frame.with_columns(
             [
                 pl.int_range(pl.len()).alias("_bf_join_r"),
             ]
         )
-        if node.type != "cross":
-            left_on = [l_name.id.sql for l_name, _ in node.conditions]
-            right_on = [r_name.id.sql for _, r_name in node.conditions]
+        if how != "cross":
             joined = left.join(
-                right, how=node.type, left_on=left_on, right_on=right_on, coalesce=False
+                right,
+                how=how,
+                left_on=left_on,
+                right_on=right_on,
+                # Note: join_nulls renamed to nulls_equal for polars 1.24
+                join_nulls=join_nulls,  # type: ignore
+                coalesce=False,
             )
         else:
-            joined = left.join(right, how=node.type)
-        return joined.sort(["_bf_join_l", "_bf_join_r"]).drop(
+            joined = left.join(right, how=how, coalesce=False)
+
+        join_order = (
+            ["_bf_join_l", "_bf_join_r"]
+            if how != "right"
+            else ["_bf_join_r", "_bf_join_l"]
+        )
+        return joined.sort(join_order, nulls_last=True).drop(
             ["_bf_join_l", "_bf_join_r"]
         )
 
     @compile_node.register
     def compile_concat(self, node: nodes.ConcatNode):
-        return pl.concat(self.compile_node(child) for child in node.child_nodes)
+        child_frames = [self.compile_node(child) for child in node.child_nodes]
+        child_frames = [
+            frame.rename(
+                {col: id.sql for col, id in zip(frame.columns, node.output_ids)}
+            )
+            for frame in child_frames
+        ]
+        df = pl.concat(child_frames)
+        return df
 
     @compile_node.register
     def compile_agg(self, node: nodes.AggregateNode):
         df = self.compile_node(node.child)
-
+        if node.dropna and len(node.by_column_ids) > 0:
+            df = df.filter(
+                [pl.col(ref.id.sql).is_not_null() for ref in node.by_column_ids]
+            )
+        if node.order_by:
+            df = self._sort(df, node.order_by)
+        return self._aggregate(df, node.aggregations, node.by_column_ids)
+
+    def _aggregate(
+        self,
+        df: pl.LazyFrame,
+        aggregations: Sequence[Tuple[ex.Aggregation, identifiers.ColumnId]],
+        grouping_keys: Tuple[ex.DerefOp, ...],
+    ) -> pl.LazyFrame:
         # Need to materialize columns to broadcast constants
         agg_inputs = [
             list(
@@ -304,7 +508,7 @@ def compile_agg(self, node: nodes.AggregateNode):
                     self.agg_compiler.get_args(agg),
                 )
             )
-            for agg, _ in node.aggregations
+            for agg, _ in aggregations
         ]
 
         df_agg_inputs = df.with_columns(itertools.chain(*agg_inputs))
@@ -313,18 +517,19 @@ def compile_agg(self, node: nodes.AggregateNode):
             self.agg_compiler.compile_agg_op(
                 agg.op, list(map(lambda x: x.meta.output_name(), inputs))
             ).alias(id.sql)
-            for (agg, id), inputs in zip(node.aggregations, agg_inputs)
+            for (agg, id), inputs in zip(aggregations, agg_inputs)
         ]
 
-        if len(node.by_column_ids) > 0:
-            group_exprs = [pl.col(ref.id.sql) for ref in node.by_column_ids]
+        if len(grouping_keys) > 0:
+            group_exprs = [pl.col(ref.id.sql) for ref in grouping_keys]
             grouped_df = df_agg_inputs.group_by(group_exprs)
-            return grouped_df.agg(agg_exprs).sort(group_exprs)
+            return grouped_df.agg(agg_exprs).sort(group_exprs, nulls_last=True)
         else:
             return df_agg_inputs.select(agg_exprs)
 
     @compile_node.register
     def compile_explode(self, node: nodes.ExplodeNode):
+        assert node.offsets_col is None
         df = self.compile_node(node.child)
         cols = [pl.col(col.id.sql) for col in node.column_ids]
         return df.explode(cols)
@@ -338,55 +543,92 @@ def compile_sample(self, node: nodes.RandomSampleNode):
     @compile_node.register
     def compile_window(self, node: nodes.WindowOpNode):
         df = self.compile_node(node.child)
-        agg_expr = self.agg_compiler.compile_agg_expr(node.expression).alias(
-            node.output_name.sql
-        )
-        # Three window types: completely unbound, grouped and row bounded
 
         window = node.window_spec
-
+        # Should have been handled by reweriter
+        assert len(window.ordering) == 0
         if window.min_periods > 0:
             raise NotImplementedError("min_period not yet supported for polars engine")
 
-        if window.bounds is None:
+        if (window.bounds is None) or (window.is_unbounded):
             # polars will automatically broadcast the aggregate to the matching input rows
-            if len(window.grouping_keys) == 0:  # unbound window
-                pass
-            else:  # partition-only window
-                agg_expr = agg_expr.over(
-                    partition_by=[ref.id.sql for ref in window.grouping_keys]
-                )
-            return df.with_columns([agg_expr])
-
+            agg_pl = self.agg_compiler.compile_agg_expr(node.expression)
+            if window.grouping_keys:
+                agg_pl = agg_pl.over(id.id.sql for id in window.grouping_keys)
+            result = df.with_columns(agg_pl.alias(node.output_name.sql))
         else:  # row-bounded window
-            assert isinstance(window.bounds, window_spec.RowsWindowBounds)
-            # Polars API semi-bounded, and any grouped rolling window challenging
-            # https://github.com/pola-rs/polars/issues/4799
-            # https://github.com/pola-rs/polars/issues/8976
-            index_col_name = "_bf_pl_engine_offsets"
-            indexed_df = df.with_row_index(index_col_name)
-            if len(window.grouping_keys) == 0:  # rolling-only window
-                # https://docs.pola.rs/api/python/stable/reference/dataframe/api/polars.DataFrame.rolling.html
-                offset_n = window.bounds.start
-                period_n = _get_period(window.bounds) or df.collect().height
-                results = indexed_df.rolling(
-                    index_column=index_col_name,
-                    period=f"{period_n}i",
-                    offset=f"{offset_n}i" if offset_n else None,
-                ).agg(agg_expr)
-            else:  # groupby-rolling window
-                raise NotImplementedError(
-                    "Groupby rolling windows not yet implemented in polars engine"
-                )
-            # polars is columnar, so this is efficient
-            # TODO: why can't just add columns?
-            return pl.concat([df, results], how="horizontal")
+            window_result = self._calc_row_analytic_func(
+                df, node.expression, node.window_spec, node.output_name.sql
+            )
+            result = pl.concat([df, window_result], how="horizontal")
+
+        # Probably easier just to pull this out as a rewriter
+        if (
+            node.expression.op.skips_nulls
+            and not node.never_skip_nulls
+            and node.expression.column_references
+        ):
+            nullity_expr = functools.reduce(
+                operator.or_,
+                (
+                    pl.col(column.sql).is_null()
+                    for column in node.expression.column_references
+                ),
+            )
+            result = result.with_columns(
+                pl.when(nullity_expr)
+                .then(None)
+                .otherwise(pl.col(node.output_name.sql))
+                .alias(node.output_name.sql)
+            )
+        return result
+
+    def _calc_row_analytic_func(
+        self,
+        frame: pl.LazyFrame,
+        agg_expr: ex.Aggregation,
+        window: window_spec.WindowSpec,
+        name: str,
+    ) -> pl.LazyFrame:
+        if not isinstance(window.bounds, window_spec.RowsWindowBounds):
+            raise NotImplementedError("Only row bounds supported by polars engine")
+        groupby = None
+        if len(window.grouping_keys) > 0:
+            groupby = [
+                self.expr_compiler.compile_expression(ref)
+                for ref in window.grouping_keys
+            ]
+
+        # Polars API semi-bounded, and any grouped rolling window challenging
+        # https://github.com/pola-rs/polars/issues/4799
+        # https://github.com/pola-rs/polars/issues/8976
+        pl_agg_expr = self.agg_compiler.compile_agg_expr(agg_expr).alias(name)
+        index_col_name = "_bf_pl_engine_offsets"
+        indexed_df = frame.with_row_index(index_col_name)
+        # https://docs.pola.rs/api/python/stable/reference/dataframe/api/polars.DataFrame.rolling.html
+        period_n, offset_n = _get_period_and_offset(window.bounds)
+        return (
+            indexed_df.rolling(
+                index_column=index_col_name,
+                period=f"{period_n}i",
+                offset=f"{offset_n}i" if (offset_n is not None) else None,
+                group_by=groupby,
+            )
+            .agg(pl_agg_expr)
+            .select(name)
+        )
 
 
-def _get_period(bounds: window_spec.RowsWindowBounds) -> Optional[int]:
-    """Returns None if the boundary is infinite."""
-    if bounds.start is None or bounds.end is None:
-        return None
+def _get_period_and_offset(
+    bounds: window_spec.RowsWindowBounds,
+) -> tuple[int, Optional[int]]:
+    # fixed size window
+    if (bounds.start is not None) and (bounds.end is not None):
+        return ((bounds.end - bounds.start + 1), bounds.start - 1)
 
-    # collecting height is a massive kludge
-    return bounds.end - bounds.start + 1
+    LARGE_N = 1000000000
+    if bounds.start is not None:
+        return (LARGE_N, bounds.start - 1)
+    if bounds.end is not None:
+        return (LARGE_N, None)
+    raise ValueError("Not a bounded window")
diff --git a/bigframes/core/global_session.py b/bigframes/core/global_session.py
index d4d70f5a06..8732b55990 100644
--- a/bigframes/core/global_session.py
+++ b/bigframes/core/global_session.py
@@ -112,3 +112,23 @@ def get_global_session():
 
 def with_default_session(func: Callable[..., _T], *args, **kwargs) -> _T:
     return func(get_global_session(), *args, **kwargs)
+
+
+class _GlobalSessionContext:
+    """
+    Context manager for testing that sets global session.
+    """
+
+    def __init__(self, session: bigframes.session.Session):
+        self._session = session
+
+    def __enter__(self):
+        global _global_session, _global_session_lock
+        with _global_session_lock:
+            self._previous_session = _global_session
+            _global_session = self._session
+
+    def __exit__(self, *exc_details):
+        global _global_session, _global_session_lock
+        with _global_session_lock:
+            _global_session = self._previous_session
diff --git a/bigframes/core/rewrite/__init__.py b/bigframes/core/rewrite/__init__.py
index b8f1d26db8..5d554d45d7 100644
--- a/bigframes/core/rewrite/__init__.py
+++ b/bigframes/core/rewrite/__init__.py
@@ -24,7 +24,7 @@
 )
 from bigframes.core.rewrite.slices import pull_out_limit, pull_up_limits, rewrite_slice
 from bigframes.core.rewrite.timedeltas import rewrite_timedelta_expressions
-from bigframes.core.rewrite.windows import rewrite_range_rolling
+from bigframes.core.rewrite.windows import pull_out_window_order, rewrite_range_rolling
 
 __all__ = [
     "legacy_join_as_projection",
@@ -41,4 +41,5 @@
     "bake_order",
     "try_reduce_to_local_scan",
     "fold_row_counts",
+    "pull_out_window_order",
 ]
diff --git a/bigframes/core/rewrite/windows.py b/bigframes/core/rewrite/windows.py
index 9f55db23af..6e9ba0dd3d 100644
--- a/bigframes/core/rewrite/windows.py
+++ b/bigframes/core/rewrite/windows.py
@@ -17,7 +17,7 @@
 import dataclasses
 
 from bigframes import operations as ops
-from bigframes.core import nodes
+from bigframes.core import guid, identifiers, nodes, ordering
 
 
 def rewrite_range_rolling(node: nodes.BigFrameNode) -> nodes.BigFrameNode:
@@ -43,3 +43,34 @@ def rewrite_range_rolling(node: nodes.BigFrameNode) -> nodes.BigFrameNode:
         node,
         window_spec=dataclasses.replace(node.window_spec, ordering=(new_ordering,)),
     )
+
+
+def pull_out_window_order(root: nodes.BigFrameNode) -> nodes.BigFrameNode:
+    return root.bottom_up(rewrite_window_node)
+
+
+def rewrite_window_node(node: nodes.BigFrameNode) -> nodes.BigFrameNode:
+    if not isinstance(node, nodes.WindowOpNode):
+        return node
+    if len(node.window_spec.ordering) == 0:
+        return node
+    else:
+        offsets_id = guid.generate_guid()
+        w_offsets = nodes.PromoteOffsetsNode(
+            node.child, identifiers.ColumnId(offsets_id)
+        )
+        sorted_child = nodes.OrderByNode(w_offsets, node.window_spec.ordering)
+        new_window_node = dataclasses.replace(
+            node,
+            child=sorted_child,
+            window_spec=node.window_spec.without_order(force=True),
+        )
+        w_resetted_order = nodes.OrderByNode(
+            new_window_node,
+            by=(ordering.ascending_over(identifiers.ColumnId(offsets_id)),),
+            is_total_order=True,
+        )
+        w_offsets_dropped = nodes.SelectionNode(
+            w_resetted_order, tuple(nodes.AliasedRef.identity(id) for id in node.ids)
+        )
+        return w_offsets_dropped
diff --git a/bigframes/core/window_spec.py b/bigframes/core/window_spec.py
index d08ba3d12a..2be30135ee 100644
--- a/bigframes/core/window_spec.py
+++ b/bigframes/core/window_spec.py
@@ -234,7 +234,9 @@ def is_row_bounded(self):
         This is relevant for determining whether the window requires a total order
         to calculate deterministically.
         """
-        return isinstance(self.bounds, RowsWindowBounds)
+        return isinstance(self.bounds, RowsWindowBounds) and (
+            (self.bounds.start is not None) or (self.bounds.end is not None)
+        )
 
     @property
     def is_range_bounded(self):
@@ -254,7 +256,9 @@ def is_unbounded(self):
         This is relevant for determining whether the window requires a total order
         to calculate deterministically.
         """
-        return self.bounds is None
+        return self.bounds is None or (
+            self.bounds.start is None and self.bounds.end is None
+        )
 
     @property
     def all_referenced_columns(self) -> Set[ids.ColumnId]:
@@ -266,9 +270,9 @@ def all_referenced_columns(self) -> Set[ids.ColumnId]:
         )
         return set(itertools.chain((i.id for i in self.grouping_keys), ordering_vars))
 
-    def without_order(self) -> WindowSpec:
+    def without_order(self, force: bool = False) -> WindowSpec:
         """Removes ordering clause if ordering isn't required to define bounds."""
-        if self.is_row_bounded:
+        if self.is_row_bounded and not force:
             raise ValueError("Cannot remove order from row-bounded window")
         return replace(self, ordering=())
 
diff --git a/bigframes/operations/aggregations.py b/bigframes/operations/aggregations.py
index e3f15e67a1..1c321c0bf8 100644
--- a/bigframes/operations/aggregations.py
+++ b/bigframes/operations/aggregations.py
@@ -439,7 +439,6 @@ def output_type(self, *input_types: dtypes.ExpressionType) -> dtypes.ExpressionT
         return dtypes.INT_DTYPE
 
 
-# TODO: Convert to NullaryWindowOp
 @dataclasses.dataclass(frozen=True)
 class RankOp(UnaryWindowOp):
     name: ClassVar[str] = "rank"
@@ -456,7 +455,6 @@ def implicitly_inherits_order(self):
         return False
 
 
-# TODO: Convert to NullaryWindowOp
 @dataclasses.dataclass(frozen=True)
 class DenseRankOp(UnaryWindowOp):
     @property
diff --git a/bigframes/testing/polars_session.py b/bigframes/testing/polars_session.py
index f8dda8da55..5e5de2d0b2 100644
--- a/bigframes/testing/polars_session.py
+++ b/bigframes/testing/polars_session.py
@@ -20,12 +20,9 @@
 import polars
 
 import bigframes
-import bigframes.clients
 import bigframes.core.blocks
 import bigframes.core.compile.polars
-import bigframes.core.ordering
 import bigframes.dataframe
-import bigframes.session.clients
 import bigframes.session.executor
 import bigframes.session.metrics
 
@@ -35,6 +32,26 @@
 class TestExecutor(bigframes.session.executor.Executor):
     compiler = bigframes.core.compile.polars.PolarsCompiler()
 
+    def peek(
+        self,
+        array_value: bigframes.core.ArrayValue,
+        n_rows: int,
+        use_explicit_destination: Optional[bool] = False,
+    ):
+        """
+        A 'peek' efficiently accesses a small number of rows in the dataframe.
+        """
+        lazy_frame: polars.LazyFrame = self.compiler.compile(array_value)
+        pa_table = lazy_frame.collect().limit(n_rows).to_arrow()
+        # Currently, pyarrow types might not quite be exactly the ones in the bigframes schema.
+        # Nullability may be different, and might use large versions of list, string datatypes.
+        return bigframes.session.executor.ExecuteResult(
+            arrow_batches=pa_table.to_batches(),
+            schema=array_value.schema,
+            total_bytes=pa_table.nbytes,
+            total_rows=pa_table.num_rows,
+        )
+
     def execute(
         self,
         array_value: bigframes.core.ArrayValue,
@@ -58,6 +75,14 @@ def execute(
             total_rows=pa_table.num_rows,
         )
 
+    def cached(
+        self,
+        array_value: bigframes.core.ArrayValue,
+        *,
+        config,
+    ) -> None:
+        return
+
 
 class TestSession(bigframes.session.Session):
     def __init__(self):
@@ -92,3 +117,8 @@ def read_pandas(self, pandas_dataframe, write_engine="default"):
             pandas_dataframe = pandas_dataframe.to_frame()
         local_block = bigframes.core.blocks.Block.from_local(pandas_dataframe, self)
         return bigframes.dataframe.DataFrame(local_block)
+
+    @property
+    def bqclient(self):
+        # prevents logger from trying to call bq upon any errors
+        return None
diff --git a/noxfile.py b/noxfile.py
index 297e8f9d6f..e3cfbf83a4 100644
--- a/noxfile.py
+++ b/noxfile.py
@@ -79,7 +79,7 @@
 UNIT_TEST_DEPENDENCIES: List[str] = []
 UNIT_TEST_EXTRAS: List[str] = ["tests"]
 UNIT_TEST_EXTRAS_BY_PYTHON: Dict[str, List[str]] = {
-    "3.12": ["polars", "scikit-learn"],
+    "3.12": ["tests", "polars", "scikit-learn"],
 }
 
 # 3.10 is needed for Windows tests as it is the only version installed in the
@@ -202,14 +202,11 @@ def install_unittest_dependencies(session, install_test_extra, *constraints):
     if UNIT_TEST_LOCAL_DEPENDENCIES:
         session.install(*UNIT_TEST_LOCAL_DEPENDENCIES, *constraints)
 
-    if install_test_extra and UNIT_TEST_EXTRAS_BY_PYTHON:
-        extras = UNIT_TEST_EXTRAS_BY_PYTHON.get(session.python, [])
-    if install_test_extra and UNIT_TEST_EXTRAS:
-        extras = UNIT_TEST_EXTRAS
-    else:
-        extras = []
-
-    if extras:
+    if install_test_extra:
+        if session.python in UNIT_TEST_EXTRAS_BY_PYTHON:
+            extras = UNIT_TEST_EXTRAS_BY_PYTHON[session.python]
+        else:
+            extras = UNIT_TEST_EXTRAS
         session.install("-e", f".[{','.join(extras)}]", *constraints)
     else:
         session.install("-e", ".", *constraints)
diff --git a/tests/unit/test_dataframe_polars.py b/tests/unit/test_dataframe_polars.py
new file mode 100644
index 0000000000..2bda563418
--- /dev/null
+++ b/tests/unit/test_dataframe_polars.py
@@ -0,0 +1,4422 @@
+# Copyright 2023 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import io
+import operator
+import pathlib
+import tempfile
+import typing
+from typing import Generator, List, Tuple
+
+import numpy as np
+import pandas as pd
+import pandas.testing
+import pytest
+
+import bigframes
+import bigframes._config.display_options as display_options
+import bigframes.core.indexes as bf_indexes
+import bigframes.dataframe as dataframe
+import bigframes.pandas as bpd
+import bigframes.series as series
+from tests.system.utils import (
+    assert_dfs_equivalent,
+    assert_pandas_df_equal,
+    assert_series_equal,
+    assert_series_equivalent,
+    convert_pandas_dtypes,
+)
+
+pytest.importorskip("polars")
+pytest.importorskip("pandas", minversion="2.0.0")
+
+CURRENT_DIR = pathlib.Path(__file__).parent
+DATA_DIR = CURRENT_DIR.parent / "data"
+
+
+@pytest.fixture(scope="module", autouse=True)
+def session() -> Generator[bigframes.Session, None, None]:
+    import bigframes.core.global_session
+    from bigframes.testing import polars_session
+
+    session = polars_session.TestSession()
+    with bigframes.core.global_session._GlobalSessionContext(session):
+        yield session
+
+
+@pytest.fixture(scope="module")
+def scalars_pandas_df_index() -> pd.DataFrame:
+    """pd.DataFrame pointing at test data."""
+
+    df = pd.read_json(
+        DATA_DIR / "scalars.jsonl",
+        lines=True,
+    )
+    convert_pandas_dtypes(df, bytes_col=True)
+
+    df = df.set_index("rowindex", drop=False)
+    df.index.name = None
+    return df.set_index("rowindex").sort_index()
+
+
+@pytest.fixture(scope="module")
+def scalars_df_index(
+    session: bigframes.Session, scalars_pandas_df_index
+) -> bpd.DataFrame:
+    return session.read_pandas(scalars_pandas_df_index)
+
+
+@pytest.fixture(scope="module")
+def scalars_df_2_index(
+    session: bigframes.Session, scalars_pandas_df_index
+) -> bpd.DataFrame:
+    return session.read_pandas(scalars_pandas_df_index)
+
+
+@pytest.fixture(scope="module")
+def scalars_dfs(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    return scalars_df_index, scalars_pandas_df_index
+
+
+def test_df_construct_copy(scalars_dfs):
+    columns = ["int64_col", "string_col", "float64_col"]
+    scalars_df, scalars_pandas_df = scalars_dfs
+    # Make the mapping from label to col_id non-trivial
+    bf_df = scalars_df.copy()
+    bf_df["int64_col"] = bf_df["int64_col"] / 2
+    pd_df = scalars_pandas_df.copy()
+    pd_df["int64_col"] = pd_df["int64_col"] / 2
+
+    bf_result = dataframe.DataFrame(bf_df, columns=columns).to_pandas()
+
+    pd_result = pd.DataFrame(pd_df, columns=columns)
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_df_construct_pandas_default(scalars_dfs):
+    # This should trigger the inlined codepath
+    columns = [
+        "int64_too",
+        "int64_col",
+        "float64_col",
+        "bool_col",
+        "string_col",
+        "date_col",
+        "datetime_col",
+        "numeric_col",
+        "float64_col",
+        "time_col",
+        "timestamp_col",
+    ]
+    _, scalars_pandas_df = scalars_dfs
+    bf_result = dataframe.DataFrame(scalars_pandas_df, columns=columns).to_pandas()
+    pd_result = pd.DataFrame(scalars_pandas_df, columns=columns)
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_df_construct_structs(session):
+    pd_frame = pd.Series(
+        [
+            {"version": 1, "project": "pandas"},
+            {"version": 2, "project": "pandas"},
+            {"version": 1, "project": "numpy"},
+        ]
+    ).to_frame()
+    bf_series = session.read_pandas(pd_frame)
+    pd.testing.assert_frame_equal(
+        bf_series.to_pandas(), pd_frame, check_index_type=False, check_dtype=False
+    )
+
+
+def test_df_construct_pandas_set_dtype(scalars_dfs):
+    columns = [
+        "int64_too",
+        "int64_col",
+        "float64_col",
+        "bool_col",
+    ]
+    _, scalars_pandas_df = scalars_dfs
+    bf_result = dataframe.DataFrame(
+        scalars_pandas_df, columns=columns, dtype="Float64"
+    ).to_pandas()
+    pd_result = pd.DataFrame(scalars_pandas_df, columns=columns, dtype="Float64")
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_df_construct_from_series(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = dataframe.DataFrame(
+        {"a": scalars_df["int64_col"], "b": scalars_df["string_col"]},
+        dtype="string[pyarrow]",
+    )
+    pd_result = pd.DataFrame(
+        {"a": scalars_pandas_df["int64_col"], "b": scalars_pandas_df["string_col"]},
+        dtype="string[pyarrow]",
+    )
+    assert_dfs_equivalent(pd_result, bf_result)
+
+
+def test_df_construct_from_dict():
+    input_dict = {
+        "Animal": ["Falcon", "Falcon", "Parrot", "Parrot"],
+        # With a space in column name. We use standardized SQL schema ids to solve the problem that BQ schema doesn't support column names with spaces. b/296751058
+        "Max Speed": [380.0, 370.0, 24.0, 26.0],
+    }
+    bf_result = dataframe.DataFrame(input_dict).to_pandas()
+    pd_result = pd.DataFrame(input_dict)
+
+    pandas.testing.assert_frame_equal(
+        bf_result, pd_result, check_dtype=False, check_index_type=False
+    )
+
+
+def test_df_construct_dtype():
+    data = {
+        "int_col": [1, 2, 3],
+        "string_col": ["1.1", "2.0", "3.5"],
+        "float_col": [1.0, 2.0, 3.0],
+    }
+    dtype = pd.StringDtype(storage="pyarrow")
+    bf_result = dataframe.DataFrame(data, dtype=dtype)
+    pd_result = pd.DataFrame(data, dtype=dtype)
+    pd_result.index = pd_result.index.astype("Int64")
+    pandas.testing.assert_frame_equal(bf_result.to_pandas(), pd_result)
+
+
+def test_get_column(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_name = "int64_col"
+    series = scalars_df[col_name]
+    bf_result = series.to_pandas()
+    pd_result = scalars_pandas_df[col_name]
+    assert_series_equal(bf_result, pd_result)
+
+
+def test_get_column_nonstring(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    series = scalars_df.rename(columns={"int64_col": 123.1})[123.1]
+    bf_result = series.to_pandas()
+    pd_result = scalars_pandas_df.rename(columns={"int64_col": 123.1})[123.1]
+    assert_series_equal(bf_result, pd_result)
+
+
+@pytest.mark.parametrize(
+    "row_slice",
+    [
+        (slice(1, 7, 2)),
+        (slice(1, 7, None)),
+        (slice(None, -3, None)),
+    ],
+)
+def test_get_rows_with_slice(scalars_dfs, row_slice):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df[row_slice].to_pandas()
+    pd_result = scalars_pandas_df[row_slice]
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+def test_hasattr(scalars_dfs):
+    scalars_df, _ = scalars_dfs
+    assert hasattr(scalars_df, "int64_col")
+    assert hasattr(scalars_df, "head")
+    assert not hasattr(scalars_df, "not_exist")
+
+
+@pytest.mark.parametrize(
+    ("ordered"),
+    [
+        (True),
+        (False),
+    ],
+)
+def test_head_with_custom_column_labels(
+    scalars_df_index, scalars_pandas_df_index, ordered
+):
+    rename_mapping = {
+        "int64_col": "Integer Column",
+        "string_col": "言語列",
+    }
+    bf_df = scalars_df_index.rename(columns=rename_mapping).head(3)
+    bf_result = bf_df.to_pandas(ordered=ordered)
+    pd_result = scalars_pandas_df_index.rename(columns=rename_mapping).head(3)
+    assert_pandas_df_equal(bf_result, pd_result, ignore_order=not ordered)
+
+
+def test_tail_with_custom_column_labels(scalars_df_index, scalars_pandas_df_index):
+    rename_mapping = {
+        "int64_col": "Integer Column",
+        "string_col": "言語列",
+    }
+    bf_df = scalars_df_index.rename(columns=rename_mapping).tail(3)
+    bf_result = bf_df.to_pandas()
+    pd_result = scalars_pandas_df_index.rename(columns=rename_mapping).tail(3)
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_get_column_by_attr(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    series = scalars_df.int64_col
+    bf_result = series.to_pandas()
+    pd_result = scalars_pandas_df.int64_col
+    assert_series_equal(bf_result, pd_result)
+
+
+def test_get_columns(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_names = ["bool_col", "float64_col", "int64_col"]
+    df_subset = scalars_df.get(col_names)
+    df_pandas = df_subset.to_pandas()
+    pd.testing.assert_index_equal(
+        df_pandas.columns, scalars_pandas_df[col_names].columns
+    )
+
+
+def test_get_columns_default(scalars_dfs):
+    scalars_df, _ = scalars_dfs
+    col_names = ["not", "column", "names"]
+    result = scalars_df.get(col_names, "default_val")
+    assert result == "default_val"
+
+
+@pytest.mark.parametrize(
+    ("loc", "column", "value", "allow_duplicates"),
+    [
+        (0, 666, 2, False),
+        (5, "float64_col", 2.2, True),
+        (13, "rowindex_2", [8, 7, 6, 5, 4, 3, 2, 1, 0], True),
+        pytest.param(
+            14,
+            "test",
+            2,
+            False,
+            marks=pytest.mark.xfail(
+                raises=IndexError,
+            ),
+        ),
+        pytest.param(
+            12,
+            "int64_col",
+            2,
+            False,
+            marks=pytest.mark.xfail(
+                raises=ValueError,
+            ),
+        ),
+    ],
+)
+def test_insert(scalars_dfs, loc, column, value, allow_duplicates):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    # insert works inplace, so will influence other tests.
+    # make a copy to avoid inplace changes.
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+    bf_df.insert(loc, column, value, allow_duplicates)
+    pd_df.insert(loc, column, value, allow_duplicates)
+
+    pd.testing.assert_frame_equal(bf_df.to_pandas(), pd_df, check_dtype=False)
+
+
+def test_where_series_cond(scalars_df_index, scalars_pandas_df_index):
+    # Condition is dataframe, other is None (as default).
+    cond_bf = scalars_df_index["int64_col"] > 0
+    cond_pd = scalars_pandas_df_index["int64_col"] > 0
+    bf_result = scalars_df_index.where(cond_bf).to_pandas()
+    pd_result = scalars_pandas_df_index.where(cond_pd)
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_mask_series_cond(scalars_df_index, scalars_pandas_df_index):
+    cond_bf = scalars_df_index["int64_col"] > 0
+    cond_pd = scalars_pandas_df_index["int64_col"] > 0
+
+    bf_df = scalars_df_index[["int64_too", "int64_col", "float64_col"]]
+    pd_df = scalars_pandas_df_index[["int64_too", "int64_col", "float64_col"]]
+    bf_result = bf_df.mask(cond_bf, bf_df + 1).to_pandas()
+    pd_result = pd_df.mask(cond_pd, pd_df + 1)
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_where_series_multi_index(scalars_df_index, scalars_pandas_df_index):
+    # Test when a dataframe has multi-index or multi-columns.
+    columns = ["int64_col", "float64_col"]
+    dataframe_bf = scalars_df_index[columns]
+
+    dataframe_bf.columns = pd.MultiIndex.from_tuples(
+        [("str1", 1), ("str2", 2)], names=["STR", "INT"]
+    )
+    cond_bf = dataframe_bf["str1"] > 0
+
+    with pytest.raises(NotImplementedError) as context:
+        dataframe_bf.where(cond_bf).to_pandas()
+    assert (
+        str(context.value)
+        == "The dataframe.where() method does not support multi-index and/or multi-column."
+    )
+
+
+def test_where_series_cond_const_other(scalars_df_index, scalars_pandas_df_index):
+    # Condition is a series, other is a constant.
+    columns = ["int64_col", "float64_col"]
+    dataframe_bf = scalars_df_index[columns]
+    dataframe_pd = scalars_pandas_df_index[columns]
+    dataframe_bf.columns.name = "test_name"
+    dataframe_pd.columns.name = "test_name"
+
+    cond_bf = dataframe_bf["int64_col"] > 0
+    cond_pd = dataframe_pd["int64_col"] > 0
+    other = 0
+
+    bf_result = dataframe_bf.where(cond_bf, other).to_pandas()
+    pd_result = dataframe_pd.where(cond_pd, other)
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_where_series_cond_dataframe_other(scalars_df_index, scalars_pandas_df_index):
+    # Condition is a series, other is a dataframe.
+    columns = ["int64_col", "float64_col"]
+    dataframe_bf = scalars_df_index[columns]
+    dataframe_pd = scalars_pandas_df_index[columns]
+
+    cond_bf = dataframe_bf["int64_col"] > 0
+    cond_pd = dataframe_pd["int64_col"] > 0
+    other_bf = -dataframe_bf
+    other_pd = -dataframe_pd
+
+    bf_result = dataframe_bf.where(cond_bf, other_bf).to_pandas()
+    pd_result = dataframe_pd.where(cond_pd, other_pd)
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_where_dataframe_cond(scalars_df_index, scalars_pandas_df_index):
+    # Condition is a dataframe, other is None.
+    columns = ["int64_col", "float64_col"]
+    dataframe_bf = scalars_df_index[columns]
+    dataframe_pd = scalars_pandas_df_index[columns]
+
+    cond_bf = dataframe_bf > 0
+    cond_pd = dataframe_pd > 0
+
+    bf_result = dataframe_bf.where(cond_bf, None).to_pandas()
+    pd_result = dataframe_pd.where(cond_pd, None)
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_where_dataframe_cond_const_other(scalars_df_index, scalars_pandas_df_index):
+    # Condition is a dataframe, other is a constant.
+    columns = ["int64_col", "float64_col"]
+    dataframe_bf = scalars_df_index[columns]
+    dataframe_pd = scalars_pandas_df_index[columns]
+
+    cond_bf = dataframe_bf > 0
+    cond_pd = dataframe_pd > 0
+    other_bf = 10
+    other_pd = 10
+
+    bf_result = dataframe_bf.where(cond_bf, other_bf).to_pandas()
+    pd_result = dataframe_pd.where(cond_pd, other_pd)
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_where_dataframe_cond_dataframe_other(
+    scalars_df_index, scalars_pandas_df_index
+):
+    # Condition is a dataframe, other is a dataframe.
+    columns = ["int64_col", "float64_col"]
+    dataframe_bf = scalars_df_index[columns]
+    dataframe_pd = scalars_pandas_df_index[columns]
+
+    cond_bf = dataframe_bf > 0
+    cond_pd = dataframe_pd > 0
+    other_bf = dataframe_bf * 2
+    other_pd = dataframe_pd * 2
+
+    bf_result = dataframe_bf.where(cond_bf, other_bf).to_pandas()
+    pd_result = dataframe_pd.where(cond_pd, other_pd)
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_drop_column(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_name = "int64_col"
+    df_pandas = scalars_df.drop(columns=col_name).to_pandas()
+    pd.testing.assert_index_equal(
+        df_pandas.columns, scalars_pandas_df.drop(columns=col_name).columns
+    )
+
+
+def test_drop_columns(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_names = ["int64_col", "geography_col", "time_col"]
+    df_pandas = scalars_df.drop(columns=col_names).to_pandas()
+    pd.testing.assert_index_equal(
+        df_pandas.columns, scalars_pandas_df.drop(columns=col_names).columns
+    )
+
+
+def test_drop_labels_axis_1(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    labels = ["int64_col", "geography_col", "time_col"]
+
+    pd_result = scalars_pandas_df.drop(labels=labels, axis=1)
+    bf_result = scalars_df.drop(labels=labels, axis=1).to_pandas()
+
+    pd.testing.assert_frame_equal(pd_result, bf_result)
+
+
+def test_drop_with_custom_column_labels(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    rename_mapping = {
+        "int64_col": "Integer Column",
+        "string_col": "言語列",
+    }
+    dropped_columns = [
+        "言語列",
+        "timestamp_col",
+    ]
+    bf_df = scalars_df.rename(columns=rename_mapping).drop(columns=dropped_columns)
+    bf_result = bf_df.to_pandas()
+    pd_result = scalars_pandas_df.rename(columns=rename_mapping).drop(
+        columns=dropped_columns
+    )
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+def test_df_memory_usage(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    pd_result = scalars_pandas_df.memory_usage()
+    bf_result = scalars_df.memory_usage()
+
+    pd.testing.assert_series_equal(pd_result, bf_result, rtol=1.5)
+
+
+def test_df_info(scalars_dfs):
+    expected = (
+        "<class 'bigframes.dataframe.DataFrame'>\n"
+        "Index: 9 entries, 0 to 8\n"
+        "Data columns (total 13 columns):\n"
+        "  #  Column         Non-Null Count    Dtype\n"
+        "---  -------------  ----------------  ------------------------------\n"
+        "  0  bool_col       8 non-null        boolean\n"
+        "  1  bytes_col      6 non-null        binary[pyarrow]\n"
+        "  2  date_col       7 non-null        date32[day][pyarrow]\n"
+        "  3  datetime_col   6 non-null        timestamp[us][pyarrow]\n"
+        "  4  geography_col  4 non-null        geometry\n"
+        "  5  int64_col      8 non-null        Int64\n"
+        "  6  int64_too      9 non-null        Int64\n"
+        "  7  numeric_col    6 non-null        decimal128(38, 9)[pyarrow]\n"
+        "  8  float64_col    7 non-null        Float64\n"
+        "  9  rowindex_2     9 non-null        Int64\n"
+        " 10  string_col     8 non-null        string\n"
+        " 11  time_col       6 non-null        time64[us][pyarrow]\n"
+        " 12  timestamp_col  6 non-null        timestamp[us, tz=UTC][pyarrow]\n"
+        "dtypes: Float64(1), Int64(3), binary[pyarrow](1), boolean(1), date32[day][pyarrow](1), decimal128(38, 9)[pyarrow](1), geometry(1), string(1), time64[us][pyarrow](1), timestamp[us, tz=UTC][pyarrow](1), timestamp[us][pyarrow](1)\n"
+        "memory usage: 1269 bytes\n"
+    )
+
+    scalars_df, _ = scalars_dfs
+    bf_result = io.StringIO()
+
+    scalars_df.info(buf=bf_result)
+
+    assert expected == bf_result.getvalue()
+
+
+@pytest.mark.parametrize(
+    ("include", "exclude"),
+    [
+        ("Int64", None),
+        (["int"], None),
+        ("number", None),
+        ([pd.Int64Dtype(), pd.BooleanDtype()], None),
+        (None, [pd.Int64Dtype(), pd.BooleanDtype()]),
+        ("Int64", ["boolean"]),
+    ],
+)
+def test_select_dtypes(scalars_dfs, include, exclude):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    pd_result = scalars_pandas_df.select_dtypes(include=include, exclude=exclude)
+    bf_result = scalars_df.select_dtypes(include=include, exclude=exclude).to_pandas()
+
+    pd.testing.assert_frame_equal(pd_result, bf_result)
+
+
+def test_drop_index(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    pd_result = scalars_pandas_df.drop(index=[4, 1, 2])
+    bf_result = scalars_df.drop(index=[4, 1, 2]).to_pandas()
+
+    pd.testing.assert_frame_equal(pd_result, bf_result)
+
+
+def test_drop_pandas_index(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    drop_index = scalars_pandas_df.iloc[[4, 1, 2]].index
+
+    pd_result = scalars_pandas_df.drop(index=drop_index)
+    bf_result = scalars_df.drop(index=drop_index).to_pandas()
+
+    pd.testing.assert_frame_equal(pd_result, bf_result)
+
+
+def test_drop_bigframes_index(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    drop_index = scalars_df.loc[[4, 1, 2]].index
+    drop_pandas_index = scalars_pandas_df.loc[[4, 1, 2]].index
+
+    pd_result = scalars_pandas_df.drop(index=drop_pandas_index)
+    bf_result = scalars_df.drop(index=drop_index).to_pandas()
+
+    pd.testing.assert_frame_equal(pd_result, bf_result)
+
+
+def test_drop_bigframes_index_with_na(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    scalars_df = scalars_df.copy()
+    scalars_pandas_df = scalars_pandas_df.copy()
+    scalars_df = scalars_df.set_index("bytes_col")
+    scalars_pandas_df = scalars_pandas_df.set_index("bytes_col")
+    drop_index = scalars_df.iloc[[3, 5]].index
+    drop_pandas_index = scalars_pandas_df.iloc[[3, 5]].index
+
+    pd_result = scalars_pandas_df.drop(index=drop_pandas_index)  # drop_pandas_index)
+    bf_result = scalars_df.drop(index=drop_index).to_pandas()
+
+    pd.testing.assert_frame_equal(pd_result, bf_result)
+
+
+def test_drop_bigframes_multiindex(scalars_dfs):
+    # TODO: supply a reason why this isn't compatible with pandas 1.x
+    pytest.importorskip("pandas", minversion="2.0.0")
+    scalars_df, scalars_pandas_df = scalars_dfs
+    scalars_df = scalars_df.copy()
+    scalars_pandas_df = scalars_pandas_df.copy()
+    sub_df = scalars_df.iloc[[4, 1, 2]]
+    sub_pandas_df = scalars_pandas_df.iloc[[4, 1, 2]]
+    sub_df = sub_df.set_index(["bytes_col", "numeric_col"])
+    sub_pandas_df = sub_pandas_df.set_index(["bytes_col", "numeric_col"])
+    drop_index = sub_df.index
+    drop_pandas_index = sub_pandas_df.index
+
+    scalars_df = scalars_df.set_index(["bytes_col", "numeric_col"])
+    scalars_pandas_df = scalars_pandas_df.set_index(["bytes_col", "numeric_col"])
+    bf_result = scalars_df.drop(index=drop_index).to_pandas()
+    pd_result = scalars_pandas_df.drop(index=drop_pandas_index)
+
+    pd.testing.assert_frame_equal(pd_result, bf_result)
+
+
+def test_drop_labels_axis_0(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    pd_result = scalars_pandas_df.drop(labels=[4, 1, 2], axis=0)
+    bf_result = scalars_df.drop(labels=[4, 1, 2], axis=0).to_pandas()
+
+    pd.testing.assert_frame_equal(pd_result, bf_result)
+
+
+def test_drop_index_and_columns(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    pd_result = scalars_pandas_df.drop(index=[4, 1, 2], columns="int64_col")
+    bf_result = scalars_df.drop(index=[4, 1, 2], columns="int64_col").to_pandas()
+
+    pd.testing.assert_frame_equal(pd_result, bf_result)
+
+
+def test_rename(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_name_dict = {"bool_col": 1.2345}
+    df_pandas = scalars_df.rename(columns=col_name_dict).to_pandas()
+    pd.testing.assert_index_equal(
+        df_pandas.columns, scalars_pandas_df.rename(columns=col_name_dict).columns
+    )
+
+
+def test_df_peek(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    peek_result = scalars_df.peek(n=3, force=False, allow_large_results=True)
+
+    pd.testing.assert_index_equal(scalars_pandas_df.columns, peek_result.columns)
+    assert len(peek_result) == 3
+
+
+def test_df_peek_with_large_results_not_allowed(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    peek_result = scalars_df.peek(n=3, force=False, allow_large_results=False)
+
+    pd.testing.assert_index_equal(scalars_pandas_df.columns, peek_result.columns)
+    assert len(peek_result) == 3
+
+
+def test_df_peek_filtered(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    peek_result = scalars_df[scalars_df.int64_col != 0].peek(n=3, force=False)
+    pd.testing.assert_index_equal(scalars_pandas_df.columns, peek_result.columns)
+    assert len(peek_result) == 3
+
+
+def test_df_peek_force_default(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    peek_result = scalars_df[["int64_col", "int64_too"]].cumsum().peek(n=3)
+    pd.testing.assert_index_equal(
+        scalars_pandas_df[["int64_col", "int64_too"]].columns, peek_result.columns
+    )
+    assert len(peek_result) == 3
+
+
+def test_df_peek_reset_index(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    peek_result = (
+        scalars_df[["int64_col", "int64_too"]].reset_index(drop=True).peek(n=3)
+    )
+    pd.testing.assert_index_equal(
+        scalars_pandas_df[["int64_col", "int64_too"]].columns, peek_result.columns
+    )
+    assert len(peek_result) == 3
+
+
+def test_repr_w_all_rows(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    # Remove columns with flaky formatting, like NUMERIC columns (which use the
+    # object dtype). Also makes a copy so that mutating the index name doesn't
+    # break other tests.
+    scalars_df = scalars_df.drop(columns=["numeric_col"])
+    scalars_pandas_df = scalars_pandas_df.drop(columns=["numeric_col"])
+
+    # When there are 10 or fewer rows, the outputs should be identical.
+    actual = repr(scalars_df.head(10))
+
+    with display_options.pandas_repr(bigframes.options.display):
+        expected = repr(scalars_pandas_df.head(10))
+
+    assert actual == expected
+
+
+def test_join_repr(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    scalars_df = (
+        scalars_df[["int64_col"]]
+        .join(scalars_df.set_index("int64_col")[["int64_too"]])
+        .sort_index()
+    )
+    scalars_pandas_df = (
+        scalars_pandas_df[["int64_col"]]
+        .join(scalars_pandas_df.set_index("int64_col")[["int64_too"]])
+        .sort_index()
+    )
+    # Pandas join result index name seems to depend on the index values in a way that bigframes can't match exactly
+    scalars_pandas_df.index.name = None
+
+    actual = repr(scalars_df)
+
+    with display_options.pandas_repr(bigframes.options.display):
+        expected = repr(scalars_pandas_df)
+
+    assert actual == expected
+
+
+def test_repr_html_w_all_rows(scalars_dfs, session):
+    scalars_df, _ = scalars_dfs
+    # get a pandas df of the expected format
+    df, _ = scalars_df._block.to_pandas()
+    pandas_df = df.set_axis(scalars_df._block.column_labels, axis=1)
+    pandas_df.index.name = scalars_df.index.name
+
+    # When there are 10 or fewer rows, the outputs should be identical except for the extra note.
+    actual = scalars_df.head(10)._repr_html_()
+
+    with display_options.pandas_repr(bigframes.options.display):
+        pandas_repr = pandas_df.head(10)._repr_html_()
+
+    expected = (
+        pandas_repr
+        + f"[{len(pandas_df.index)} rows x {len(pandas_df.columns)} columns in total]"
+    )
+    assert actual == expected
+
+
+def test_df_column_name_with_space(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_name_dict = {"bool_col": "bool  col"}
+    df_pandas = scalars_df.rename(columns=col_name_dict).to_pandas()
+    pd.testing.assert_index_equal(
+        df_pandas.columns, scalars_pandas_df.rename(columns=col_name_dict).columns
+    )
+
+
+def test_df_column_name_duplicate(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_name_dict = {"int64_too": "int64_col"}
+    df_pandas = scalars_df.rename(columns=col_name_dict).to_pandas()
+    pd.testing.assert_index_equal(
+        df_pandas.columns, scalars_pandas_df.rename(columns=col_name_dict).columns
+    )
+
+
+def test_get_df_column_name_duplicate(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_name_dict = {"int64_too": "int64_col"}
+
+    bf_result = scalars_df.rename(columns=col_name_dict)["int64_col"].to_pandas()
+    pd_result = scalars_pandas_df.rename(columns=col_name_dict)["int64_col"]
+    pd.testing.assert_index_equal(bf_result.columns, pd_result.columns)
+
+
+@pytest.mark.parametrize(
+    ("indices", "axis"),
+    [
+        ([1, 3, 5], 0),
+        ([2, 4, 6], 1),
+        ([1, -3, -5, -6], "index"),
+        ([-2, -4, -6], "columns"),
+    ],
+)
+def test_take_df(scalars_dfs, indices, axis):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    bf_result = scalars_df.take(indices, axis=axis).to_pandas()
+    pd_result = scalars_pandas_df.take(indices, axis=axis)
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+def test_filter_df(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    bf_bool_series = scalars_df["bool_col"]
+    bf_result = scalars_df[bf_bool_series].to_pandas()
+
+    pd_bool_series = scalars_pandas_df["bool_col"]
+    pd_result = scalars_pandas_df[pd_bool_series]
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+def test_assign_new_column(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    kwargs = {"new_col": 2}
+    df = scalars_df.assign(**kwargs)
+    bf_result = df.to_pandas()
+    pd_result = scalars_pandas_df.assign(**kwargs)
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_result["new_col"] = pd_result["new_col"].astype("Int64")
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+def test_assign_new_column_w_loc(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+    bf_df.loc[:, "new_col"] = 2
+    pd_df.loc[:, "new_col"] = 2
+    bf_result = bf_df.to_pandas()
+    pd_result = pd_df
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_result["new_col"] = pd_result["new_col"].astype("Int64")
+
+    pd.testing.assert_frame_equal(bf_result, pd_result)
+
+
+@pytest.mark.parametrize(
+    ("scalar",),
+    [
+        (2.1,),
+        (None,),
+    ],
+)
+def test_assign_new_column_w_setitem(scalars_dfs, scalar):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+    bf_df["new_col"] = scalar
+    pd_df["new_col"] = scalar
+    bf_result = bf_df.to_pandas()
+    pd_result = pd_df
+
+    # Convert default pandas dtypes `float64` to match BigQuery DataFrames dtypes.
+    pd_result["new_col"] = pd_result["new_col"].astype("Float64")
+
+    pd.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_assign_new_column_w_setitem_dataframe(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+    bf_df["int64_col"] = bf_df["int64_too"].to_frame()
+    pd_df["int64_col"] = pd_df["int64_too"].to_frame()
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_df["int64_col"] = pd_df["int64_col"].astype("Int64")
+
+    pd.testing.assert_frame_equal(bf_df.to_pandas(), pd_df)
+
+
+def test_assign_new_column_w_setitem_dataframe_error(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+
+    with pytest.raises(ValueError):
+        bf_df["impossible_col"] = bf_df[["int64_too", "string_col"]]
+    with pytest.raises(ValueError):
+        pd_df["impossible_col"] = pd_df[["int64_too", "string_col"]]
+
+
+def test_assign_new_column_w_setitem_list(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+    bf_df["new_col"] = [9, 8, 7, 6, 5, 4, 3, 2, 1]
+    pd_df["new_col"] = [9, 8, 7, 6, 5, 4, 3, 2, 1]
+    bf_result = bf_df.to_pandas()
+    pd_result = pd_df
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_result["new_col"] = pd_result["new_col"].astype("Int64")
+
+    pd.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_assign_new_column_w_setitem_list_repeated(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+    bf_df["new_col"] = [9, 8, 7, 6, 5, 4, 3, 2, 1]
+    pd_df["new_col"] = [9, 8, 7, 6, 5, 4, 3, 2, 1]
+    bf_df["new_col_2"] = [1, 3, 2, 5, 4, 7, 6, 9, 8]
+    pd_df["new_col_2"] = [1, 3, 2, 5, 4, 7, 6, 9, 8]
+    bf_result = bf_df.to_pandas()
+    pd_result = pd_df
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_result["new_col"] = pd_result["new_col"].astype("Int64")
+    pd_result["new_col_2"] = pd_result["new_col_2"].astype("Int64")
+
+    pd.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_assign_new_column_w_setitem_list_custom_index(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+
+    # set the custom index
+    pd_df = pd_df.set_index(["string_col", "int64_col"])
+    bf_df = bf_df.set_index(["string_col", "int64_col"])
+
+    bf_df["new_col"] = [9, 8, 7, 6, 5, 4, 3, 2, 1]
+    pd_df["new_col"] = [9, 8, 7, 6, 5, 4, 3, 2, 1]
+    bf_result = bf_df.to_pandas()
+    pd_result = pd_df
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_result["new_col"] = pd_result["new_col"].astype("Int64")
+
+    pd.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_assign_new_column_w_setitem_list_error(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+
+    with pytest.raises(ValueError):
+        pd_df["new_col"] = [1, 2, 3]  # should be len 9, is 3
+    with pytest.raises(ValueError):
+        bf_df["new_col"] = [1, 2, 3]
+
+
+def test_assign_existing_column(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    kwargs = {"int64_col": 2}
+    df = scalars_df.assign(**kwargs)
+    bf_result = df.to_pandas()
+    pd_result = scalars_pandas_df.assign(**kwargs)
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_result["int64_col"] = pd_result["int64_col"].astype("Int64")
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+def test_assign_listlike_to_empty_df(session):
+    empty_df = dataframe.DataFrame(session=session)
+    empty_pandas_df = pd.DataFrame()
+
+    bf_result = empty_df.assign(new_col=[1, 2, 3])
+    pd_result = empty_pandas_df.assign(new_col=[1, 2, 3])
+
+    pd_result["new_col"] = pd_result["new_col"].astype("Int64")
+    pd_result.index = pd_result.index.astype("Int64")
+    assert_pandas_df_equal(bf_result.to_pandas(), pd_result)
+
+
+def test_assign_to_empty_df_multiindex_error(session):
+    empty_df = dataframe.DataFrame(session=session)
+    empty_pandas_df = pd.DataFrame()
+
+    empty_df["empty_col_1"] = typing.cast(series.Series, [])
+    empty_df["empty_col_2"] = typing.cast(series.Series, [])
+    empty_pandas_df["empty_col_1"] = []
+    empty_pandas_df["empty_col_2"] = []
+    empty_df = empty_df.set_index(["empty_col_1", "empty_col_2"])
+    empty_pandas_df = empty_pandas_df.set_index(["empty_col_1", "empty_col_2"])
+
+    with pytest.raises(ValueError):
+        empty_df.assign(new_col=[1, 2, 3, 4, 5, 6, 7, 8, 9])
+    with pytest.raises(ValueError):
+        empty_pandas_df.assign(new_col=[1, 2, 3, 4, 5, 6, 7, 8, 9])
+
+
+@pytest.mark.parametrize(
+    ("ordered"),
+    [
+        (True),
+        (False),
+    ],
+)
+def test_assign_series(scalars_dfs, ordered):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    column_name = "int64_col"
+    df = scalars_df.assign(new_col=scalars_df[column_name])
+    bf_result = df.to_pandas(ordered=ordered)
+    pd_result = scalars_pandas_df.assign(new_col=scalars_pandas_df[column_name])
+
+    assert_pandas_df_equal(bf_result, pd_result, ignore_order=not ordered)
+
+
+def test_assign_series_overwrite(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    column_name = "int64_col"
+    df = scalars_df.assign(**{column_name: scalars_df[column_name] + 3})
+    bf_result = df.to_pandas()
+    pd_result = scalars_pandas_df.assign(
+        **{column_name: scalars_pandas_df[column_name] + 3}
+    )
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+def test_assign_sequential(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    kwargs = {"int64_col": 2, "new_col": 3, "new_col2": 4}
+    df = scalars_df.assign(**kwargs)
+    bf_result = df.to_pandas()
+    pd_result = scalars_pandas_df.assign(**kwargs)
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_result["int64_col"] = pd_result["int64_col"].astype("Int64")
+    pd_result["new_col"] = pd_result["new_col"].astype("Int64")
+    pd_result["new_col2"] = pd_result["new_col2"].astype("Int64")
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+# Require an index so that the self-join is consistent each time.
+def test_assign_same_table_different_index_performs_self_join(
+    scalars_df_index, scalars_pandas_df_index
+):
+    column_name = "int64_col"
+    bf_df = scalars_df_index.assign(
+        alternative_index=scalars_df_index["rowindex_2"] + 2
+    )
+    pd_df = scalars_pandas_df_index.assign(
+        alternative_index=scalars_pandas_df_index["rowindex_2"] + 2
+    )
+    bf_df_2 = bf_df.set_index("alternative_index")
+    pd_df_2 = pd_df.set_index("alternative_index")
+    bf_result = bf_df.assign(new_col=bf_df_2[column_name] * 10).to_pandas()
+    pd_result = pd_df.assign(new_col=pd_df_2[column_name] * 10)
+
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+# Different table expression must have Index
+def test_assign_different_df(
+    scalars_df_index, scalars_df_2_index, scalars_pandas_df_index
+):
+    column_name = "int64_col"
+    df = scalars_df_index.assign(new_col=scalars_df_2_index[column_name])
+    bf_result = df.to_pandas()
+    # Doesn't matter to pandas if it comes from the same DF or a different DF.
+    pd_result = scalars_pandas_df_index.assign(
+        new_col=scalars_pandas_df_index[column_name]
+    )
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+def test_assign_different_df_w_loc(
+    scalars_df_index, scalars_df_2_index, scalars_pandas_df_index
+):
+    bf_df = scalars_df_index.copy()
+    bf_df2 = scalars_df_2_index.copy()
+    pd_df = scalars_pandas_df_index.copy()
+    assert "int64_col" in bf_df.columns
+    assert "int64_col" in pd_df.columns
+    bf_df.loc[:, "int64_col"] = bf_df2.loc[:, "int64_col"] + 1
+    pd_df.loc[:, "int64_col"] = pd_df.loc[:, "int64_col"] + 1
+    bf_result = bf_df.to_pandas()
+    pd_result = pd_df
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_result["int64_col"] = pd_result["int64_col"].astype("Int64")
+
+    pd.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_assign_different_df_w_setitem(
+    scalars_df_index, scalars_df_2_index, scalars_pandas_df_index
+):
+    bf_df = scalars_df_index.copy()
+    bf_df2 = scalars_df_2_index.copy()
+    pd_df = scalars_pandas_df_index.copy()
+    assert "int64_col" in bf_df.columns
+    assert "int64_col" in pd_df.columns
+    bf_df["int64_col"] = bf_df2["int64_col"] + 1
+    pd_df["int64_col"] = pd_df["int64_col"] + 1
+    bf_result = bf_df.to_pandas()
+    pd_result = pd_df
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_result["int64_col"] = pd_result["int64_col"].astype("Int64")
+
+    pd.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_assign_callable_lambda(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    kwargs = {"new_col": lambda x: x["int64_col"] + x["int64_too"]}
+    df = scalars_df.assign(**kwargs)
+    bf_result = df.to_pandas()
+    pd_result = scalars_pandas_df.assign(**kwargs)
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_result["new_col"] = pd_result["new_col"].astype("Int64")
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+@pytest.mark.parametrize(
+    ("axis", "how", "ignore_index", "subset"),
+    [
+        (0, "any", False, None),
+        (0, "any", True, None),
+        (0, "all", False, ["bool_col", "time_col"]),
+        (0, "any", False, ["bool_col", "time_col"]),
+        (0, "all", False, "time_col"),
+        (1, "any", False, None),
+        (1, "all", False, None),
+    ],
+)
+def test_df_dropna(scalars_dfs, axis, how, ignore_index, subset):
+    # TODO: supply a reason why this isn't compatible with pandas 1.x
+    pytest.importorskip("pandas", minversion="2.0.0")
+    scalars_df, scalars_pandas_df = scalars_dfs
+    df = scalars_df.dropna(axis=axis, how=how, ignore_index=ignore_index, subset=subset)
+    bf_result = df.to_pandas()
+    pd_result = scalars_pandas_df.dropna(
+        axis=axis, how=how, ignore_index=ignore_index, subset=subset
+    )
+
+    # Pandas uses int64 instead of Int64 (nullable) dtype.
+    pd_result.index = pd_result.index.astype(pd.Int64Dtype())
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_df_dropna_range_columns(scalars_dfs):
+    # TODO: supply a reason why this isn't compatible with pandas 1.x
+    pytest.importorskip("pandas", minversion="2.0.0")
+    scalars_df, scalars_pandas_df = scalars_dfs
+    scalars_df = scalars_df.copy()
+    scalars_pandas_df = scalars_pandas_df.copy()
+    scalars_df.columns = pandas.RangeIndex(0, len(scalars_df.columns))
+    scalars_pandas_df.columns = pandas.RangeIndex(0, len(scalars_pandas_df.columns))
+
+    df = scalars_df.dropna()
+    bf_result = df.to_pandas()
+    pd_result = scalars_pandas_df.dropna()
+
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_df_interpolate(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    columns = ["int64_col", "int64_too", "float64_col"]
+    bf_result = scalars_df[columns].interpolate().to_pandas()
+    # Pandas can only interpolate on "float64" columns
+    # https://github.com/pandas-dev/pandas/issues/40252
+    pd_result = scalars_pandas_df[columns].astype("float64").interpolate()
+
+    pandas.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+        check_index_type=False,
+        check_dtype=False,
+    )
+
+
+@pytest.mark.parametrize(
+    "col, fill_value",
+    [
+        (["int64_col", "float64_col"], 3),
+        (["string_col"], "A"),
+        (["datetime_col"], pd.Timestamp("2023-01-01")),
+    ],
+)
+def test_df_fillna(scalars_dfs, col, fill_value):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df[col].fillna(fill_value).to_pandas()
+    pd_result = scalars_pandas_df[col].fillna(fill_value)
+
+    pd.testing.assert_frame_equal(bf_result, pd_result, check_dtype=False)
+
+
+def test_df_ffill(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df[["int64_col", "float64_col"]].ffill(limit=1).to_pandas()
+    pd_result = scalars_pandas_df[["int64_col", "float64_col"]].ffill(limit=1)
+
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_df_bfill(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df[["int64_col", "float64_col"]].bfill().to_pandas()
+    pd_result = scalars_pandas_df[["int64_col", "float64_col"]].bfill()
+
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_apply_series_series_callable(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    columns = ["int64_too", "int64_col"]
+
+    def foo(series, arg1, arg2, *, kwarg1=0, kwarg2=0):
+        return series**2 + (arg1 * arg2 % 4) + (kwarg1 * kwarg2 % 7)
+
+    bf_result = (
+        scalars_df_index[columns]
+        .apply(foo, args=(33, 61), kwarg1=52, kwarg2=21)
+        .to_pandas()
+    )
+
+    pd_result = scalars_pandas_df_index[columns].apply(
+        foo, args=(33, 61), kwarg1=52, kwarg2=21
+    )
+
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_apply_series_listlike_callable(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    columns = ["int64_too", "int64_col"]
+    bf_result = (
+        scalars_df_index[columns].apply(lambda x: [len(x), x.min(), 24]).to_pandas()
+    )
+
+    pd_result = scalars_pandas_df_index[columns].apply(lambda x: [len(x), x.min(), 24])
+
+    # Convert default pandas dtypes `int64` to match BigQuery DataFrames dtypes.
+    pd_result.index = pd_result.index.astype("Int64")
+    pd_result = pd_result.astype("Int64")
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_apply_series_scalar_callable(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    columns = ["int64_too", "int64_col"]
+    bf_result = scalars_df_index[columns].apply(lambda x: x.sum())
+
+    pd_result = scalars_pandas_df_index[columns].apply(lambda x: x.sum())
+
+    pandas.testing.assert_series_equal(bf_result, pd_result)
+
+
+def test_df_pipe(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    columns = ["int64_too", "int64_col"]
+
+    def foo(x: int, y: int, df):
+        return (df + x) % y
+
+    bf_result = (
+        scalars_df_index[columns]
+        .pipe((foo, "df"), x=7, y=9)
+        .pipe(lambda x: x**2)
+        .to_pandas()
+    )
+
+    pd_result = (
+        scalars_pandas_df_index[columns]
+        .pipe((foo, "df"), x=7, y=9)
+        .pipe(lambda x: x**2)
+    )
+
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_df_keys(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    pandas.testing.assert_index_equal(
+        scalars_df_index.keys(), scalars_pandas_df_index.keys()
+    )
+
+
+def test_df_iter(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    for bf_i, df_i in zip(scalars_df_index, scalars_pandas_df_index):
+        assert bf_i == df_i
+
+
+def test_iterrows(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    # TODO: supply a reason why this isn't compatible with pandas 1.x
+    pytest.importorskip("pandas", minversion="2.0.0")
+    scalars_df_index = scalars_df_index.add_suffix("_suffix", axis=1)
+    scalars_pandas_df_index = scalars_pandas_df_index.add_suffix("_suffix", axis=1)
+    for (bf_index, bf_series), (pd_index, pd_series) in zip(
+        scalars_df_index.iterrows(), scalars_pandas_df_index.iterrows()
+    ):
+        assert bf_index == pd_index
+        pandas.testing.assert_series_equal(bf_series, pd_series)
+
+
+@pytest.mark.parametrize(
+    (
+        "index",
+        "name",
+    ),
+    [
+        (
+            True,
+            "my_df",
+        ),
+        (False, None),
+    ],
+)
+def test_itertuples(scalars_df_index, index, name):
+    # Numeric has slightly different representation as a result of conversions.
+    bf_tuples = scalars_df_index.itertuples(index, name)
+    pd_tuples = scalars_df_index.to_pandas().itertuples(index, name)
+    for bf_tuple, pd_tuple in zip(bf_tuples, pd_tuples):
+        assert bf_tuple == pd_tuple
+
+
+def test_df_cross_merge(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    left_columns = ["int64_col", "float64_col", "rowindex_2"]
+    right_columns = ["int64_col", "bool_col", "string_col", "rowindex_2"]
+
+    left = scalars_df[left_columns]
+    # Offset the rows somewhat so that outer join can have an effect.
+    right = scalars_df[right_columns].assign(rowindex_2=scalars_df["rowindex_2"] + 2)
+
+    bf_result = left.merge(right, "cross").to_pandas()
+
+    pd_result = scalars_pandas_df[left_columns].merge(
+        scalars_pandas_df[right_columns].assign(
+            rowindex_2=scalars_pandas_df["rowindex_2"] + 2
+        ),
+        "cross",
+    )
+    pd.testing.assert_frame_equal(bf_result, pd_result, check_index_type=False)
+
+
+@pytest.mark.parametrize(
+    ("merge_how",),
+    [
+        ("inner",),
+        ("outer",),
+        ("left",),
+        ("right",),
+    ],
+)
+def test_df_merge(scalars_dfs, merge_how):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    on = "rowindex_2"
+    left_columns = ["int64_col", "float64_col", "rowindex_2"]
+    right_columns = ["int64_col", "bool_col", "string_col", "rowindex_2"]
+
+    left = scalars_df[left_columns]
+    # Offset the rows somewhat so that outer join can have an effect.
+    right = scalars_df[right_columns].assign(rowindex_2=scalars_df["rowindex_2"] + 2)
+
+    df = left.merge(right, merge_how, on, sort=True)
+    bf_result = df.to_pandas()
+
+    pd_result = scalars_pandas_df[left_columns].merge(
+        scalars_pandas_df[right_columns].assign(
+            rowindex_2=scalars_pandas_df["rowindex_2"] + 2
+        ),
+        merge_how,
+        on,
+        sort=True,
+    )
+
+    assert_pandas_df_equal(
+        bf_result, pd_result, ignore_order=True, check_index_type=False
+    )
+
+
+@pytest.mark.parametrize(
+    ("left_on", "right_on"),
+    [
+        (["int64_col", "rowindex_2"], ["int64_col", "rowindex_2"]),
+        (["rowindex_2", "int64_col"], ["int64_col", "rowindex_2"]),
+        # Polars engine is currently strict on join key types
+        # (["rowindex_2", "float64_col"], ["int64_col", "rowindex_2"]),
+    ],
+)
+def test_df_merge_multi_key(scalars_dfs, left_on, right_on):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    left_columns = ["int64_col", "float64_col", "rowindex_2"]
+    right_columns = ["int64_col", "bool_col", "string_col", "rowindex_2"]
+
+    left = scalars_df[left_columns]
+    # Offset the rows somewhat so that outer join can have an effect.
+    right = scalars_df[right_columns].assign(rowindex_2=scalars_df["rowindex_2"] + 2)
+
+    df = left.merge(right, "outer", left_on=left_on, right_on=right_on, sort=True)
+    bf_result = df.to_pandas()
+
+    pd_result = scalars_pandas_df[left_columns].merge(
+        scalars_pandas_df[right_columns].assign(
+            rowindex_2=scalars_pandas_df["rowindex_2"] + 2
+        ),
+        "outer",
+        left_on=left_on,
+        right_on=right_on,
+        sort=True,
+    )
+
+    assert_pandas_df_equal(
+        bf_result, pd_result, ignore_order=True, check_index_type=False
+    )
+
+
+@pytest.mark.parametrize(
+    ("merge_how",),
+    [
+        ("inner",),
+        ("outer",),
+        ("left",),
+        ("right",),
+    ],
+)
+def test_merge_custom_col_name(scalars_dfs, merge_how):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    left_columns = ["int64_col", "float64_col"]
+    right_columns = ["int64_col", "bool_col", "string_col"]
+    on = "int64_col"
+    rename_columns = {"float64_col": "f64_col"}
+
+    left = scalars_df[left_columns]
+    left = left.rename(columns=rename_columns)
+    right = scalars_df[right_columns]
+    df = left.merge(right, merge_how, on, sort=True)
+    bf_result = df.to_pandas()
+
+    pandas_left_df = scalars_pandas_df[left_columns]
+    pandas_left_df = pandas_left_df.rename(columns=rename_columns)
+    pandas_right_df = scalars_pandas_df[right_columns]
+    pd_result = pandas_left_df.merge(pandas_right_df, merge_how, on, sort=True)
+
+    assert_pandas_df_equal(
+        bf_result, pd_result, ignore_order=True, check_index_type=False
+    )
+
+
+@pytest.mark.parametrize(
+    ("merge_how",),
+    [
+        ("inner",),
+        ("outer",),
+        ("left",),
+        ("right",),
+    ],
+)
+def test_merge_left_on_right_on(scalars_dfs, merge_how):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    left_columns = ["int64_col", "float64_col", "int64_too"]
+    right_columns = ["int64_col", "bool_col", "string_col", "rowindex_2"]
+
+    left = scalars_df[left_columns]
+    right = scalars_df[right_columns]
+
+    df = left.merge(
+        right, merge_how, left_on="int64_too", right_on="rowindex_2", sort=True
+    )
+    bf_result = df.to_pandas()
+
+    pd_result = scalars_pandas_df[left_columns].merge(
+        scalars_pandas_df[right_columns],
+        merge_how,
+        left_on="int64_too",
+        right_on="rowindex_2",
+        sort=True,
+    )
+
+    assert_pandas_df_equal(
+        bf_result, pd_result, ignore_order=True, check_index_type=False
+    )
+
+
+def test_shape(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df.shape
+    pd_result = scalars_pandas_df.shape
+
+    assert bf_result == pd_result
+
+
+def test_len(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = len(scalars_df)
+    pd_result = len(scalars_pandas_df)
+
+    assert bf_result == pd_result
+
+
+@pytest.mark.parametrize(
+    ("n_rows",),
+    [
+        (50,),
+        (10000,),
+    ],
+)
+def test_df_len_local(session, n_rows):
+    assert (
+        len(
+            session.read_pandas(
+                pd.DataFrame(np.random.randint(1, 7, n_rows), columns=["one"]),
+            )
+        )
+        == n_rows
+    )
+
+
+def test_size(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df.size
+    pd_result = scalars_pandas_df.size
+
+    assert bf_result == pd_result
+
+
+def test_ndim(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df.ndim
+    pd_result = scalars_pandas_df.ndim
+
+    assert bf_result == pd_result
+
+
+def test_empty_false(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    bf_result = scalars_df.empty
+    pd_result = scalars_pandas_df.empty
+
+    assert bf_result == pd_result
+
+
+def test_empty_true_column_filter(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    bf_result = scalars_df[[]].empty
+    pd_result = scalars_pandas_df[[]].empty
+
+    assert bf_result == pd_result
+
+
+def test_empty_true_row_filter(scalars_dfs: Tuple[dataframe.DataFrame, pd.DataFrame]):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_bool: series.Series = typing.cast(series.Series, scalars_df["bool_col"])
+    pd_bool: pd.Series = scalars_pandas_df["bool_col"]
+    bf_false = bf_bool.notna() & (bf_bool != bf_bool)
+    pd_false = pd_bool.notna() & (pd_bool != pd_bool)
+
+    bf_result = scalars_df[bf_false].empty
+    pd_result = scalars_pandas_df[pd_false].empty
+
+    assert pd_result
+    assert bf_result == pd_result
+
+
+def test_empty_true_memtable(session: bigframes.Session):
+    bf_df = dataframe.DataFrame(session=session)
+    pd_df = pd.DataFrame()
+
+    bf_result = bf_df.empty
+    pd_result = pd_df.empty
+
+    assert pd_result
+    assert bf_result == pd_result
+
+
+@pytest.mark.parametrize(
+    ("drop",),
+    ((True,), (False,)),
+)
+def test_reset_index(scalars_df_index, scalars_pandas_df_index, drop):
+    df = scalars_df_index.reset_index(drop=drop)
+    assert df.index.name is None
+
+    bf_result = df.to_pandas()
+    pd_result = scalars_pandas_df_index.reset_index(drop=drop)
+
+    # Pandas uses int64 instead of Int64 (nullable) dtype.
+    pd_result.index = pd_result.index.astype(pd.Int64Dtype())
+
+    # reset_index should maintain the original ordering.
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_reset_index_then_filter(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    bf_filter = scalars_df_index["bool_col"].fillna(True)
+    bf_df = scalars_df_index.reset_index()[bf_filter]
+    bf_result = bf_df.to_pandas()
+    pd_filter = scalars_pandas_df_index["bool_col"].fillna(True)
+    pd_result = scalars_pandas_df_index.reset_index()[pd_filter]
+
+    # Pandas uses int64 instead of Int64 (nullable) dtype.
+    pd_result.index = pd_result.index.astype(pd.Int64Dtype())
+
+    # reset_index should maintain the original ordering and index keys
+    # post-filter will have gaps.
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_reset_index_with_unnamed_index(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    scalars_df_index = scalars_df_index.copy()
+    scalars_pandas_df_index = scalars_pandas_df_index.copy()
+
+    scalars_df_index.index.name = None
+    scalars_pandas_df_index.index.name = None
+    df = scalars_df_index.reset_index(drop=False)
+    assert df.index.name is None
+
+    # reset_index(drop=False) creates a new column "index".
+    assert df.columns[0] == "index"
+
+    bf_result = df.to_pandas()
+    pd_result = scalars_pandas_df_index.reset_index(drop=False)
+
+    # Pandas uses int64 instead of Int64 (nullable) dtype.
+    pd_result.index = pd_result.index.astype(pd.Int64Dtype())
+
+    # reset_index should maintain the original ordering.
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_reset_index_with_unnamed_multiindex(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    bf_df = dataframe.DataFrame(
+        ([1, 2, 3], [2, 5, 7]),
+        index=pd.MultiIndex.from_tuples([("a", "aa"), ("a", "aa")]),
+    )
+    pd_df = pd.DataFrame(
+        ([1, 2, 3], [2, 5, 7]),
+        index=pd.MultiIndex.from_tuples([("a", "aa"), ("a", "aa")]),
+    )
+
+    bf_df = bf_df.reset_index()
+    pd_df = pd_df.reset_index()
+
+    assert pd_df.columns[0] == "level_0"
+    assert bf_df.columns[0] == "level_0"
+    assert pd_df.columns[1] == "level_1"
+    assert bf_df.columns[1] == "level_1"
+
+
+def test_reset_index_with_unnamed_index_and_index_column(
+    scalars_df_index,
+    scalars_pandas_df_index,
+):
+    scalars_df_index = scalars_df_index.copy()
+    scalars_pandas_df_index = scalars_pandas_df_index.copy()
+
+    scalars_df_index.index.name = None
+    scalars_pandas_df_index.index.name = None
+    df = scalars_df_index.assign(index=scalars_df_index["int64_col"]).reset_index(
+        drop=False
+    )
+    assert df.index.name is None
+
+    # reset_index(drop=False) creates a new column "level_0" if the "index" column already exists.
+    assert df.columns[0] == "level_0"
+
+    bf_result = df.to_pandas()
+    pd_result = scalars_pandas_df_index.assign(
+        index=scalars_pandas_df_index["int64_col"]
+    ).reset_index(drop=False)
+
+    # Pandas uses int64 instead of Int64 (nullable) dtype.
+    pd_result.index = pd_result.index.astype(pd.Int64Dtype())
+
+    # reset_index should maintain the original ordering.
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+@pytest.mark.parametrize(
+    ("drop",),
+    (
+        (True,),
+        (False,),
+    ),
+)
+@pytest.mark.parametrize(
+    ("append",),
+    (
+        (True,),
+        (False,),
+    ),
+)
+@pytest.mark.parametrize(
+    ("index_column",),
+    (("int64_too",), ("string_col",), ("timestamp_col",)),
+)
+def test_set_index(scalars_dfs, index_column, drop, append):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    df = scalars_df.set_index(index_column, append=append, drop=drop)
+    bf_result = df.to_pandas()
+    pd_result = scalars_pandas_df.set_index(index_column, append=append, drop=drop)
+
+    # Sort to disambiguate when there are duplicate index labels.
+    # Note: Doesn't use assert_pandas_df_equal_ignore_ordering because we get
+    # "ValueError: 'timestamp_col' is both an index level and a column label,
+    # which is ambiguous" when trying to sort by a column with the same name as
+    # the index.
+    bf_result = bf_result.sort_values("rowindex_2")
+    pd_result = pd_result.sort_values("rowindex_2")
+
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_set_index_key_error(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    with pytest.raises(KeyError):
+        scalars_pandas_df.set_index(["not_a_col"])
+    with pytest.raises(KeyError):
+        scalars_df.set_index(["not_a_col"])
+
+
+@pytest.mark.parametrize(
+    ("ascending",),
+    ((True,), (False,)),
+)
+@pytest.mark.parametrize(
+    ("na_position",),
+    (("first",), ("last",)),
+)
+def test_sort_index(scalars_dfs, ascending, na_position):
+    index_column = "int64_col"
+    scalars_df, scalars_pandas_df = scalars_dfs
+    df = scalars_df.set_index(index_column)
+    bf_result = df.sort_index(ascending=ascending, na_position=na_position).to_pandas()
+    pd_result = scalars_pandas_df.set_index(index_column).sort_index(
+        ascending=ascending, na_position=na_position
+    )
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_dataframe_sort_index_inplace(scalars_dfs):
+    index_column = "int64_col"
+    scalars_df, scalars_pandas_df = scalars_dfs
+    df = scalars_df.copy().set_index(index_column)
+    df.sort_index(ascending=False, inplace=True)
+    bf_result = df.to_pandas()
+
+    pd_result = scalars_pandas_df.set_index(index_column).sort_index(ascending=False)
+    pandas.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_df_abs(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    columns = ["int64_col", "int64_too", "float64_col"]
+
+    bf_result = scalars_df[columns].abs()
+    pd_result = scalars_pandas_df[columns].abs()
+
+    assert_dfs_equivalent(pd_result, bf_result)
+
+
+def test_df_pos(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = (+scalars_df[["int64_col", "numeric_col"]]).to_pandas()
+    pd_result = +scalars_pandas_df[["int64_col", "numeric_col"]]
+
+    assert_pandas_df_equal(pd_result, bf_result)
+
+
+def test_df_neg(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = (-scalars_df[["int64_col", "numeric_col"]]).to_pandas()
+    pd_result = -scalars_pandas_df[["int64_col", "numeric_col"]]
+
+    assert_pandas_df_equal(pd_result, bf_result)
+
+
+def test_df_invert(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    columns = ["int64_col", "bool_col"]
+
+    bf_result = (~scalars_df[columns]).to_pandas()
+    pd_result = ~scalars_pandas_df[columns]
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+def test_df_isnull(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    columns = ["int64_col", "int64_too", "string_col", "bool_col"]
+    bf_result = scalars_df[columns].isnull().to_pandas()
+    pd_result = scalars_pandas_df[columns].isnull()
+
+    # One of dtype mismatches to be documented. Here, the `bf_result.dtype` is
+    # `BooleanDtype` but the `pd_result.dtype` is `bool`.
+    pd_result["int64_col"] = pd_result["int64_col"].astype(pd.BooleanDtype())
+    pd_result["int64_too"] = pd_result["int64_too"].astype(pd.BooleanDtype())
+    pd_result["string_col"] = pd_result["string_col"].astype(pd.BooleanDtype())
+    pd_result["bool_col"] = pd_result["bool_col"].astype(pd.BooleanDtype())
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+def test_df_notnull(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    columns = ["int64_col", "int64_too", "string_col", "bool_col"]
+    bf_result = scalars_df[columns].notnull().to_pandas()
+    pd_result = scalars_pandas_df[columns].notnull()
+
+    # One of dtype mismatches to be documented. Here, the `bf_result.dtype` is
+    # `BooleanDtype` but the `pd_result.dtype` is `bool`.
+    pd_result["int64_col"] = pd_result["int64_col"].astype(pd.BooleanDtype())
+    pd_result["int64_too"] = pd_result["int64_too"].astype(pd.BooleanDtype())
+    pd_result["string_col"] = pd_result["string_col"].astype(pd.BooleanDtype())
+    pd_result["bool_col"] = pd_result["bool_col"].astype(pd.BooleanDtype())
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+@pytest.mark.parametrize(
+    ("left_labels", "right_labels", "overwrite", "fill_value"),
+    [
+        (["a", "b", "c"], ["c", "a", "b"], True, None),
+        (["a", "b", "c"], ["c", "a", "b"], False, None),
+        (["a", "b", "c"], ["a", "b", "c"], False, 2),
+    ],
+    ids=[
+        "one_one_match_overwrite",
+        "one_one_match_no_overwrite",
+        "exact_match",
+    ],
+)
+def test_combine(
+    scalars_df_index,
+    scalars_df_2_index,
+    scalars_pandas_df_index,
+    left_labels,
+    right_labels,
+    overwrite,
+    fill_value,
+):
+    if pd.__version__.startswith("1."):
+        pytest.skip("pd.NA vs NaN not handled well in pandas 1.x.")
+    columns = ["int64_too", "int64_col", "float64_col"]
+
+    bf_df_a = scalars_df_index[columns]
+    bf_df_a.columns = left_labels
+    bf_df_b = scalars_df_2_index[columns]
+    bf_df_b.columns = right_labels
+    bf_result = bf_df_a.combine(
+        bf_df_b,
+        lambda x, y: x**2 + 2 * x * y + y**2,
+        overwrite=overwrite,
+        fill_value=fill_value,
+    ).to_pandas()
+
+    pd_df_a = scalars_pandas_df_index[columns]
+    pd_df_a.columns = left_labels
+    pd_df_b = scalars_pandas_df_index[columns]
+    pd_df_b.columns = right_labels
+    pd_result = pd_df_a.combine(
+        pd_df_b,
+        lambda x, y: x**2 + 2 * x * y + y**2,
+        overwrite=overwrite,
+        fill_value=fill_value,
+    )
+
+    # Some dtype inconsistency for all-NULL columns
+    pd.testing.assert_frame_equal(bf_result, pd_result, check_dtype=False)
+
+
+@pytest.mark.parametrize(
+    ("overwrite", "filter_func"),
+    [
+        (True, None),
+        (False, None),
+        (True, lambda x: x.isna() | (x % 2 == 0)),
+    ],
+    ids=[
+        "default",
+        "overwritefalse",
+        "customfilter",
+    ],
+)
+def test_df_update(overwrite, filter_func):
+    if pd.__version__.startswith("1."):
+        pytest.skip("dtype handled differently in pandas 1.x.")
+
+    index1: pandas.Index = pandas.Index([1, 2, 3, 4], dtype="Int64")
+
+    index2: pandas.Index = pandas.Index([1, 2, 4, 5], dtype="Int64")
+    pd_df1 = pandas.DataFrame(
+        {"a": [1, None, 3, 4], "b": [5, 6, None, 8]}, dtype="Int64", index=index1
+    )
+    pd_df2 = pandas.DataFrame(
+        {"a": [None, 20, 30, 40], "c": [90, None, 110, 120]},
+        dtype="Int64",
+        index=index2,
+    )
+
+    bf_df1 = dataframe.DataFrame(pd_df1)
+    bf_df2 = dataframe.DataFrame(pd_df2)
+
+    bf_df1.update(bf_df2, overwrite=overwrite, filter_func=filter_func)
+    pd_df1.update(pd_df2, overwrite=overwrite, filter_func=filter_func)
+
+    pd.testing.assert_frame_equal(bf_df1.to_pandas(), pd_df1)
+
+
+def test_df_idxmin():
+    pd_df = pd.DataFrame(
+        {"a": [1, 2, 3], "b": [7, None, 3], "c": [4, 4, 4]}, index=["x", "y", "z"]
+    )
+    bf_df = dataframe.DataFrame(pd_df)
+
+    bf_result = bf_df.idxmin().to_pandas()
+    pd_result = pd_df.idxmin()
+
+    pd.testing.assert_series_equal(
+        bf_result, pd_result, check_index_type=False, check_dtype=False
+    )
+
+
+def test_df_idxmax():
+    pd_df = pd.DataFrame(
+        {"a": [1, 2, 3], "b": [7, None, 3], "c": [4, 4, 4]}, index=["x", "y", "z"]
+    )
+    bf_df = dataframe.DataFrame(pd_df)
+
+    bf_result = bf_df.idxmax().to_pandas()
+    pd_result = pd_df.idxmax()
+
+    pd.testing.assert_series_equal(
+        bf_result, pd_result, check_index_type=False, check_dtype=False
+    )
+
+
+@pytest.mark.parametrize(
+    ("join", "axis"),
+    [
+        ("outer", None),
+        ("outer", 0),
+        ("outer", 1),
+        ("left", 0),
+        ("right", 1),
+        ("inner", None),
+        ("inner", 1),
+    ],
+)
+def test_df_align(join, axis):
+
+    index1: pandas.Index = pandas.Index([1, 2, 3, 4], dtype="Int64")
+
+    index2: pandas.Index = pandas.Index([1, 2, 4, 5], dtype="Int64")
+    pd_df1 = pandas.DataFrame(
+        {"a": [1, None, 3, 4], "b": [5, 6, None, 8]}, dtype="Int64", index=index1
+    )
+    pd_df2 = pandas.DataFrame(
+        {"a": [None, 20, 30, 40], "c": [90, None, 110, 120]},
+        dtype="Int64",
+        index=index2,
+    )
+
+    bf_df1 = dataframe.DataFrame(pd_df1)
+    bf_df2 = dataframe.DataFrame(pd_df2)
+
+    bf_result1, bf_result2 = bf_df1.align(bf_df2, join=join, axis=axis)
+    pd_result1, pd_result2 = pd_df1.align(pd_df2, join=join, axis=axis)
+
+    # Don't check dtype as pandas does unnecessary float conversion
+    assert isinstance(bf_result1, dataframe.DataFrame) and isinstance(
+        bf_result2, dataframe.DataFrame
+    )
+    pd.testing.assert_frame_equal(bf_result1.to_pandas(), pd_result1, check_dtype=False)
+    pd.testing.assert_frame_equal(bf_result2.to_pandas(), pd_result2, check_dtype=False)
+
+
+def test_combine_first(
+    scalars_df_index,
+    scalars_df_2_index,
+    scalars_pandas_df_index,
+):
+    if pd.__version__.startswith("1."):
+        pytest.skip("pd.NA vs NaN not handled well in pandas 1.x.")
+    columns = ["int64_too", "int64_col", "float64_col"]
+
+    bf_df_a = scalars_df_index[columns].iloc[0:6]
+    bf_df_a.columns = ["a", "b", "c"]
+    bf_df_b = scalars_df_2_index[columns].iloc[2:8]
+    bf_df_b.columns = ["b", "a", "d"]
+    bf_result = bf_df_a.combine_first(bf_df_b).to_pandas()
+
+    pd_df_a = scalars_pandas_df_index[columns].iloc[0:6]
+    pd_df_a.columns = ["a", "b", "c"]
+    pd_df_b = scalars_pandas_df_index[columns].iloc[2:8]
+    pd_df_b.columns = ["b", "a", "d"]
+    pd_result = pd_df_a.combine_first(pd_df_b)
+
+    # Some dtype inconsistency for all-NULL columns
+    pd.testing.assert_frame_equal(bf_result, pd_result, check_dtype=False)
+
+
+def test_df_corr_w_invalid_parameters(scalars_dfs):
+    columns = ["int64_too", "int64_col", "float64_col"]
+    scalars_df, _ = scalars_dfs
+
+    with pytest.raises(NotImplementedError):
+        scalars_df[columns].corr(method="kendall")
+
+    with pytest.raises(NotImplementedError):
+        scalars_df[columns].corr(min_periods=1)
+
+
+@pytest.mark.parametrize(
+    ("columns", "numeric_only"),
+    [
+        (["bool_col", "int64_col", "float64_col"], True),
+        (["bool_col", "int64_col", "float64_col"], False),
+        (["bool_col", "int64_col", "float64_col", "string_col"], True),
+        pytest.param(
+            ["bool_col", "int64_col", "float64_col", "string_col"],
+            False,
+            marks=pytest.mark.xfail(
+                raises=NotImplementedError,
+            ),
+        ),
+    ],
+)
+def test_cov_w_numeric_only(scalars_dfs, columns, numeric_only):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df[columns].cov(numeric_only=numeric_only).to_pandas()
+    pd_result = scalars_pandas_df[columns].cov(numeric_only=numeric_only)
+    # BigFrames and Pandas differ in their data type handling:
+    # - Column types: BigFrames uses Float64, Pandas uses float64.
+    # - Index types: BigFrames uses strign, Pandas uses object.
+    pd.testing.assert_index_equal(bf_result.columns, pd_result.columns)
+    # Only check row order in ordered mode.
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+        check_dtype=False,
+        check_index_type=False,
+        check_like=~scalars_df._block.session._strictly_ordered,
+    )
+
+
+def test_df_corrwith_df(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    l_cols = ["int64_col", "float64_col", "int64_too"]
+    r_cols = ["int64_too", "float64_col"]
+
+    bf_result = scalars_df[l_cols].corrwith(scalars_df[r_cols]).to_pandas()
+    pd_result = scalars_pandas_df[l_cols].corrwith(scalars_pandas_df[r_cols])
+
+    # BigFrames and Pandas differ in their data type handling:
+    # - Column types: BigFrames uses Float64, Pandas uses float64.
+    # - Index types: BigFrames uses strign, Pandas uses object.
+    pd.testing.assert_series_equal(
+        bf_result, pd_result, check_dtype=False, check_index_type=False
+    )
+
+
+def test_df_corrwith_df_numeric_only(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    l_cols = ["int64_col", "float64_col", "int64_too", "string_col"]
+    r_cols = ["int64_too", "float64_col", "bool_col"]
+
+    bf_result = (
+        scalars_df[l_cols].corrwith(scalars_df[r_cols], numeric_only=True).to_pandas()
+    )
+    pd_result = scalars_pandas_df[l_cols].corrwith(
+        scalars_pandas_df[r_cols], numeric_only=True
+    )
+
+    # BigFrames and Pandas differ in their data type handling:
+    # - Column types: BigFrames uses Float64, Pandas uses float64.
+    # - Index types: BigFrames uses strign, Pandas uses object.
+    pd.testing.assert_series_equal(
+        bf_result, pd_result, check_dtype=False, check_index_type=False
+    )
+
+
+def test_df_corrwith_df_non_numeric_error(scalars_dfs):
+    scalars_df, _ = scalars_dfs
+
+    l_cols = ["int64_col", "float64_col", "int64_too", "string_col"]
+    r_cols = ["int64_too", "float64_col", "bool_col"]
+
+    with pytest.raises(NotImplementedError):
+        scalars_df[l_cols].corrwith(scalars_df[r_cols], numeric_only=False)
+
+
+def test_df_corrwith_series(scalars_dfs):
+    # TODO: supply a reason why this isn't compatible with pandas 1.x
+    pytest.importorskip("pandas", minversion="2.0.0")
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    l_cols = ["int64_col", "float64_col", "int64_too"]
+    r_col = "float64_col"
+
+    bf_result = scalars_df[l_cols].corrwith(scalars_df[r_col]).to_pandas()
+    pd_result = scalars_pandas_df[l_cols].corrwith(scalars_pandas_df[r_col])
+
+    # BigFrames and Pandas differ in their data type handling:
+    # - Column types: BigFrames uses Float64, Pandas uses float64.
+    # - Index types: BigFrames uses strign, Pandas uses object.
+    pd.testing.assert_series_equal(
+        bf_result, pd_result, check_dtype=False, check_index_type=False
+    )
+
+
+@pytest.mark.parametrize(
+    ("op"),
+    [
+        operator.add,
+        operator.sub,
+        operator.mul,
+        operator.truediv,
+        # operator.floordiv,
+        operator.eq,
+        operator.ne,
+        operator.gt,
+        operator.ge,
+        operator.lt,
+        operator.le,
+    ],
+    ids=[
+        "add",
+        "subtract",
+        "multiply",
+        "true_divide",
+        # "floor_divide",
+        "eq",
+        "ne",
+        "gt",
+        "ge",
+        "lt",
+        "le",
+    ],
+)
+# TODO(garrettwu): deal with NA values
+@pytest.mark.parametrize(("other_scalar"), [1, 2.5, 0, 0.0])
+@pytest.mark.parametrize(("reverse_operands"), [True, False])
+def test_scalar_binop(scalars_dfs, op, other_scalar, reverse_operands):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    columns = ["int64_col", "float64_col"]
+
+    maybe_reversed_op = (lambda x, y: op(y, x)) if reverse_operands else op
+
+    bf_result = maybe_reversed_op(scalars_df[columns], other_scalar).to_pandas()
+    pd_result = maybe_reversed_op(scalars_pandas_df[columns], other_scalar)
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+@pytest.mark.parametrize(("other_scalar"), [1, -2])
+def test_mod(scalars_dfs, other_scalar):
+    # Zero case excluded as pandas produces 0 result for Int64 inputs rather than NA/NaN.
+    # This is likely a pandas bug as mod 0 is undefined in other dtypes, and most programming languages.
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    bf_result = (scalars_df[["int64_col", "int64_too"]] % other_scalar).to_pandas()
+    pd_result = scalars_pandas_df[["int64_col", "int64_too"]] % other_scalar
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+def test_scalar_binop_str_exception(scalars_dfs):
+    scalars_df, _ = scalars_dfs
+    columns = ["string_col"]
+    with pytest.raises(TypeError, match="Cannot add dtypes"):
+        (scalars_df[columns] + 1).to_pandas()
+
+
+@pytest.mark.parametrize(
+    ("op"),
+    [
+        (lambda x, y: x.add(y, axis="index")),
+        (lambda x, y: x.radd(y, axis="index")),
+        (lambda x, y: x.sub(y, axis="index")),
+        (lambda x, y: x.rsub(y, axis="index")),
+        (lambda x, y: x.mul(y, axis="index")),
+        (lambda x, y: x.rmul(y, axis="index")),
+        (lambda x, y: x.truediv(y, axis="index")),
+        (lambda x, y: x.rtruediv(y, axis="index")),
+        # (lambda x, y: x.floordiv(y, axis="index")),
+        # (lambda x, y: x.floordiv(y, axis="index")),
+        (lambda x, y: x.gt(y, axis="index")),
+        (lambda x, y: x.ge(y, axis="index")),
+        (lambda x, y: x.lt(y, axis="index")),
+        (lambda x, y: x.le(y, axis="index")),
+    ],
+    ids=[
+        "add",
+        "radd",
+        "sub",
+        "rsub",
+        "mul",
+        "rmul",
+        "truediv",
+        "rtruediv",
+        # "floordiv",
+        # "rfloordiv",
+        "gt",
+        "ge",
+        "lt",
+        "le",
+    ],
+)
+def test_series_binop_axis_index(
+    scalars_dfs,
+    op,
+):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    df_columns = ["int64_col", "float64_col"]
+    series_column = "int64_too"
+
+    bf_result = op(scalars_df[df_columns], scalars_df[series_column]).to_pandas()
+    pd_result = op(scalars_pandas_df[df_columns], scalars_pandas_df[series_column])
+
+    assert_pandas_df_equal(bf_result, pd_result)
+
+
+@pytest.mark.parametrize(
+    ("input"),
+    [
+        ((1000, 2000, 3000)),
+        (pd.Index([1000, 2000, 3000])),
+        (pd.Series((1000, 2000), index=["int64_too", "float64_col"])),
+    ],
+    ids=[
+        "tuple",
+        "pd_index",
+        "pd_series",
+    ],
+)
+def test_listlike_binop_axis_1_in_memory_data(scalars_dfs, input):
+    # TODO: supply a reason why this isn't compatible with pandas 1.x
+    pytest.importorskip("pandas", minversion="2.0.0")
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    df_columns = ["int64_col", "float64_col", "int64_too"]
+
+    bf_result = scalars_df[df_columns].add(input, axis=1).to_pandas()
+    if hasattr(input, "to_pandas"):
+        input = input.to_pandas()
+    pd_result = scalars_pandas_df[df_columns].add(input, axis=1)
+
+    assert_pandas_df_equal(bf_result, pd_result, check_dtype=False)
+
+
+def test_df_reverse_binop_pandas(scalars_dfs):
+    # TODO: supply a reason why this isn't compatible with pandas 1.x
+    pytest.importorskip("pandas", minversion="2.0.0")
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    pd_series = pd.Series([100, 200, 300])
+
+    df_columns = ["int64_col", "float64_col", "int64_too"]
+
+    bf_result = pd_series + scalars_df[df_columns].to_pandas()
+    pd_result = pd_series + scalars_pandas_df[df_columns]
+
+    assert_pandas_df_equal(bf_result, pd_result, check_dtype=False)
+
+
+def test_listlike_binop_axis_1_bf_index(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    df_columns = ["int64_col", "float64_col", "int64_too"]
+
+    bf_result = (
+        scalars_df[df_columns]
+        .add(bf_indexes.Index([1000, 2000, 3000]), axis=1)
+        .to_pandas()
+    )
+    pd_result = scalars_pandas_df[df_columns].add(pd.Index([1000, 2000, 3000]), axis=1)
+
+    assert_pandas_df_equal(bf_result, pd_result, check_dtype=False)
+
+
+def test_binop_with_self_aggregate(session, scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    df_columns = ["int64_col", "float64_col", "int64_too"]
+
+    bf_df = scalars_df[df_columns]
+    bf_result = (bf_df - bf_df.mean()).to_pandas()
+
+    pd_df = scalars_pandas_df[df_columns]
+    pd_result = pd_df - pd_df.mean()
+
+    assert_pandas_df_equal(bf_result, pd_result, check_dtype=False)
+
+
+@pytest.mark.parametrize(
+    ("left_labels", "right_labels"),
+    [
+        (["a", "a", "b"], ["c", "c", "d"]),
+        (["a", "b", "c"], ["c", "a", "b"]),
+        (["a", "c", "c"], ["c", "a", "c"]),
+        (["a", "b", "c"], ["a", "b", "c"]),
+    ],
+    ids=[
+        "no_overlap",
+        "one_one_match",
+        "multi_match",
+        "exact_match",
+    ],
+)
+def test_binop_df_df_binary_op(
+    scalars_df_index,
+    scalars_df_2_index,
+    scalars_pandas_df_index,
+    left_labels,
+    right_labels,
+):
+    if pd.__version__.startswith("1."):
+        pytest.skip("pd.NA vs NaN not handled well in pandas 1.x.")
+    columns = ["int64_too", "int64_col", "float64_col"]
+
+    bf_df_a = scalars_df_index[columns]
+    bf_df_a.columns = left_labels
+    bf_df_b = scalars_df_2_index[columns]
+    bf_df_b.columns = right_labels
+    bf_result = (bf_df_a - bf_df_b).to_pandas()
+
+    pd_df_a = scalars_pandas_df_index[columns]
+    pd_df_a.columns = left_labels
+    pd_df_b = scalars_pandas_df_index[columns]
+    pd_df_b.columns = right_labels
+    pd_result = pd_df_a - pd_df_b
+
+    # Some dtype inconsistency for all-NULL columns
+    pd.testing.assert_frame_equal(bf_result, pd_result, check_dtype=False)
+
+
+# Differnt table will only work for explicit index, since default index orders are arbitrary.
+@pytest.mark.parametrize(
+    ("ordered"),
+    [
+        (True),
+        (False),
+    ],
+)
+def test_series_binop_add_different_table(
+    scalars_df_index, scalars_pandas_df_index, scalars_df_2_index, ordered
+):
+    df_columns = ["int64_col", "float64_col"]
+    series_column = "int64_too"
+
+    bf_result = (
+        scalars_df_index[df_columns]
+        .add(scalars_df_2_index[series_column], axis="index")
+        .to_pandas(ordered=ordered)
+    )
+    pd_result = scalars_pandas_df_index[df_columns].add(
+        scalars_pandas_df_index[series_column], axis="index"
+    )
+
+    assert_pandas_df_equal(bf_result, pd_result, ignore_order=not ordered)
+
+
+# TODO(garrettwu): Test series binop with different index
+
+all_joins = pytest.mark.parametrize(
+    ("how",),
+    (("outer",), ("left",), ("right",), ("inner",), ("cross",)),
+)
+
+
+@all_joins
+def test_join_same_table(scalars_dfs, how):
+    bf_df, pd_df = scalars_dfs
+    if not bf_df._session._strictly_ordered and how == "cross":
+        pytest.skip("Cross join not supported in partial ordering mode.")
+
+    bf_df_a = bf_df.set_index("int64_too")[["string_col", "int64_col"]]
+    bf_df_a = bf_df_a.sort_index()
+
+    bf_df_b = bf_df.set_index("int64_too")[["float64_col"]]
+    bf_df_b = bf_df_b[bf_df_b.float64_col > 0]
+    bf_df_b = bf_df_b.sort_values("float64_col")
+
+    bf_result = bf_df_a.join(bf_df_b, how=how).to_pandas()
+
+    pd_df_a = pd_df.set_index("int64_too")[["string_col", "int64_col"]].sort_index()
+    pd_df_a = pd_df_a.sort_index()
+
+    pd_df_b = pd_df.set_index("int64_too")[["float64_col"]]
+    pd_df_b = pd_df_b[pd_df_b.float64_col > 0]
+    pd_df_b = pd_df_b.sort_values("float64_col")
+
+    pd_result = pd_df_a.join(pd_df_b, how=how)
+
+    assert_pandas_df_equal(bf_result, pd_result, ignore_order=True)
+
+
+@all_joins
+def test_join_different_table(
+    scalars_df_index, scalars_df_2_index, scalars_pandas_df_index, how
+):
+    bf_df_a = scalars_df_index[["string_col", "int64_col"]]
+    bf_df_b = scalars_df_2_index.dropna()[["float64_col"]]
+    bf_result = bf_df_a.join(bf_df_b, how=how).to_pandas()
+    pd_df_a = scalars_pandas_df_index[["string_col", "int64_col"]]
+    pd_df_b = scalars_pandas_df_index.dropna()[["float64_col"]]
+    pd_result = pd_df_a.join(pd_df_b, how=how)
+    assert_pandas_df_equal(bf_result, pd_result, ignore_order=True)
+
+
+def test_join_duplicate_columns_raises_not_implemented(scalars_dfs):
+    scalars_df, _ = scalars_dfs
+    df_a = scalars_df[["string_col", "float64_col"]]
+    df_b = scalars_df[["float64_col"]]
+    with pytest.raises(NotImplementedError):
+        df_a.join(df_b, how="outer").to_pandas()
+
+
+@all_joins
+def test_join_param_on(scalars_dfs, how):
+    bf_df, pd_df = scalars_dfs
+
+    bf_df_a = bf_df[["string_col", "int64_col", "rowindex_2"]]
+    bf_df_a = bf_df_a.assign(rowindex_2=bf_df_a["rowindex_2"] + 2)
+    bf_df_b = bf_df[["float64_col"]]
+
+    if how == "cross":
+        with pytest.raises(ValueError):
+            bf_df_a.join(bf_df_b, on="rowindex_2", how=how)
+    else:
+        bf_result = bf_df_a.join(bf_df_b, on="rowindex_2", how=how).to_pandas()
+
+        pd_df_a = pd_df[["string_col", "int64_col", "rowindex_2"]]
+        pd_df_a = pd_df_a.assign(rowindex_2=pd_df_a["rowindex_2"] + 2)
+        pd_df_b = pd_df[["float64_col"]]
+        pd_result = pd_df_a.join(pd_df_b, on="rowindex_2", how=how)
+        assert_pandas_df_equal(bf_result, pd_result, ignore_order=True)
+
+
+@all_joins
+def test_df_join_series(scalars_dfs, how):
+    bf_df, pd_df = scalars_dfs
+
+    bf_df_a = bf_df[["string_col", "int64_col", "rowindex_2"]]
+    bf_df_a = bf_df_a.assign(rowindex_2=bf_df_a["rowindex_2"] + 2)
+    bf_series_b = bf_df["float64_col"]
+
+    if how == "cross":
+        with pytest.raises(ValueError):
+            bf_df_a.join(bf_series_b, on="rowindex_2", how=how)
+    else:
+        bf_result = bf_df_a.join(bf_series_b, on="rowindex_2", how=how).to_pandas()
+
+        pd_df_a = pd_df[["string_col", "int64_col", "rowindex_2"]]
+        pd_df_a = pd_df_a.assign(rowindex_2=pd_df_a["rowindex_2"] + 2)
+        pd_series_b = pd_df["float64_col"]
+        pd_result = pd_df_a.join(pd_series_b, on="rowindex_2", how=how)
+        assert_pandas_df_equal(bf_result, pd_result, ignore_order=True)
+
+
+@pytest.mark.parametrize(
+    ("by", "ascending", "na_position"),
+    [
+        ("int64_col", True, "first"),
+        (["bool_col", "int64_col"], True, "last"),
+        ("int64_col", False, "first"),
+        (["bool_col", "int64_col"], [False, True], "last"),
+        (["bool_col", "int64_col"], [True, False], "first"),
+    ],
+)
+def test_dataframe_sort_values(
+    scalars_df_index, scalars_pandas_df_index, by, ascending, na_position
+):
+    # Test needs values to be unique
+    bf_result = scalars_df_index.sort_values(
+        by, ascending=ascending, na_position=na_position
+    ).to_pandas()
+    pd_result = scalars_pandas_df_index.sort_values(
+        by, ascending=ascending, na_position=na_position
+    )
+
+    pandas.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+@pytest.mark.parametrize(
+    ("by", "ascending", "na_position"),
+    [
+        ("int64_col", True, "first"),
+        (["bool_col", "int64_col"], True, "last"),
+    ],
+)
+def test_dataframe_sort_values_inplace(
+    scalars_df_index, scalars_pandas_df_index, by, ascending, na_position
+):
+    # Test needs values to be unique
+    bf_sorted = scalars_df_index.copy()
+    bf_sorted.sort_values(
+        by, ascending=ascending, na_position=na_position, inplace=True
+    )
+    bf_result = bf_sorted.to_pandas()
+    pd_result = scalars_pandas_df_index.sort_values(
+        by, ascending=ascending, na_position=na_position
+    )
+
+    pandas.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_dataframe_sort_values_invalid_input(scalars_df_index):
+    with pytest.raises(KeyError):
+        scalars_df_index.sort_values(by=scalars_df_index["int64_col"])
+
+
+def test_dataframe_sort_values_stable(scalars_df_index, scalars_pandas_df_index):
+    bf_result = (
+        scalars_df_index.sort_values("int64_col", kind="stable")
+        .sort_values("bool_col", kind="stable")
+        .to_pandas()
+    )
+    pd_result = scalars_pandas_df_index.sort_values(
+        "int64_col", kind="stable"
+    ).sort_values("bool_col", kind="stable")
+
+    pandas.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+@pytest.mark.parametrize(
+    ("operator", "columns"),
+    [
+        pytest.param(lambda x: x.cumsum(), ["float64_col", "int64_too"]),
+        # pytest.param(lambda x: x.cumprod(), ["float64_col", "int64_too"]),
+        pytest.param(
+            lambda x: x.cumprod(),
+            ["string_col"],
+            marks=pytest.mark.xfail(
+                raises=ValueError,
+            ),
+        ),
+    ],
+    ids=[
+        "cumsum",
+        # "cumprod",
+        "non-numeric",
+    ],
+)
+def test_dataframe_numeric_analytic_op(
+    scalars_df_index, scalars_pandas_df_index, operator, columns
+):
+    # TODO: Add nullable ints (pandas 1.x has poor behavior on these)
+    bf_series = operator(scalars_df_index[columns])
+    pd_series = operator(scalars_pandas_df_index[columns])
+    bf_result = bf_series.to_pandas()
+    pd.testing.assert_frame_equal(pd_series, bf_result, check_dtype=False)
+
+
+@pytest.mark.parametrize(
+    ("operator"),
+    [
+        (lambda x: x.cummin()),
+        (lambda x: x.cummax()),
+        (lambda x: x.shift(2)),
+        (lambda x: x.shift(-2)),
+    ],
+    ids=[
+        "cummin",
+        "cummax",
+        "shiftpostive",
+        "shiftnegative",
+    ],
+)
+def test_dataframe_general_analytic_op(
+    scalars_df_index, scalars_pandas_df_index, operator
+):
+    col_names = ["int64_too", "float64_col", "int64_col", "bool_col"]
+    bf_series = operator(scalars_df_index[col_names])
+    pd_series = operator(scalars_pandas_df_index[col_names])
+    bf_result = bf_series.to_pandas()
+    pd.testing.assert_frame_equal(
+        pd_series,
+        bf_result,
+    )
+
+
+@pytest.mark.parametrize(
+    ("periods",),
+    [
+        (1,),
+        (2,),
+        (-1,),
+    ],
+)
+def test_dataframe_diff(scalars_df_index, scalars_pandas_df_index, periods):
+    col_names = ["int64_too", "float64_col", "int64_col"]
+    bf_result = scalars_df_index[col_names].diff(periods=periods).to_pandas()
+    pd_result = scalars_pandas_df_index[col_names].diff(periods=periods)
+    pd.testing.assert_frame_equal(
+        pd_result,
+        bf_result,
+    )
+
+
+@pytest.mark.parametrize(
+    ("periods",),
+    [
+        (1,),
+        (2,),
+        (-1,),
+    ],
+)
+def test_dataframe_pct_change(scalars_df_index, scalars_pandas_df_index, periods):
+    col_names = ["int64_too", "float64_col", "int64_col"]
+    bf_result = scalars_df_index[col_names].pct_change(periods=periods).to_pandas()
+    pd_result = scalars_pandas_df_index[col_names].pct_change(periods=periods)
+    pd.testing.assert_frame_equal(
+        pd_result,
+        bf_result,
+    )
+
+
+def test_dataframe_agg_single_string(scalars_dfs):
+    numeric_cols = ["int64_col", "int64_too", "float64_col"]
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    bf_result = scalars_df[numeric_cols].agg("sum").to_pandas()
+    pd_result = scalars_pandas_df[numeric_cols].agg("sum")
+
+    assert bf_result.dtype == "Float64"
+    pd.testing.assert_series_equal(
+        pd_result, bf_result, check_dtype=False, check_index_type=False
+    )
+
+
+@pytest.mark.parametrize(
+    ("agg",),
+    (
+        ("sum",),
+        ("size",),
+    ),
+)
+def test_dataframe_agg_int_single_string(scalars_dfs, agg):
+    numeric_cols = ["int64_col", "int64_too", "bool_col"]
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    bf_result = scalars_df[numeric_cols].agg(agg).to_pandas()
+    pd_result = scalars_pandas_df[numeric_cols].agg(agg)
+
+    assert bf_result.dtype == "Int64"
+    pd.testing.assert_series_equal(
+        pd_result, bf_result, check_dtype=False, check_index_type=False
+    )
+
+
+def test_dataframe_agg_multi_string(scalars_dfs):
+    numeric_cols = ["int64_col", "int64_too", "float64_col"]
+    aggregations = [
+        "sum",
+        "mean",
+        "median",
+        "std",
+        "var",
+        "min",
+        "max",
+        "nunique",
+        "count",
+    ]
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df[numeric_cols].agg(aggregations)
+    pd_result = scalars_pandas_df[numeric_cols].agg(aggregations)
+
+    # Pandas may produce narrower numeric types, but bigframes always produces Float64
+    pd_result = pd_result.astype("Float64")
+
+    # Drop median, as it's an approximation.
+    bf_median = bf_result.loc["median", :]
+    bf_result = bf_result.drop(labels=["median"])
+    pd_result = pd_result.drop(labels=["median"])
+
+    assert_dfs_equivalent(pd_result, bf_result, check_index_type=False)
+
+    # Double-check that median is at least plausible.
+    assert (
+        (bf_result.loc["min", :] <= bf_median) & (bf_median <= bf_result.loc["max", :])
+    ).all()
+
+
+def test_dataframe_agg_int_multi_string(scalars_dfs):
+    numeric_cols = ["int64_col", "int64_too", "bool_col"]
+    aggregations = [
+        "sum",
+        "nunique",
+        "count",
+        "size",
+    ]
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df[numeric_cols].agg(aggregations).to_pandas()
+    pd_result = scalars_pandas_df[numeric_cols].agg(aggregations)
+
+    for dtype in bf_result.dtypes:
+        assert dtype == "Int64"
+
+    # Pandas may produce narrower numeric types
+    # Pandas has object index type
+    pd.testing.assert_frame_equal(
+        pd_result, bf_result, check_dtype=False, check_index_type=False
+    )
+
+
+def test_df_transpose():
+    # Include some floats to ensure type coercion
+    values = [[0, 3.5, True], [1, 4.5, False], [2, 6.5, None]]
+    # Test complex case of both axes being multi-indices with non-unique elements
+
+    columns: pandas.Index = pd.Index(
+        ["A", "B", "A"], dtype=pd.StringDtype(storage="pyarrow")
+    )
+    columns_multi = pd.MultiIndex.from_arrays([columns, columns], names=["c1", "c2"])
+
+    index: pandas.Index = pd.Index(
+        ["b", "a", "a"], dtype=pd.StringDtype(storage="pyarrow")
+    )
+    rows_multi = pd.MultiIndex.from_arrays([index, index], names=["r1", "r2"])
+
+    pd_df = pandas.DataFrame(values, index=rows_multi, columns=columns_multi)
+    bf_df = dataframe.DataFrame(values, index=rows_multi, columns=columns_multi)
+
+    pd_result = pd_df.T
+    bf_result = bf_df.T.to_pandas()
+
+    pd.testing.assert_frame_equal(pd_result, bf_result, check_dtype=False)
+
+
+def test_df_transpose_error():
+    with pytest.raises(TypeError, match="Cannot coerce.*to a common type."):
+        dataframe.DataFrame([[1, "hello"], [2, "world"]]).transpose()
+
+
+def test_df_transpose_repeated_uses_cache():
+    bf_df = dataframe.DataFrame([[1, 2.5], [2, 3.5]])
+    pd_df = pandas.DataFrame([[1, 2.5], [2, 3.5]])
+    # Transposing many times so that operation will fail from complexity if not using cache
+    for i in range(10):
+        # Cache still works even with simple scalar binop
+        bf_df = bf_df.transpose() + i
+        pd_df = pd_df.transpose() + i
+
+    pd.testing.assert_frame_equal(
+        pd_df, bf_df.to_pandas(), check_dtype=False, check_index_type=False
+    )
+
+
+def test_df_stack(scalars_dfs):
+    if pandas.__version__.startswith("1.") or pandas.__version__.startswith("2.0"):
+        pytest.skip("pandas <2.1 uses different stack implementation")
+    scalars_df, scalars_pandas_df = scalars_dfs
+    # To match bigquery dataframes
+    scalars_pandas_df = scalars_pandas_df.copy()
+    scalars_pandas_df.columns = scalars_pandas_df.columns.astype("string[pyarrow]")
+    # Can only stack identically-typed columns
+    columns = ["int64_col", "int64_too", "rowindex_2"]
+
+    bf_result = scalars_df[columns].stack().to_pandas()
+    pd_result = scalars_pandas_df[columns].stack(future_stack=True)
+
+    # Pandas produces NaN, where bq dataframes produces pd.NA
+    assert_series_equal(bf_result, pd_result, check_dtype=False)
+
+
+def test_df_melt_default(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    # To match bigquery dataframes
+    scalars_pandas_df = scalars_pandas_df.copy()
+    scalars_pandas_df.columns = scalars_pandas_df.columns.astype("string[pyarrow]")
+    # Can only stack identically-typed columns
+    columns = ["int64_col", "int64_too", "rowindex_2"]
+
+    bf_result = scalars_df[columns].melt().to_pandas()
+    pd_result = scalars_pandas_df[columns].melt()
+
+    # Pandas produces int64 index, Bigframes produces Int64 (nullable)
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+        check_index_type=False,
+        check_dtype=False,
+    )
+
+
+def test_df_melt_parameterized(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    # To match bigquery dataframes
+    scalars_pandas_df = scalars_pandas_df.copy()
+    scalars_pandas_df.columns = scalars_pandas_df.columns.astype("string[pyarrow]")
+    # Can only stack identically-typed columns
+
+    bf_result = scalars_df.melt(
+        var_name="alice",
+        value_name="bob",
+        id_vars=["string_col"],
+        value_vars=["int64_col", "int64_too"],
+    ).to_pandas()
+    pd_result = scalars_pandas_df.melt(
+        var_name="alice",
+        value_name="bob",
+        id_vars=["string_col"],
+        value_vars=["int64_col", "int64_too"],
+    )
+
+    # Pandas produces int64 index, Bigframes produces Int64 (nullable)
+    pd.testing.assert_frame_equal(
+        bf_result, pd_result, check_index_type=False, check_dtype=False
+    )
+
+
+@pytest.mark.parametrize(
+    ("ordered"),
+    [
+        (True),
+        (False),
+    ],
+)
+def test_df_unstack(scalars_dfs, ordered):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    # To match bigquery dataframes
+    scalars_pandas_df = scalars_pandas_df.copy()
+    scalars_pandas_df.columns = scalars_pandas_df.columns.astype("string[pyarrow]")
+    # Can only stack identically-typed columns
+    columns = [
+        "rowindex_2",
+        "int64_col",
+        "int64_too",
+    ]
+
+    # unstack on mono-index produces series
+    bf_result = scalars_df[columns].unstack().to_pandas(ordered=ordered)
+    pd_result = scalars_pandas_df[columns].unstack()
+
+    # Pandas produces NaN, where bq dataframes produces pd.NA
+    assert_series_equal(
+        bf_result, pd_result, check_dtype=False, ignore_order=not ordered
+    )
+
+
+def test_ipython_key_completions_with_drop(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_names = "string_col"
+    bf_dataframe = scalars_df.drop(columns=col_names)
+    pd_dataframe = scalars_pandas_df.drop(columns=col_names)
+    expected = pd_dataframe.columns.tolist()
+
+    results = bf_dataframe._ipython_key_completions_()
+
+    assert col_names not in results
+    assert results == expected
+    # _ipython_key_completions_ is called with square brackets
+    # so only column names are relevant with tab completion
+    assert "to_gbq" not in results
+    assert "merge" not in results
+    assert "drop" not in results
+
+
+def test_ipython_key_completions_with_rename(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_name_dict = {"string_col": "a_renamed_column"}
+    bf_dataframe = scalars_df.rename(columns=col_name_dict)
+    pd_dataframe = scalars_pandas_df.rename(columns=col_name_dict)
+    expected = pd_dataframe.columns.tolist()
+
+    results = bf_dataframe._ipython_key_completions_()
+
+    assert "string_col" not in results
+    assert "a_renamed_column" in results
+    assert results == expected
+    # _ipython_key_completions_ is called with square brackets
+    # so only column names are relevant with tab completion
+    assert "to_gbq" not in results
+    assert "merge" not in results
+    assert "drop" not in results
+
+
+def test__dir__with_drop(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_names = "string_col"
+    bf_dataframe = scalars_df.drop(columns=col_names)
+    pd_dataframe = scalars_pandas_df.drop(columns=col_names)
+    expected = pd_dataframe.columns.tolist()
+
+    results = dir(bf_dataframe)
+
+    assert col_names not in results
+    assert frozenset(expected) <= frozenset(results)
+    # __dir__ is called with a '.' and displays all methods, columns names, etc.
+    assert "to_gbq" in results
+    assert "merge" in results
+    assert "drop" in results
+
+
+def test__dir__with_rename(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    col_name_dict = {"string_col": "a_renamed_column"}
+    bf_dataframe = scalars_df.rename(columns=col_name_dict)
+    pd_dataframe = scalars_pandas_df.rename(columns=col_name_dict)
+    expected = pd_dataframe.columns.tolist()
+
+    results = dir(bf_dataframe)
+
+    assert "string_col" not in results
+    assert "a_renamed_column" in results
+    assert frozenset(expected) <= frozenset(results)
+    # __dir__ is called with a '.' and displays all methods, columns names, etc.
+    assert "to_gbq" in results
+    assert "merge" in results
+    assert "drop" in results
+
+
+@pytest.mark.parametrize(
+    ("start", "stop", "step"),
+    [
+        (0, 0, None),
+        (None, None, None),
+        (1, None, None),
+        (None, 4, None),
+        (None, None, 2),
+        (None, 50000000000, 1),
+        (5, 4, None),
+        (3, None, 2),
+        (1, 7, 2),
+        (1, 7, 50000000000),
+    ],
+)
+def test_iloc_slice(scalars_df_index, scalars_pandas_df_index, start, stop, step):
+    bf_result = scalars_df_index.iloc[start:stop:step].to_pandas()
+    pd_result = scalars_pandas_df_index.iloc[start:stop:step]
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_iloc_slice_zero_step(scalars_df_index):
+    with pytest.raises(ValueError):
+        scalars_df_index.iloc[0:0:0]
+
+
+@pytest.mark.parametrize(
+    ("ordered"),
+    [
+        (True),
+        (False),
+    ],
+)
+def test_iloc_slice_nested(scalars_df_index, scalars_pandas_df_index, ordered):
+    bf_result = scalars_df_index.iloc[1:].iloc[1:].to_pandas(ordered=ordered)
+    pd_result = scalars_pandas_df_index.iloc[1:].iloc[1:]
+
+    assert_pandas_df_equal(bf_result, pd_result, ignore_order=not ordered)
+
+
+@pytest.mark.parametrize(
+    "index",
+    [0, 5, -2, (2,)],
+)
+def test_iloc_single_integer(scalars_df_index, scalars_pandas_df_index, index):
+    bf_result = scalars_df_index.iloc[index]
+    pd_result = scalars_pandas_df_index.iloc[index]
+
+    pd.testing.assert_series_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+@pytest.mark.parametrize(
+    "index",
+    [(2, 5), (5, 0), (0, 0)],
+)
+def test_iloc_tuple(scalars_df_index, scalars_pandas_df_index, index):
+    bf_result = scalars_df_index.iloc[index]
+    pd_result = scalars_pandas_df_index.iloc[index]
+
+    assert bf_result == pd_result
+
+
+@pytest.mark.parametrize(
+    "index",
+    [(slice(None), [1, 2, 3]), (slice(1, 7, 2), [2, 5, 3])],
+)
+def test_iloc_tuple_multi_columns(scalars_df_index, scalars_pandas_df_index, index):
+    bf_result = scalars_df_index.iloc[index].to_pandas()
+    pd_result = scalars_pandas_df_index.iloc[index]
+
+    pd.testing.assert_frame_equal(bf_result, pd_result)
+
+
+def test_iloc_tuple_multi_columns_single_row(scalars_df_index, scalars_pandas_df_index):
+    index = (2, [2, 1, 3, -4])
+    bf_result = scalars_df_index.iloc[index]
+    pd_result = scalars_pandas_df_index.iloc[index]
+    pd.testing.assert_series_equal(bf_result, pd_result)
+
+
+@pytest.mark.parametrize(
+    ("index", "error"),
+    [
+        ((1, 1, 1), pd.errors.IndexingError),
+        (("asd", "asd", "asd"), pd.errors.IndexingError),
+        (("asd"), TypeError),
+    ],
+)
+def test_iloc_tuple_errors(scalars_df_index, scalars_pandas_df_index, index, error):
+    with pytest.raises(error):
+        scalars_df_index.iloc[index]
+    with pytest.raises(error):
+        scalars_pandas_df_index.iloc[index]
+
+
+@pytest.mark.parametrize(
+    "index",
+    [(2, 5), (5, 0), (0, 0)],
+)
+def test_iat(scalars_df_index, scalars_pandas_df_index, index):
+    bf_result = scalars_df_index.iat[index]
+    pd_result = scalars_pandas_df_index.iat[index]
+
+    assert bf_result == pd_result
+
+
+@pytest.mark.parametrize(
+    ("index", "error"),
+    [
+        (0, TypeError),
+        ("asd", ValueError),
+        ((1, 2, 3), TypeError),
+        (("asd", "asd"), ValueError),
+    ],
+)
+def test_iat_errors(scalars_df_index, scalars_pandas_df_index, index, error):
+    with pytest.raises(error):
+        scalars_pandas_df_index.iat[index]
+    with pytest.raises(error):
+        scalars_df_index.iat[index]
+
+
+def test_iloc_single_integer_out_of_bound_error(
+    scalars_df_index, scalars_pandas_df_index
+):
+    with pytest.raises(IndexError, match="single positional indexer is out-of-bounds"):
+        scalars_df_index.iloc[99]
+
+
+def test_loc_bool_series(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.loc[scalars_df_index.bool_col].to_pandas()
+    pd_result = scalars_pandas_df_index.loc[scalars_pandas_df_index.bool_col]
+
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_loc_select_column(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.loc[:, "int64_col"].to_pandas()
+    pd_result = scalars_pandas_df_index.loc[:, "int64_col"]
+    pd.testing.assert_series_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_loc_select_with_column_condition(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.loc[:, scalars_df_index.dtypes == "Int64"].to_pandas()
+    pd_result = scalars_pandas_df_index.loc[
+        :, scalars_pandas_df_index.dtypes == "Int64"
+    ]
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_loc_select_with_column_condition_bf_series(
+    scalars_df_index, scalars_pandas_df_index
+):
+    # (b/347072677) GEOGRAPH type doesn't support DISTINCT op
+    columns = [
+        item for item in scalars_pandas_df_index.columns if item != "geography_col"
+    ]
+    scalars_df_index = scalars_df_index[columns]
+    scalars_pandas_df_index = scalars_pandas_df_index[columns]
+
+    size_half = len(scalars_pandas_df_index) / 2
+    bf_result = scalars_df_index.loc[
+        :, scalars_df_index.nunique() > size_half
+    ].to_pandas()
+    pd_result = scalars_pandas_df_index.loc[
+        :, scalars_pandas_df_index.nunique() > size_half
+    ]
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_loc_single_index_with_duplicate(scalars_df_index, scalars_pandas_df_index):
+    scalars_df_index = scalars_df_index.set_index("string_col", drop=False)
+    scalars_pandas_df_index = scalars_pandas_df_index.set_index(
+        "string_col", drop=False
+    )
+    index = "Hello, World!"
+    bf_result = scalars_df_index.loc[index]
+    pd_result = scalars_pandas_df_index.loc[index]
+    pd.testing.assert_frame_equal(
+        bf_result.to_pandas(),
+        pd_result,
+    )
+
+
+def test_loc_single_index_no_duplicate(scalars_df_index, scalars_pandas_df_index):
+    scalars_df_index = scalars_df_index.set_index("int64_too", drop=False)
+    scalars_pandas_df_index = scalars_pandas_df_index.set_index("int64_too", drop=False)
+    index = -2345
+    bf_result = scalars_df_index.loc[index]
+    pd_result = scalars_pandas_df_index.loc[index]
+    pd.testing.assert_series_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_at_with_duplicate(scalars_df_index, scalars_pandas_df_index):
+    scalars_df_index = scalars_df_index.set_index("string_col", drop=False)
+    scalars_pandas_df_index = scalars_pandas_df_index.set_index(
+        "string_col", drop=False
+    )
+    index = "Hello, World!"
+    bf_result = scalars_df_index.at[index, "int64_too"]
+    pd_result = scalars_pandas_df_index.at[index, "int64_too"]
+    pd.testing.assert_series_equal(
+        bf_result.to_pandas(),
+        pd_result,
+    )
+
+
+def test_at_no_duplicate(scalars_df_index, scalars_pandas_df_index):
+    scalars_df_index = scalars_df_index.set_index("int64_too", drop=False)
+    scalars_pandas_df_index = scalars_pandas_df_index.set_index("int64_too", drop=False)
+    index = -2345
+    bf_result = scalars_df_index.at[index, "string_col"]
+    pd_result = scalars_pandas_df_index.at[index, "string_col"]
+    assert bf_result == pd_result
+
+
+def test_loc_setitem_bool_series_scalar_new_col(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+    bf_df.loc[bf_df["int64_too"] == 0, "new_col"] = 99
+    pd_df.loc[pd_df["int64_too"] == 0, "new_col"] = 99
+
+    # pandas uses float64 instead
+    pd_df["new_col"] = pd_df["new_col"].astype("Float64")
+
+    pd.testing.assert_frame_equal(
+        bf_df.to_pandas(),
+        pd_df,
+    )
+
+
+@pytest.mark.parametrize(
+    ("col", "value"),
+    [
+        ("string_col", "hello"),
+        ("int64_col", 3),
+        ("float64_col", 3.5),
+    ],
+)
+def test_loc_setitem_bool_series_scalar_existing_col(scalars_dfs, col, value):
+    if pd.__version__.startswith("1."):
+        pytest.skip("this loc overload not supported in pandas 1.x.")
+
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+    bf_df.loc[bf_df["int64_too"] == 1, col] = value
+    pd_df.loc[pd_df["int64_too"] == 1, col] = value
+
+    pd.testing.assert_frame_equal(
+        bf_df.to_pandas(),
+        pd_df,
+    )
+
+
+def test_loc_setitem_bool_series_scalar_error(scalars_dfs):
+    if pd.__version__.startswith("1."):
+        pytest.skip("this loc overload not supported in pandas 1.x.")
+
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_df = scalars_df.copy()
+    pd_df = scalars_pandas_df.copy()
+
+    with pytest.raises(Exception):
+        bf_df.loc[bf_df["int64_too"] == 1, "string_col"] = 99
+    with pytest.raises(Exception):
+        pd_df.loc[pd_df["int64_too"] == 1, "string_col"] = 99
+
+
+@pytest.mark.parametrize(
+    ("col", "op"),
+    [
+        # Int aggregates
+        pytest.param("int64_col", lambda x: x.sum(), id="int-sum"),
+        pytest.param("int64_col", lambda x: x.min(), id="int-min"),
+        pytest.param("int64_col", lambda x: x.max(), id="int-max"),
+        pytest.param("int64_col", lambda x: x.count(), id="int-count"),
+        pytest.param("int64_col", lambda x: x.nunique(), id="int-nunique"),
+        # Float aggregates
+        pytest.param("float64_col", lambda x: x.count(), id="float-count"),
+        pytest.param("float64_col", lambda x: x.nunique(), id="float-nunique"),
+        # Bool aggregates
+        pytest.param("bool_col", lambda x: x.sum(), id="bool-sum"),
+        pytest.param("bool_col", lambda x: x.count(), id="bool-count"),
+        pytest.param("bool_col", lambda x: x.nunique(), id="bool-nunique"),
+        # String aggregates
+        pytest.param("string_col", lambda x: x.count(), id="string-count"),
+        pytest.param("string_col", lambda x: x.nunique(), id="string-nunique"),
+    ],
+)
+def test_dataframe_aggregate_int(scalars_df_index, scalars_pandas_df_index, col, op):
+    bf_result = op(scalars_df_index[[col]]).to_pandas()
+    pd_result = op(scalars_pandas_df_index[[col]])
+
+    # Check dtype separately
+    assert bf_result.dtype == "Int64"
+    # Is otherwise "object" dtype
+    pd_result.index = pd_result.index.astype("string[pyarrow]")
+    # Pandas may produce narrower numeric types
+    assert_series_equal(pd_result, bf_result, check_dtype=False, check_index_type=False)
+
+
+@pytest.mark.parametrize(
+    ("col", "op"),
+    [
+        pytest.param("bool_col", lambda x: x.min(), id="bool-min"),
+        pytest.param("bool_col", lambda x: x.max(), id="bool-max"),
+    ],
+)
+def test_dataframe_aggregate_bool(scalars_df_index, scalars_pandas_df_index, col, op):
+    bf_result = op(scalars_df_index[[col]]).to_pandas()
+    pd_result = op(scalars_pandas_df_index[[col]])
+
+    # Check dtype separately
+    assert bf_result.dtype == "boolean"
+
+    # Pandas may produce narrower numeric types
+    # Pandas has object index type
+    pd_result.index = pd_result.index.astype("string[pyarrow]")
+    assert_series_equal(pd_result, bf_result, check_dtype=False, check_index_type=False)
+
+
+@pytest.mark.parametrize(
+    ("op", "bf_dtype"),
+    [
+        (lambda x: x.sum(numeric_only=True), "Float64"),
+        (lambda x: x.mean(numeric_only=True), "Float64"),
+        (lambda x: x.min(numeric_only=True), "Float64"),
+        (lambda x: x.max(numeric_only=True), "Float64"),
+        (lambda x: x.std(numeric_only=True), "Float64"),
+        (lambda x: x.var(numeric_only=True), "Float64"),
+        (lambda x: x.count(numeric_only=False), "Int64"),
+        (lambda x: x.nunique(), "Int64"),
+    ],
+    ids=["sum", "mean", "min", "max", "std", "var", "count", "nunique"],
+)
+def test_dataframe_aggregates(scalars_dfs, op, bf_dtype):
+    scalars_df_index, scalars_pandas_df_index = scalars_dfs
+    col_names = ["int64_too", "float64_col", "string_col", "int64_col", "bool_col"]
+    bf_series = op(scalars_df_index[col_names])
+    bf_result = bf_series
+    pd_result = op(scalars_pandas_df_index[col_names])
+
+    # Check dtype separately
+    assert bf_result.dtype == bf_dtype
+
+    # Pandas may produce narrower numeric types, but bigframes always produces Float64
+    # Pandas has object index type
+    pd_result.index = pd_result.index.astype("string[pyarrow]")
+    assert_series_equivalent(
+        pd_result,
+        bf_result,
+        check_dtype=False,
+        check_index_type=False,
+    )
+
+
+@pytest.mark.parametrize(
+    ("op"),
+    [
+        (lambda x: x.sum(axis=1, numeric_only=True)),
+        (lambda x: x.mean(axis=1, numeric_only=True)),
+        (lambda x: x.min(axis=1, numeric_only=True)),
+        (lambda x: x.max(axis=1, numeric_only=True)),
+        (lambda x: x.std(axis=1, numeric_only=True)),
+        (lambda x: x.var(axis=1, numeric_only=True)),
+    ],
+    ids=["sum", "mean", "min", "max", "std", "var"],
+)
+def test_dataframe_aggregates_axis_1(scalars_df_index, scalars_pandas_df_index, op):
+    col_names = ["int64_too", "int64_col", "float64_col", "bool_col", "string_col"]
+    bf_result = op(scalars_df_index[col_names]).to_pandas()
+    pd_result = op(scalars_pandas_df_index[col_names])
+
+    # Pandas may produce narrower numeric types, but bigframes always produces Float64
+    pd_result = pd_result.astype("Float64")
+    # Pandas has object index type
+    pd.testing.assert_series_equal(pd_result, bf_result, check_index_type=False)
+
+
+@pytest.mark.parametrize(
+    ("op"),
+    [
+        (lambda x: x.all(bool_only=True)),
+        (lambda x: x.any(bool_only=True)),
+        (lambda x: x.all(axis=1, bool_only=True)),
+        (lambda x: x.any(axis=1, bool_only=True)),
+    ],
+    ids=["all_axis0", "any_axis0", "all_axis1", "any_axis1"],
+)
+def test_dataframe_bool_aggregates(scalars_df_index, scalars_pandas_df_index, op):
+    # Pandas will drop nullable 'boolean' dtype so we convert first to bool, then cast back later
+    scalars_df_index = scalars_df_index.assign(
+        bool_col=scalars_df_index.bool_col.fillna(False)
+    )
+    scalars_pandas_df_index = scalars_pandas_df_index.assign(
+        bool_col=scalars_pandas_df_index.bool_col.fillna(False).astype("bool")
+    )
+    bf_series = op(scalars_df_index)
+    pd_series = op(scalars_pandas_df_index).astype("boolean")
+    bf_result = bf_series.to_pandas()
+
+    pd_series.index = pd_series.index.astype(bf_result.index.dtype)
+    pd.testing.assert_series_equal(pd_series, bf_result, check_index_type=False)
+
+
+def test_dataframe_prod(scalars_df_index, scalars_pandas_df_index):
+    col_names = ["int64_too", "float64_col"]
+    bf_series = scalars_df_index[col_names].prod()
+    pd_series = scalars_pandas_df_index[col_names].prod()
+    bf_result = bf_series.to_pandas()
+
+    # Pandas may produce narrower numeric types, but bigframes always produces Float64
+    pd_series = pd_series.astype("Float64")
+    # Pandas has object index type
+    pd.testing.assert_series_equal(pd_series, bf_result, check_index_type=False)
+
+
+def test_df_skew_too_few_values(scalars_dfs):
+    columns = ["float64_col", "int64_col"]
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df[columns].head(2).skew().to_pandas()
+    pd_result = scalars_pandas_df[columns].head(2).skew()
+
+    # Pandas may produce narrower numeric types, but bigframes always produces Float64
+    pd_result = pd_result.astype("Float64")
+
+    pd.testing.assert_series_equal(pd_result, bf_result, check_index_type=False)
+
+
+@pytest.mark.parametrize(
+    ("ordered"),
+    [
+        (True),
+        (False),
+    ],
+)
+def test_df_skew(scalars_dfs, ordered):
+    columns = ["float64_col", "int64_col"]
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df[columns].skew().to_pandas(ordered=ordered)
+    pd_result = scalars_pandas_df[columns].skew()
+
+    # Pandas may produce narrower numeric types, but bigframes always produces Float64
+    pd_result = pd_result.astype("Float64")
+
+    assert_series_equal(
+        pd_result, bf_result, check_index_type=False, ignore_order=not ordered
+    )
+
+
+def test_df_kurt_too_few_values(scalars_dfs):
+    columns = ["float64_col", "int64_col"]
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df[columns].head(2).kurt().to_pandas()
+    pd_result = scalars_pandas_df[columns].head(2).kurt()
+
+    # Pandas may produce narrower numeric types, but bigframes always produces Float64
+    pd_result = pd_result.astype("Float64")
+
+    pd.testing.assert_series_equal(pd_result, bf_result, check_index_type=False)
+
+
+def test_df_kurt(scalars_dfs):
+    columns = ["float64_col", "int64_col"]
+    scalars_df, scalars_pandas_df = scalars_dfs
+    bf_result = scalars_df[columns].kurt().to_pandas()
+    pd_result = scalars_pandas_df[columns].kurt()
+
+    # Pandas may produce narrower numeric types, but bigframes always produces Float64
+    pd_result = pd_result.astype("Float64")
+
+    pd.testing.assert_series_equal(pd_result, bf_result, check_index_type=False)
+
+
+def test_sample_raises_value_error(scalars_dfs):
+    scalars_df, _ = scalars_dfs
+    with pytest.raises(
+        ValueError, match="Only one of 'n' or 'frac' parameter can be specified."
+    ):
+        scalars_df.sample(frac=0.5, n=4)
+
+
+@pytest.mark.parametrize(
+    ("axis",),
+    [
+        (None,),
+        (0,),
+        (1,),
+    ],
+)
+def test_df_add_prefix(scalars_df_index, scalars_pandas_df_index, axis):
+    if pd.__version__.startswith("1."):
+        pytest.skip("add_prefix axis parameter not supported in pandas 1.x.")
+    bf_result = scalars_df_index.add_prefix("prefix_", axis).to_pandas()
+
+    pd_result = scalars_pandas_df_index.add_prefix("prefix_", axis)
+
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+        check_index_type=False,
+    )
+
+
+@pytest.mark.parametrize(
+    ("axis",),
+    [
+        (0,),
+        (1,),
+    ],
+)
+def test_df_add_suffix(scalars_df_index, scalars_pandas_df_index, axis):
+    if pd.__version__.startswith("1."):
+        pytest.skip("add_prefix axis parameter not supported in pandas 1.x.")
+    bf_result = scalars_df_index.add_suffix("_suffix", axis).to_pandas()
+
+    pd_result = scalars_pandas_df_index.add_suffix("_suffix", axis)
+
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+        check_index_type=False,
+    )
+
+
+def test_df_astype_error_error(session):
+    input = pd.DataFrame(["hello", "world", "3.11", "4000"])
+    with pytest.raises(ValueError):
+        session.read_pandas(input).astype("Float64", errors="bad_value")
+
+
+def test_df_columns_filter_items(scalars_df_index, scalars_pandas_df_index):
+    if pd.__version__.startswith("2.0") or pd.__version__.startswith("1."):
+        pytest.skip("pandas filter items behavior different pre-2.1")
+    bf_result = scalars_df_index.filter(items=["string_col", "int64_col"]).to_pandas()
+
+    pd_result = scalars_pandas_df_index.filter(items=["string_col", "int64_col"])
+    # Ignore column ordering as pandas order differently depending on version
+    pd.testing.assert_frame_equal(
+        bf_result.sort_index(axis=1),
+        pd_result.sort_index(axis=1),
+    )
+
+
+def test_df_columns_filter_like(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.filter(like="64_col").to_pandas()
+
+    pd_result = scalars_pandas_df_index.filter(like="64_col")
+
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_df_columns_filter_regex(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.filter(regex="^[^_]+$").to_pandas()
+
+    pd_result = scalars_pandas_df_index.filter(regex="^[^_]+$")
+
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_df_reindex_rows_list(scalars_dfs):
+    scalars_df_index, scalars_pandas_df_index = scalars_dfs
+    bf_result = scalars_df_index.reindex(index=[5, 1, 3, 99, 1])
+
+    pd_result = scalars_pandas_df_index.reindex(index=[5, 1, 3, 99, 1])
+
+    # Pandas uses int64 instead of Int64 (nullable) dtype.
+    pd_result.index = pd_result.index.astype(pd.Int64Dtype())
+    assert_dfs_equivalent(
+        pd_result,
+        bf_result,
+    )
+
+
+def test_df_reindex_rows_index(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.reindex(
+        index=pd.Index([5, 1, 3, 99, 1], name="newname")
+    ).to_pandas()
+
+    pd_result = scalars_pandas_df_index.reindex(
+        index=pd.Index([5, 1, 3, 99, 1], name="newname")
+    )
+
+    # Pandas uses int64 instead of Int64 (nullable) dtype.
+    pd_result.index = pd_result.index.astype(pd.Int64Dtype())
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_df_reindex_nonunique(scalars_df_index):
+    with pytest.raises(ValueError):
+        # int64_too is non-unique
+        scalars_df_index.set_index("int64_too").reindex(
+            index=[5, 1, 3, 99, 1], validate=True
+        )
+
+
+def test_df_reindex_columns(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.reindex(
+        columns=["not_a_col", "int64_col", "int64_too"]
+    ).to_pandas()
+
+    pd_result = scalars_pandas_df_index.reindex(
+        columns=["not_a_col", "int64_col", "int64_too"]
+    )
+
+    # Pandas uses float64 as default for newly created empty column, bf uses Float64
+    pd_result.not_a_col = pd_result.not_a_col.astype(pandas.Float64Dtype())
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_df_reindex_columns_with_same_order(scalars_df_index, scalars_pandas_df_index):
+    # First, make sure the two dataframes have the same columns in order.
+    columns = ["int64_col", "int64_too"]
+    bf = scalars_df_index[columns]
+    pd_df = scalars_pandas_df_index[columns]
+
+    bf_result = bf.reindex(columns=columns).to_pandas()
+    pd_result = pd_df.reindex(columns=columns)
+
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_df_equals_identical(scalars_df_index, scalars_pandas_df_index):
+    unsupported = [
+        "geography_col",
+    ]
+    scalars_df_index = scalars_df_index.drop(columns=unsupported)
+    scalars_pandas_df_index = scalars_pandas_df_index.drop(columns=unsupported)
+
+    bf_result = scalars_df_index.equals(scalars_df_index)
+    pd_result = scalars_pandas_df_index.equals(scalars_pandas_df_index)
+
+    assert pd_result == bf_result
+
+
+def test_df_equals_series(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index[["int64_col"]].equals(scalars_df_index["int64_col"])
+    pd_result = scalars_pandas_df_index[["int64_col"]].equals(
+        scalars_pandas_df_index["int64_col"]
+    )
+
+    assert pd_result == bf_result
+
+
+def test_df_equals_different_dtype(scalars_df_index, scalars_pandas_df_index):
+    columns = ["int64_col", "int64_too"]
+    scalars_df_index = scalars_df_index[columns]
+    scalars_pandas_df_index = scalars_pandas_df_index[columns]
+
+    bf_modified = scalars_df_index.copy()
+    bf_modified = bf_modified.astype("Float64")
+
+    pd_modified = scalars_pandas_df_index.copy()
+    pd_modified = pd_modified.astype("Float64")
+
+    bf_result = scalars_df_index.equals(bf_modified)
+    pd_result = scalars_pandas_df_index.equals(pd_modified)
+
+    assert pd_result == bf_result
+
+
+def test_df_equals_different_values(scalars_df_index, scalars_pandas_df_index):
+    columns = ["int64_col", "int64_too"]
+    scalars_df_index = scalars_df_index[columns]
+    scalars_pandas_df_index = scalars_pandas_df_index[columns]
+
+    bf_modified = scalars_df_index.copy()
+    bf_modified["int64_col"] = bf_modified.int64_col + 1
+
+    pd_modified = scalars_pandas_df_index.copy()
+    pd_modified["int64_col"] = pd_modified.int64_col + 1
+
+    bf_result = scalars_df_index.equals(bf_modified)
+    pd_result = scalars_pandas_df_index.equals(pd_modified)
+
+    assert pd_result == bf_result
+
+
+def test_df_equals_extra_column(scalars_df_index, scalars_pandas_df_index):
+    columns = ["int64_col", "int64_too"]
+    more_columns = ["int64_col", "int64_too", "float64_col"]
+
+    bf_result = scalars_df_index[columns].equals(scalars_df_index[more_columns])
+    pd_result = scalars_pandas_df_index[columns].equals(
+        scalars_pandas_df_index[more_columns]
+    )
+
+    assert pd_result == bf_result
+
+
+def test_df_reindex_like(scalars_df_index, scalars_pandas_df_index):
+    reindex_target_bf = scalars_df_index.reindex(
+        columns=["not_a_col", "int64_col", "int64_too"], index=[5, 1, 3, 99, 1]
+    )
+    bf_result = scalars_df_index.reindex_like(reindex_target_bf).to_pandas()
+
+    reindex_target_pd = scalars_pandas_df_index.reindex(
+        columns=["not_a_col", "int64_col", "int64_too"], index=[5, 1, 3, 99, 1]
+    )
+    pd_result = scalars_pandas_df_index.reindex_like(reindex_target_pd)
+
+    # Pandas uses float64 as default for newly created empty column, bf uses Float64
+    # Pandas uses int64 instead of Int64 (nullable) dtype.
+    pd_result.index = pd_result.index.astype(pd.Int64Dtype())
+    # Pandas uses float64 as default for newly created empty column, bf uses Float64
+    pd_result.not_a_col = pd_result.not_a_col.astype(pandas.Float64Dtype())
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_df_values(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.values
+
+    pd_result = scalars_pandas_df_index.values
+    # Numpy isn't equipped to compare non-numeric objects, so convert back to dataframe
+    pd.testing.assert_frame_equal(
+        pd.DataFrame(bf_result), pd.DataFrame(pd_result), check_dtype=False
+    )
+
+
+def test_df_to_numpy(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.to_numpy()
+
+    pd_result = scalars_pandas_df_index.to_numpy()
+    # Numpy isn't equipped to compare non-numeric objects, so convert back to dataframe
+    pd.testing.assert_frame_equal(
+        pd.DataFrame(bf_result), pd.DataFrame(pd_result), check_dtype=False
+    )
+
+
+def test_df___array__(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.__array__()
+
+    pd_result = scalars_pandas_df_index.__array__()
+    # Numpy isn't equipped to compare non-numeric objects, so convert back to dataframe
+    pd.testing.assert_frame_equal(
+        pd.DataFrame(bf_result), pd.DataFrame(pd_result), check_dtype=False
+    )
+
+
+def test_df_getattr_attribute_error_when_pandas_has(scalars_df_index):
+    # swapaxes is implemented in pandas but not in bigframes
+    with pytest.raises(AttributeError):
+        scalars_df_index.swapaxes()
+
+
+def test_df_getattr_attribute_error(scalars_df_index):
+    with pytest.raises(AttributeError):
+        scalars_df_index.not_a_method()
+
+
+def test_df_getattr_axes():
+    df = dataframe.DataFrame(
+        [[1, 1, 1], [1, 1, 1]], columns=["index", "columns", "my_column"]
+    )
+    assert isinstance(df.index, bigframes.core.indexes.Index)
+    assert isinstance(df.columns, pandas.Index)
+    assert isinstance(df.my_column, series.Series)
+
+
+def test_df_setattr_index():
+    pd_df = pandas.DataFrame(
+        [[1, 1, 1], [1, 1, 1]], columns=["index", "columns", "my_column"]
+    )
+    bf_df = dataframe.DataFrame(pd_df)
+
+    pd_df.index = pandas.Index([4, 5])
+    bf_df.index = [4, 5]
+
+    assert_pandas_df_equal(
+        pd_df, bf_df.to_pandas(), check_index_type=False, check_dtype=False
+    )
+
+
+def test_df_setattr_columns():
+    pd_df = pandas.DataFrame(
+        [[1, 1, 1], [1, 1, 1]], columns=["index", "columns", "my_column"]
+    )
+    bf_df = dataframe.DataFrame(pd_df)
+
+    pd_df.columns = typing.cast(pandas.Index, pandas.Index([4, 5, 6]))
+
+    bf_df.columns = pandas.Index([4, 5, 6])
+
+    assert_pandas_df_equal(
+        pd_df, bf_df.to_pandas(), check_index_type=False, check_dtype=False
+    )
+
+
+def test_df_setattr_modify_column():
+    pd_df = pandas.DataFrame(
+        [[1, 1, 1], [1, 1, 1]], columns=["index", "columns", "my_column"]
+    )
+    bf_df = dataframe.DataFrame(pd_df)
+    pd_df.my_column = [4, 5]
+    bf_df.my_column = [4, 5]
+
+    assert_pandas_df_equal(
+        pd_df, bf_df.to_pandas(), check_index_type=False, check_dtype=False
+    )
+
+
+def test_loc_list_string_index(scalars_df_index, scalars_pandas_df_index):
+    index_list = scalars_pandas_df_index.string_col.iloc[[0, 1, 1, 5]].values
+
+    scalars_df_index = scalars_df_index.set_index("string_col")
+    scalars_pandas_df_index = scalars_pandas_df_index.set_index("string_col")
+
+    bf_result = scalars_df_index.loc[index_list].to_pandas()
+    pd_result = scalars_pandas_df_index.loc[index_list]
+
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_loc_list_integer_index(scalars_df_index, scalars_pandas_df_index):
+    index_list = [3, 2, 1, 3, 2, 1]
+
+    bf_result = scalars_df_index.loc[index_list]
+    pd_result = scalars_pandas_df_index.loc[index_list]
+
+    pd.testing.assert_frame_equal(
+        bf_result.to_pandas(),
+        pd_result,
+    )
+
+
+def test_loc_list_multiindex(scalars_dfs):
+    scalars_df_index, scalars_pandas_df_index = scalars_dfs
+    scalars_df_multiindex = scalars_df_index.set_index(["string_col", "int64_col"])
+    scalars_pandas_df_multiindex = scalars_pandas_df_index.set_index(
+        ["string_col", "int64_col"]
+    )
+    index_list = [("Hello, World!", -234892), ("Hello, World!", 123456789)]
+
+    bf_result = scalars_df_multiindex.loc[index_list]
+    pd_result = scalars_pandas_df_multiindex.loc[index_list]
+
+    assert_dfs_equivalent(
+        pd_result,
+        bf_result,
+    )
+
+
+@pytest.mark.parametrize(
+    "index_list",
+    [
+        [0, 1, 2, 3, 4, 4],
+        [0, 0, 0, 5, 4, 7, -2, -5, 3],
+        [-1, -2, -3, -4, -5, -5],
+    ],
+)
+def test_iloc_list(scalars_df_index, scalars_pandas_df_index, index_list):
+    bf_result = scalars_df_index.iloc[index_list]
+    pd_result = scalars_pandas_df_index.iloc[index_list]
+
+    pd.testing.assert_frame_equal(
+        bf_result.to_pandas(),
+        pd_result,
+    )
+
+
+def test_iloc_list_multiindex(scalars_dfs):
+    scalars_df, scalars_pandas_df = scalars_dfs
+    scalars_df = scalars_df.copy()
+    scalars_pandas_df = scalars_pandas_df.copy()
+    scalars_df = scalars_df.set_index(["bytes_col", "numeric_col"])
+    scalars_pandas_df = scalars_pandas_df.set_index(["bytes_col", "numeric_col"])
+
+    index_list = [0, 0, 0, 5, 4, 7]
+
+    bf_result = scalars_df.iloc[index_list]
+    pd_result = scalars_pandas_df.iloc[index_list]
+
+    pd.testing.assert_frame_equal(
+        bf_result.to_pandas(),
+        pd_result,
+    )
+
+
+def test_iloc_empty_list(scalars_df_index, scalars_pandas_df_index):
+
+    index_list: List[int] = []
+
+    bf_result = scalars_df_index.iloc[index_list]
+    pd_result = scalars_pandas_df_index.iloc[index_list]
+
+    bf_result = bf_result.to_pandas()
+    assert bf_result.shape == pd_result.shape  # types are known to be different
+
+
+def test_rename_axis(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.rename_axis("newindexname")
+    pd_result = scalars_pandas_df_index.rename_axis("newindexname")
+
+    pd.testing.assert_frame_equal(
+        bf_result.to_pandas(),
+        pd_result,
+    )
+
+
+def test_rename_axis_nonstring(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.rename_axis((4,))
+    pd_result = scalars_pandas_df_index.rename_axis((4,))
+
+    pd.testing.assert_frame_equal(
+        bf_result.to_pandas(),
+        pd_result,
+    )
+
+
+def test_loc_bf_series_string_index(scalars_df_index, scalars_pandas_df_index):
+    pd_string_series = scalars_pandas_df_index.string_col.iloc[[0, 5, 1, 1, 5]]
+    bf_string_series = scalars_df_index.string_col.iloc[[0, 5, 1, 1, 5]]
+
+    scalars_df_index = scalars_df_index.set_index("string_col")
+    scalars_pandas_df_index = scalars_pandas_df_index.set_index("string_col")
+
+    bf_result = scalars_df_index.loc[bf_string_series]
+    pd_result = scalars_pandas_df_index.loc[pd_string_series]
+
+    pd.testing.assert_frame_equal(
+        bf_result.to_pandas(),
+        pd_result,
+    )
+
+
+def test_loc_bf_series_multiindex(scalars_df_index, scalars_pandas_df_index):
+    pd_string_series = scalars_pandas_df_index.string_col.iloc[[0, 5, 1, 1, 5]]
+    bf_string_series = scalars_df_index.string_col.iloc[[0, 5, 1, 1, 5]]
+
+    scalars_df_multiindex = scalars_df_index.set_index(["string_col", "int64_col"])
+    scalars_pandas_df_multiindex = scalars_pandas_df_index.set_index(
+        ["string_col", "int64_col"]
+    )
+
+    bf_result = scalars_df_multiindex.loc[bf_string_series]
+    pd_result = scalars_pandas_df_multiindex.loc[pd_string_series]
+
+    pd.testing.assert_frame_equal(
+        bf_result.to_pandas(),
+        pd_result,
+    )
+
+
+def test_loc_bf_index_integer_index(scalars_df_index, scalars_pandas_df_index):
+    pd_index = scalars_pandas_df_index.iloc[[0, 5, 1, 1, 5]].index
+    bf_index = scalars_df_index.iloc[[0, 5, 1, 1, 5]].index
+
+    bf_result = scalars_df_index.loc[bf_index]
+    pd_result = scalars_pandas_df_index.loc[pd_index]
+
+    pd.testing.assert_frame_equal(
+        bf_result.to_pandas(),
+        pd_result,
+    )
+
+
+def test_loc_bf_index_integer_index_renamed_col(
+    scalars_df_index, scalars_pandas_df_index
+):
+    scalars_df_index = scalars_df_index.rename(columns={"int64_col": "rename"})
+    scalars_pandas_df_index = scalars_pandas_df_index.rename(
+        columns={"int64_col": "rename"}
+    )
+
+    pd_index = scalars_pandas_df_index.iloc[[0, 5, 1, 1, 5]].index
+    bf_index = scalars_df_index.iloc[[0, 5, 1, 1, 5]].index
+
+    bf_result = scalars_df_index.loc[bf_index]
+    pd_result = scalars_pandas_df_index.loc[pd_index]
+
+    pd.testing.assert_frame_equal(
+        bf_result.to_pandas(),
+        pd_result,
+    )
+
+
+@pytest.mark.parametrize(
+    ("subset"),
+    [
+        None,
+        "bool_col",
+        ["bool_col", "int64_too"],
+    ],
+)
+@pytest.mark.parametrize(
+    ("keep",),
+    [
+        (False,),
+    ],
+)
+def test_df_drop_duplicates(scalars_df_index, scalars_pandas_df_index, keep, subset):
+    columns = ["bool_col", "int64_too", "int64_col"]
+    bf_df = scalars_df_index[columns].drop_duplicates(subset, keep=keep).to_pandas()
+    pd_df = scalars_pandas_df_index[columns].drop_duplicates(subset, keep=keep)
+    pd.testing.assert_frame_equal(
+        pd_df,
+        bf_df,
+    )
+
+
+@pytest.mark.parametrize(
+    ("subset"),
+    [
+        None,
+        ["bool_col"],
+    ],
+)
+@pytest.mark.parametrize(
+    ("keep",),
+    [
+        (False,),
+    ],
+)
+def test_df_duplicated(scalars_df_index, scalars_pandas_df_index, keep, subset):
+    columns = ["bool_col", "int64_too", "int64_col"]
+    bf_series = scalars_df_index[columns].duplicated(subset, keep=keep).to_pandas()
+    pd_series = scalars_pandas_df_index[columns].duplicated(subset, keep=keep)
+    pd.testing.assert_series_equal(pd_series, bf_series, check_dtype=False)
+
+
+def test_df_from_dict_columns_orient():
+    data = {"a": [1, 2], "b": [3.3, 2.4]}
+    bf_result = dataframe.DataFrame.from_dict(data, orient="columns").to_pandas()
+    pd_result = pd.DataFrame.from_dict(data, orient="columns")
+    assert_pandas_df_equal(
+        pd_result, bf_result, check_dtype=False, check_index_type=False
+    )
+
+
+def test_df_from_dict_index_orient():
+    data = {"a": [1, 2], "b": [3.3, 2.4]}
+    bf_result = dataframe.DataFrame.from_dict(
+        data, orient="index", columns=["col1", "col2"]
+    ).to_pandas()
+    pd_result = pd.DataFrame.from_dict(data, orient="index", columns=["col1", "col2"])
+    assert_pandas_df_equal(
+        pd_result, bf_result, check_dtype=False, check_index_type=False
+    )
+
+
+def test_df_from_dict_tight_orient():
+    data = {
+        "index": [("i1", "i2"), ("i3", "i4")],
+        "columns": ["col1", "col2"],
+        "data": [[1, 2.6], [3, 4.5]],
+        "index_names": ["in1", "in2"],
+        "column_names": ["column_axis"],
+    }
+
+    bf_result = dataframe.DataFrame.from_dict(data, orient="tight").to_pandas()
+    pd_result = pd.DataFrame.from_dict(data, orient="tight")
+    assert_pandas_df_equal(
+        pd_result, bf_result, check_dtype=False, check_index_type=False
+    )
+
+
+def test_df_from_records():
+    records = ((1, "a"), (2.5, "b"), (3.3, "c"), (4.9, "d"))
+
+    bf_result = dataframe.DataFrame.from_records(
+        records, columns=["c1", "c2"]
+    ).to_pandas()
+    pd_result = pd.DataFrame.from_records(records, columns=["c1", "c2"])
+    assert_pandas_df_equal(
+        pd_result, bf_result, check_dtype=False, check_index_type=False
+    )
+
+
+def test_df_to_dict(scalars_df_index, scalars_pandas_df_index):
+    unsupported = ["numeric_col"]  # formatted differently
+    bf_result = scalars_df_index.drop(columns=unsupported).to_dict()
+    pd_result = scalars_pandas_df_index.drop(columns=unsupported).to_dict()
+
+    assert bf_result == pd_result
+
+
+def test_df_to_json_local_str(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.to_json()
+    # default_handler for arrow types that have no default conversion
+    pd_result = scalars_pandas_df_index.to_json(default_handler=str)
+
+    assert bf_result == pd_result
+
+
+def test_df_to_json_local_file(scalars_df_index, scalars_pandas_df_index):
+    # TODO: supply a reason why this isn't compatible with pandas 1.x
+    pytest.importorskip("pandas", minversion="2.0.0")
+    with tempfile.TemporaryFile() as bf_result_file, tempfile.TemporaryFile() as pd_result_file:
+        scalars_df_index.to_json(bf_result_file, orient="table")
+        # default_handler for arrow types that have no default conversion
+        scalars_pandas_df_index.to_json(
+            pd_result_file, orient="table", default_handler=str
+        )
+
+        bf_result = bf_result_file.read()
+        pd_result = pd_result_file.read()
+
+    assert bf_result == pd_result
+
+
+def test_df_to_csv_local_str(scalars_df_index, scalars_pandas_df_index):
+    bf_result = scalars_df_index.to_csv()
+    # default_handler for arrow types that have no default conversion
+    pd_result = scalars_pandas_df_index.to_csv()
+
+    assert bf_result == pd_result
+
+
+def test_df_to_csv_local_file(scalars_df_index, scalars_pandas_df_index):
+    with tempfile.TemporaryFile() as bf_result_file, tempfile.TemporaryFile() as pd_result_file:
+        scalars_df_index.to_csv(bf_result_file)
+        scalars_pandas_df_index.to_csv(pd_result_file)
+
+        bf_result = bf_result_file.read()
+        pd_result = pd_result_file.read()
+
+    assert bf_result == pd_result
+
+
+def test_df_to_parquet_local_bytes(scalars_df_index, scalars_pandas_df_index):
+    # GEOGRAPHY not supported in parquet export.
+    unsupported = ["geography_col"]
+
+    bf_result = scalars_df_index.drop(columns=unsupported).to_parquet()
+    # default_handler for arrow types that have no default conversion
+    pd_result = scalars_pandas_df_index.drop(columns=unsupported).to_parquet()
+
+    assert bf_result == pd_result
+
+
+def test_df_to_parquet_local_file(scalars_df_index, scalars_pandas_df_index):
+    # GEOGRAPHY not supported in parquet export.
+    unsupported = ["geography_col"]
+    with tempfile.TemporaryFile() as bf_result_file, tempfile.TemporaryFile() as pd_result_file:
+        scalars_df_index.drop(columns=unsupported).to_parquet(bf_result_file)
+        scalars_pandas_df_index.drop(columns=unsupported).to_parquet(pd_result_file)
+
+        bf_result = bf_result_file.read()
+        pd_result = pd_result_file.read()
+
+    assert bf_result == pd_result
+
+
+def test_df_to_records(scalars_df_index, scalars_pandas_df_index):
+    unsupported = ["numeric_col"]
+    bf_result = scalars_df_index.drop(columns=unsupported).to_records()
+    pd_result = scalars_pandas_df_index.drop(columns=unsupported).to_records()
+
+    for bfi, pdi in zip(bf_result, pd_result):
+        for bfj, pdj in zip(bfi, pdi):
+            assert pd.isna(bfj) and pd.isna(pdj) or bfj == pdj
+
+
+def test_df_to_string(scalars_df_index, scalars_pandas_df_index):
+    unsupported = ["numeric_col"]  # formatted differently
+
+    bf_result = scalars_df_index.drop(columns=unsupported).to_string()
+    pd_result = scalars_pandas_df_index.drop(columns=unsupported).to_string()
+
+    assert bf_result == pd_result
+
+
+def test_df_to_html(scalars_df_index, scalars_pandas_df_index):
+    unsupported = ["numeric_col"]  # formatted differently
+
+    bf_result = scalars_df_index.drop(columns=unsupported).to_html()
+    pd_result = scalars_pandas_df_index.drop(columns=unsupported).to_html()
+
+    assert bf_result == pd_result
+
+
+def test_df_to_markdown(scalars_df_index, scalars_pandas_df_index):
+    # Nulls have bug from tabulate https://github.com/astanin/python-tabulate/issues/231
+    bf_result = scalars_df_index.dropna().to_markdown()
+    pd_result = scalars_pandas_df_index.dropna().to_markdown()
+
+    assert bf_result == pd_result
+
+
+def test_df_to_pickle(scalars_df_index, scalars_pandas_df_index):
+    with tempfile.TemporaryFile() as bf_result_file, tempfile.TemporaryFile() as pd_result_file:
+        scalars_df_index.to_pickle(bf_result_file)
+        scalars_pandas_df_index.to_pickle(pd_result_file)
+        bf_result = bf_result_file.read()
+        pd_result = pd_result_file.read()
+
+    assert bf_result == pd_result
+
+
+def test_df_to_orc(scalars_df_index, scalars_pandas_df_index):
+    unsupported = [
+        "numeric_col",
+        "bytes_col",
+        "date_col",
+        "datetime_col",
+        "time_col",
+        "timestamp_col",
+        "geography_col",
+    ]
+
+    bf_result_file = tempfile.TemporaryFile()
+    pd_result_file = tempfile.TemporaryFile()
+    scalars_df_index.drop(columns=unsupported).to_orc(bf_result_file)
+    scalars_pandas_df_index.drop(columns=unsupported).reset_index().to_orc(
+        pd_result_file
+    )
+    bf_result = bf_result_file.read()
+    pd_result = bf_result_file.read()
+
+    assert bf_result == pd_result
+
+
+@pytest.mark.parametrize(
+    ("expr",),
+    [
+        ("new_col = int64_col + int64_too",),
+        ("new_col = (rowindex > 3) | bool_col",),
+        ("int64_too = bool_col\nnew_col2 = rowindex",),
+    ],
+)
+def test_df_eval(scalars_dfs, expr):
+    # TODO: supply a reason why this isn't compatible with pandas 1.x
+    pytest.importorskip("pandas", minversion="2.0.0")
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    bf_result = scalars_df.eval(expr).to_pandas()
+    pd_result = scalars_pandas_df.eval(expr)
+
+    pd.testing.assert_frame_equal(bf_result, pd_result)
+
+
+@pytest.mark.parametrize(
+    ("expr",),
+    [
+        ("int64_col > int64_too",),
+        ("bool_col",),
+        ("((int64_col - int64_too) % @local_var) == 0",),
+    ],
+)
+def test_df_query(scalars_dfs, expr):
+    # TODO: supply a reason why this isn't compatible with pandas 1.x
+    pytest.importorskip("pandas", minversion="2.0.0")
+    # local_var is referenced in expressions
+    local_var = 3  # NOQA
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    bf_result = scalars_df.query(expr).to_pandas()
+    pd_result = scalars_pandas_df.query(expr)
+
+    pd.testing.assert_frame_equal(bf_result, pd_result)
+
+
+@pytest.mark.parametrize(
+    ("subset", "normalize", "ascending", "dropna"),
+    [
+        (None, False, False, False),
+        (None, True, True, True),
+        ("bool_col", True, False, True),
+    ],
+)
+def test_df_value_counts(scalars_dfs, subset, normalize, ascending, dropna):
+    if pd.__version__.startswith("1."):
+        pytest.skip("pandas 1.x produces different column labels.")
+    scalars_df, scalars_pandas_df = scalars_dfs
+
+    bf_result = (
+        scalars_df[["string_col", "bool_col"]]
+        .value_counts(subset, normalize=normalize, ascending=ascending, dropna=dropna)
+        .to_pandas()
+    )
+    pd_result = scalars_pandas_df[["string_col", "bool_col"]].value_counts(
+        subset, normalize=normalize, ascending=ascending, dropna=dropna
+    )
+
+    pd.testing.assert_series_equal(
+        bf_result, pd_result, check_dtype=False, check_index_type=False
+    )
+
+
+def test_df_bool_interpretation_error(scalars_df_index):
+    with pytest.raises(ValueError):
+        True if scalars_df_index else False
+
+
+def test_assign_after_binop_row_joins():
+    pd_df = pd.DataFrame(
+        {
+            "idx1": [1, 1, 1, 1, 2, 2, 2, 2],
+            "idx2": [10, 10, 20, 20, 10, 10, 20, 20],
+            "metric1": [10, 14, 2, 13, 6, 2, 9, 5],
+            "metric2": [25, -3, 8, 2, -1, 0, 0, -4],
+        },
+        dtype=pd.Int64Dtype(),
+    ).set_index(["idx1", "idx2"])
+    bf_df = dataframe.DataFrame(pd_df)
+
+    # Expect implicit joiner to be used, preserving input cardinality rather than getting relational join
+    bf_df["metric_diff"] = bf_df.metric1 - bf_df.metric2
+    pd_df["metric_diff"] = pd_df.metric1 - pd_df.metric2
+
+    assert_pandas_df_equal(bf_df.to_pandas(), pd_df)
+
+
+def test_df_dot_inline(session):
+    df1 = pd.DataFrame([[1, 2, 3], [2, 5, 7]])
+    df2 = pd.DataFrame([[2, 4, 8], [1, 5, 10], [3, 6, 9]])
+
+    bf1 = session.read_pandas(df1)
+    bf2 = session.read_pandas(df2)
+    bf_result = bf1.dot(bf2).to_pandas()
+    pd_result = df1.dot(df2)
+
+    # Patch pandas dtypes for testing parity
+    # Pandas uses int64 instead of Int64 (nullable) dtype.
+    for name in pd_result.columns:
+        pd_result[name] = pd_result[name].astype(pd.Int64Dtype())
+    pd_result.index = pd_result.index.astype(pd.Int64Dtype())
+
+    pd.testing.assert_frame_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+def test_df_dot_series_inline():
+    left = [[1, 2, 3], [2, 5, 7]]
+    right = [2, 1, 3]
+
+    bf1 = dataframe.DataFrame(left)
+    bf2 = series.Series(right)
+    bf_result = bf1.dot(bf2).to_pandas()
+
+    df1 = pd.DataFrame(left)
+    df2 = pd.Series(right)
+    pd_result = df1.dot(df2)
+
+    # Patch pandas dtypes for testing parity
+    # Pandas result is int64 instead of Int64 (nullable) dtype.
+    pd_result = pd_result.astype(pd.Int64Dtype())
+    pd_result.index = pd_result.index.astype(pd.Int64Dtype())
+
+    pd.testing.assert_series_equal(
+        bf_result,
+        pd_result,
+    )
+
+
+@pytest.mark.parametrize(
+    ("col_names", "ignore_index"),
+    [
+        pytest.param(["A"], False, id="one_array_false"),
+        pytest.param(["A"], True, id="one_array_true"),
+        pytest.param(["B"], False, id="one_float_false"),
+        pytest.param(["B"], True, id="one_float_true"),
+        pytest.param(["A", "C"], False, id="two_arrays_false"),
+        pytest.param(["A", "C"], True, id="two_arrays_true"),
+    ],
+)
+def test_dataframe_explode(col_names, ignore_index, session):
+    data = {
+        "A": [[0, 1, 2], [], [3, 4]],
+        "B": 3,
+        "C": [["a", "b", "c"], np.nan, ["d", "e"]],
+    }
+
+    df = bpd.DataFrame(data, session=session)
+    pd_df = df.to_pandas()
+    pd_result = pd_df.explode(col_names, ignore_index=ignore_index)
+    bf_result = df.explode(col_names, ignore_index=ignore_index)
+
+    # Check that to_pandas() results in at most a single query execution
+    bf_materialized = bf_result.to_pandas()
+
+    pd.testing.assert_frame_equal(
+        bf_materialized,
+        pd_result,
+        check_index_type=False,
+        check_dtype=False,
+    )
+
+
+@pytest.mark.parametrize(
+    ("ignore_index", "ordered"),
+    [
+        pytest.param(True, True, id="include_index_ordered"),
+        pytest.param(True, False, id="include_index_unordered"),
+        pytest.param(False, True, id="ignore_index_ordered"),
+    ],
+)
+def test_dataframe_explode_reserve_order(session, ignore_index, ordered):
+    data = {
+        "a": [np.random.randint(0, 10, 10) for _ in range(10)],
+        "b": [np.random.randint(0, 10, 10) for _ in range(10)],
+    }
+    df = bpd.DataFrame(data)
+    pd_df = pd.DataFrame(data)
+
+    res = df.explode(["a", "b"], ignore_index=ignore_index).to_pandas(ordered=ordered)
+    pd_res = pd_df.explode(["a", "b"], ignore_index=ignore_index).astype(
+        pd.Int64Dtype()
+    )
+    pd.testing.assert_frame_equal(
+        res if ordered else res.sort_index(),
+        pd_res,
+        check_index_type=False,
+    )
+
+
+@pytest.mark.parametrize(
+    ("col_names"),
+    [
+        pytest.param([], id="empty", marks=pytest.mark.xfail(raises=ValueError)),
+        pytest.param(
+            ["A", "A"], id="duplicate", marks=pytest.mark.xfail(raises=ValueError)
+        ),
+        pytest.param("unknown", id="unknown", marks=pytest.mark.xfail(raises=KeyError)),
+    ],
+)
+def test_dataframe_explode_xfail(col_names):
+    df = bpd.DataFrame({"A": [[0, 1, 2], [], [3, 4]]})
+    df.explode(col_names)