From 32e81b711ecc41aa465900b863ed8ba7963415d7 Mon Sep 17 00:00:00 2001
From: Hazem Elmeleegy <hazem.elmeleegy@snowflake.com>
Date: Mon, 16 Sep 2024 10:31:31 -0700
Subject: [PATCH] =?UTF-8?q?SNOW-1665707:=20Move=20general.py=20into=20src/?=
 =?UTF-8?q?=E2=80=A6/modin/plugin/extensions/?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .../snowpark/modin/pandas/__init__.py         |   52 +-
 .../{pandas => plugin/extensions}/general.py  | 4218 +++++++++--------
 2 files changed, 2146 insertions(+), 2124 deletions(-)
 rename src/snowflake/snowpark/modin/{pandas => plugin/extensions}/general.py (98%)

diff --git a/src/snowflake/snowpark/modin/pandas/__init__.py b/src/snowflake/snowpark/modin/pandas/__init__.py
index 8f9834630b7..d188236315c 100644
--- a/src/snowflake/snowpark/modin/pandas/__init__.py
+++ b/src/snowflake/snowpark/modin/pandas/__init__.py
@@ -95,32 +95,6 @@
     register_dataframe_accessor,
     register_series_accessor,
 )
-from snowflake.snowpark.modin.pandas.general import (
-    bdate_range,
-    concat,
-    crosstab,
-    cut,
-    date_range,
-    get_dummies,
-    isna,
-    isnull,
-    lreshape,
-    melt,
-    merge,
-    merge_asof,
-    merge_ordered,
-    notna,
-    notnull,
-    pivot,
-    pivot_table,
-    qcut,
-    to_datetime,
-    to_numeric,
-    to_timedelta,
-    unique,
-    value_counts,
-    wide_to_long,
-)
 from snowflake.snowpark.modin.pandas.io import (  # read_json is provided by overrides module
     ExcelFile,
     HDFStore,
@@ -151,6 +125,32 @@
     TELEMETRY_PRIVATE_METHODS,
     try_add_telemetry_to_attribute,
 )
+from snowflake.snowpark.modin.plugin.extensions.general import (
+    bdate_range,
+    concat,
+    crosstab,
+    cut,
+    date_range,
+    get_dummies,
+    isna,
+    isnull,
+    lreshape,
+    melt,
+    merge,
+    merge_asof,
+    merge_ordered,
+    notna,
+    notnull,
+    pivot,
+    pivot_table,
+    qcut,
+    to_datetime,
+    to_numeric,
+    to_timedelta,
+    unique,
+    value_counts,
+    wide_to_long,
+)
 from snowflake.snowpark.modin.plugin.utils.frontend_constants import _ATTRS_NO_LOOKUP
 
 # The extensions assigned to this module
diff --git a/src/snowflake/snowpark/modin/pandas/general.py b/src/snowflake/snowpark/modin/plugin/extensions/general.py
similarity index 98%
rename from src/snowflake/snowpark/modin/pandas/general.py
rename to src/snowflake/snowpark/modin/plugin/extensions/general.py
index 5024d0618ac..58f945e25c0 100644
--- a/src/snowflake/snowpark/modin/pandas/general.py
+++ b/src/snowflake/snowpark/modin/plugin/extensions/general.py
@@ -31,7 +31,7 @@
 import numpy as np
 import pandas
 import pandas.core.common as common
-from modin.pandas import DataFrame, Series
+from modin.pandas import Series
 from modin.pandas.base import BasePandasDataset
 from pandas import IntervalIndex, NaT, Timedelta, Timestamp
 from pandas._libs import NaTType, lib
@@ -65,6 +65,7 @@
 
 # add this line to make doctests runnable
 from snowflake.snowpark.modin import pandas as pd  # noqa: F401
+from snowflake.snowpark.modin.pandas.dataframe import DataFrame
 from snowflake.snowpark.modin.pandas.utils import (
     is_scalar,
     raise_if_native_pandas_objects,
@@ -91,9 +92,10 @@
     # linking to `snowflake.snowpark.DataFrame`, we need to explicitly
     # qualify return types in this file with `modin.pandas.DataFrame`.
     # SNOW-1233342: investigate how to fix these links without using absolute paths
-    import modin
     from modin.core.storage_formats import BaseQueryCompiler  # pragma: no cover
 
+    import snowflake  # pragma: no cover
+
 _logger = getLogger(__name__)
 
 VALID_DATE_TYPE = Union[
@@ -101,513 +103,177 @@
 ]
 
 
+###########################################################################
+# Data manipulations
+###########################################################################
+
+
 @snowpark_pandas_telemetry_standalone_function_decorator
-@_inherit_docstrings(pandas.isna, apilink="pandas.isna")
-def isna(obj):  # noqa: PR01, RT01, D200
-    """
-    Detect missing values for an array-like object.
+def melt(
+    frame,
+    id_vars=None,
+    value_vars=None,
+    var_name=None,
+    value_name="value",
+    col_level=None,
+    ignore_index: bool = True,
+):  # noqa: PR01, RT01, D200
     """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    if isinstance(obj, BasePandasDataset):
-        return obj.isna()
-    else:
-        return pandas.isna(obj)
+    Unpivot a DataFrame from wide to long format, optionally leaving identifiers set.
 
+    Parameters
+    ----------
+    id_vars : list of identifiers to retain in the result
+    value_vars : list of columns to unpivot on
+        defaults to all columns, excluding the id_vars columns
+    var_name : variable name, defaults to "variable"
+    value_name : value name, defaults to "value"
+    col_level : int, not implemented
+    ignore_index : bool, not implemented
 
-isnull = isna
+    Returns
+    -------
+    :class:`~modin.pandas.DataFrame`
+        unpivoted on the value columns
 
+    Examples
+    --------
+    >>> df = pd.DataFrame({'A': {0: 'a', 1: 'b', 2: 'c'},
+    ...           'B': {0: 1, 1: 3, 2: 5},
+    ...           'C': {0: 2, 1: 4, 2: 6}})
 
-@snowpark_pandas_telemetry_standalone_function_decorator
-@_inherit_docstrings(pandas.notna, apilink="pandas.notna")
-def notna(obj):  # noqa: PR01, RT01, D200
-    """
-    Detect non-missing values for an array-like object.
+    >>> pd.melt(df)
+      variable value
+    0        A     a
+    1        A     b
+    2        A     c
+    3        B     1
+    4        B     3
+    5        B     5
+    6        C     2
+    7        C     4
+    8        C     6
+
+    >>> df = pd.DataFrame({'A': {0: 'a', 1: 'b', 2: 'c'},
+    ...           'B': {0: 1, 1: 3, 2: 5},
+    ...           'C': {0: 2, 1: 4, 2: 6}})
+    >>> pd.melt(df, id_vars=['A'], value_vars=['B'], var_name='myVarname', value_name='myValname')
+       A myVarname  myValname
+    0  a         B          1
+    1  b         B          3
+    2  c         B          5
     """
     # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    if isinstance(obj, BasePandasDataset):
-        return obj.notna()
-    else:
-        return pandas.notna(obj)
-
-
-notnull = notna
+    return frame.melt(
+        id_vars=id_vars,
+        value_vars=value_vars,
+        var_name=var_name,
+        value_name=value_name,
+        col_level=col_level,
+        ignore_index=ignore_index,
+    )
 
 
 @snowpark_pandas_telemetry_standalone_function_decorator
-def merge(
-    left: modin.pandas.DataFrame | Series,
-    right: modin.pandas.DataFrame | Series,
-    how: str | None = "inner",
-    on: IndexLabel | None = None,
-    left_on: None
-    | (Hashable | AnyArrayLike | Sequence[Hashable | AnyArrayLike]) = None,
-    right_on: None
-    | (Hashable | AnyArrayLike | Sequence[Hashable | AnyArrayLike]) = None,
-    left_index: bool | None = False,
-    right_index: bool | None = False,
-    sort: bool | None = False,
-    suffixes: Suffixes | None = ("_x", "_y"),
-    copy: bool | None = True,
-    indicator: bool | str | None = False,
-    validate: str | None = None,
-):
+def pivot(data, index=None, columns=None, values=None):  # noqa: PR01, RT01, D200
     """
-    Merge DataFrame or named Series objects with a database-style join.
-
-    A named Series object is treated as a DataFrame with a single named column.
-
-    The join is done on columns or indexes. If joining columns on
-    columns, the DataFrame indexes *will be ignored*. Otherwise if joining indexes
-    on indexes or indexes on a column or columns, the index will be passed on.
-    When performing a cross merge, no column specifications to merge on are
-    allowed.
-
-    .. warning::
+    Return reshaped DataFrame organized by given index / column values.
 
-        If both key columns contain rows where the key is a null value, those
-        rows will be matched against each other. This is different from usual SQL
-        join behaviour and can lead to unexpected results.
+    Reshape data (produce a “pivot” table) based on column values. Uses unique values from
+    specified index / columns to form axes of the resulting DataFrame. This function does not
+    support data aggregation, multiple values will result in a MultiIndex in the columns.
 
     Parameters
     ----------
-    left : :class:`~modin.pandas.DataFrame` or named Series
-    right : :class:`~modin.pandas.DataFrame` or named Series
-        Object to merge with.
-    how : {'left', 'right', 'outer', 'inner', 'cross'}, default 'inner'
-        Type of merge to be performed.
-
-        * left: use only keys from left frame, similar to a SQL left outer join;
-          preserve key order.
-        * right: use only keys from right frame, similar to a SQL right outer join;
-          preserve key order.
-        * outer: use union of keys from both frames, similar to a SQL full outer
-          join; sort keys lexicographically.
-        * inner: use intersection of keys from both frames, similar to a SQL inner
-          join; preserve the order of the left keys.
-        * cross: creates the cartesian product from both frames, preserves the order
-          of the left keys.
-
-    on : label or list
-        Column or index level names to join on. These must be found in both
-        DataFrames. If `on` is None and not merging on indexes then this defaults
-        to the intersection of the columns in both DataFrames.
-    left_on : label or list, or array-like
-        Column or index level names to join on in the left DataFrame. Can also
-        be an array or list of arrays of the length of the left DataFrame.
-        These arrays are treated as if they are columns.
-    right_on : label or list, or array-like
-        Column or index level names to join on in the right DataFrame. Can also
-        be an array or list of arrays of the length of the right DataFrame.
-        These arrays are treated as if they are columns.
-    left_index : bool, default False
-        Use the index from the left DataFrame as the join key(s). If it is a
-        MultiIndex, the number of keys in the other DataFrame (either the index
-        or a number of columns) must match the number of levels.
-    right_index : bool, default False
-        Use the index from the right DataFrame as the join key. Same caveats as
-        left_index.
-    sort : bool, default False
-        Sort the join keys lexicographically in the result DataFrame. If False,
-        the order of the join keys depends on the join type (how keyword).
-    suffixes : list-like, default is ("_x", "_y")
-        A length-2 sequence where each element is optionally a string
-        indicating the suffix to add to overlapping column names in
-        `left` and `right` respectively. Pass a value of `None` instead
-        of a string to indicate that the column name from `left` or
-        `right` should be left as-is, with no suffix. At least one of the
-        values must not be None.
-    copy : bool, default True
-        This argument is ignored in Snowpark pandas API.
-    indicator : bool or str, default False
-        If True, adds a column to the output DataFrame called "_merge" with
-        information on the source of each row. The column can be given a different
-        name by providing a string argument. The column will have a Categorical
-        type with the value of "left_only" for observations whose merge key only
-        appears in the left DataFrame, "right_only" for observations
-        whose merge key only appears in the right DataFrame, and "both"
-        if the observation's merge key is found in both DataFrames.
-
-    validate : str, optional
-        This is not yet supported.
+    data : :class:`~modin.pandas.DataFrame`
+    columns : str or object or a list of str
+        Column to use to make new frame’s columns.
+    index : str or object or a list of str, optional
+        Column to use to make new frame’s index. If not given, uses existing index.
+    values : str, object or a list of the previous, optional
+        Column(s) to use for populating new frame’s values. If not specified, all remaining columns
+        will be used and the result will have hierarchically indexed columns.
 
     Returns
     -------
     :class:`~modin.pandas.DataFrame`
-        A DataFrame of the two merged objects.
+
+    Notes
+    -----
+    Calls pivot_table with columns, values, index and aggregation "min".
 
     See Also
     --------
-    merge_ordered : Merge with optional filling/interpolation.
-    merge_asof : Merge on nearest keys.
-    DataFrame.join : Similar method using indices.
+    DataFrame.pivot_table : Generalization of pivot that can handle
+        duplicate values for one index/column pair.
+    DataFrame.unstack: Pivot based on the index values instead
+        of a column.
+    wide_to_long : Wide panel to long format. Less flexible but more
+        user-friendly than melt.
 
     Examples
     --------
-    >>> df1 = pd.DataFrame({'lkey': ['foo', 'bar', 'baz', 'foo'],
-    ...                     'value': [1, 2, 3, 5]})
-    >>> df2 = pd.DataFrame({'rkey': ['foo', 'bar', 'baz', 'foo'],
-    ...                     'value': [5, 6, 7, 8]})
-    >>> df1
-      lkey  value
-    0  foo      1
-    1  bar      2
-    2  baz      3
-    3  foo      5
-    >>> df2
-      rkey  value
-    0  foo      5
-    1  bar      6
-    2  baz      7
-    3  foo      8
-
-    Merge df1 and df2 on the lkey and rkey columns. The value columns have
-    the default suffixes, _x and _y, appended.
-
-    >>> df1.merge(df2, left_on='lkey', right_on='rkey')
-      lkey  value_x rkey  value_y
-    0  foo        1  foo        5
-    1  foo        1  foo        8
-    2  bar        2  bar        6
-    3  baz        3  baz        7
-    4  foo        5  foo        5
-    5  foo        5  foo        8
-
-    Merge DataFrames df1 and df2 with specified left and right suffixes
-    appended to any overlapping columns.
-
-    >>> df1.merge(df2, left_on='lkey', right_on='rkey',
-    ...           suffixes=('_left', '_right'))
-      lkey  value_left rkey  value_right
-    0  foo           1  foo            5
-    1  foo           1  foo            8
-    2  bar           2  bar            6
-    3  baz           3  baz            7
-    4  foo           5  foo            5
-    5  foo           5  foo            8
-
-
-    >>> df1 = pd.DataFrame({'a': ['foo', 'bar'], 'b': [1, 2]})
-    >>> df2 = pd.DataFrame({'a': ['foo', 'baz'], 'c': [3, 4]})
-    >>> df1
-         a  b
-    0  foo  1
-    1  bar  2
-    >>> df2
-         a  c
-    0  foo  3
-    1  baz  4
-
-    >>> df1.merge(df2, how='inner', on='a')
-         a  b  c
-    0  foo  1  3
-
-    >>> df1.merge(df2, how='left', on='a')
-         a  b    c
-    0  foo  1  3.0
-    1  bar  2  NaN
-
-    >>> df1 = pd.DataFrame({'left': ['foo', 'bar']})
-    >>> df2 = pd.DataFrame({'right': [7, 8]})
-    >>> df1
-      left
-    0  foo
-    1  bar
-    >>> df2
-       right
-    0      7
-    1      8
-
-    >>> df1.merge(df2, how='cross')
-      left  right
-    0  foo      7
-    1  foo      8
-    2  bar      7
-    3  bar      8
-    """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    # Raise error if 'left' or 'right' is native pandas object.
-    raise_if_native_pandas_objects(left)
-    raise_if_native_pandas_objects(right)
-
-    if isinstance(left, Series):
-        if left.name is None:
-            raise ValueError("Cannot merge a Series without a name")
-        else:
-            left = left.to_frame()
-
-    if not isinstance(left, DataFrame):
-        raise TypeError(
-            f"Can only merge Series or DataFrame objects, a {type(left)} was passed"
-        )
-
-    return left.merge(
-        right,
-        how=how,
-        on=on,
-        left_on=left_on,
-        right_on=right_on,
-        left_index=left_index,
-        right_index=right_index,
-        sort=sort,
-        suffixes=suffixes,
-        copy=copy,
-        indicator=indicator,
-        validate=validate,
-    )
-
-
-@snowpark_pandas_telemetry_standalone_function_decorator
-@pandas_module_level_function_not_implemented()
-@_inherit_docstrings(pandas.merge_ordered, apilink="pandas.merge_ordered")
-def merge_ordered(
-    left,
-    right,
-    on=None,
-    left_on=None,
-    right_on=None,
-    left_by=None,
-    right_by=None,
-    fill_method=None,
-    suffixes=("_x", "_y"),
-    how: str = "outer",
-) -> DataFrame:  # noqa: PR01, RT01, D200
-    """
-    Perform a merge for ordered data with optional filling/interpolation.
-    """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    if not isinstance(left, DataFrame):
-        raise ValueError(f"can not merge DataFrame with instance of type {type(right)}")
-    if isinstance(right, DataFrame):
-        right = to_pandas(right)
-    return DataFrame(
-        pandas.merge_ordered(
-            to_pandas(left),
-            right,
-            on=on,
-            left_on=left_on,
-            right_on=right_on,
-            left_by=left_by,
-            right_by=right_by,
-            fill_method=fill_method,
-            suffixes=suffixes,
-            how=how,
-        )
-    )
-
-
-@snowpark_pandas_telemetry_standalone_function_decorator
-@_inherit_docstrings(pandas.merge_asof, apilink="pandas.merge_asof")
-def merge_asof(
-    left,
-    right,
-    on: str | None = None,
-    left_on: str | None = None,
-    right_on: str | None = None,
-    left_index: bool = False,
-    right_index: bool = False,
-    by: str | list[str] | None = None,
-    left_by: str | None = None,
-    right_by: str | None = None,
-    suffixes: Suffixes = ("_x", "_y"),
-    tolerance: int | Timedelta | None = None,
-    allow_exact_matches: bool = True,
-    direction: str = "backward",
-) -> modin.pandas.DataFrame:
-    """
-    Perform a merge by key distance.
-
-    This is similar to a left-join except that we match on nearest key rather than equal keys.
-    Both DataFrames must be sorted by the key. For each row in the left DataFrame:
-
-    A “backward” search selects the last row in the right DataFrame whose ‘on’ key is less than or equal to the left’s key.
-    A “forward” search selects the first row in the right DataFrame whose ‘on’ key is greater than or equal to the left’s key.
-    A “nearest” search selects the row in the right DataFrame whose ‘on’ key is closest in absolute distance to the left’s key.
-
-    Optionally match on equivalent keys with ‘by’ before searching with ‘on’.
-
-    Parameters
-    ----------
-    left : :class:`~modin.pandas.DataFrame` or named :class:`~modin.pandas.Series`.
-    right : :class:`~modin.pandas.DataFrame` or named :class:`~modin.pandas.Series`.
-    on : label
-        Field name to join on. Must be found in both DataFrames. The data MUST be ordered.
-        Furthermore, this must be a numeric column such as datetimelike, integer, or float.
-        On or left_on/right_on must be given.
-    left_on : label
-        Field name to join on in left DataFrame.
-    right_on : label
-        Field name to join on in right DataFrame.
-    left_index : bool
-        Use the index of the left DataFrame as the join key.
-    right_index : bool
-        Use the index of the right DataFrame as the join key.
-    by : column name or list of column names
-        Match on these columns before performing merge operation.
-    left_by : column name
-        Field names to match on in the left DataFrame.
-    right_by : column name
-        Field names to match on in the right DataFrame.
-    suffixes : 2-length sequence (tuple, list, …)
-        Suffix to apply to overlapping column names in the left and right side, respectively.
-    tolerance: int or Timedelta, optional, default None
-        Select asof tolerance within this range; must be compatible with the merge index.
-    allow_exact_matches : bool, default True
-        If True, allow matching with the same ‘on’ value (i.e. less-than-or-equal-to / greater-than-or-equal-to)
-        If False, don’t match the same ‘on’ value (i.e., strictly less-than / strictly greater-than).
-    direction : ‘backward’ (default), ‘forward’, or ‘nearest’
-        Whether to search for prior, subsequent, or closest matches.
-
-    Returns
-    -------
-    Snowpark pandas :class:`~modin.pandas.DataFrame`
-
-    Examples
-    --------
-    >>> left = pd.DataFrame({"a": [1, 5, 10], "left_val": ["a", "b", "c"]})
-    >>> left
-        a left_val
-    0   1        a
-    1   5        b
-    2  10        c
-    >>> right = pd.DataFrame({"a": [1, 2, 3, 6, 7], "right_val": [1, 2, 3, 6, 7]})
-    >>> right
-       a  right_val
-    0  1          1
-    1  2          2
-    2  3          3
-    3  6          6
-    4  7          7
-    >>> pd.merge_asof(left, right, on="a")
-        a left_val  right_val
-    0   1        a          1
-    1   5        b          3
-    2  10        c          7
-    >>> pd.merge_asof(left, right, on="a", allow_exact_matches=False)
-        a left_val  right_val
-    0   1        a        NaN
-    1   5        b        3.0
-    2  10        c        7.0
-    >>> pd.merge_asof(left, right, on="a", direction="forward")
-        a left_val  right_val
-    0   1        a        1.0
-    1   5        b        6.0
-    2  10        c        NaN
-
-    Here is a real-world times-series example:
-
-    >>> quotes = pd.DataFrame(
-    ...    {
-    ...        "time": [
-    ...            pd.Timestamp("2016-05-25 13:30:00.023"),
-    ...            pd.Timestamp("2016-05-25 13:30:00.023"),
-    ...            pd.Timestamp("2016-05-25 13:30:00.030"),
-    ...            pd.Timestamp("2016-05-25 13:30:00.041"),
-    ...            pd.Timestamp("2016-05-25 13:30:00.048"),
-    ...            pd.Timestamp("2016-05-25 13:30:00.049"),
-    ...            pd.Timestamp("2016-05-25 13:30:00.072"),
-    ...            pd.Timestamp("2016-05-25 13:30:00.075")
-    ...        ],
-    ...        "bid": [720.50, 51.95, 51.97, 51.99, 720.50, 97.99, 720.50, 52.01],
-    ...        "ask": [720.93, 51.96, 51.98, 52.00, 720.93, 98.01, 720.88, 52.03]
-    ...    }
-    ... )
-    >>> quotes
-                         time     bid     ask
-    0 2016-05-25 13:30:00.023  720.50  720.93
-    1 2016-05-25 13:30:00.023   51.95   51.96
-    2 2016-05-25 13:30:00.030   51.97   51.98
-    3 2016-05-25 13:30:00.041   51.99   52.00
-    4 2016-05-25 13:30:00.048  720.50  720.93
-    5 2016-05-25 13:30:00.049   97.99   98.01
-    6 2016-05-25 13:30:00.072  720.50  720.88
-    7 2016-05-25 13:30:00.075   52.01   52.03
-    >>> trades = pd.DataFrame(
-    ...    {
-    ...        "time": [
-    ...            pd.Timestamp("2016-05-25 13:30:00.023"),
-    ...            pd.Timestamp("2016-05-25 13:30:00.038"),
-    ...            pd.Timestamp("2016-05-25 13:30:00.048"),
-    ...            pd.Timestamp("2016-05-25 13:30:00.048"),
-    ...            pd.Timestamp("2016-05-25 13:30:00.048")
-    ...        ],
-    ...        "price": [51.95, 51.95, 720.77, 720.92, 98.0],
-    ...        "quantity": [75, 155, 100, 100, 100]
-    ...    }
-    ... )
-    >>> trades
-                         time   price  quantity
-    0 2016-05-25 13:30:00.023   51.95        75
-    1 2016-05-25 13:30:00.038   51.95       155
-    2 2016-05-25 13:30:00.048  720.77       100
-    3 2016-05-25 13:30:00.048  720.92       100
-    4 2016-05-25 13:30:00.048   98.00       100
-    >>> pd.merge_asof(trades, quotes, on="time")
-                         time   price  quantity     bid     ask
-    0 2016-05-25 13:30:00.023   51.95        75   51.95   51.96
-    1 2016-05-25 13:30:00.038   51.95       155   51.97   51.98
-    2 2016-05-25 13:30:00.048  720.77       100  720.50  720.93
-    3 2016-05-25 13:30:00.048  720.92       100  720.50  720.93
-    4 2016-05-25 13:30:00.048   98.00       100  720.50  720.93
-    """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    if not isinstance(left, DataFrame):
-        raise ValueError(f"can not merge DataFrame with instance of type {type(left)}")
-    if not isinstance(right, DataFrame):
-        raise ValueError(f"can not merge DataFrame with instance of type {type(right)}")
-
-    # As of pandas 1.2 these should raise an error; before that it did
-    # something likely random:
-    if (
-        (on and (left_index or right_index))
-        or (left_on and left_index)
-        or (right_on and right_index)
-    ):
-        raise ValueError("Can't combine left/right_index with left/right_on or on.")
-
-    if on is not None:
-        if left_on is not None or right_on is not None:
-            raise ValueError("If 'on' is set, 'left_on' and 'right_on' can't be set.")
-        if is_list_like(on) and len(on) > 1:
-            raise MergeError("can only asof on a key for left")
-        left_on = on
-        right_on = on
-
-    if by is not None:
-        if left_by is not None or right_by is not None:
-            raise ValueError("Can't have both 'by' and 'left_by' or 'right_by'")
-        left_by = right_by = by
-
-    if left_on is None and not left_index:
-        raise ValueError("Must pass on, left_on, or left_index=True")
-
-    if right_on is None and not right_index:
-        raise ValueError("Must pass on, right_on, or right_index=True")
-
-    if not left_index and not right_index:
-        left_on_length = len(left_on) if is_list_like(left_on) else 1
-        right_on_length = len(right_on) if is_list_like(right_on) else 1
-        if left_on_length != right_on_length:
-            raise ValueError("len(right_on) must equal len(left_on)")
-        if left_on_length > 1:
-            raise MergeError("can only asof on a key for left")
-
-    return DataFrame(
-        query_compiler=left._query_compiler.merge_asof(
-            right._query_compiler,
-            on,
-            left_on,
-            right_on,
-            left_index,
-            right_index,
-            by,
-            left_by,
-            right_by,
-            suffixes,
-            tolerance,
-            allow_exact_matches,
-            direction,
-        )
-    )
+    >>> df = pd.DataFrame({'foo': ['one', 'one', 'one', 'two', 'two',
+    ...                   'two'],
+    ...           'bar': ['A', 'B', 'C', 'A', 'B', 'C'],
+    ...           'baz': [1, 2, 3, 4, 5, 6],
+    ...           'zoo': ['x', 'y', 'z', 'q', 'w', 't']})
+    >>> df
+       foo bar  baz zoo
+    0  one   A    1   x
+    1  one   B    2   y
+    2  one   C    3   z
+    3  two   A    4   q
+    4  two   B    5   w
+    5  two   C    6   t
+    >>> pd.pivot(data=df, index='foo', columns='bar', values='baz')  # doctest: +NORMALIZE_WHITESPACE
+    bar  A  B  C
+    foo
+    one  1  2  3
+    two  4  5  6
+    >>> pd.pivot(data=df, index='foo', columns='bar')['baz']  # doctest: +NORMALIZE_WHITESPACE
+    bar  A  B  C
+    foo
+    one  1  2  3
+    two  4  5  6
+    >>> pd.pivot(data=df, index='foo', columns='bar', values=['baz', 'zoo'])  # doctest: +NORMALIZE_WHITESPACE
+        baz       zoo
+    bar   A  B  C   A  B  C
+    foo
+    one   1  2  3   x  y  z
+    two   4  5  6   q  w  t
+    >>> df = pd.DataFrame({
+    ...     "lev1": [1, 1, 1, 2, 2, 2],
+    ...     "lev2": [1, 1, 2, 1, 1, 2],
+    ...     "lev3": [1, 2, 1, 2, 1, 2],
+    ...     "lev4": [1, 2, 3, 4, 5, 6],
+    ...     "values": [0, 1, 2, 3, 4, 5]})
+    >>> df
+       lev1  lev2  lev3  lev4  values
+    0     1     1     1     1       0
+    1     1     1     2     2       1
+    2     1     2     1     3       2
+    3     2     1     2     4       3
+    4     2     1     1     5       4
+    5     2     2     2     6       5
+    >>> pd.pivot(data=df, index="lev1", columns=["lev2", "lev3"], values="values")  # doctest: +NORMALIZE_WHITESPACE
+    lev2  1       2
+    lev3  1  2    1    2
+    lev1
+    1     0  1  2.0  NaN
+    2     4  3  NaN  5.0
+    >>> pd.pivot(data=df, index=["lev1", "lev2"], columns=["lev3"], values="values")  # doctest: +NORMALIZE_WHITESPACE
+    lev3         1    2
+    lev1 lev2
+    1    1     0.0  1.0
+         2     2.0  NaN
+    2    1     4.0  3.0
+         2     NaN  5.0
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    if not isinstance(data, DataFrame):
+        raise ValueError(f"can not pivot with instance of type {type(data)}")
+    return data.pivot(index=index, columns=columns, values=values)
 
 
 @snowpark_pandas_telemetry_standalone_function_decorator
@@ -789,1041 +455,1472 @@ def pivot_table(
         aggfunc=aggfunc,
         fill_value=fill_value,
         margins=margins,
-        dropna=dropna,
+        dropna=dropna,
+        margins_name=margins_name,
+        sort=sort,
+    )
+
+
+@snowpark_pandas_telemetry_standalone_function_decorator
+def crosstab(
+    index,
+    columns,
+    values=None,
+    rownames=None,
+    colnames=None,
+    aggfunc=None,
+    margins=False,
+    margins_name: str = "All",
+    dropna: bool = True,
+    normalize=False,
+) -> DataFrame:  # noqa: PR01, RT01, D200
+    """
+    Compute a simple cross tabulation of two (or more) factors.
+
+    By default, computes a frequency table of the factors unless an array
+    of values and an aggregation function are passed.
+
+    Parameters
+    ----------
+    index : array-like, Series, or list of arrays/Series
+        Values to group by in the rows.
+    columns : array-like, Series, or list of arrays/Series
+        Values to group by in the columns.
+    values : array-like, optional
+        Array of values to aggregate according to the factors.
+        Requires aggfunc be specified.
+    rownames : sequence, default None
+        If passed, must match number of row arrays passed.
+    colnames : sequence, default None
+        If passed, must match number of column arrays passed.
+    aggfunc : function, optional
+        If specified, requires values be specified as well.
+    margins : bool, default False
+        Add row/column margins (subtotals).
+    margins_name : str, default 'All'
+        Name of the row/column that will contain the totals when margins is True.
+    dropna : bool, default True
+        Do not include columns whose entries are all NaN.
+
+    normalize : bool, {'all', 'index', 'columns'}, or {0,1}, default False
+        Normalize by dividing all values by the sum of values.
+
+        * If passed 'all' or True, will normalize over all values.
+        * If passed 'index' will normalize over each row.
+        * If passed 'columns' will normalize over each column.
+        * If margins is True, will also normalize margin values.
+
+    Returns
+    -------
+    Snowpark pandas :class:`~modin.pandas.DataFrame`
+        Cross tabulation of the data.
+
+    Notes
+    -----
+
+    Raises NotImplementedError if aggfunc is not one of "count", "mean", "min", "max", or "sum", or
+    margins is True, normalize is True or all, and values is passed.
+
+    Examples
+    --------
+    >>> a = np.array(["foo", "foo", "foo", "foo", "bar", "bar",
+    ...               "bar", "bar", "foo", "foo", "foo"], dtype=object)
+    >>> b = np.array(["one", "one", "one", "two", "one", "one",
+    ...               "one", "two", "two", "two", "one"], dtype=object)
+    >>> c = np.array(["dull", "dull", "shiny", "dull", "dull", "shiny",
+    ...               "shiny", "dull", "shiny", "shiny", "shiny"],
+    ...              dtype=object)
+    >>> pd.crosstab(a, [b, c], rownames=['a'], colnames=['b', 'c']) # doctest: +NORMALIZE_WHITESPACE
+    b    one        two
+    c   dull shiny dull shiny
+    a
+    bar    1     2    1     0
+    foo    2     2    1     2
+    """
+    if values is None and aggfunc is not None:
+        raise ValueError("aggfunc cannot be used without values.")
+
+    if values is not None and aggfunc is None:
+        raise ValueError("values cannot be used without an aggfunc.")
+
+    if not is_nested_list_like(index):
+        index = [index]
+    if not is_nested_list_like(columns):
+        columns = [columns]
+
+    if (
+        values is not None
+        and margins is True
+        and (normalize is True or normalize == "all")
+    ):
+        raise NotImplementedError(
+            'Snowpark pandas does not yet support passing in margins=True, normalize="all", and values.'
+        )
+
+    user_passed_rownames = rownames is not None
+    user_passed_colnames = colnames is not None
+
+    from pandas.core.reshape.pivot import _build_names_mapper, _get_names
+
+    def _get_names_wrapper(list_of_objs, names, prefix):
+        """
+        Helper method to expand DataFrame objects containing
+        multiple columns into Series, since `_get_names` expects
+        one column per entry.
+        """
+        expanded_list_of_objs = []
+        for obj in list_of_objs:
+            if isinstance(obj, DataFrame):
+                for col in obj.columns:
+                    expanded_list_of_objs.append(obj[col])
+            else:
+                expanded_list_of_objs.append(obj)
+        return _get_names(expanded_list_of_objs, names, prefix)
+
+    rownames = _get_names_wrapper(index, rownames, prefix="row")
+    colnames = _get_names_wrapper(columns, colnames, prefix="col")
+
+    (
+        rownames_mapper,
+        unique_rownames,
+        colnames_mapper,
+        unique_colnames,
+    ) = _build_names_mapper(rownames, colnames)
+
+    pass_objs = [x for x in index + columns if isinstance(x, (Series, DataFrame))]
+    row_idx_names = None
+    col_idx_names = None
+    if pass_objs:
+        # If we have any Snowpark pandas objects in the index or columns, then we
+        # need to find the intersection of their indices, and only pick rows from
+        # the objects that have indices in the intersection of their indices.
+        # After we do that, we then need to append the non Snowpark pandas objects
+        # using the intersection of indices as the final index for the DataFrame object.
+        # First, we separate the objects into Snowpark pandas objects, and non-Snowpark
+        # pandas objects (while renaming them so that they have unique names).
+        rownames_idx = 0
+        row_idx_names = []
+        dfs = []
+        arrays = []
+        array_lengths = []
+        for obj in index:
+            if isinstance(obj, Series):
+                row_idx_names.append(obj.name)
+                df = pd.DataFrame(obj)
+                df.columns = [unique_rownames[rownames_idx]]
+                rownames_idx += 1
+                dfs.append(df)
+            elif isinstance(obj, DataFrame):
+                row_idx_names.extend(obj.columns)
+                obj.columns = unique_rownames[
+                    rownames_idx : rownames_idx + len(obj.columns)
+                ]
+                rownames_idx += len(obj.columns)
+                dfs.append(obj)
+            else:
+                row_idx_names.append(None)
+                array_lengths.append(len(obj))
+                df = pd.DataFrame(obj)
+                df.columns = unique_rownames[
+                    rownames_idx : rownames_idx + len(df.columns)
+                ]
+                rownames_idx += len(df.columns)
+                arrays.append(df)
+
+        colnames_idx = 0
+        col_idx_names = []
+        for obj in columns:
+            if isinstance(obj, Series):
+                col_idx_names.append(obj.name)
+                df = pd.DataFrame(obj)
+                df.columns = [unique_colnames[colnames_idx]]
+                colnames_idx += 1
+                dfs.append(df)
+            elif isinstance(obj, DataFrame):
+                col_idx_names.extend(obj.columns)
+                obj.columns = unique_colnames[
+                    colnames_idx : colnames_idx + len(obj.columns)
+                ]
+                colnames_idx += len(obj.columns)
+                dfs.append(obj)
+            else:
+                col_idx_names.append(None)
+                array_lengths.append(len(obj))
+                df = pd.DataFrame(obj)
+                df.columns = unique_colnames[
+                    colnames_idx : colnames_idx + len(df.columns)
+                ]
+                colnames_idx += len(df.columns)
+                arrays.append(df)
+
+        if len(set(array_lengths)) > 1:
+            raise ValueError("All arrays must be of the same length")
+
+        # Now, we have two lists - a list of Snowpark pandas objects, and a list of objects
+        # that were not passed in as Snowpark pandas objects, but that we have converted
+        # to Snowpark pandas objects to give them column names. We can perform inner joins
+        # on the dfs list to get a DataFrame with the final index (that is only an intersection
+        # of indices.)
+        df = dfs[0]
+        for right in dfs[1:]:
+            df = df.merge(right, left_index=True, right_index=True)
+        if len(arrays) > 0:
+            index = df.index
+            right_df = pd.concat(arrays, axis=1)
+            # Increases query count by 1, but necessary for error checking.
+            index_length = len(df)
+            if index_length != array_lengths[0]:
+                raise ValueError(
+                    f"Length mismatch: Expected {array_lengths[0]} rows, received array of length {index_length}"
+                )
+            right_df.index = index
+            df = df.merge(right_df, left_index=True, right_index=True)
+    else:
+        data = {
+            **dict(zip(unique_rownames, index)),
+            **dict(zip(unique_colnames, columns)),
+        }
+        df = DataFrame(data)
+
+    if values is None:
+        df["__dummy__"] = 0
+        kwargs = {"aggfunc": "count"}
+    else:
+        df["__dummy__"] = values
+        kwargs = {"aggfunc": aggfunc}
+
+    table = df.pivot_table(
+        "__dummy__",
+        index=unique_rownames,
+        columns=unique_colnames,
+        margins=margins,
         margins_name=margins_name,
-        sort=sort,
+        dropna=dropna,
+        **kwargs,  # type: ignore[arg-type]
     )
 
+    if row_idx_names is not None and not user_passed_rownames:
+        table.index = table.index.set_names(row_idx_names)
 
-@snowpark_pandas_telemetry_standalone_function_decorator
-def pivot(data, index=None, columns=None, values=None):  # noqa: PR01, RT01, D200
-    """
-    Return reshaped DataFrame organized by given index / column values.
-
-    Reshape data (produce a “pivot” table) based on column values. Uses unique values from
-    specified index / columns to form axes of the resulting DataFrame. This function does not
-    support data aggregation, multiple values will result in a MultiIndex in the columns.
-
-    Parameters
-    ----------
-    data : :class:`~modin.pandas.DataFrame`
-    columns : str or object or a list of str
-        Column to use to make new frame’s columns.
-    index : str or object or a list of str, optional
-        Column to use to make new frame’s index. If not given, uses existing index.
-    values : str, object or a list of the previous, optional
-        Column(s) to use for populating new frame’s values. If not specified, all remaining columns
-        will be used and the result will have hierarchically indexed columns.
-
-    Returns
-    -------
-    :class:`~modin.pandas.DataFrame`
-
-    Notes
-    -----
-    Calls pivot_table with columns, values, index and aggregation "min".
+    if col_idx_names is not None and not user_passed_colnames:
+        table.columns = table.columns.set_names(col_idx_names)
 
-    See Also
-    --------
-    DataFrame.pivot_table : Generalization of pivot that can handle
-        duplicate values for one index/column pair.
-    DataFrame.unstack: Pivot based on the index values instead
-        of a column.
-    wide_to_long : Wide panel to long format. Less flexible but more
-        user-friendly than melt.
+    if aggfunc is None:
+        # If no aggfunc is provided, we are computing frequencies. Since we use
+        # pivot_table above, pairs that are not observed will get a NaN value,
+        # so we need to fill all NaN values with 0.
+        table = table.fillna(0)
 
-    Examples
-    --------
-    >>> df = pd.DataFrame({'foo': ['one', 'one', 'one', 'two', 'two',
-    ...                   'two'],
-    ...           'bar': ['A', 'B', 'C', 'A', 'B', 'C'],
-    ...           'baz': [1, 2, 3, 4, 5, 6],
-    ...           'zoo': ['x', 'y', 'z', 'q', 'w', 't']})
-    >>> df
-       foo bar  baz zoo
-    0  one   A    1   x
-    1  one   B    2   y
-    2  one   C    3   z
-    3  two   A    4   q
-    4  two   B    5   w
-    5  two   C    6   t
-    >>> pd.pivot(data=df, index='foo', columns='bar', values='baz')  # doctest: +NORMALIZE_WHITESPACE
-    bar  A  B  C
-    foo
-    one  1  2  3
-    two  4  5  6
-    >>> pd.pivot(data=df, index='foo', columns='bar')['baz']  # doctest: +NORMALIZE_WHITESPACE
-    bar  A  B  C
-    foo
-    one  1  2  3
-    two  4  5  6
-    >>> pd.pivot(data=df, index='foo', columns='bar', values=['baz', 'zoo'])  # doctest: +NORMALIZE_WHITESPACE
-        baz       zoo
-    bar   A  B  C   A  B  C
-    foo
-    one   1  2  3   x  y  z
-    two   4  5  6   q  w  t
-    >>> df = pd.DataFrame({
-    ...     "lev1": [1, 1, 1, 2, 2, 2],
-    ...     "lev2": [1, 1, 2, 1, 1, 2],
-    ...     "lev3": [1, 2, 1, 2, 1, 2],
-    ...     "lev4": [1, 2, 3, 4, 5, 6],
-    ...     "values": [0, 1, 2, 3, 4, 5]})
-    >>> df
-       lev1  lev2  lev3  lev4  values
-    0     1     1     1     1       0
-    1     1     1     2     2       1
-    2     1     2     1     3       2
-    3     2     1     2     4       3
-    4     2     1     1     5       4
-    5     2     2     2     6       5
-    >>> pd.pivot(data=df, index="lev1", columns=["lev2", "lev3"], values="values")  # doctest: +NORMALIZE_WHITESPACE
-    lev2  1       2
-    lev3  1  2    1    2
-    lev1
-    1     0  1  2.0  NaN
-    2     4  3  NaN  5.0
-    >>> pd.pivot(data=df, index=["lev1", "lev2"], columns=["lev3"], values="values")  # doctest: +NORMALIZE_WHITESPACE
-    lev3         1    2
-    lev1 lev2
-    1    1     0.0  1.0
-         2     2.0  NaN
-    2    1     4.0  3.0
-         2     NaN  5.0
-    """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    if not isinstance(data, DataFrame):
-        raise ValueError(f"can not pivot with instance of type {type(data)}")
-    return data.pivot(index=index, columns=columns, values=values)
+    # We must explicitly check that the value of normalize is not False here,
+    # as a valid value of normalize is `0` (for normalizing index).
+    if normalize is not False:
+        if normalize not in [0, 1, "index", "columns", "all", True]:
+            raise ValueError("Not a valid normalize argument")
+        if normalize is True:
+            normalize = "all"
+        normalize = {0: "index", 1: "columns"}.get(normalize, normalize)
 
+        # Actual Normalizations
+        normalizers: dict[bool | str, Callable] = {
+            "all": lambda x: x / x.sum(axis=0).sum(),
+            "columns": lambda x: x / x.sum(),
+            "index": lambda x: x.div(x.sum(axis=1), axis="index"),
+        }
 
-@snowpark_pandas_telemetry_standalone_function_decorator
-def to_numeric(
-    arg: Scalar | Series | ArrayConvertible,
-    errors: Literal["ignore", "raise", "coerce"] = "raise",
-    downcast: Literal["integer", "signed", "unsigned", "float"] | None = None,
-) -> Series | Scalar | None:
-    """
-    Convert argument to a numeric type.
+        if margins is False:
 
-    If the input arg type is already a numeric type, the return dtype
-    will be the original type; otherwise, the return dtype is float.
+            f = normalizers[normalize]
+            names = table.columns.names
+            table = f(table)
+            table.columns.names = names
+            table = table.fillna(0)
+        else:
+            # keep index and column of pivoted table
+            table_index = table.index
+            table_columns = table.columns
 
-    Parameters
-    ----------
-    arg : scalar, list, tuple, 1-d array, or Series
-        Argument to be converted.
-    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
-        - If 'raise', then invalid parsing will raise an exception.
-        - If 'coerce', then invalid parsing will be set as NaN.
-        - If 'ignore', then invalid parsing will return the input.
-    downcast : str, default None
-        downcast is ignored in Snowflake backend.
+            column_margin = table.iloc[:-1, -1]
 
-    Returns
-    -------
-    ret
-        Numeric if parsing succeeded.
-        Return type depends on input.  Series if `arg` is not scalar.
+            if normalize == "columns":
+                # keep the core table
+                table = table.iloc[:-1, :-1]
 
-    See Also
-    --------
-    DataFrame.astype : Cast argument to a specified dtype.
-    to_datetime : Convert argument to datetime.
-    to_timedelta : Convert argument to timedelta.
-    numpy.ndarray.astype : Cast a numpy array to a specified type.
-    DataFrame.convert_dtypes : Convert dtypes.
+                # Normalize core
+                f = normalizers[normalize]
+                table = f(table)
+                table = table.fillna(0)
+                # Fix Margins
+                column_margin = column_margin / column_margin.sum()
+                table = pd.concat([table, column_margin], axis=1)
+                table = table.fillna(0)
+                table.columns = table_columns
 
-    Examples
-    --------
-    Take separate series and convert to numeric, coercing when told to
+            elif normalize == "index":
+                table = table.iloc[:, :-1]
 
-    >>> s = pd.Series(['1.0', '2', -3])
-    >>> pd.to_numeric(s)
-    0    1.0
-    1    2.0
-    2   -3.0
-    dtype: float64
+                # Normalize core
+                f = normalizers[normalize]
+                table = f(table)
+                table = table.fillna(0).reindex(index=table_index)
 
-    Note: to_numeric always converts non-numeric values to floats
-    >>> s = pd.Series(['1', '2', '-3'])
-    >>> pd.to_numeric(s)
-    0    1.0
-    1    2.0
-    2   -3.0
-    dtype: float64
-    >>> pd.to_numeric(s, downcast='float')  # downcast is ignored
-    0    1.0
-    1    2.0
-    2   -3.0
-    dtype: float64
-    >>> pd.to_numeric(s, downcast='signed')  # downcast is ignored
-    0    1.0
-    1    2.0
-    2   -3.0
-    dtype: float64
-    >>> s = pd.Series(['apple', '1.0', '2', -3])
-    >>> pd.to_numeric(s, errors='coerce')
-    0    NaN
-    1    1.0
-    2    2.0
-    3   -3.0
-    dtype: float64
-    """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    raise_if_native_pandas_objects(arg)
-    if errors not in ("ignore", "raise", "coerce"):
-        raise ValueError("invalid error value specified")
-    if downcast is not None:
-        WarningMessage.ignored_argument(
-            operation="to_numeric",
-            argument="downcast",
-            message="downcast is ignored in Snowflake backend",
-        )
-    # convert arg to series
-    arg_is_scalar = is_scalar(arg)
+            elif normalize == "all":
+                # Normalize core
+                f = normalizers[normalize]
 
-    if (
-        not arg_is_scalar
-        and not isinstance(arg, (list, tuple, Series))
-        and not (is_array_like(arg) and arg.ndim == 1)
-    ):
-        raise TypeError("arg must be a list, tuple, 1-d array, or Series")
+                # When we perform the normalization function, we take the sum over
+                # the rows, and divide every value by the sum. Since margins is included
+                # though, the result of the sum is actually 2 * the sum of the original
+                # values (since the margin itself is the sum of the original values),
+                # so we need to multiply by 2 here to account for that.
+                # The alternative would be to apply normalization to the main table
+                # and the index margins separately, but that would require additional joins
+                # to get the final table, which we want to avoid.
+                table = f(table.iloc[:, :-1]) * 2.0
 
-    if arg_is_scalar:
-        arg = Series([arg])
+                column_margin = column_margin / column_margin.sum()
+                table = pd.concat([table, column_margin], axis=1)
+                table.iloc[-1, -1] = 1
 
-    if not isinstance(arg, Series):
-        name = None
-        # keep index name
-        if isinstance(arg, pandas.Index):
-            name = arg.name
-        arg = Series(arg, name=name)
+                table = table.fillna(0)
+                table.index = table_index
+                table.columns = table_columns
 
-    ret = arg._to_numeric(errors=errors)
-    if arg_is_scalar:
-        # use squeeze to turn the series result into a scalar
-        ret = ret.squeeze()
-    return ret
+    table = table.rename_axis(index=rownames_mapper, axis=0)
+    table = table.rename_axis(columns=colnames_mapper, axis=1)
+
+    return table
 
 
 @snowpark_pandas_telemetry_standalone_function_decorator
-def unique(values) -> np.ndarray:
+def cut(
+    x: AnyArrayLike,
+    bins: int | Sequence[Scalar] | IntervalIndex,
+    right: bool = True,
+    labels=None,
+    retbins: bool = False,
+    precision: int = 3,
+    include_lowest: bool = False,
+    duplicates: str = "raise",
+    ordered: bool = True,
+):
     """
-    Return unique values based on a hash table. Unique values are
-    returned in the order of appearance. This does NOT sort.
+    Bin values into discrete intervals.
+
+    Use `cut` when you need to segment and sort data values into bins. This
+    function is also useful for going from a continuous variable to a
+    categorical variable. For example, `cut` could convert ages to groups of
+    age ranges. Supports binning into an equal number of bins, or a
+    pre-specified array of bins.
 
     Parameters
     ----------
-    values : ndarray (1-d), list, bytearray, tuple, Series, Index, list-like
-        Non-hashable objects like set, dict, and user defined classes are
-        invalid input.
-        Values to perform computation.
+    x : array-like
+        The input array to be binned. Must be 1-dimensional.
+    bins : int, sequence of scalars
+        The criteria to bin by.
+
+        * int : Defines the number of equal-width bins in the range of `x`. The
+          range of `x` is extended by .1% on each side to include the minimum
+          and maximum values of `x`.
+        * sequence of scalars : Defines the bin edges allowing for non-uniform
+          width. No extension of the range of `x` is done.
+
+    right : bool, default True
+        Indicates whether `bins` includes the rightmost edge or not. If
+        ``right == True`` (the default), then the `bins` ``[1, 2, 3, 4]``
+        indicate (1,2], (2,3], (3,4]. This argument is ignored when
+        `bins` is an IntervalIndex.
+    labels : array or False, default None
+        Specifies the labels for the returned bins. Must be the same length as
+        the resulting bins. If False, returns only integer indicators of the
+        bins. This affects the type of the output container (see below).
+        This argument is ignored when `bins` is an IntervalIndex. If True,
+        raises an error. When `ordered=False`, labels must be provided.
+
+        Snowpark pandas API does not support labels=None.
+        Labels must be of a Snowpark pandas API supported dtype.
+
+    retbins : bool, default False
+        Snowpark pandas API does not support this parameter yet.
+    precision : int, default 3
+        The precision at which to store and display the bins labels.
+    include_lowest : bool, default False
+        Whether the first interval should be left-inclusive or not.
+    duplicates : {default 'raise', 'drop'}, optional
+        If bin edges are not unique, raise ValueError or drop non-uniques.
+    ordered : bool, default True
+        Whether the labels are ordered or not. Applies to returned types
+        Categorical and Series (with Categorical dtype). If True,
+        the resulting categorical will be ordered. If False, the resulting
+        categorical will be unordered (labels must be provided).
 
     Returns
     -------
-    ndarray
-    The unique values returned as a NumPy array. See Notes.
+    out : Categorical, Series, or ndarray
+        An array-like object representing the respective bin for each value
+        of `x`. The type depends on the value of `labels`.
 
-    See Also
-    --------
-    Series.unique()
+        * None (default) : returns a Series for Series `x` or a
+          Categorical for all other inputs. The values stored within
+          are Interval dtype.
+
+        * sequence of scalars : returns a Series for Series `x` or a
+          Categorical for all other inputs. The values stored within
+          are whatever the type in the sequence is.
+
+        * False : returns an ndarray of integers.
+
+    bins : numpy.ndarray
+        The computed or specified bins. Only returned when `retbins=True`.
+        For scalar or sequence `bins`, this is an ndarray with the computed
+        bins. If set `duplicates=drop`, `bins` will drop non-unique bin.
 
     Notes
     -----
-    Returns the unique values as a NumPy array. This includes
-
-        * Datetime with Timezone
-        * IntegerNA
+    Any NA values will be NA in the result. Out of bounds values will be NA in
+    the resulting Series or Categorical object.
 
-    See Examples section.
+    Snowpark pandas API does not natively support Categorical and categorical types. When calling `cut` with a
+    Snowpark pandas Series and using `labels=False`, a Snowpark pandas Series object is returned. However,
+    for `labels != False` an error is raised.
 
     Examples
     --------
-    >>> pd.unique([2, 1, 3, 3])
-    array([2, 1, 3])
-
-    >>> pd.unique([pd.Timestamp('2016-01-01', tz='US/Eastern')
-    ...            for _ in range(3)])
-    array([Timestamp('2016-01-01 00:00:00-0500', tz='UTC-05:00')],
-          dtype=object)
-
-    >>> pd.unique([("a", "b"), ("b", "a"), ("a", "c"), ("b", "a")])
-    array([list(['a', 'b']), list(['b', 'a']), list(['a', 'c'])], dtype=object)
-
-    >>> pd.unique([None, np.nan, 2])
-    array([nan,  2.])
-    """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    if is_list_like(values) and not isinstance(values, dict):
-        return Series(values).unique()
-    else:
-        raise TypeError("Only list-like objects can be used with unique()")
-
+    Discretize into three equal-sized bins.
 
-# Adding docstring since pandas docs don't have web section for this function.
-@snowpark_pandas_telemetry_standalone_function_decorator
-@pandas_module_level_function_not_implemented()
-def value_counts(
-    values, sort=True, ascending=False, normalize=False, bins=None, dropna=True
-):
-    """
-    Compute a histogram of the counts of non-null values.
+    >>> pd.cut(np.array([1, 7, 5, 4, 6, 3]), 3, labels=False)
+    ... # doctest: +ELLIPSIS
+    array([0, 2, 1, 1, 2, 0])
 
-    Parameters
-    ----------
-    values : ndarray (1-d)
-        Values to perform computation.
-    sort : bool, default: True
-        Sort by values.
-    ascending : bool, default: False
-        Sort in ascending order.
-    normalize : bool, default: False
-        If True then compute a relative histogram.
-    bins : integer, optional
-        Rather than count values, group them into half-open bins,
-        convenience for pd.cut, only works with numeric data.
-    dropna : bool, default: True
-        Don't include counts of NaN.
+    ``labels=False`` implies you just want the bins back.
 
-    Returns
-    -------
-    Series
-    """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    return Series(values).value_counts(
-        sort=sort,
-        ascending=ascending,
-        normalize=normalize,
-        bins=bins,
-        dropna=dropna,
-    )
+    >>> pd.cut([0, 1, 1, 2], bins=4, labels=False)
+    array([0, 1, 1, 3])
 
+    Passing a Series as an input returns a Series with labels=False:
 
-@snowpark_pandas_telemetry_standalone_function_decorator
-def concat(
-    objs: (
-        Iterable[modin.pandas.DataFrame | Series]
-        | Mapping[Hashable, modin.pandas.DataFrame | Series]
-    ),
-    axis: Axis = 0,
-    join: str = "outer",
-    ignore_index: bool = False,
-    keys: Sequence[Hashable] = None,
-    levels: list[Sequence[Hashable]] = None,
-    names: list[Hashable] = None,
-    verify_integrity: bool = False,
-    sort: bool = False,
-    copy: bool = True,
-) -> modin.pandas.DataFrame | Series:
+    >>> s = pd.Series(np.array([2, 4, 6, 8, 10]),
+    ...               index=['a', 'b', 'c', 'd', 'e'])
+    >>> pd.cut(s, 3, labels=False)
+    ... # doctest: +ELLIPSIS
+    a    0
+    b    0
+    c    1
+    d    2
+    e    2
+    dtype: int64
     """
-    Concatenate pandas objects along a particular axis.
 
-    Allows optional set logic along the other axes.
+    if retbins is True:
+        ErrorMessage.not_implemented("retbins not supported.")
 
-    Can also add a layer of hierarchical indexing on the concatenation axis,
-    which may be useful if the labels are the same (or overlapping) on
-    the passed axis number.
+    # Execute other supported objects via native pandas.
+    if not isinstance(x, Series):
+        return pandas.cut(
+            x,
+            bins,
+            right=right,
+            labels=labels,
+            retbins=retbins,
+            precision=precision,
+            include_lowest=include_lowest,
+            duplicates=duplicates,
+            ordered=ordered,
+        )
 
-    Parameters
-    ----------
-    objs : a sequence or mapping of Series or DataFrame objects
-        If a mapping is passed, the sorted keys will be used as the `keys`
-        argument, unless it is passed, in which case the values will be
-        selected (see below). Any None objects will be dropped silently unless
-        they are all None in which case a ValueError will be raised.
-    axis : {0/'index', 1/'columns'}, default 0
-        The axis to concatenate along.
-    join : {'inner', 'outer'}, default 'outer'
-        How to handle indexes on other axis (or axes).
-    ignore_index : bool, default False
-        If True, do not use the index values along the concatenation axis. The
-        resulting axis will be labeled 0, ..., n - 1. This is useful if you are
-        concatenating objects where the concatenation axis does not have
-        meaningful indexing information. Note the index values on the other
-        axes are still respected in the join.
-    keys : sequence, default None
-        If multiple levels passed, should contain tuples. Construct
-        hierarchical index using the passed keys as the outermost level.
-    levels : list of sequences, default None
-        Specific levels (unique values) to use for constructing a
-        MultiIndex. Otherwise they will be inferred from the keys.
-        Snowpark pandas does not support 'levels' argument.
-    names : list, default None
-        Names for the levels in the resulting hierarchical index.
-    verify_integrity : bool, default False
-        Check whether the new concatenated axis contains duplicates.
-        Snowpark pandas does not support distributed computation of concat when
-        'verify_integrity' is True.
-    sort : bool, default False
-        Sort non-concatenation axis if it is not already aligned.
-    copy : bool, default True
-        If False, do not copy data unnecessarily.
-        This argument is ignored in Snowpark pandas.
+    # Produce pandas-compatible error if ordered=False and labels are not specified.
+    # No error is raised when labels are not desired (labels=False).
+    if ordered is False and labels is None:
+        raise ValueError("'labels' must be provided if 'ordered = False'")
 
-    Returns
-    -------
-    object, type of objs
-        When concatenating all Snowpark pandas :class:`~modin.pandas.Series` along the index (axis=0),
-        a Snowpark pandas :class:`~modin.pandas.Series` is returned. When ``objs`` contains at least
-        one Snowpark pandas :class:`~modin.pandas.DataFrame`,
-        a Snowpark pandas :class:`~modin.pandas.DataFrame` is returned. When concatenating along
-        the columns (axis=1), a Snowpark pandas :class:`~modin.pandas.DataFrame` is returned.
+    bins, qc = x._query_compiler.cut(
+        bins,
+        right=right,
+        labels=labels,
+        precision=precision,
+        include_lowest=include_lowest,
+        duplicates=duplicates,
+    )
 
-    See Also
-    --------
-    DataFrame.join : Join DataFrames using indexes.
-    DataFrame.merge : Merge DataFrames by indexes or columns.
+    # Depending on setting, reconstruct bins and convert qc to the correct result.
+    if labels is False:
+        return pd.Series(query_compiler=qc)
+    else:
+        # Raise NotImplemented Error as categorical is not supported.
+        ErrorMessage.not_implemented("categorical not supported in Snowpark pandas API")
 
-    Notes
-    -----
-    The keys, levels, and names arguments are all optional.
+        # Following code would produce correct result, uncomment once categorical is supported.
+        # Convert to pandas categorical and return as Series.
+        # Note: In the future, once we support CategoricalType we could keep this lazily around. For now,
+        # match what pandas does here. In the future, change pandas -> pd and everything should work out-of-the box.
+        # arr = qc.to_numpy().ravel()
+        # return pandas.Series(
+        #    pandas.Categorical(values=arr, categories=labels, ordered=ordered)
+        # )
 
-    It is not recommended to build DataFrames by adding single rows in a
-    for loop. Build a list of rows and make a DataFrame in a single concat.
 
-    Examples
-    --------
-    Combine two ``Series``.
+@snowpark_pandas_telemetry_standalone_function_decorator
+def qcut(
+    x: np.ndarray | Series,
+    q: int | ListLikeOfFloats,
+    labels: ListLike | bool | None = None,
+    retbins: bool = False,
+    precision: int = 3,
+    duplicates: Literal["raise"] | Literal["drop"] = "raise",
+) -> Series:
+    """
+    Quantile-based discretization function.
 
-    >>> s1 = pd.Series(['a', 'b'])
-    >>> s2 = pd.Series(['c', 'd'])
-    >>> pd.concat([s1, s2])
-    0    a
-    1    b
-    0    c
-    1    d
-    dtype: object
+    Discretize variable into equal-sized buckets based on rank or based
+    on sample quantiles.
 
-    Clear the existing index and reset it in the result
-    by setting the ``ignore_index`` option to ``True``.
+    Parameters
+    ----------
+    x : 1-D ndarray or Series
+        The data across which to compute buckets. If a Snowpark pandas Series is passed, the computation
+        is distributed. Otherwise, if a numpy array or list is provided, the computation is performed
+        client-side instead.
 
-    >>> pd.concat([s1, s2], ignore_index=True)
-    0    a
-    1    b
-    2    c
-    3    d
-    dtype: object
+    q : int or list-like of float
+        Number of quantiles. 10 for deciles, 4 for quartiles, etc. Alternately array of quantiles,
+        e.g. [0, .25, .5, .75, 1.] for quartiles.
 
-    Add a hierarchical index at the outermost level of
-    the data with the ``keys`` option.
+    labels : array or False, default None
+        Used as labels for the resulting bin. Must be of the same length as the resulting bins. If False,
+        return only integer indicators of the bins. If True, raise an error.
 
-    >>> pd.concat([s1, s2], keys=['s1', 's2'])
-    s1  0    a
-        1    b
-    s2  0    c
-        1    d
-    dtype: object
+        ``labels=False`` will run binning computation in Snowflake; other values are not yet supported
+        in Snowpark pandas.
 
-    Label the index keys you create with the ``names`` option.
+    retbins : bool, default False
+        Whether to return the (bins, labels) or not. Can be useful if bins is given as a scalar.
+        ``retbins=True`` is not yet supported in Snowpark pandas.
 
-    >>> pd.concat([s1, s2], keys=['s1', 's2'],
-    ...           names=['Series name', 'Row ID'])
-    Series name  Row ID
-    s1           0         a
-                 1         b
-    s2           0         c
-                 1         d
-    dtype: object
+    precision : int, optional
+        The precision at which to store and display the bins labels.
 
-    Combine two ``DataFrame`` objects with identical columns.
+    duplicates : {default 'raise', 'drop'}, optional
+        If bin edges are not unique, raise ValueError or drop non-uniques.
 
-    >>> df1 = pd.DataFrame([['a', 1], ['b', 2]],
-    ...                    columns=['letter', 'number'])
-    >>> df1
-      letter  number
-    0      a       1
-    1      b       2
-    >>> df2 = pd.DataFrame([['c', 3], ['d', 4]],
-    ...                    columns=['letter', 'number'])
-    >>> df2
-      letter  number
-    0      c       3
-    1      d       4
-    >>> pd.concat([df1, df2])
-      letter  number
-    0      a       1
-    1      b       2
-    0      c       3
-    1      d       4
+    Returns
+    -------
+    Series
+        Since Snowpark pandas does not yet support the ``pd.Categorical`` type, unlike native pandas, the
+        return value is always a Series.
+    """
 
-    Combine ``DataFrame`` objects with overlapping columns
-    and return everything. Columns outside the intersection will
-    be filled with ``NaN`` values.
+    kwargs = {
+        "labels": labels,
+        "retbins": retbins,
+        "precision": precision,
+        "duplicates": duplicates,
+    }
 
-    >>> df3 = pd.DataFrame([['c', 3, 'cat'], ['d', 4, 'dog']],
-    ...                    columns=['letter', 'number', 'animal'])
-    >>> df3
-      letter  number animal
-    0      c       3    cat
-    1      d       4    dog
-    >>> pd.concat([df1, df3], sort=False)
-      letter  number animal
-    0      a       1   None
-    1      b       2   None
-    0      c       3    cat
-    1      d       4    dog
+    # For numpy or list, call to native pandas.
+    if not isinstance(x, Series):
+        return pandas.qcut(x, q, **kwargs)
 
-    Combine ``DataFrame`` objects with overlapping columns
-    and return only those that are shared by passing ``inner`` to
-    the ``join`` keyword argument.
+    # Check that labels is supported as in pandas.
+    if not (labels is None or labels is False or is_list_like(labels)):
+        raise ValueError(
+            "Bin labels must either be False, None or passed in as a list-like argument"
+        )
 
-    >>> pd.concat([df1, df3], join="inner")
-      letter  number
-    0      a       1
-    1      b       2
-    0      c       3
-    1      d       4
+    # Carry out check that for the list-like case quantiles are (monotonically) increasing,
+    # if not the case throw pandas compatible error.
+    if not isinstance(q, int) and np.all(np.diff(q) < 0):
+        # Note: Pandas 2.x changed the error message here, using Pandas 2.x behavior here.
+        raise ValueError("left side of interval must be <= right side")
 
-    Combine ``DataFrame`` objects horizontally along the x axis by
-    passing in ``axis=1``.
+        # remove duplicates (input like [0.5, 0.5] is ok)
+        q = sorted(list(set(q)))
 
-    >>> df4 = pd.DataFrame([['bird', 'polly'], ['monkey', 'george']],
-    ...                    columns=['animal', 'name'])
-    >>> pd.concat([df1, df4], axis=1)
-      letter  number  animal    name
-    0      a       1    bird   polly
-    1      b       2  monkey  george
+    if labels is not False:
+        # Labels require categorical, not yet supported. Use native pandas conversion here to compute result.
+        ErrorMessage.not_implemented(
+            "Snowpark pandas API qcut method supports only labels=False, if you need support"
+            " for labels consider calling pandas.qcut(x.to_pandas(), q, ...)"
+        )
 
-    Combining series horizontally creates a DataFrame. Missing names are replaced with
-    numeric values.
+    ans = x._qcut(q, retbins, duplicates)
 
-    >>> pd.concat([s1, s2], axis=1)
-       0  1
-    0  a  c
-    1  b  d
+    if isinstance(q, int) and q != 1 and len(ans) == 1:
+        if duplicates == "raise":
+            # We issue a count query since if q !=1 and x is a Series/list-like containing
+            # a single element, an error will be produced  ValueError: Bin edges must be unique: array([0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.]).
+            #                You can drop duplicate edges by setting the 'duplicates' kwarg.
+            # With qcut being an API that requires conversion, we can mimick this behavior here.
 
-    When combining objects horizoantally ``ignore_index=True`` will clear the existing
-    column names and reset it in the result.
+            # Produce raising error.
+            raise ValueError(
+                f"Bin edges must be unique: {repr(np.array([0.] * q))}.\nYou can drop duplicate edges by setting the 'duplicates' kwarg."
+            )
+        else:
+            # The result will always be NaN because no unique bin could be found.
+            return pd.Series([np.nan])
 
-    >>> pd.concat([df1, df4], axis=1, ignore_index=True)
-       0  1       2       3
-    0  a  1    bird   polly
-    1  b  2  monkey  george
+    return ans
 
-    When combining objects horizontally, add a hierarchical column index at the
-    outermost level of the column labels with the ``keys`` option.
 
-    >>> pd.concat([df1, df4], axis=1, keys=['x', 'y']) # doctest: +NORMALIZE_WHITESPACE
-           x              y
-      letter number  animal    name
-    0      a      1    bird   polly
-    1      b      2  monkey  george
+@snowpark_pandas_telemetry_standalone_function_decorator
+def merge(
+    left: snowflake.snowpark.modin.pandas.DataFrame | Series,
+    right: snowflake.snowpark.modin.pandas.DataFrame | Series,
+    how: str | None = "inner",
+    on: IndexLabel | None = None,
+    left_on: None
+    | (Hashable | AnyArrayLike | Sequence[Hashable | AnyArrayLike]) = None,
+    right_on: None
+    | (Hashable | AnyArrayLike | Sequence[Hashable | AnyArrayLike]) = None,
+    left_index: bool | None = False,
+    right_index: bool | None = False,
+    sort: bool | None = False,
+    suffixes: Suffixes | None = ("_x", "_y"),
+    copy: bool | None = True,
+    indicator: bool | str | None = False,
+    validate: str | None = None,
+):
+    """
+    Merge DataFrame or named Series objects with a database-style join.
 
-    Concatenatiing series horizontally with ``keys``.
+    A named Series object is treated as a DataFrame with a single named column.
+
+    The join is done on columns or indexes. If joining columns on
+    columns, the DataFrame indexes *will be ignored*. Otherwise if joining indexes
+    on indexes or indexes on a column or columns, the index will be passed on.
+    When performing a cross merge, no column specifications to merge on are
+    allowed.
 
-    >>> pd.concat([s1, s2], axis=1, keys=['x', 'y'])
-       x  y
-    0  a  c
-    1  b  d
+    .. warning::
 
-    When combining objects horizontally, ``how='inner'`` to keep only overalpping
-    index values.
+        If both key columns contain rows where the key is a null value, those
+        rows will be matched against each other. This is different from usual SQL
+        join behaviour and can lead to unexpected results.
 
-    >>> df5 = pd.DataFrame([['a', 1], ['b', 2]],
-    ...                    columns=['letter', 'number'],
-    ...                    index=[1, 2])
-    >>> df5
-      letter  number
-    1      a       1
-    2      b       2
-    >>> pd.concat([df1, df5], axis=1, join='inner')
-      letter  number letter  number
-    1      b       2      a       1
+    Parameters
+    ----------
+    left : :class:`~modin.pandas.DataFrame` or named Series
+    right : :class:`~modin.pandas.DataFrame` or named Series
+        Object to merge with.
+    how : {'left', 'right', 'outer', 'inner', 'cross'}, default 'inner'
+        Type of merge to be performed.
 
-    Prevent the result from including duplicate index values with the
-    ``verify_integrity`` option.
+        * left: use only keys from left frame, similar to a SQL left outer join;
+          preserve key order.
+        * right: use only keys from right frame, similar to a SQL right outer join;
+          preserve key order.
+        * outer: use union of keys from both frames, similar to a SQL full outer
+          join; sort keys lexicographically.
+        * inner: use intersection of keys from both frames, similar to a SQL inner
+          join; preserve the order of the left keys.
+        * cross: creates the cartesian product from both frames, preserves the order
+          of the left keys.
 
-    >>> df5 = pd.DataFrame([1], index=['a'])
-    >>> df5
-       0
-    a  1
-    >>> df6 = pd.DataFrame([2], index=['a'])
-    >>> df6
-       0
-    a  2
-    >>> pd.concat([df5, df6], verify_integrity=True)
-    Traceback (most recent call last):
-        ...
-    ValueError: Indexes have overlapping values: Index(['a'], dtype='object')
+    on : label or list
+        Column or index level names to join on. These must be found in both
+        DataFrames. If `on` is None and not merging on indexes then this defaults
+        to the intersection of the columns in both DataFrames.
+    left_on : label or list, or array-like
+        Column or index level names to join on in the left DataFrame. Can also
+        be an array or list of arrays of the length of the left DataFrame.
+        These arrays are treated as if they are columns.
+    right_on : label or list, or array-like
+        Column or index level names to join on in the right DataFrame. Can also
+        be an array or list of arrays of the length of the right DataFrame.
+        These arrays are treated as if they are columns.
+    left_index : bool, default False
+        Use the index from the left DataFrame as the join key(s). If it is a
+        MultiIndex, the number of keys in the other DataFrame (either the index
+        or a number of columns) must match the number of levels.
+    right_index : bool, default False
+        Use the index from the right DataFrame as the join key. Same caveats as
+        left_index.
+    sort : bool, default False
+        Sort the join keys lexicographically in the result DataFrame. If False,
+        the order of the join keys depends on the join type (how keyword).
+    suffixes : list-like, default is ("_x", "_y")
+        A length-2 sequence where each element is optionally a string
+        indicating the suffix to add to overlapping column names in
+        `left` and `right` respectively. Pass a value of `None` instead
+        of a string to indicate that the column name from `left` or
+        `right` should be left as-is, with no suffix. At least one of the
+        values must not be None.
+    copy : bool, default True
+        This argument is ignored in Snowpark pandas API.
+    indicator : bool or str, default False
+        If True, adds a column to the output DataFrame called "_merge" with
+        information on the source of each row. The column can be given a different
+        name by providing a string argument. The column will have a Categorical
+        type with the value of "left_only" for observations whose merge key only
+        appears in the left DataFrame, "right_only" for observations
+        whose merge key only appears in the right DataFrame, and "both"
+        if the observation's merge key is found in both DataFrames.
 
-    Append a single row to the end of a ``DataFrame`` object.
+    validate : str, optional
+        This is not yet supported.
 
-    >>> df7 = pd.DataFrame({'a': 1, 'b': 2}, index=[0])
-    >>> df7
-       a  b
-    0  1  2
-    >>> new_row = pd.DataFrame({'a': 3, 'b': 4}, index=[0])
-    >>> new_row
-       a  b
-    0  3  4
-    >>> pd.concat([df7, new_row], ignore_index=True)
-       a  b
-    0  1  2
-    1  3  4
-    """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    # Raise error if native pandas objects are passed.
-    raise_if_native_pandas_objects(objs)
+    Returns
+    -------
+    :class:`~modin.pandas.DataFrame`
+        A DataFrame of the two merged objects.
 
-    # In native pandas 'concat' API is expected to work with all types of iterables like
-    # tuples, list, generators, custom iterators, deque etc.
-    # Few exceptions are 'DataFrame', 'Series', 'str', these are also technically
-    # iterables, but they are not iterables of pandas objects.
-    # Note other iterables can also have non pandas objects as element in them, but it's
-    # not possible to know that in advance without iterating over all objects, so we
-    # also individual element later.
+    See Also
+    --------
+    merge_ordered : Merge with optional filling/interpolation.
+    merge_asof : Merge on nearest keys.
+    DataFrame.join : Similar method using indices.
 
-    # Raise error if 'objs' is not an iterable or an iterable of non-pandas objects.
-    if not isinstance(objs, Iterable) or isinstance(
-        objs, (pd.DataFrame, pd.Series, str)
-    ):
-        # Same error as native pandas.
-        raise TypeError(
-            "first argument must be an iterable of pandas "
-            f'objects, you passed an object of type "{type(objs).__name__}"'
-        )
+    Examples
+    --------
+    >>> df1 = pd.DataFrame({'lkey': ['foo', 'bar', 'baz', 'foo'],
+    ...                     'value': [1, 2, 3, 5]})
+    >>> df2 = pd.DataFrame({'rkey': ['foo', 'bar', 'baz', 'foo'],
+    ...                     'value': [5, 6, 7, 8]})
+    >>> df1
+      lkey  value
+    0  foo      1
+    1  bar      2
+    2  baz      3
+    3  foo      5
+    >>> df2
+      rkey  value
+    0  foo      5
+    1  bar      6
+    2  baz      7
+    3  foo      8
 
-    if isinstance(objs, dict):
-        if keys is None:
-            keys = list(objs.keys())
-        # if 'keys' is not none, filter out additional objects from mapping.
-        objs = [objs[k] for k in keys]
-    else:
-        # Native pandas also supports generators as input, that can only be iterated
-        # only once so first create a list from 'objs'.
-        objs = list(objs)
+    Merge df1 and df2 on the lkey and rkey columns. The value columns have
+    the default suffixes, _x and _y, appended.
 
-    for obj in objs:
-        # Raise error if native pandas objects are passed.
-        raise_if_native_pandas_objects(obj)
+    >>> df1.merge(df2, left_on='lkey', right_on='rkey')
+      lkey  value_x rkey  value_y
+    0  foo        1  foo        5
+    1  foo        1  foo        8
+    2  bar        2  bar        6
+    3  baz        3  baz        7
+    4  foo        5  foo        5
+    5  foo        5  foo        8
 
-    if join not in ("inner", "outer"):
-        # Same error as native pandas.
-        raise ValueError(
-            "Only can inner (intersect) or outer (union) join the other axis"
-        )
+    Merge DataFrames df1 and df2 with specified left and right suffixes
+    appended to any overlapping columns.
 
-    axis = pandas.DataFrame()._get_axis_number(axis)
+    >>> df1.merge(df2, left_on='lkey', right_on='rkey',
+    ...           suffixes=('_left', '_right'))
+      lkey  value_left rkey  value_right
+    0  foo           1  foo            5
+    1  foo           1  foo            8
+    2  bar           2  bar            6
+    3  baz           3  baz            7
+    4  foo           5  foo            5
+    5  foo           5  foo            8
 
-    if len(objs) == 0:
-        # Same error as native pandas.
-        raise ValueError("No objects to concatenate")
 
-    # Filter out None objects
-    if keys is None:
-        objs = [o for o in objs if o is not None]
-    else:
-        tuples = [(k, v) for k, v in zip(keys, objs) if v is not None]
-        # convert list of tuples to tuples of list.
-        keys, objs = list(map(list, zip(*tuples))) if tuples else ([], [])
+    >>> df1 = pd.DataFrame({'a': ['foo', 'bar'], 'b': [1, 2]})
+    >>> df2 = pd.DataFrame({'a': ['foo', 'baz'], 'c': [3, 4]})
+    >>> df1
+         a  b
+    0  foo  1
+    1  bar  2
+    >>> df2
+         a  c
+    0  foo  3
+    1  baz  4
 
-    if len(objs) == 0:
-        # Same error as native pandas.
-        raise ValueError("All objects passed were None")
+    >>> df1.merge(df2, how='inner', on='a')
+         a  b  c
+    0  foo  1  3
 
-    for obj in objs:
-        # Same error as native pandas.
-        if not isinstance(obj, (Series, DataFrame)):
-            raise TypeError(
-                f"cannot concatenate object of type '{type(obj)}'; "
-                "only Series and DataFrame objs are valid"
-            )
+    >>> df1.merge(df2, how='left', on='a')
+         a  b    c
+    0  foo  1  3.0
+    1  bar  2  NaN
 
-    # Assign names to unnamed series - the names function as column labels for Series.
-    # If all Series have no name, use the keys as names.
-    if (
-        axis == 1
-        and keys is not None
-        and all(isinstance(obj, Series) and obj.name is None for obj in objs)
-    ):
-        for i, obj in enumerate(objs):
-            objs[i] = obj.rename(keys[i])
+    >>> df1 = pd.DataFrame({'left': ['foo', 'bar']})
+    >>> df2 = pd.DataFrame({'right': [7, 8]})
+    >>> df1
+      left
+    0  foo
+    1  bar
+    >>> df2
+       right
+    0      7
+    1      8
 
-    # If only some Series have names, give them temporary names.
-    series_name = 0
-    for i, obj in enumerate(objs):
-        if isinstance(obj, pd.Series) and obj.name is None:
-            objs[i] = obj.rename(series_name)
-            series_name = series_name + 1
+    >>> df1.merge(df2, how='cross')
+      left  right
+    0  foo      7
+    1  foo      8
+    2  bar      7
+    3  bar      8
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    # Raise error if 'left' or 'right' is native pandas object.
+    raise_if_native_pandas_objects(left)
+    raise_if_native_pandas_objects(right)
 
-    # Check if all objects are of Series types.
-    all_series = all([isinstance(obj, pd.Series) for obj in objs])
-    # When concatenating Series objects on axis 0, pandas tries to preserve name from
-    # input if all have same name otherwise set it to None.
-    if all_series and axis == 0:
-        unique_names = {obj.name for obj in objs}
-        name = objs[0].name if len(unique_names) == 1 else None
-        objs = [obj.rename(name) for obj in objs]
+    if isinstance(left, Series):
+        if left.name is None:
+            raise ValueError("Cannot merge a Series without a name")
+        else:
+            left = left.to_frame()
 
-    if not copy:
-        WarningMessage.ignored_argument(
-            operation="concat",
-            argument="copy",
-            message="copy parameter has been ignored with Snowflake execution engine",
+    if not isinstance(left, DataFrame):
+        raise TypeError(
+            f"Can only merge Series or DataFrame objects, a {type(left)} was passed"
         )
 
-    # For the edge case where concatenation is done on the columns where all the objects are series,
-    # need to prevent a second column level from being created - therefore, keys is None.
-    keys = None if axis == 1 and all(isinstance(obj, Series) for obj in objs) else keys
-
-    result = objs[0]._query_compiler.concat(
-        axis,
-        [o._query_compiler for o in objs[1:]],
-        join=join,
-        ignore_index=ignore_index,
-        keys=keys,
-        levels=levels,
-        names=names,
-        verify_integrity=verify_integrity,
+    return left.merge(
+        right,
+        how=how,
+        on=on,
+        left_on=left_on,
+        right_on=right_on,
+        left_index=left_index,
+        right_index=right_index,
         sort=sort,
+        suffixes=suffixes,
+        copy=copy,
+        indicator=indicator,
+        validate=validate,
     )
-    # If all objects are series and concat axis=0, return Series else return DataFrame.
-    if all_series and axis == 0:
-        return Series(query_compiler=result)
-    return DataFrame(query_compiler=result)
 
 
 @snowpark_pandas_telemetry_standalone_function_decorator
-def to_datetime(
-    arg: DatetimeScalarOrArrayConvertible
-    | DictConvertible
-    | modin.pandas.DataFrame
-    | Series,
-    errors: DateTimeErrorChoices = "raise",
-    dayfirst: bool = False,
-    yearfirst: bool = False,
-    utc: bool = False,
-    format: str | None = None,
-    exact: bool | lib.NoDefault = lib.no_default,
-    unit: str | None = None,
-    infer_datetime_format: lib.NoDefault | bool = lib.no_default,
-    origin: Any = "unix",
-    cache: bool = True,
-) -> pd.DatetimeIndex | Series | DatetimeScalar | NaTType | None:
+@pandas_module_level_function_not_implemented()
+@_inherit_docstrings(pandas.merge_ordered, apilink="pandas.merge_ordered")
+def merge_ordered(
+    left,
+    right,
+    on=None,
+    left_on=None,
+    right_on=None,
+    left_by=None,
+    right_by=None,
+    fill_method=None,
+    suffixes=("_x", "_y"),
+    how: str = "outer",
+) -> DataFrame:  # noqa: PR01, RT01, D200
     """
-    Convert argument to datetime.
+    Perform a merge for ordered data with optional filling/interpolation.
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    if not isinstance(left, DataFrame):
+        raise ValueError(f"can not merge DataFrame with instance of type {type(right)}")
+    if isinstance(right, DataFrame):
+        right = to_pandas(right)
+    return DataFrame(
+        pandas.merge_ordered(
+            to_pandas(left),
+            right,
+            on=on,
+            left_on=left_on,
+            right_on=right_on,
+            left_by=left_by,
+            right_by=right_by,
+            fill_method=fill_method,
+            suffixes=suffixes,
+            how=how,
+        )
+    )
 
-    This function converts a scalar, array-like, :class:`~modin.pandas.Series` or
-    :class:`~modin.pandas.DataFrame`/dict-like to a pandas datetime object.
+
+@snowpark_pandas_telemetry_standalone_function_decorator
+@_inherit_docstrings(pandas.merge_asof, apilink="pandas.merge_asof")
+def merge_asof(
+    left,
+    right,
+    on: str | None = None,
+    left_on: str | None = None,
+    right_on: str | None = None,
+    left_index: bool = False,
+    right_index: bool = False,
+    by: str | list[str] | None = None,
+    left_by: str | None = None,
+    right_by: str | None = None,
+    suffixes: Suffixes = ("_x", "_y"),
+    tolerance: int | Timedelta | None = None,
+    allow_exact_matches: bool = True,
+    direction: str = "backward",
+) -> snowflake.snowpark.modin.pandas.DataFrame:
+    """
+    Perform a merge by key distance.
+
+    This is similar to a left-join except that we match on nearest key rather than equal keys.
+    Both DataFrames must be sorted by the key. For each row in the left DataFrame:
+
+    A “backward” search selects the last row in the right DataFrame whose ‘on’ key is less than or equal to the left’s key.
+    A “forward” search selects the first row in the right DataFrame whose ‘on’ key is greater than or equal to the left’s key.
+    A “nearest” search selects the row in the right DataFrame whose ‘on’ key is closest in absolute distance to the left’s key.
+
+    Optionally match on equivalent keys with ‘by’ before searching with ‘on’.
 
     Parameters
     ----------
-    arg : int, float, str, datetime, list, tuple, 1-d array, Series, :class:`~modin.pandas.DataFrame`/dict-like
-        The object to convert to a datetime. If a :class:`~modin.pandas.DataFrame` is provided, the
-        method expects minimally the following columns: :const:`"year"`,
-        :const:`"month"`, :const:`"day"`.
-    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
-        - If :const:`'raise'`, then invalid parsing will raise an exception.
-        - If :const:`'coerce'`, then invalid parsing will be set as :const:`NaT`.
-        - If :const:`'ignore'`, then invalid parsing will return the input.
-    dayfirst : bool, default False
-        Specify a date parse order if `arg` is str or is list-like.
-        If :const:`True`, parses dates with the day first, e.g. :const:`"10/11/12"`
-        is parsed as :const:`2012-11-10`.
+    left : :class:`~modin.pandas.DataFrame` or named :class:`~modin.pandas.Series`.
+    right : :class:`~modin.pandas.DataFrame` or named :class:`~modin.pandas.Series`.
+    on : label
+        Field name to join on. Must be found in both DataFrames. The data MUST be ordered.
+        Furthermore, this must be a numeric column such as datetimelike, integer, or float.
+        On or left_on/right_on must be given.
+    left_on : label
+        Field name to join on in left DataFrame.
+    right_on : label
+        Field name to join on in right DataFrame.
+    left_index : bool
+        Use the index of the left DataFrame as the join key.
+    right_index : bool
+        Use the index of the right DataFrame as the join key.
+    by : column name or list of column names
+        Match on these columns before performing merge operation.
+    left_by : column name
+        Field names to match on in the left DataFrame.
+    right_by : column name
+        Field names to match on in the right DataFrame.
+    suffixes : 2-length sequence (tuple, list, …)
+        Suffix to apply to overlapping column names in the left and right side, respectively.
+    tolerance: int or Timedelta, optional, default None
+        Select asof tolerance within this range; must be compatible with the merge index.
+    allow_exact_matches : bool, default True
+        If True, allow matching with the same ‘on’ value (i.e. less-than-or-equal-to / greater-than-or-equal-to)
+        If False, don’t match the same ‘on’ value (i.e., strictly less-than / strictly greater-than).
+    direction : ‘backward’ (default), ‘forward’, or ‘nearest’
+        Whether to search for prior, subsequent, or closest matches.
 
-        .. warning::
+    Returns
+    -------
+    Snowpark pandas :class:`~modin.pandas.DataFrame`
 
-            ``dayfirst=True`` is not strict, but will prefer to parse
-            with day first. If a delimited date string cannot be parsed in
-            accordance with the given `dayfirst` option, e.g.
-            ``to_datetime(['31-12-2021'])``, then a warning will be shown.
+    Examples
+    --------
+    >>> left = pd.DataFrame({"a": [1, 5, 10], "left_val": ["a", "b", "c"]})
+    >>> left
+        a left_val
+    0   1        a
+    1   5        b
+    2  10        c
+    >>> right = pd.DataFrame({"a": [1, 2, 3, 6, 7], "right_val": [1, 2, 3, 6, 7]})
+    >>> right
+       a  right_val
+    0  1          1
+    1  2          2
+    2  3          3
+    3  6          6
+    4  7          7
+    >>> pd.merge_asof(left, right, on="a")
+        a left_val  right_val
+    0   1        a          1
+    1   5        b          3
+    2  10        c          7
+    >>> pd.merge_asof(left, right, on="a", allow_exact_matches=False)
+        a left_val  right_val
+    0   1        a        NaN
+    1   5        b        3.0
+    2  10        c        7.0
+    >>> pd.merge_asof(left, right, on="a", direction="forward")
+        a left_val  right_val
+    0   1        a        1.0
+    1   5        b        6.0
+    2  10        c        NaN
+
+    Here is a real-world times-series example:
+
+    >>> quotes = pd.DataFrame(
+    ...    {
+    ...        "time": [
+    ...            pd.Timestamp("2016-05-25 13:30:00.023"),
+    ...            pd.Timestamp("2016-05-25 13:30:00.023"),
+    ...            pd.Timestamp("2016-05-25 13:30:00.030"),
+    ...            pd.Timestamp("2016-05-25 13:30:00.041"),
+    ...            pd.Timestamp("2016-05-25 13:30:00.048"),
+    ...            pd.Timestamp("2016-05-25 13:30:00.049"),
+    ...            pd.Timestamp("2016-05-25 13:30:00.072"),
+    ...            pd.Timestamp("2016-05-25 13:30:00.075")
+    ...        ],
+    ...        "bid": [720.50, 51.95, 51.97, 51.99, 720.50, 97.99, 720.50, 52.01],
+    ...        "ask": [720.93, 51.96, 51.98, 52.00, 720.93, 98.01, 720.88, 52.03]
+    ...    }
+    ... )
+    >>> quotes
+                         time     bid     ask
+    0 2016-05-25 13:30:00.023  720.50  720.93
+    1 2016-05-25 13:30:00.023   51.95   51.96
+    2 2016-05-25 13:30:00.030   51.97   51.98
+    3 2016-05-25 13:30:00.041   51.99   52.00
+    4 2016-05-25 13:30:00.048  720.50  720.93
+    5 2016-05-25 13:30:00.049   97.99   98.01
+    6 2016-05-25 13:30:00.072  720.50  720.88
+    7 2016-05-25 13:30:00.075   52.01   52.03
+    >>> trades = pd.DataFrame(
+    ...    {
+    ...        "time": [
+    ...            pd.Timestamp("2016-05-25 13:30:00.023"),
+    ...            pd.Timestamp("2016-05-25 13:30:00.038"),
+    ...            pd.Timestamp("2016-05-25 13:30:00.048"),
+    ...            pd.Timestamp("2016-05-25 13:30:00.048"),
+    ...            pd.Timestamp("2016-05-25 13:30:00.048")
+    ...        ],
+    ...        "price": [51.95, 51.95, 720.77, 720.92, 98.0],
+    ...        "quantity": [75, 155, 100, 100, 100]
+    ...    }
+    ... )
+    >>> trades
+                         time   price  quantity
+    0 2016-05-25 13:30:00.023   51.95        75
+    1 2016-05-25 13:30:00.038   51.95       155
+    2 2016-05-25 13:30:00.048  720.77       100
+    3 2016-05-25 13:30:00.048  720.92       100
+    4 2016-05-25 13:30:00.048   98.00       100
+    >>> pd.merge_asof(trades, quotes, on="time")
+                         time   price  quantity     bid     ask
+    0 2016-05-25 13:30:00.023   51.95        75   51.95   51.96
+    1 2016-05-25 13:30:00.038   51.95       155   51.97   51.98
+    2 2016-05-25 13:30:00.048  720.77       100  720.50  720.93
+    3 2016-05-25 13:30:00.048  720.92       100  720.50  720.93
+    4 2016-05-25 13:30:00.048   98.00       100  720.50  720.93
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    if not isinstance(left, DataFrame):
+        raise ValueError(f"can not merge DataFrame with instance of type {type(left)}")
+    if not isinstance(right, DataFrame):
+        raise ValueError(f"can not merge DataFrame with instance of type {type(right)}")
 
-    yearfirst : bool, default False
-        Specify a date parse order if `arg` is str or is list-like.
+    # As of pandas 1.2 these should raise an error; before that it did
+    # something likely random:
+    if (
+        (on and (left_index or right_index))
+        or (left_on and left_index)
+        or (right_on and right_index)
+    ):
+        raise ValueError("Can't combine left/right_index with left/right_on or on.")
 
-        - If :const:`True` parses dates with the year first, e.g.
-          :const:`"10/11/12"` is parsed as :const:`2010-11-12`.
-        - If both `dayfirst` and `yearfirst` are :const:`True`, `yearfirst` is
-          preceded (same as :mod:`dateutil`).
+    if on is not None:
+        if left_on is not None or right_on is not None:
+            raise ValueError("If 'on' is set, 'left_on' and 'right_on' can't be set.")
+        if is_list_like(on) and len(on) > 1:
+            raise MergeError("can only asof on a key for left")
+        left_on = on
+        right_on = on
 
-        .. warning::
+    if by is not None:
+        if left_by is not None or right_by is not None:
+            raise ValueError("Can't have both 'by' and 'left_by' or 'right_by'")
+        left_by = right_by = by
 
-            ``yearfirst=True`` is not strict, but will prefer to parse
-            with year first.
+    if left_on is None and not left_index:
+        raise ValueError("Must pass on, left_on, or left_index=True")
 
-    utc : bool, default None
-        Control timezone-related parsing, localization and conversion.
+    if right_on is None and not right_index:
+        raise ValueError("Must pass on, right_on, or right_index=True")
 
-        - If :const:`True`, the function *always* returns a timezone-aware
-          UTC-localized :class:`Timestamp`, :class:`~modin.pandas.Series` or
-          :class:`DatetimeIndex`. To do this, timezone-naive inputs are
-          *localized* as UTC, while timezone-aware inputs are *converted* to UTC.
+    if not left_index and not right_index:
+        left_on_length = len(left_on) if is_list_like(left_on) else 1
+        right_on_length = len(right_on) if is_list_like(right_on) else 1
+        if left_on_length != right_on_length:
+            raise ValueError("len(right_on) must equal len(left_on)")
+        if left_on_length > 1:
+            raise MergeError("can only asof on a key for left")
 
-        - If :const:`False` (default), inputs will not be coerced to UTC.
-          Timezone-naive inputs will remain naive, while timezone-aware ones
-          will keep their time offsets. Limitations exist for mixed
-          offsets (typically, daylight savings), see :ref:`Examples
-          <to_datetime_tz_examples>` section for details.
+    return DataFrame(
+        query_compiler=left._query_compiler.merge_asof(
+            right._query_compiler,
+            on,
+            left_on,
+            right_on,
+            left_index,
+            right_index,
+            by,
+            left_by,
+            right_by,
+            suffixes,
+            tolerance,
+            allow_exact_matches,
+            direction,
+        )
+    )
 
-        See also: pandas general documentation about `timezone conversion and
-        localization
-        <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html
-        #time-zone-handling>`_.
 
-    format : str, default None
-        The strftime to parse time, e.g. :const:`"%d/%m/%Y"`. Note that
-        :const:`"%f"` will parse all the way up to nanoseconds. See
-        `strftime documentation
-        <https://docs.python.org/3/library/datetime.html
-        #strftime-and-strptime-behavior>`_ for more information on choices.
-    exact : bool, default True
-        Control how `format` is used:
+@snowpark_pandas_telemetry_standalone_function_decorator
+def concat(
+    objs: (
+        Iterable[snowflake.snowpark.modin.pandas.DataFrame | Series]
+        | Mapping[Hashable, snowflake.snowpark.modin.pandas.DataFrame | Series]
+    ),
+    axis: Axis = 0,
+    join: str = "outer",
+    ignore_index: bool = False,
+    keys: Sequence[Hashable] = None,
+    levels: list[Sequence[Hashable]] = None,
+    names: list[Hashable] = None,
+    verify_integrity: bool = False,
+    sort: bool = False,
+    copy: bool = True,
+) -> snowflake.snowpark.modin.pandas.DataFrame | Series:
+    """
+    Concatenate pandas objects along a particular axis.
 
-        - If :const:`True`, require an exact `format` match.
-        - If :const:`False`, allow the `format` to match anywhere in the target
-          string.
+    Allows optional set logic along the other axes.
 
-    unit : str, default 'ns'
-        The unit of the arg (D,s,ms,us,ns) denote the unit, which is an
-        integer or float number. This will be based off the origin.
-        Example, with ``unit='ms'`` and ``origin='unix'``, this would calculate
-        the number of milliseconds to the unix epoch start.
-    infer_datetime_format : bool, default False
-        If :const:`True` and no `format` is given, attempt to infer the format
-        of the datetime strings based on the first non-NaN element,
-        and if it can be inferred, switch to a faster method of parsing them.
-        In some cases this can increase the parsing speed by ~5-10x.
-    origin : scalar, default 'unix'
-        Define the reference date. The numeric values would be parsed as number
-        of units (defined by `unit`) since this reference date.
+    Can also add a layer of hierarchical indexing on the concatenation axis,
+    which may be useful if the labels are the same (or overlapping) on
+    the passed axis number.
 
-        - If :const:`'unix'` (or POSIX) time; origin is set to 1970-01-01.
-        - If :const:`'julian'`, unit must be :const:`'D'`, and origin is set to
-          beginning of Julian Calendar. Julian day number :const:`0` is assigned
-          to the day starting at noon on January 1, 4713 BC.
-        - If Timestamp convertible, origin is set to Timestamp identified by
-          origin.
-    cache : bool, default True
-        cache parameter is ignored with Snowflake backend, i.e., no caching will be
-        applied
+    Parameters
+    ----------
+    objs : a sequence or mapping of Series or DataFrame objects
+        If a mapping is passed, the sorted keys will be used as the `keys`
+        argument, unless it is passed, in which case the values will be
+        selected (see below). Any None objects will be dropped silently unless
+        they are all None in which case a ValueError will be raised.
+    axis : {0/'index', 1/'columns'}, default 0
+        The axis to concatenate along.
+    join : {'inner', 'outer'}, default 'outer'
+        How to handle indexes on other axis (or axes).
+    ignore_index : bool, default False
+        If True, do not use the index values along the concatenation axis. The
+        resulting axis will be labeled 0, ..., n - 1. This is useful if you are
+        concatenating objects where the concatenation axis does not have
+        meaningful indexing information. Note the index values on the other
+        axes are still respected in the join.
+    keys : sequence, default None
+        If multiple levels passed, should contain tuples. Construct
+        hierarchical index using the passed keys as the outermost level.
+    levels : list of sequences, default None
+        Specific levels (unique values) to use for constructing a
+        MultiIndex. Otherwise they will be inferred from the keys.
+        Snowpark pandas does not support 'levels' argument.
+    names : list, default None
+        Names for the levels in the resulting hierarchical index.
+    verify_integrity : bool, default False
+        Check whether the new concatenated axis contains duplicates.
+        Snowpark pandas does not support distributed computation of concat when
+        'verify_integrity' is True.
+    sort : bool, default False
+        Sort non-concatenation axis if it is not already aligned.
+    copy : bool, default True
+        If False, do not copy data unnecessarily.
+        This argument is ignored in Snowpark pandas.
 
     Returns
     -------
-    datetime
-        If parsing succeeded.
-        Return type depends on input (types in parenthesis correspond to
-        fallback in case of unsuccessful timezone or out-of-range timestamp
-        parsing):
-
-        - scalar: :class:`Timestamp` (or :class:`datetime.datetime`)
-        - array-like: :class:`~modin.pandas.DatetimeIndex` (or
-          :class: :class:`~modin.pandas.Series` of :class:`object` dtype containing
-          :class:`datetime.datetime`)
-        - Series: :class:`~modin.pandas.Series` of :class:`datetime64` dtype (or
-          :class: :class:`~modin.pandas.Series` of :class:`object` dtype containing
-          :class:`datetime.datetime`)
-        - DataFrame: :class:`~modin.pandas.Series` of :class:`datetime64` dtype (or
-          :class:`~modin.pandas.Series` of :class:`object` dtype containing
-          :class:`datetime.datetime`)
-
-    Raises
-    ------
-    ParserError
-        When parsing a date from string fails.
-    ValueError
-        When another datetime conversion error happens. For example when one
-        of 'year', 'month', day' columns is missing in a :class:`~modin.pandas.DataFrame`, or
-        when a Timezone-aware :class:`datetime.datetime` is found in an array-like
-        of mixed time offsets, and ``utc=False``.
+    object, type of objs
+        When concatenating all Snowpark pandas :class:`~modin.pandas.Series` along the index (axis=0),
+        a Snowpark pandas :class:`~modin.pandas.Series` is returned. When ``objs`` contains at least
+        one Snowpark pandas :class:`~modin.pandas.DataFrame`,
+        a Snowpark pandas :class:`~modin.pandas.DataFrame` is returned. When concatenating along
+        the columns (axis=1), a Snowpark pandas :class:`~modin.pandas.DataFrame` is returned.
 
     See Also
     --------
-    DataFrame.astype : Cast argument to a specified dtype.
-    to_timedelta : Convert argument to timedelta.
-    convert_dtypes : Convert dtypes.
+    DataFrame.join : Join DataFrames using indexes.
+    DataFrame.merge : Merge DataFrames by indexes or columns.
 
     Notes
     -----
+    The keys, levels, and names arguments are all optional.
 
-    Many input types are supported, and lead to different output types:
+    It is not recommended to build DataFrames by adding single rows in a
+    for loop. Build a list of rows and make a DataFrame in a single concat.
 
-    - **scalars** can be int, float, str, datetime object (from stdlib :mod:`datetime`
-      module or :mod:`numpy`). They are converted to :class:`Timestamp` when
-      possible, otherwise they are converted to :class:`datetime.datetime`.
-      None/NaN/null scalars are converted to :const:`NaT`.
+    Examples
+    --------
+    Combine two ``Series``.
 
-    - **array-like** can contain int, float, str, datetime objects. They are
-      converted to :class:`DatetimeIndex` when possible, otherwise they are
-      converted to :class:`Index` with :class:`object` dtype, containing
-      :class:`datetime.datetime`. None/NaN/null entries are converted to
-      :const:`NaT` in both cases.
+    >>> s1 = pd.Series(['a', 'b'])
+    >>> s2 = pd.Series(['c', 'd'])
+    >>> pd.concat([s1, s2])
+    0    a
+    1    b
+    0    c
+    1    d
+    dtype: object
 
-    - **Series** are converted to :class:`~modin.pandas.Series` with :class:`datetime64`
-      dtype when possible, otherwise they are converted to :class:`~modin.pandas.Series` with
-      :class:`object` dtype, containing :class:`datetime.datetime`. None/NaN/null
-      entries are converted to :const:`NaT` in both cases.
+    Clear the existing index and reset it in the result
+    by setting the ``ignore_index`` option to ``True``.
+
+    >>> pd.concat([s1, s2], ignore_index=True)
+    0    a
+    1    b
+    2    c
+    3    d
+    dtype: object
 
-    - **DataFrame/dict-like** are converted to :class:`~modin.pandas.Series` with
-      :class:`datetime64` dtype. For each row a datetime is created from assembling
-      the various dataframe columns. Column keys can be common abbreviations
-      like [‘year’, ‘month’, ‘day’, ‘minute’, ‘second’, ‘ms’, ‘us’, ‘ns’]) or
-      plurals of the same.
+    Add a hierarchical index at the outermost level of
+    the data with the ``keys`` option.
 
-    The following causes are responsible for :class:`datetime.datetime` objects
-    being returned (possibly inside an :class:`Index` or a :class:`~modin.pandas.Series` with
-    :class:`object` dtype) instead of a proper pandas designated type
-    (:class:`Timestamp` or :class:`~modin.pandas.Series` with :class:`datetime64` dtype):
+    >>> pd.concat([s1, s2], keys=['s1', 's2'])
+    s1  0    a
+        1    b
+    s2  0    c
+        1    d
+    dtype: object
 
-    - when any input element is before :const:`Timestamp.min` or after
-      :const:`Timestamp.max`, see `timestamp limitations
-      <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html
-      #timeseries-timestamp-limits>`_.
+    Label the index keys you create with the ``names`` option.
 
-    - when ``utc=False`` (default) and the input is an array-like or
-      :class:`~modin.pandas.Series` containing mixed naive/aware datetime, or aware with mixed
-      time offsets. Note that this happens in the (quite frequent) situation when
-      the timezone has a daylight savings policy. In that case you may wish to
-      use ``utc=True``.
+    >>> pd.concat([s1, s2], keys=['s1', 's2'],
+    ...           names=['Series name', 'Row ID'])
+    Series name  Row ID
+    s1           0         a
+                 1         b
+    s2           0         c
+                 1         d
+    dtype: object
 
-    Examples
-    --------
+    Combine two ``DataFrame`` objects with identical columns.
 
-    **Handling various input formats**
+    >>> df1 = pd.DataFrame([['a', 1], ['b', 2]],
+    ...                    columns=['letter', 'number'])
+    >>> df1
+      letter  number
+    0      a       1
+    1      b       2
+    >>> df2 = pd.DataFrame([['c', 3], ['d', 4]],
+    ...                    columns=['letter', 'number'])
+    >>> df2
+      letter  number
+    0      c       3
+    1      d       4
+    >>> pd.concat([df1, df2])
+      letter  number
+    0      a       1
+    1      b       2
+    0      c       3
+    1      d       4
 
-    Assembling a datetime from multiple columns of a :class:`~modin.pandas.DataFrame`. The keys
-    can be common abbreviations like ['year', 'month', 'day', 'minute', 'second',
-    'ms', 'us', 'ns']) or plurals of the same
+    Combine ``DataFrame`` objects with overlapping columns
+    and return everything. Columns outside the intersection will
+    be filled with ``NaN`` values.
 
-    >>> df = pd.DataFrame({'year': [2015, 2016],
-    ...                    'month': [2, 3],
-    ...                    'day': [4, 5]})
-    >>> pd.to_datetime(df)
-    0   2015-02-04
-    1   2016-03-05
-    dtype: datetime64[ns]
+    >>> df3 = pd.DataFrame([['c', 3, 'cat'], ['d', 4, 'dog']],
+    ...                    columns=['letter', 'number', 'animal'])
+    >>> df3
+      letter  number animal
+    0      c       3    cat
+    1      d       4    dog
+    >>> pd.concat([df1, df3], sort=False)
+      letter  number animal
+    0      a       1   None
+    1      b       2   None
+    0      c       3    cat
+    1      d       4    dog
 
-    Passing ``infer_datetime_format=True`` can often-times speedup a parsing
-    if it's not an ISO8601 format exactly, but in a regular format.
+    Combine ``DataFrame`` objects with overlapping columns
+    and return only those that are shared by passing ``inner`` to
+    the ``join`` keyword argument.
 
-    >>> s = pd.Series(['3/11/2000', '3/12/2000', '3/13/2000'] * 1000)
-    >>> s.head()
-    0    3/11/2000
-    1    3/12/2000
-    2    3/13/2000
-    3    3/11/2000
-    4    3/12/2000
-    dtype: object
+    >>> pd.concat([df1, df3], join="inner")
+      letter  number
+    0      a       1
+    1      b       2
+    0      c       3
+    1      d       4
 
-    Using a unix epoch time
+    Combine ``DataFrame`` objects horizontally along the x axis by
+    passing in ``axis=1``.
 
-    >>> pd.to_datetime(1490195805, unit='s')
-    Timestamp('2017-03-22 15:16:45')
-    >>> pd.to_datetime(1490195805433502912, unit='ns')
-    Timestamp('2017-03-22 15:16:45.433502912')
+    >>> df4 = pd.DataFrame([['bird', 'polly'], ['monkey', 'george']],
+    ...                    columns=['animal', 'name'])
+    >>> pd.concat([df1, df4], axis=1)
+      letter  number  animal    name
+    0      a       1    bird   polly
+    1      b       2  monkey  george
 
-    .. warning:: For float arg, precision rounding might happen. To prevent
-        unexpected behavior use a fixed-width exact type.
+    Combining series horizontally creates a DataFrame. Missing names are replaced with
+    numeric values.
 
-    Using a non-unix epoch origin
+    >>> pd.concat([s1, s2], axis=1)
+       0  1
+    0  a  c
+    1  b  d
 
-    >>> pd.to_datetime([1, 2, 3], unit='D',
-    ...                origin=pd.Timestamp('1960-01-01'))
-    DatetimeIndex(['1960-01-02', '1960-01-03', '1960-01-04'], dtype='datetime64[ns]', freq=None)
+    When combining objects horizoantally ``ignore_index=True`` will clear the existing
+    column names and reset it in the result.
 
+    >>> pd.concat([df1, df4], axis=1, ignore_index=True)
+       0  1       2       3
+    0  a  1    bird   polly
+    1  b  2  monkey  george
 
-    **Non-convertible date/times**
+    When combining objects horizontally, add a hierarchical column index at the
+    outermost level of the column labels with the ``keys`` option.
 
-    If a date does not meet the `timestamp limitations
-    <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html
-    #timeseries-timestamp-limits>`_, passing ``errors='ignore'``
-    will return the original input instead of raising any exception.
+    >>> pd.concat([df1, df4], axis=1, keys=['x', 'y']) # doctest: +NORMALIZE_WHITESPACE
+           x              y
+      letter number  animal    name
+    0      a      1    bird   polly
+    1      b      2  monkey  george
 
-    Passing ``errors='coerce'`` will force an out-of-bounds date to :const:`NaT`,
-    in addition to forcing non-dates (or non-parseable dates) to :const:`NaT`.
+    Concatenatiing series horizontally with ``keys``.
 
-    >>> pd.to_datetime(['13000101', 'abc'], format='%Y%m%d', errors='coerce')
-    DatetimeIndex(['NaT', 'NaT'], dtype='datetime64[ns]', freq=None)
+    >>> pd.concat([s1, s2], axis=1, keys=['x', 'y'])
+       x  y
+    0  a  c
+    1  b  d
 
+    When combining objects horizontally, ``how='inner'`` to keep only overalpping
+    index values.
 
-    .. _to_datetime_tz_examples:
+    >>> df5 = pd.DataFrame([['a', 1], ['b', 2]],
+    ...                    columns=['letter', 'number'],
+    ...                    index=[1, 2])
+    >>> df5
+      letter  number
+    1      a       1
+    2      b       2
+    >>> pd.concat([df1, df5], axis=1, join='inner')
+      letter  number letter  number
+    1      b       2      a       1
 
-    **Timezones and time offsets**
+    Prevent the result from including duplicate index values with the
+    ``verify_integrity`` option.
 
-    The default behaviour (``utc=False``) is as follows:
+    >>> df5 = pd.DataFrame([1], index=['a'])
+    >>> df5
+       0
+    a  1
+    >>> df6 = pd.DataFrame([2], index=['a'])
+    >>> df6
+       0
+    a  2
+    >>> pd.concat([df5, df6], verify_integrity=True)
+    Traceback (most recent call last):
+        ...
+    ValueError: Indexes have overlapping values: Index(['a'], dtype='object')
 
-    - Timezone-naive inputs are kept as timezone-naive :class:`~modin.pandas.DatetimeIndex`:
+    Append a single row to the end of a ``DataFrame`` object.
 
-    >>> pd.to_datetime(['2018-10-26 12:00:00', '2018-10-26 13:00:15'])
-    DatetimeIndex(['2018-10-26 12:00:00', '2018-10-26 13:00:15'], dtype='datetime64[ns]', freq=None)
+    >>> df7 = pd.DataFrame({'a': 1, 'b': 2}, index=[0])
+    >>> df7
+       a  b
+    0  1  2
+    >>> new_row = pd.DataFrame({'a': 3, 'b': 4}, index=[0])
+    >>> new_row
+       a  b
+    0  3  4
+    >>> pd.concat([df7, new_row], ignore_index=True)
+       a  b
+    0  1  2
+    1  3  4
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    # Raise error if native pandas objects are passed.
+    raise_if_native_pandas_objects(objs)
 
-    >>> pd.to_datetime(['2018-10-26 12:00:00 -0500', '2018-10-26 13:00:00 -0500'])
-    DatetimeIndex(['2018-10-26 12:00:00-05:00', '2018-10-26 13:00:00-05:00'], dtype='datetime64[ns, UTC-05:00]', freq=None)
+    # In native pandas 'concat' API is expected to work with all types of iterables like
+    # tuples, list, generators, custom iterators, deque etc.
+    # Few exceptions are 'DataFrame', 'Series', 'str', these are also technically
+    # iterables, but they are not iterables of pandas objects.
+    # Note other iterables can also have non pandas objects as element in them, but it's
+    # not possible to know that in advance without iterating over all objects, so we
+    # also individual element later.
 
-    - Use right format to convert to timezone-aware type (Note that when call Snowpark
-      pandas API to_pandas() the timezone-aware output will always be converted to session timezone):
+    # Raise error if 'objs' is not an iterable or an iterable of non-pandas objects.
+    if not isinstance(objs, Iterable) or isinstance(
+        objs, (pd.DataFrame, pd.Series, str)
+    ):
+        # Same error as native pandas.
+        raise TypeError(
+            "first argument must be an iterable of pandas "
+            f'objects, you passed an object of type "{type(objs).__name__}"'
+        )
 
-    >>> pd.to_datetime(['2018-10-26 12:00:00 -0500', '2018-10-26 13:00:00 -0500'], format="%Y-%m-%d %H:%M:%S %z")
-    DatetimeIndex(['2018-10-26 12:00:00-05:00', '2018-10-26 13:00:00-05:00'], dtype='datetime64[ns, UTC-05:00]', freq=None)
+    if isinstance(objs, dict):
+        if keys is None:
+            keys = list(objs.keys())
+        # if 'keys' is not none, filter out additional objects from mapping.
+        objs = [objs[k] for k in keys]
+    else:
+        # Native pandas also supports generators as input, that can only be iterated
+        # only once so first create a list from 'objs'.
+        objs = list(objs)
 
-    - Timezone-aware inputs *with mixed time offsets* (for example
-      issued from a timezone with daylight savings, such as Europe/Paris):
+    for obj in objs:
+        # Raise error if native pandas objects are passed.
+        raise_if_native_pandas_objects(obj)
 
-    >>> pd.to_datetime(['2020-10-25 02:00:00 +0200', '2020-10-25 04:00:00 +0100'])
-    DatetimeIndex([2020-10-25 02:00:00+02:00, 2020-10-25 04:00:00+01:00], dtype='object', freq=None)
+    if join not in ("inner", "outer"):
+        # Same error as native pandas.
+        raise ValueError(
+            "Only can inner (intersect) or outer (union) join the other axis"
+        )
 
-    >>> pd.to_datetime(['2020-10-25 02:00:00 +0200', '2020-10-25 04:00:00 +0100'], format="%Y-%m-%d %H:%M:%S %z")
-    DatetimeIndex([2020-10-25 02:00:00+02:00, 2020-10-25 04:00:00+01:00], dtype='object', freq=None)
+    axis = pandas.DataFrame()._get_axis_number(axis)
 
-    Setting ``utc=True`` makes sure always convert to timezone-aware outputs:
+    if len(objs) == 0:
+        # Same error as native pandas.
+        raise ValueError("No objects to concatenate")
 
-    - Timezone-naive inputs are *localized* based on the session timezone
+    # Filter out None objects
+    if keys is None:
+        objs = [o for o in objs if o is not None]
+    else:
+        tuples = [(k, v) for k, v in zip(keys, objs) if v is not None]
+        # convert list of tuples to tuples of list.
+        keys, objs = list(map(list, zip(*tuples))) if tuples else ([], [])
 
-    >>> pd.to_datetime(['2018-10-26 12:00', '2018-10-26 13:00'], utc=True)
-    DatetimeIndex(['2018-10-26 12:00:00+00:00', '2018-10-26 13:00:00+00:00'], dtype='datetime64[ns, UTC]', freq=None)
+    if len(objs) == 0:
+        # Same error as native pandas.
+        raise ValueError("All objects passed were None")
 
-    - Timezone-aware inputs are *converted* to session timezone
+    for obj in objs:
+        # Same error as native pandas.
+        if not isinstance(obj, (Series, DataFrame)):
+            raise TypeError(
+                f"cannot concatenate object of type '{type(obj)}'; "
+                "only Series and DataFrame objs are valid"
+            )
 
-    >>> pd.to_datetime(['2018-10-26 12:00:00 -0530', '2018-10-26 12:00:00 -0500'],
-    ...                utc=True)
-    DatetimeIndex(['2018-10-26 17:30:00+00:00', '2018-10-26 17:00:00+00:00'], dtype='datetime64[ns, UTC]', freq=None)
-    """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    raise_if_native_pandas_objects(arg)
+    # Assign names to unnamed series - the names function as column labels for Series.
+    # If all Series have no name, use the keys as names.
+    if (
+        axis == 1
+        and keys is not None
+        and all(isinstance(obj, Series) and obj.name is None for obj in objs)
+    ):
+        for i, obj in enumerate(objs):
+            objs[i] = obj.rename(keys[i])
 
-    if not isinstance(arg, (DataFrame, Series, pd.Index)):
-        # use pandas.to_datetime to convert local data to datetime
-        res = pandas.to_datetime(
-            arg,
-            errors,
-            dayfirst,
-            yearfirst,
-            utc,
-            format,
-            exact,
-            unit,
-            infer_datetime_format,
-            origin,
-            cache,
-        )
-        if isinstance(res, pandas.Series):
-            res = pd.Series(res)
-        elif not is_scalar(res):
-            res = pd.Index(res)
-        return res
+    # If only some Series have names, give them temporary names.
+    series_name = 0
+    for i, obj in enumerate(objs):
+        if isinstance(obj, pd.Series) and obj.name is None:
+            objs[i] = obj.rename(series_name)
+            series_name = series_name + 1
 
-    # handle modin objs
-    if unit and unit not in VALID_TO_DATETIME_UNIT:
-        raise ValueError(f"Unrecognized unit {unit}")
+    # Check if all objects are of Series types.
+    all_series = all([isinstance(obj, pd.Series) for obj in objs])
+    # When concatenating Series objects on axis 0, pandas tries to preserve name from
+    # input if all have same name otherwise set it to None.
+    if all_series and axis == 0:
+        unique_names = {obj.name for obj in objs}
+        name = objs[0].name if len(unique_names) == 1 else None
+        objs = [obj.rename(name) for obj in objs]
 
-    if not cache:
+    if not copy:
         WarningMessage.ignored_argument(
-            operation="to_datetime",
-            argument="cache",
-            message="cache parameter is ignored with Snowflake backend, i.e., no caching will be applied",
+            operation="concat",
+            argument="copy",
+            message="copy parameter has been ignored with Snowflake execution engine",
         )
 
-    return arg._to_datetime(
-        errors=errors,
-        dayfirst=dayfirst,
-        yearfirst=yearfirst,
-        utc=utc,
-        format=format,
-        exact=exact,
-        unit=unit,
-        infer_datetime_format=infer_datetime_format,
-        origin=origin,
+    # For the edge case where concatenation is done on the columns where all the objects are series,
+    # need to prevent a second column level from being created - therefore, keys is None.
+    keys = None if axis == 1 and all(isinstance(obj, Series) for obj in objs) else keys
+
+    result = objs[0]._query_compiler.concat(
+        axis,
+        [o._query_compiler for o in objs[1:]],
+        join=join,
+        ignore_index=ignore_index,
+        keys=keys,
+        levels=levels,
+        names=names,
+        verify_integrity=verify_integrity,
+        sort=sort,
     )
+    # If all objects are series and concat axis=0, return Series else return DataFrame.
+    if all_series and axis == 0:
+        return Series(query_compiler=result)
+    return DataFrame(query_compiler=result)
 
 
 @snowpark_pandas_telemetry_standalone_function_decorator
@@ -1885,515 +1982,640 @@ def get_dummies(
     2  0  0  1
     3  1  0  0
 
-    >>> df = pd.DataFrame({'A': ['a', 'b', 'a'], 'B': ['b', 'a', 'c'],
-    ...                    'C': [1, 2, 3]})
+    >>> df = pd.DataFrame({'A': ['a', 'b', 'a'], 'B': ['b', 'a', 'c'],
+    ...                    'C': [1, 2, 3]})
+
+    >>> pd.get_dummies(df, prefix=['col1', 'col2'])
+       C  col1_a  col1_b  col2_a  col2_b  col2_c
+    0  1       1       0       0       1       0
+    1  2       0       1       1       0       0
+    2  3       1       0       0       0       1
+
+    >>> pd.get_dummies(pd.Series(list('abcaa')))
+       a  b  c
+    0  1  0  0
+    1  0  1  0
+    2  0  0  1
+    3  1  0  0
+    4  1  0  0
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    new_qc = data._query_compiler.get_dummies(
+        columns=columns,
+        prefix=prefix,
+        prefix_sep=prefix_sep,
+        dummy_na=dummy_na,
+        drop_first=drop_first,
+        dtype=dtype,
+        is_series=not data._is_dataframe,
+    )
+    return DataFrame(query_compiler=new_qc)
+
+
+@snowpark_pandas_telemetry_standalone_function_decorator
+def unique(values) -> np.ndarray:
+    """
+    Return unique values based on a hash table. Unique values are
+    returned in the order of appearance. This does NOT sort.
+
+    Parameters
+    ----------
+    values : ndarray (1-d), list, bytearray, tuple, Series, Index, list-like
+        Non-hashable objects like set, dict, and user defined classes are
+        invalid input.
+        Values to perform computation.
+
+    Returns
+    -------
+    ndarray
+    The unique values returned as a NumPy array. See Notes.
+
+    See Also
+    --------
+    Series.unique()
+
+    Notes
+    -----
+    Returns the unique values as a NumPy array. This includes
+
+        * Datetime with Timezone
+        * IntegerNA
+
+    See Examples section.
+
+    Examples
+    --------
+    >>> pd.unique([2, 1, 3, 3])
+    array([2, 1, 3])
+
+    >>> pd.unique([pd.Timestamp('2016-01-01', tz='US/Eastern')
+    ...            for _ in range(3)])
+    array([Timestamp('2016-01-01 00:00:00-0500', tz='UTC-05:00')],
+          dtype=object)
+
+    >>> pd.unique([("a", "b"), ("b", "a"), ("a", "c"), ("b", "a")])
+    array([list(['a', 'b']), list(['b', 'a']), list(['a', 'c'])], dtype=object)
+
+    >>> pd.unique([None, np.nan, 2])
+    array([nan,  2.])
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    if is_list_like(values) and not isinstance(values, dict):
+        return Series(values).unique()
+    else:
+        raise TypeError("Only list-like objects can be used with unique()")
+
+
+# Adding docstring since pandas docs don't have web section for this function.
+@snowpark_pandas_telemetry_standalone_function_decorator
+@pandas_module_level_function_not_implemented()
+def lreshape(data: DataFrame, groups, dropna=True, label=None):
+    """
+    Reshape wide-format data to long. Generalized inverse of ``DataFrame.pivot``.
+
+    Accepts a dictionary, `groups`, in which each key is a new column name
+    and each value is a list of old column names that will be "melted" under
+    the new column name as part of the reshape.
+
+    Parameters
+    ----------
+    data : DataFrame
+        The wide-format DataFrame.
+    groups : dict
+        Dictionary in the form: `{new_name : list_of_columns}`.
+    dropna : bool, default: True
+        Whether include columns whose entries are all NaN or not.
+    label : optional
+        Deprecated parameter.
+
+    Returns
+    -------
+    DataFrame
+        Reshaped DataFrame.
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    if not isinstance(data, DataFrame):
+        raise ValueError(f"can not lreshape with instance of type {type(data)}")
+    return DataFrame(
+        pandas.lreshape(to_pandas(data), groups, dropna=dropna, label=label)
+    )
+
+
+@_inherit_docstrings(pandas.wide_to_long, apilink="pandas.wide_to_long")
+@snowpark_pandas_telemetry_standalone_function_decorator
+@pandas_module_level_function_not_implemented()
+def wide_to_long(
+    df: DataFrame, stubnames, i, j, sep: str = "", suffix: str = r"\d+"
+) -> DataFrame:  # noqa: PR01, RT01, D200
+    """
+    Unpivot a DataFrame from wide to long format.
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    if not isinstance(df, DataFrame):
+        raise ValueError(f"can not wide_to_long with instance of type {type(df)}")
+    # ErrorMessage.default_to_pandas("`wide_to_long`")
+    return DataFrame(
+        pandas.wide_to_long(to_pandas(df), stubnames, i, j, sep=sep, suffix=suffix)
+    )
+
+
+###########################################################################
+# Top-level missing data
+###########################################################################
+
+
+@snowpark_pandas_telemetry_standalone_function_decorator
+@_inherit_docstrings(pandas.isna, apilink="pandas.isna")
+def isna(obj):  # noqa: PR01, RT01, D200
+    """
+    Detect missing values for an array-like object.
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    if isinstance(obj, BasePandasDataset):
+        return obj.isna()
+    else:
+        return pandas.isna(obj)
+
 
-    >>> pd.get_dummies(df, prefix=['col1', 'col2'])
-       C  col1_a  col1_b  col2_a  col2_b  col2_c
-    0  1       1       0       0       1       0
-    1  2       0       1       1       0       0
-    2  3       1       0       0       0       1
+isnull = isna
 
-    >>> pd.get_dummies(pd.Series(list('abcaa')))
-       a  b  c
-    0  1  0  0
-    1  0  1  0
-    2  0  0  1
-    3  1  0  0
-    4  1  0  0
+
+@snowpark_pandas_telemetry_standalone_function_decorator
+@_inherit_docstrings(pandas.notna, apilink="pandas.notna")
+def notna(obj):  # noqa: PR01, RT01, D200
+    """
+    Detect non-missing values for an array-like object.
     """
     # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    new_qc = data._query_compiler.get_dummies(
-        columns=columns,
-        prefix=prefix,
-        prefix_sep=prefix_sep,
-        dummy_na=dummy_na,
-        drop_first=drop_first,
-        dtype=dtype,
-        is_series=not data._is_dataframe,
-    )
-    return DataFrame(query_compiler=new_qc)
+    if isinstance(obj, BasePandasDataset):
+        return obj.notna()
+    else:
+        return pandas.notna(obj)
+
+
+notnull = notna
+
+
+###########################################################################
+# Top-level dealing with numeric data
+###########################################################################
 
 
 @snowpark_pandas_telemetry_standalone_function_decorator
-def melt(
-    frame,
-    id_vars=None,
-    value_vars=None,
-    var_name=None,
-    value_name="value",
-    col_level=None,
-    ignore_index: bool = True,
-):  # noqa: PR01, RT01, D200
+def to_numeric(
+    arg: Scalar | Series | ArrayConvertible,
+    errors: Literal["ignore", "raise", "coerce"] = "raise",
+    downcast: Literal["integer", "signed", "unsigned", "float"] | None = None,
+) -> Series | Scalar | None:
     """
-    Unpivot a DataFrame from wide to long format, optionally leaving identifiers set.
+    Convert argument to a numeric type.
+
+    If the input arg type is already a numeric type, the return dtype
+    will be the original type; otherwise, the return dtype is float.
 
     Parameters
     ----------
-    id_vars : list of identifiers to retain in the result
-    value_vars : list of columns to unpivot on
-        defaults to all columns, excluding the id_vars columns
-    var_name : variable name, defaults to "variable"
-    value_name : value name, defaults to "value"
-    col_level : int, not implemented
-    ignore_index : bool, not implemented
+    arg : scalar, list, tuple, 1-d array, or Series
+        Argument to be converted.
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+        - If 'raise', then invalid parsing will raise an exception.
+        - If 'coerce', then invalid parsing will be set as NaN.
+        - If 'ignore', then invalid parsing will return the input.
+    downcast : str, default None
+        downcast is ignored in Snowflake backend.
 
     Returns
     -------
-    :class:`~modin.pandas.DataFrame`
-        unpivoted on the value columns
+    ret
+        Numeric if parsing succeeded.
+        Return type depends on input.  Series if `arg` is not scalar.
+
+    See Also
+    --------
+    DataFrame.astype : Cast argument to a specified dtype.
+    to_datetime : Convert argument to datetime.
+    to_timedelta : Convert argument to timedelta.
+    numpy.ndarray.astype : Cast a numpy array to a specified type.
+    DataFrame.convert_dtypes : Convert dtypes.
 
     Examples
     --------
-    >>> df = pd.DataFrame({'A': {0: 'a', 1: 'b', 2: 'c'},
-    ...           'B': {0: 1, 1: 3, 2: 5},
-    ...           'C': {0: 2, 1: 4, 2: 6}})
+    Take separate series and convert to numeric, coercing when told to
 
-    >>> pd.melt(df)
-      variable value
-    0        A     a
-    1        A     b
-    2        A     c
-    3        B     1
-    4        B     3
-    5        B     5
-    6        C     2
-    7        C     4
-    8        C     6
+    >>> s = pd.Series(['1.0', '2', -3])
+    >>> pd.to_numeric(s)
+    0    1.0
+    1    2.0
+    2   -3.0
+    dtype: float64
 
-    >>> df = pd.DataFrame({'A': {0: 'a', 1: 'b', 2: 'c'},
-    ...           'B': {0: 1, 1: 3, 2: 5},
-    ...           'C': {0: 2, 1: 4, 2: 6}})
-    >>> pd.melt(df, id_vars=['A'], value_vars=['B'], var_name='myVarname', value_name='myValname')
-       A myVarname  myValname
-    0  a         B          1
-    1  b         B          3
-    2  c         B          5
+    Note: to_numeric always converts non-numeric values to floats
+    >>> s = pd.Series(['1', '2', '-3'])
+    >>> pd.to_numeric(s)
+    0    1.0
+    1    2.0
+    2   -3.0
+    dtype: float64
+    >>> pd.to_numeric(s, downcast='float')  # downcast is ignored
+    0    1.0
+    1    2.0
+    2   -3.0
+    dtype: float64
+    >>> pd.to_numeric(s, downcast='signed')  # downcast is ignored
+    0    1.0
+    1    2.0
+    2   -3.0
+    dtype: float64
+    >>> s = pd.Series(['apple', '1.0', '2', -3])
+    >>> pd.to_numeric(s, errors='coerce')
+    0    NaN
+    1    1.0
+    2    2.0
+    3   -3.0
+    dtype: float64
     """
     # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    return frame.melt(
-        id_vars=id_vars,
-        value_vars=value_vars,
-        var_name=var_name,
-        value_name=value_name,
-        col_level=col_level,
-        ignore_index=ignore_index,
-    )
+    raise_if_native_pandas_objects(arg)
+    if errors not in ("ignore", "raise", "coerce"):
+        raise ValueError("invalid error value specified")
+    if downcast is not None:
+        WarningMessage.ignored_argument(
+            operation="to_numeric",
+            argument="downcast",
+            message="downcast is ignored in Snowflake backend",
+        )
+    # convert arg to series
+    arg_is_scalar = is_scalar(arg)
+
+    if (
+        not arg_is_scalar
+        and not isinstance(arg, (list, tuple, Series))
+        and not (is_array_like(arg) and arg.ndim == 1)
+    ):
+        raise TypeError("arg must be a list, tuple, 1-d array, or Series")
+
+    if arg_is_scalar:
+        arg = Series([arg])
+
+    if not isinstance(arg, Series):
+        name = None
+        # keep index name
+        if isinstance(arg, pandas.Index):
+            name = arg.name
+        arg = Series(arg, name=name)
+
+    ret = arg._to_numeric(errors=errors)
+    if arg_is_scalar:
+        # use squeeze to turn the series result into a scalar
+        ret = ret.squeeze()
+    return ret
+
+
+###########################################################################
+# Top-level dealing with datetimelike data
+###########################################################################
 
 
 @snowpark_pandas_telemetry_standalone_function_decorator
-def crosstab(
-    index,
-    columns,
-    values=None,
-    rownames=None,
-    colnames=None,
-    aggfunc=None,
-    margins=False,
-    margins_name: str = "All",
-    dropna: bool = True,
-    normalize=False,
-) -> DataFrame:  # noqa: PR01, RT01, D200
+def to_datetime(
+    arg: DatetimeScalarOrArrayConvertible
+    | DictConvertible
+    | snowflake.snowpark.modin.pandas.DataFrame
+    | Series,
+    errors: DateTimeErrorChoices = "raise",
+    dayfirst: bool = False,
+    yearfirst: bool = False,
+    utc: bool = False,
+    format: str | None = None,
+    exact: bool | lib.NoDefault = lib.no_default,
+    unit: str | None = None,
+    infer_datetime_format: lib.NoDefault | bool = lib.no_default,
+    origin: Any = "unix",
+    cache: bool = True,
+) -> pd.DatetimeIndex | Series | DatetimeScalar | NaTType | None:
     """
-    Compute a simple cross tabulation of two (or more) factors.
+    Convert argument to datetime.
+
+    This function converts a scalar, array-like, :class:`~modin.pandas.Series` or
+    :class:`~modin.pandas.DataFrame`/dict-like to a pandas datetime object.
+
+    Parameters
+    ----------
+    arg : int, float, str, datetime, list, tuple, 1-d array, Series, :class:`~modin.pandas.DataFrame`/dict-like
+        The object to convert to a datetime. If a :class:`~modin.pandas.DataFrame` is provided, the
+        method expects minimally the following columns: :const:`"year"`,
+        :const:`"month"`, :const:`"day"`.
+    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+        - If :const:`'raise'`, then invalid parsing will raise an exception.
+        - If :const:`'coerce'`, then invalid parsing will be set as :const:`NaT`.
+        - If :const:`'ignore'`, then invalid parsing will return the input.
+    dayfirst : bool, default False
+        Specify a date parse order if `arg` is str or is list-like.
+        If :const:`True`, parses dates with the day first, e.g. :const:`"10/11/12"`
+        is parsed as :const:`2012-11-10`.
+
+        .. warning::
+
+            ``dayfirst=True`` is not strict, but will prefer to parse
+            with day first. If a delimited date string cannot be parsed in
+            accordance with the given `dayfirst` option, e.g.
+            ``to_datetime(['31-12-2021'])``, then a warning will be shown.
+
+    yearfirst : bool, default False
+        Specify a date parse order if `arg` is str or is list-like.
+
+        - If :const:`True` parses dates with the year first, e.g.
+          :const:`"10/11/12"` is parsed as :const:`2010-11-12`.
+        - If both `dayfirst` and `yearfirst` are :const:`True`, `yearfirst` is
+          preceded (same as :mod:`dateutil`).
+
+        .. warning::
+
+            ``yearfirst=True`` is not strict, but will prefer to parse
+            with year first.
+
+    utc : bool, default None
+        Control timezone-related parsing, localization and conversion.
 
-    By default, computes a frequency table of the factors unless an array
-    of values and an aggregation function are passed.
+        - If :const:`True`, the function *always* returns a timezone-aware
+          UTC-localized :class:`Timestamp`, :class:`~modin.pandas.Series` or
+          :class:`DatetimeIndex`. To do this, timezone-naive inputs are
+          *localized* as UTC, while timezone-aware inputs are *converted* to UTC.
 
-    Parameters
-    ----------
-    index : array-like, Series, or list of arrays/Series
-        Values to group by in the rows.
-    columns : array-like, Series, or list of arrays/Series
-        Values to group by in the columns.
-    values : array-like, optional
-        Array of values to aggregate according to the factors.
-        Requires aggfunc be specified.
-    rownames : sequence, default None
-        If passed, must match number of row arrays passed.
-    colnames : sequence, default None
-        If passed, must match number of column arrays passed.
-    aggfunc : function, optional
-        If specified, requires values be specified as well.
-    margins : bool, default False
-        Add row/column margins (subtotals).
-    margins_name : str, default 'All'
-        Name of the row/column that will contain the totals when margins is True.
-    dropna : bool, default True
-        Do not include columns whose entries are all NaN.
+        - If :const:`False` (default), inputs will not be coerced to UTC.
+          Timezone-naive inputs will remain naive, while timezone-aware ones
+          will keep their time offsets. Limitations exist for mixed
+          offsets (typically, daylight savings), see :ref:`Examples
+          <to_datetime_tz_examples>` section for details.
 
-    normalize : bool, {'all', 'index', 'columns'}, or {0,1}, default False
-        Normalize by dividing all values by the sum of values.
+        See also: pandas general documentation about `timezone conversion and
+        localization
+        <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html
+        #time-zone-handling>`_.
 
-        * If passed 'all' or True, will normalize over all values.
-        * If passed 'index' will normalize over each row.
-        * If passed 'columns' will normalize over each column.
-        * If margins is True, will also normalize margin values.
+    format : str, default None
+        The strftime to parse time, e.g. :const:`"%d/%m/%Y"`. Note that
+        :const:`"%f"` will parse all the way up to nanoseconds. See
+        `strftime documentation
+        <https://docs.python.org/3/library/datetime.html
+        #strftime-and-strptime-behavior>`_ for more information on choices.
+    exact : bool, default True
+        Control how `format` is used:
 
-    Returns
-    -------
-    Snowpark pandas :class:`~modin.pandas.DataFrame`
-        Cross tabulation of the data.
+        - If :const:`True`, require an exact `format` match.
+        - If :const:`False`, allow the `format` to match anywhere in the target
+          string.
 
-    Notes
-    -----
+    unit : str, default 'ns'
+        The unit of the arg (D,s,ms,us,ns) denote the unit, which is an
+        integer or float number. This will be based off the origin.
+        Example, with ``unit='ms'`` and ``origin='unix'``, this would calculate
+        the number of milliseconds to the unix epoch start.
+    infer_datetime_format : bool, default False
+        If :const:`True` and no `format` is given, attempt to infer the format
+        of the datetime strings based on the first non-NaN element,
+        and if it can be inferred, switch to a faster method of parsing them.
+        In some cases this can increase the parsing speed by ~5-10x.
+    origin : scalar, default 'unix'
+        Define the reference date. The numeric values would be parsed as number
+        of units (defined by `unit`) since this reference date.
 
-    Raises NotImplementedError if aggfunc is not one of "count", "mean", "min", "max", or "sum", or
-    margins is True, normalize is True or all, and values is passed.
+        - If :const:`'unix'` (or POSIX) time; origin is set to 1970-01-01.
+        - If :const:`'julian'`, unit must be :const:`'D'`, and origin is set to
+          beginning of Julian Calendar. Julian day number :const:`0` is assigned
+          to the day starting at noon on January 1, 4713 BC.
+        - If Timestamp convertible, origin is set to Timestamp identified by
+          origin.
+    cache : bool, default True
+        cache parameter is ignored with Snowflake backend, i.e., no caching will be
+        applied
 
-    Examples
-    --------
-    >>> a = np.array(["foo", "foo", "foo", "foo", "bar", "bar",
-    ...               "bar", "bar", "foo", "foo", "foo"], dtype=object)
-    >>> b = np.array(["one", "one", "one", "two", "one", "one",
-    ...               "one", "two", "two", "two", "one"], dtype=object)
-    >>> c = np.array(["dull", "dull", "shiny", "dull", "dull", "shiny",
-    ...               "shiny", "dull", "shiny", "shiny", "shiny"],
-    ...              dtype=object)
-    >>> pd.crosstab(a, [b, c], rownames=['a'], colnames=['b', 'c']) # doctest: +NORMALIZE_WHITESPACE
-    b    one        two
-    c   dull shiny dull shiny
-    a
-    bar    1     2    1     0
-    foo    2     2    1     2
-    """
-    if values is None and aggfunc is not None:
-        raise ValueError("aggfunc cannot be used without values.")
+    Returns
+    -------
+    datetime
+        If parsing succeeded.
+        Return type depends on input (types in parenthesis correspond to
+        fallback in case of unsuccessful timezone or out-of-range timestamp
+        parsing):
 
-    if values is not None and aggfunc is None:
-        raise ValueError("values cannot be used without an aggfunc.")
+        - scalar: :class:`Timestamp` (or :class:`datetime.datetime`)
+        - array-like: :class:`~modin.pandas.DatetimeIndex` (or
+          :class: :class:`~modin.pandas.Series` of :class:`object` dtype containing
+          :class:`datetime.datetime`)
+        - Series: :class:`~modin.pandas.Series` of :class:`datetime64` dtype (or
+          :class: :class:`~modin.pandas.Series` of :class:`object` dtype containing
+          :class:`datetime.datetime`)
+        - DataFrame: :class:`~modin.pandas.Series` of :class:`datetime64` dtype (or
+          :class:`~modin.pandas.Series` of :class:`object` dtype containing
+          :class:`datetime.datetime`)
 
-    if not is_nested_list_like(index):
-        index = [index]
-    if not is_nested_list_like(columns):
-        columns = [columns]
+    Raises
+    ------
+    ParserError
+        When parsing a date from string fails.
+    ValueError
+        When another datetime conversion error happens. For example when one
+        of 'year', 'month', day' columns is missing in a :class:`~modin.pandas.DataFrame`, or
+        when a Timezone-aware :class:`datetime.datetime` is found in an array-like
+        of mixed time offsets, and ``utc=False``.
 
-    if (
-        values is not None
-        and margins is True
-        and (normalize is True or normalize == "all")
-    ):
-        raise NotImplementedError(
-            'Snowpark pandas does not yet support passing in margins=True, normalize="all", and values.'
-        )
+    See Also
+    --------
+    DataFrame.astype : Cast argument to a specified dtype.
+    to_timedelta : Convert argument to timedelta.
+    convert_dtypes : Convert dtypes.
 
-    user_passed_rownames = rownames is not None
-    user_passed_colnames = colnames is not None
+    Notes
+    -----
 
-    from pandas.core.reshape.pivot import _build_names_mapper, _get_names
+    Many input types are supported, and lead to different output types:
 
-    def _get_names_wrapper(list_of_objs, names, prefix):
-        """
-        Helper method to expand DataFrame objects containing
-        multiple columns into Series, since `_get_names` expects
-        one column per entry.
-        """
-        expanded_list_of_objs = []
-        for obj in list_of_objs:
-            if isinstance(obj, DataFrame):
-                for col in obj.columns:
-                    expanded_list_of_objs.append(obj[col])
-            else:
-                expanded_list_of_objs.append(obj)
-        return _get_names(expanded_list_of_objs, names, prefix)
+    - **scalars** can be int, float, str, datetime object (from stdlib :mod:`datetime`
+      module or :mod:`numpy`). They are converted to :class:`Timestamp` when
+      possible, otherwise they are converted to :class:`datetime.datetime`.
+      None/NaN/null scalars are converted to :const:`NaT`.
 
-    rownames = _get_names_wrapper(index, rownames, prefix="row")
-    colnames = _get_names_wrapper(columns, colnames, prefix="col")
+    - **array-like** can contain int, float, str, datetime objects. They are
+      converted to :class:`DatetimeIndex` when possible, otherwise they are
+      converted to :class:`Index` with :class:`object` dtype, containing
+      :class:`datetime.datetime`. None/NaN/null entries are converted to
+      :const:`NaT` in both cases.
 
-    (
-        rownames_mapper,
-        unique_rownames,
-        colnames_mapper,
-        unique_colnames,
-    ) = _build_names_mapper(rownames, colnames)
+    - **Series** are converted to :class:`~modin.pandas.Series` with :class:`datetime64`
+      dtype when possible, otherwise they are converted to :class:`~modin.pandas.Series` with
+      :class:`object` dtype, containing :class:`datetime.datetime`. None/NaN/null
+      entries are converted to :const:`NaT` in both cases.
 
-    pass_objs = [x for x in index + columns if isinstance(x, (Series, DataFrame))]
-    row_idx_names = None
-    col_idx_names = None
-    if pass_objs:
-        # If we have any Snowpark pandas objects in the index or columns, then we
-        # need to find the intersection of their indices, and only pick rows from
-        # the objects that have indices in the intersection of their indices.
-        # After we do that, we then need to append the non Snowpark pandas objects
-        # using the intersection of indices as the final index for the DataFrame object.
-        # First, we separate the objects into Snowpark pandas objects, and non-Snowpark
-        # pandas objects (while renaming them so that they have unique names).
-        rownames_idx = 0
-        row_idx_names = []
-        dfs = []
-        arrays = []
-        array_lengths = []
-        for obj in index:
-            if isinstance(obj, Series):
-                row_idx_names.append(obj.name)
-                df = pd.DataFrame(obj)
-                df.columns = [unique_rownames[rownames_idx]]
-                rownames_idx += 1
-                dfs.append(df)
-            elif isinstance(obj, DataFrame):
-                row_idx_names.extend(obj.columns)
-                obj.columns = unique_rownames[
-                    rownames_idx : rownames_idx + len(obj.columns)
-                ]
-                rownames_idx += len(obj.columns)
-                dfs.append(obj)
-            else:
-                row_idx_names.append(None)
-                array_lengths.append(len(obj))
-                df = pd.DataFrame(obj)
-                df.columns = unique_rownames[
-                    rownames_idx : rownames_idx + len(df.columns)
-                ]
-                rownames_idx += len(df.columns)
-                arrays.append(df)
+    - **DataFrame/dict-like** are converted to :class:`~modin.pandas.Series` with
+      :class:`datetime64` dtype. For each row a datetime is created from assembling
+      the various dataframe columns. Column keys can be common abbreviations
+      like [‘year’, ‘month’, ‘day’, ‘minute’, ‘second’, ‘ms’, ‘us’, ‘ns’]) or
+      plurals of the same.
 
-        colnames_idx = 0
-        col_idx_names = []
-        for obj in columns:
-            if isinstance(obj, Series):
-                col_idx_names.append(obj.name)
-                df = pd.DataFrame(obj)
-                df.columns = [unique_colnames[colnames_idx]]
-                colnames_idx += 1
-                dfs.append(df)
-            elif isinstance(obj, DataFrame):
-                col_idx_names.extend(obj.columns)
-                obj.columns = unique_colnames[
-                    colnames_idx : colnames_idx + len(obj.columns)
-                ]
-                colnames_idx += len(obj.columns)
-                dfs.append(obj)
-            else:
-                col_idx_names.append(None)
-                array_lengths.append(len(obj))
-                df = pd.DataFrame(obj)
-                df.columns = unique_colnames[
-                    colnames_idx : colnames_idx + len(df.columns)
-                ]
-                colnames_idx += len(df.columns)
-                arrays.append(df)
+    The following causes are responsible for :class:`datetime.datetime` objects
+    being returned (possibly inside an :class:`Index` or a :class:`~modin.pandas.Series` with
+    :class:`object` dtype) instead of a proper pandas designated type
+    (:class:`Timestamp` or :class:`~modin.pandas.Series` with :class:`datetime64` dtype):
 
-        if len(set(array_lengths)) > 1:
-            raise ValueError("All arrays must be of the same length")
+    - when any input element is before :const:`Timestamp.min` or after
+      :const:`Timestamp.max`, see `timestamp limitations
+      <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html
+      #timeseries-timestamp-limits>`_.
 
-        # Now, we have two lists - a list of Snowpark pandas objects, and a list of objects
-        # that were not passed in as Snowpark pandas objects, but that we have converted
-        # to Snowpark pandas objects to give them column names. We can perform inner joins
-        # on the dfs list to get a DataFrame with the final index (that is only an intersection
-        # of indices.)
-        df = dfs[0]
-        for right in dfs[1:]:
-            df = df.merge(right, left_index=True, right_index=True)
-        if len(arrays) > 0:
-            index = df.index
-            right_df = pd.concat(arrays, axis=1)
-            # Increases query count by 1, but necessary for error checking.
-            index_length = len(df)
-            if index_length != array_lengths[0]:
-                raise ValueError(
-                    f"Length mismatch: Expected {array_lengths[0]} rows, received array of length {index_length}"
-                )
-            right_df.index = index
-            df = df.merge(right_df, left_index=True, right_index=True)
-    else:
-        data = {
-            **dict(zip(unique_rownames, index)),
-            **dict(zip(unique_colnames, columns)),
-        }
-        df = DataFrame(data)
+    - when ``utc=False`` (default) and the input is an array-like or
+      :class:`~modin.pandas.Series` containing mixed naive/aware datetime, or aware with mixed
+      time offsets. Note that this happens in the (quite frequent) situation when
+      the timezone has a daylight savings policy. In that case you may wish to
+      use ``utc=True``.
 
-    if values is None:
-        df["__dummy__"] = 0
-        kwargs = {"aggfunc": "count"}
-    else:
-        df["__dummy__"] = values
-        kwargs = {"aggfunc": aggfunc}
+    Examples
+    --------
 
-    table = df.pivot_table(
-        "__dummy__",
-        index=unique_rownames,
-        columns=unique_colnames,
-        margins=margins,
-        margins_name=margins_name,
-        dropna=dropna,
-        **kwargs,  # type: ignore[arg-type]
-    )
+    **Handling various input formats**
 
-    if row_idx_names is not None and not user_passed_rownames:
-        table.index = table.index.set_names(row_idx_names)
+    Assembling a datetime from multiple columns of a :class:`~modin.pandas.DataFrame`. The keys
+    can be common abbreviations like ['year', 'month', 'day', 'minute', 'second',
+    'ms', 'us', 'ns']) or plurals of the same
 
-    if col_idx_names is not None and not user_passed_colnames:
-        table.columns = table.columns.set_names(col_idx_names)
+    >>> df = pd.DataFrame({'year': [2015, 2016],
+    ...                    'month': [2, 3],
+    ...                    'day': [4, 5]})
+    >>> pd.to_datetime(df)
+    0   2015-02-04
+    1   2016-03-05
+    dtype: datetime64[ns]
 
-    if aggfunc is None:
-        # If no aggfunc is provided, we are computing frequencies. Since we use
-        # pivot_table above, pairs that are not observed will get a NaN value,
-        # so we need to fill all NaN values with 0.
-        table = table.fillna(0)
+    Passing ``infer_datetime_format=True`` can often-times speedup a parsing
+    if it's not an ISO8601 format exactly, but in a regular format.
 
-    # We must explicitly check that the value of normalize is not False here,
-    # as a valid value of normalize is `0` (for normalizing index).
-    if normalize is not False:
-        if normalize not in [0, 1, "index", "columns", "all", True]:
-            raise ValueError("Not a valid normalize argument")
-        if normalize is True:
-            normalize = "all"
-        normalize = {0: "index", 1: "columns"}.get(normalize, normalize)
+    >>> s = pd.Series(['3/11/2000', '3/12/2000', '3/13/2000'] * 1000)
+    >>> s.head()
+    0    3/11/2000
+    1    3/12/2000
+    2    3/13/2000
+    3    3/11/2000
+    4    3/12/2000
+    dtype: object
 
-        # Actual Normalizations
-        normalizers: dict[bool | str, Callable] = {
-            "all": lambda x: x / x.sum(axis=0).sum(),
-            "columns": lambda x: x / x.sum(),
-            "index": lambda x: x.div(x.sum(axis=1), axis="index"),
-        }
+    Using a unix epoch time
 
-        if margins is False:
+    >>> pd.to_datetime(1490195805, unit='s')
+    Timestamp('2017-03-22 15:16:45')
+    >>> pd.to_datetime(1490195805433502912, unit='ns')
+    Timestamp('2017-03-22 15:16:45.433502912')
 
-            f = normalizers[normalize]
-            names = table.columns.names
-            table = f(table)
-            table.columns.names = names
-            table = table.fillna(0)
-        else:
-            # keep index and column of pivoted table
-            table_index = table.index
-            table_columns = table.columns
+    .. warning:: For float arg, precision rounding might happen. To prevent
+        unexpected behavior use a fixed-width exact type.
 
-            column_margin = table.iloc[:-1, -1]
+    Using a non-unix epoch origin
 
-            if normalize == "columns":
-                # keep the core table
-                table = table.iloc[:-1, :-1]
+    >>> pd.to_datetime([1, 2, 3], unit='D',
+    ...                origin=pd.Timestamp('1960-01-01'))
+    DatetimeIndex(['1960-01-02', '1960-01-03', '1960-01-04'], dtype='datetime64[ns]', freq=None)
 
-                # Normalize core
-                f = normalizers[normalize]
-                table = f(table)
-                table = table.fillna(0)
-                # Fix Margins
-                column_margin = column_margin / column_margin.sum()
-                table = pd.concat([table, column_margin], axis=1)
-                table = table.fillna(0)
-                table.columns = table_columns
 
-            elif normalize == "index":
-                table = table.iloc[:, :-1]
+    **Non-convertible date/times**
 
-                # Normalize core
-                f = normalizers[normalize]
-                table = f(table)
-                table = table.fillna(0).reindex(index=table_index)
+    If a date does not meet the `timestamp limitations
+    <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html
+    #timeseries-timestamp-limits>`_, passing ``errors='ignore'``
+    will return the original input instead of raising any exception.
 
-            elif normalize == "all":
-                # Normalize core
-                f = normalizers[normalize]
+    Passing ``errors='coerce'`` will force an out-of-bounds date to :const:`NaT`,
+    in addition to forcing non-dates (or non-parseable dates) to :const:`NaT`.
 
-                # When we perform the normalization function, we take the sum over
-                # the rows, and divide every value by the sum. Since margins is included
-                # though, the result of the sum is actually 2 * the sum of the original
-                # values (since the margin itself is the sum of the original values),
-                # so we need to multiply by 2 here to account for that.
-                # The alternative would be to apply normalization to the main table
-                # and the index margins separately, but that would require additional joins
-                # to get the final table, which we want to avoid.
-                table = f(table.iloc[:, :-1]) * 2.0
+    >>> pd.to_datetime(['13000101', 'abc'], format='%Y%m%d', errors='coerce')
+    DatetimeIndex(['NaT', 'NaT'], dtype='datetime64[ns]', freq=None)
 
-                column_margin = column_margin / column_margin.sum()
-                table = pd.concat([table, column_margin], axis=1)
-                table.iloc[-1, -1] = 1
 
-                table = table.fillna(0)
-                table.index = table_index
-                table.columns = table_columns
+    .. _to_datetime_tz_examples:
 
-    table = table.rename_axis(index=rownames_mapper, axis=0)
-    table = table.rename_axis(columns=colnames_mapper, axis=1)
+    **Timezones and time offsets**
 
-    return table
+    The default behaviour (``utc=False``) is as follows:
 
+    - Timezone-naive inputs are kept as timezone-naive :class:`~modin.pandas.DatetimeIndex`:
 
-# Adding docstring since pandas docs don't have web section for this function.
-@snowpark_pandas_telemetry_standalone_function_decorator
-@pandas_module_level_function_not_implemented()
-def lreshape(data: DataFrame, groups, dropna=True, label=None):
-    """
-    Reshape wide-format data to long. Generalized inverse of ``DataFrame.pivot``.
+    >>> pd.to_datetime(['2018-10-26 12:00:00', '2018-10-26 13:00:15'])
+    DatetimeIndex(['2018-10-26 12:00:00', '2018-10-26 13:00:15'], dtype='datetime64[ns]', freq=None)
 
-    Accepts a dictionary, `groups`, in which each key is a new column name
-    and each value is a list of old column names that will be "melted" under
-    the new column name as part of the reshape.
+    >>> pd.to_datetime(['2018-10-26 12:00:00 -0500', '2018-10-26 13:00:00 -0500'])
+    DatetimeIndex(['2018-10-26 12:00:00-05:00', '2018-10-26 13:00:00-05:00'], dtype='datetime64[ns, UTC-05:00]', freq=None)
 
-    Parameters
-    ----------
-    data : DataFrame
-        The wide-format DataFrame.
-    groups : dict
-        Dictionary in the form: `{new_name : list_of_columns}`.
-    dropna : bool, default: True
-        Whether include columns whose entries are all NaN or not.
-    label : optional
-        Deprecated parameter.
+    - Use right format to convert to timezone-aware type (Note that when call Snowpark
+      pandas API to_pandas() the timezone-aware output will always be converted to session timezone):
 
-    Returns
-    -------
-    DataFrame
-        Reshaped DataFrame.
-    """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    if not isinstance(data, DataFrame):
-        raise ValueError(f"can not lreshape with instance of type {type(data)}")
-    return DataFrame(
-        pandas.lreshape(to_pandas(data), groups, dropna=dropna, label=label)
-    )
+    >>> pd.to_datetime(['2018-10-26 12:00:00 -0500', '2018-10-26 13:00:00 -0500'], format="%Y-%m-%d %H:%M:%S %z")
+    DatetimeIndex(['2018-10-26 12:00:00-05:00', '2018-10-26 13:00:00-05:00'], dtype='datetime64[ns, UTC-05:00]', freq=None)
 
+    - Timezone-aware inputs *with mixed time offsets* (for example
+      issued from a timezone with daylight savings, such as Europe/Paris):
 
-@_inherit_docstrings(pandas.wide_to_long, apilink="pandas.wide_to_long")
-@snowpark_pandas_telemetry_standalone_function_decorator
-@pandas_module_level_function_not_implemented()
-def wide_to_long(
-    df: DataFrame, stubnames, i, j, sep: str = "", suffix: str = r"\d+"
-) -> DataFrame:  # noqa: PR01, RT01, D200
-    """
-    Unpivot a DataFrame from wide to long format.
-    """
-    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    if not isinstance(df, DataFrame):
-        raise ValueError(f"can not wide_to_long with instance of type {type(df)}")
-    # ErrorMessage.default_to_pandas("`wide_to_long`")
-    return DataFrame(
-        pandas.wide_to_long(to_pandas(df), stubnames, i, j, sep=sep, suffix=suffix)
-    )
+    >>> pd.to_datetime(['2020-10-25 02:00:00 +0200', '2020-10-25 04:00:00 +0100'])
+    DatetimeIndex([2020-10-25 02:00:00+02:00, 2020-10-25 04:00:00+01:00], dtype='object', freq=None)
 
+    >>> pd.to_datetime(['2020-10-25 02:00:00 +0200', '2020-10-25 04:00:00 +0100'], format="%Y-%m-%d %H:%M:%S %z")
+    DatetimeIndex([2020-10-25 02:00:00+02:00, 2020-10-25 04:00:00+01:00], dtype='object', freq=None)
 
-def _determine_name(objs: Iterable[BaseQueryCompiler], axis: int | str):
-    """
-    Determine names of index after concatenation along passed axis.
+    Setting ``utc=True`` makes sure always convert to timezone-aware outputs:
 
-    Parameters
-    ----------
-    objs : iterable of QueryCompilers
-        Objects to concatenate.
-    axis : int or str
-        The axis to concatenate along.
+    - Timezone-naive inputs are *localized* based on the session timezone
 
-    Returns
-    -------
-    list with single element
-        Computed index name, `None` if it could not be determined.
+    >>> pd.to_datetime(['2018-10-26 12:00', '2018-10-26 13:00'], utc=True)
+    DatetimeIndex(['2018-10-26 12:00:00+00:00', '2018-10-26 13:00:00+00:00'], dtype='datetime64[ns, UTC]', freq=None)
+
+    - Timezone-aware inputs are *converted* to session timezone
+
+    >>> pd.to_datetime(['2018-10-26 12:00:00 -0530', '2018-10-26 12:00:00 -0500'],
+    ...                utc=True)
+    DatetimeIndex(['2018-10-26 17:30:00+00:00', '2018-10-26 17:00:00+00:00'], dtype='datetime64[ns, UTC]', freq=None)
     """
     # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
-    axis = pandas.DataFrame()._get_axis_number(axis)
+    raise_if_native_pandas_objects(arg)
 
-    def get_names(obj):
-        return obj.columns.names if axis else obj.index.names
+    if not isinstance(arg, (DataFrame, Series, pd.Index)):
+        # use pandas.to_datetime to convert local data to datetime
+        res = pandas.to_datetime(
+            arg,
+            errors,
+            dayfirst,
+            yearfirst,
+            utc,
+            format,
+            exact,
+            unit,
+            infer_datetime_format,
+            origin,
+            cache,
+        )
+        if isinstance(res, pandas.Series):
+            res = pd.Series(res)
+        elif not is_scalar(res):
+            res = pd.Index(res)
+        return res
 
-    names = np.array([get_names(obj) for obj in objs])
+    # handle modin objs
+    if unit and unit not in VALID_TO_DATETIME_UNIT:
+        raise ValueError(f"Unrecognized unit {unit}")
 
-    # saving old name, only if index names of all objs are the same
-    if np.all(names == names[0]):
-        # we must do this check to avoid this calls `list(str_like_name)`
-        return list(names[0]) if is_list_like(names[0]) else [names[0]]
-    else:
-        return None
+    if not cache:
+        WarningMessage.ignored_argument(
+            operation="to_datetime",
+            argument="cache",
+            message="cache parameter is ignored with Snowflake backend, i.e., no caching will be applied",
+        )
+
+    return arg._to_datetime(
+        errors=errors,
+        dayfirst=dayfirst,
+        yearfirst=yearfirst,
+        utc=utc,
+        format=format,
+        exact=exact,
+        unit=unit,
+        infer_datetime_format=infer_datetime_format,
+        origin=origin,
+    )
 
 
 @snowpark_pandas_telemetry_standalone_function_decorator
@@ -2725,359 +2947,159 @@ def bdate_range(
     weekmask: str | None = None,
     holidays: ListLike | None = None,
     inclusive: IntervalClosedType = "both",
-    **kwargs,
-) -> pd.DatetimeIndex:
-    """
-    Return a fixed frequency DatetimeIndex with business day as the default.
-
-    Parameters
-    ----------
-    start : str or datetime-like, default None
-        Left bound for generating dates.
-    end : str or datetime-like, default None
-        Right bound for generating dates.
-    periods : int, default None
-        Number of periods to generate.
-    freq : str, Timedelta, datetime.timedelta, or DateOffset, default 'B'
-        Frequency strings can have multiples, e.g. '5h'. The default is
-        business daily ('B').
-    tz : str or None
-        Time zone name for returning localized DatetimeIndex, for example
-        Asia/Beijing.
-    normalize : bool, default False
-        Normalize start/end dates to midnight before generating date range.
-    name : str, default None
-        Name of the resulting DatetimeIndex.
-    weekmask : str or None, default None
-        Weekmask of valid business days, passed to ``numpy.busdaycalendar``,
-        only used when custom frequency strings are passed.  The default
-        value None is equivalent to 'Mon Tue Wed Thu Fri'.
-    holidays : list-like or None, default None
-        Dates to exclude from the set of valid business days, passed to
-        ``numpy.busdaycalendar``, only used when custom frequency strings
-        are passed.
-    inclusive : {"both", "neither", "left", "right"}, default "both"
-        Include boundaries; Whether to set each bound as closed or open.
-
-        .. versionadded:: 1.4.0
-    **kwargs
-        For compatibility. Has no effect on the result.
-
-    Returns
-    -------
-    DatetimeIndex
-
-    Notes
-    -----
-    Of the four parameters: ``start``, ``end``, ``periods``, and ``freq``,
-    exactly three must be specified.  Specifying ``freq`` is a requirement
-    for ``bdate_range``.  Use ``date_range`` if specifying ``freq`` is not
-    desired.
-
-    To learn more about the frequency strings, please see `this link
-    <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html#offset-aliases>`__.
-
-    Examples
-    --------
-    Note how the two weekend days are skipped in the result.
-
-    >>> pd.bdate_range(start='1/1/2018', end='1/08/2018') # doctest: +NORMALIZE_WHITESPACE
-    DatetimeIndex(['2018-01-01', '2018-01-02', '2018-01-03', '2018-01-04',
-            '2018-01-05', '2018-01-08'],
-            dtype='datetime64[ns]', freq=None)
-    """
-    if freq is None:
-        msg = "freq must be specified for bdate_range; use date_range instead"
-        raise TypeError(msg)
-
-    if isinstance(freq, str) and freq.startswith("C"):
-        ErrorMessage.not_implemented(
-            "custom frequency is not supported in Snowpark pandas API"
-        )
-    elif holidays or weekmask:
-        ErrorMessage.not_implemented(
-            "custom holidays or weekmask are not supported in Snowpark pandas API"
-        )
-
-    return date_range(
-        start=start,
-        end=end,
-        periods=periods,
-        freq=freq,
-        tz=tz,
-        normalize=normalize,
-        name=name,
-        inclusive=inclusive,
-        **kwargs,
-    )
-
-
-@snowpark_pandas_telemetry_standalone_function_decorator
-def qcut(
-    x: np.ndarray | Series,
-    q: int | ListLikeOfFloats,
-    labels: ListLike | bool | None = None,
-    retbins: bool = False,
-    precision: int = 3,
-    duplicates: Literal["raise"] | Literal["drop"] = "raise",
-) -> Series:
-    """
-    Quantile-based discretization function.
-
-    Discretize variable into equal-sized buckets based on rank or based
-    on sample quantiles.
-
-    Parameters
-    ----------
-    x : 1-D ndarray or Series
-        The data across which to compute buckets. If a Snowpark pandas Series is passed, the computation
-        is distributed. Otherwise, if a numpy array or list is provided, the computation is performed
-        client-side instead.
-
-    q : int or list-like of float
-        Number of quantiles. 10 for deciles, 4 for quartiles, etc. Alternately array of quantiles,
-        e.g. [0, .25, .5, .75, 1.] for quartiles.
-
-    labels : array or False, default None
-        Used as labels for the resulting bin. Must be of the same length as the resulting bins. If False,
-        return only integer indicators of the bins. If True, raise an error.
-
-        ``labels=False`` will run binning computation in Snowflake; other values are not yet supported
-        in Snowpark pandas.
-
-    retbins : bool, default False
-        Whether to return the (bins, labels) or not. Can be useful if bins is given as a scalar.
-        ``retbins=True`` is not yet supported in Snowpark pandas.
-
-    precision : int, optional
-        The precision at which to store and display the bins labels.
-
-    duplicates : {default 'raise', 'drop'}, optional
-        If bin edges are not unique, raise ValueError or drop non-uniques.
-
-    Returns
-    -------
-    Series
-        Since Snowpark pandas does not yet support the ``pd.Categorical`` type, unlike native pandas, the
-        return value is always a Series.
-    """
-
-    kwargs = {
-        "labels": labels,
-        "retbins": retbins,
-        "precision": precision,
-        "duplicates": duplicates,
-    }
-
-    # For numpy or list, call to native pandas.
-    if not isinstance(x, Series):
-        return pandas.qcut(x, q, **kwargs)
-
-    # Check that labels is supported as in pandas.
-    if not (labels is None or labels is False or is_list_like(labels)):
-        raise ValueError(
-            "Bin labels must either be False, None or passed in as a list-like argument"
-        )
-
-    # Carry out check that for the list-like case quantiles are (monotonically) increasing,
-    # if not the case throw pandas compatible error.
-    if not isinstance(q, int) and np.all(np.diff(q) < 0):
-        # Note: Pandas 2.x changed the error message here, using Pandas 2.x behavior here.
-        raise ValueError("left side of interval must be <= right side")
-
-        # remove duplicates (input like [0.5, 0.5] is ok)
-        q = sorted(list(set(q)))
-
-    if labels is not False:
-        # Labels require categorical, not yet supported. Use native pandas conversion here to compute result.
-        ErrorMessage.not_implemented(
-            "Snowpark pandas API qcut method supports only labels=False, if you need support"
-            " for labels consider calling pandas.qcut(x.to_pandas(), q, ...)"
-        )
-
-    ans = x._qcut(q, retbins, duplicates)
-
-    if isinstance(q, int) and q != 1 and len(ans) == 1:
-        if duplicates == "raise":
-            # We issue a count query since if q !=1 and x is a Series/list-like containing
-            # a single element, an error will be produced  ValueError: Bin edges must be unique: array([0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.]).
-            #                You can drop duplicate edges by setting the 'duplicates' kwarg.
-            # With qcut being an API that requires conversion, we can mimick this behavior here.
-
-            # Produce raising error.
-            raise ValueError(
-                f"Bin edges must be unique: {repr(np.array([0.] * q))}.\nYou can drop duplicate edges by setting the 'duplicates' kwarg."
-            )
-        else:
-            # The result will always be NaN because no unique bin could be found.
-            return pd.Series([np.nan])
-
-    return ans
-
-
-@snowpark_pandas_telemetry_standalone_function_decorator
-def cut(
-    x: AnyArrayLike,
-    bins: int | Sequence[Scalar] | IntervalIndex,
-    right: bool = True,
-    labels=None,
-    retbins: bool = False,
-    precision: int = 3,
-    include_lowest: bool = False,
-    duplicates: str = "raise",
-    ordered: bool = True,
-):
+    **kwargs,
+) -> pd.DatetimeIndex:
     """
-    Bin values into discrete intervals.
-
-    Use `cut` when you need to segment and sort data values into bins. This
-    function is also useful for going from a continuous variable to a
-    categorical variable. For example, `cut` could convert ages to groups of
-    age ranges. Supports binning into an equal number of bins, or a
-    pre-specified array of bins.
+    Return a fixed frequency DatetimeIndex with business day as the default.
 
     Parameters
     ----------
-    x : array-like
-        The input array to be binned. Must be 1-dimensional.
-    bins : int, sequence of scalars
-        The criteria to bin by.
-
-        * int : Defines the number of equal-width bins in the range of `x`. The
-          range of `x` is extended by .1% on each side to include the minimum
-          and maximum values of `x`.
-        * sequence of scalars : Defines the bin edges allowing for non-uniform
-          width. No extension of the range of `x` is done.
-
-    right : bool, default True
-        Indicates whether `bins` includes the rightmost edge or not. If
-        ``right == True`` (the default), then the `bins` ``[1, 2, 3, 4]``
-        indicate (1,2], (2,3], (3,4]. This argument is ignored when
-        `bins` is an IntervalIndex.
-    labels : array or False, default None
-        Specifies the labels for the returned bins. Must be the same length as
-        the resulting bins. If False, returns only integer indicators of the
-        bins. This affects the type of the output container (see below).
-        This argument is ignored when `bins` is an IntervalIndex. If True,
-        raises an error. When `ordered=False`, labels must be provided.
-
-        Snowpark pandas API does not support labels=None.
-        Labels must be of a Snowpark pandas API supported dtype.
+    start : str or datetime-like, default None
+        Left bound for generating dates.
+    end : str or datetime-like, default None
+        Right bound for generating dates.
+    periods : int, default None
+        Number of periods to generate.
+    freq : str, Timedelta, datetime.timedelta, or DateOffset, default 'B'
+        Frequency strings can have multiples, e.g. '5h'. The default is
+        business daily ('B').
+    tz : str or None
+        Time zone name for returning localized DatetimeIndex, for example
+        Asia/Beijing.
+    normalize : bool, default False
+        Normalize start/end dates to midnight before generating date range.
+    name : str, default None
+        Name of the resulting DatetimeIndex.
+    weekmask : str or None, default None
+        Weekmask of valid business days, passed to ``numpy.busdaycalendar``,
+        only used when custom frequency strings are passed.  The default
+        value None is equivalent to 'Mon Tue Wed Thu Fri'.
+    holidays : list-like or None, default None
+        Dates to exclude from the set of valid business days, passed to
+        ``numpy.busdaycalendar``, only used when custom frequency strings
+        are passed.
+    inclusive : {"both", "neither", "left", "right"}, default "both"
+        Include boundaries; Whether to set each bound as closed or open.
 
-    retbins : bool, default False
-        Snowpark pandas API does not support this parameter yet.
-    precision : int, default 3
-        The precision at which to store and display the bins labels.
-    include_lowest : bool, default False
-        Whether the first interval should be left-inclusive or not.
-    duplicates : {default 'raise', 'drop'}, optional
-        If bin edges are not unique, raise ValueError or drop non-uniques.
-    ordered : bool, default True
-        Whether the labels are ordered or not. Applies to returned types
-        Categorical and Series (with Categorical dtype). If True,
-        the resulting categorical will be ordered. If False, the resulting
-        categorical will be unordered (labels must be provided).
+        .. versionadded:: 1.4.0
+    **kwargs
+        For compatibility. Has no effect on the result.
 
     Returns
     -------
-    out : Categorical, Series, or ndarray
-        An array-like object representing the respective bin for each value
-        of `x`. The type depends on the value of `labels`.
-
-        * None (default) : returns a Series for Series `x` or a
-          Categorical for all other inputs. The values stored within
-          are Interval dtype.
-
-        * sequence of scalars : returns a Series for Series `x` or a
-          Categorical for all other inputs. The values stored within
-          are whatever the type in the sequence is.
-
-        * False : returns an ndarray of integers.
-
-    bins : numpy.ndarray
-        The computed or specified bins. Only returned when `retbins=True`.
-        For scalar or sequence `bins`, this is an ndarray with the computed
-        bins. If set `duplicates=drop`, `bins` will drop non-unique bin.
+    DatetimeIndex
 
     Notes
     -----
-    Any NA values will be NA in the result. Out of bounds values will be NA in
-    the resulting Series or Categorical object.
+    Of the four parameters: ``start``, ``end``, ``periods``, and ``freq``,
+    exactly three must be specified.  Specifying ``freq`` is a requirement
+    for ``bdate_range``.  Use ``date_range`` if specifying ``freq`` is not
+    desired.
 
-    Snowpark pandas API does not natively support Categorical and categorical types. When calling `cut` with a
-    Snowpark pandas Series and using `labels=False`, a Snowpark pandas Series object is returned. However,
-    for `labels != False` an error is raised.
+    To learn more about the frequency strings, please see `this link
+    <https://pandas.pydata.org/pandas-docs/stable/user_guide/timeseries.html#offset-aliases>`__.
 
     Examples
     --------
-    Discretize into three equal-sized bins.
+    Note how the two weekend days are skipped in the result.
 
-    >>> pd.cut(np.array([1, 7, 5, 4, 6, 3]), 3, labels=False)
-    ... # doctest: +ELLIPSIS
-    array([0, 2, 1, 1, 2, 0])
+    >>> pd.bdate_range(start='1/1/2018', end='1/08/2018') # doctest: +NORMALIZE_WHITESPACE
+    DatetimeIndex(['2018-01-01', '2018-01-02', '2018-01-03', '2018-01-04',
+            '2018-01-05', '2018-01-08'],
+            dtype='datetime64[ns]', freq=None)
+    """
+    if freq is None:
+        msg = "freq must be specified for bdate_range; use date_range instead"
+        raise TypeError(msg)
 
-    ``labels=False`` implies you just want the bins back.
+    if isinstance(freq, str) and freq.startswith("C"):
+        ErrorMessage.not_implemented(
+            "custom frequency is not supported in Snowpark pandas API"
+        )
+    elif holidays or weekmask:
+        ErrorMessage.not_implemented(
+            "custom holidays or weekmask are not supported in Snowpark pandas API"
+        )
 
-    >>> pd.cut([0, 1, 1, 2], bins=4, labels=False)
-    array([0, 1, 1, 3])
+    return date_range(
+        start=start,
+        end=end,
+        periods=periods,
+        freq=freq,
+        tz=tz,
+        normalize=normalize,
+        name=name,
+        inclusive=inclusive,
+        **kwargs,
+    )
 
-    Passing a Series as an input returns a Series with labels=False:
 
-    >>> s = pd.Series(np.array([2, 4, 6, 8, 10]),
-    ...               index=['a', 'b', 'c', 'd', 'e'])
-    >>> pd.cut(s, 3, labels=False)
-    ... # doctest: +ELLIPSIS
-    a    0
-    b    0
-    c    1
-    d    2
-    e    2
-    dtype: int64
+# Adding docstring since pandas docs don't have web section for this function.
+@snowpark_pandas_telemetry_standalone_function_decorator
+@pandas_module_level_function_not_implemented()
+def value_counts(
+    values, sort=True, ascending=False, normalize=False, bins=None, dropna=True
+):
     """
+    Compute a histogram of the counts of non-null values.
 
-    if retbins is True:
-        ErrorMessage.not_implemented("retbins not supported.")
+    Parameters
+    ----------
+    values : ndarray (1-d)
+        Values to perform computation.
+    sort : bool, default: True
+        Sort by values.
+    ascending : bool, default: False
+        Sort in ascending order.
+    normalize : bool, default: False
+        If True then compute a relative histogram.
+    bins : integer, optional
+        Rather than count values, group them into half-open bins,
+        convenience for pd.cut, only works with numeric data.
+    dropna : bool, default: True
+        Don't include counts of NaN.
 
-    # Execute other supported objects via native pandas.
-    if not isinstance(x, Series):
-        return pandas.cut(
-            x,
-            bins,
-            right=right,
-            labels=labels,
-            retbins=retbins,
-            precision=precision,
-            include_lowest=include_lowest,
-            duplicates=duplicates,
-            ordered=ordered,
-        )
+    Returns
+    -------
+    Series
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    return Series(values).value_counts(
+        sort=sort,
+        ascending=ascending,
+        normalize=normalize,
+        bins=bins,
+        dropna=dropna,
+    )
 
-    # Produce pandas-compatible error if ordered=False and labels are not specified.
-    # No error is raised when labels are not desired (labels=False).
-    if ordered is False and labels is None:
-        raise ValueError("'labels' must be provided if 'ordered = False'")
 
-    bins, qc = x._query_compiler.cut(
-        bins,
-        right=right,
-        labels=labels,
-        precision=precision,
-        include_lowest=include_lowest,
-        duplicates=duplicates,
-    )
+def _determine_name(objs: Iterable[BaseQueryCompiler], axis: int | str):
+    """
+    Determine names of index after concatenation along passed axis.
 
-    # Depending on setting, reconstruct bins and convert qc to the correct result.
-    if labels is False:
-        return pd.Series(query_compiler=qc)
-    else:
-        # Raise NotImplemented Error as categorical is not supported.
-        ErrorMessage.not_implemented("categorical not supported in Snowpark pandas API")
+    Parameters
+    ----------
+    objs : iterable of QueryCompilers
+        Objects to concatenate.
+    axis : int or str
+        The axis to concatenate along.
 
-        # Following code would produce correct result, uncomment once categorical is supported.
-        # Convert to pandas categorical and return as Series.
-        # Note: In the future, once we support CategoricalType we could keep this lazily around. For now,
-        # match what pandas does here. In the future, change pandas -> pd and everything should work out-of-the box.
-        # arr = qc.to_numpy().ravel()
-        # return pandas.Series(
-        #    pandas.Categorical(values=arr, categories=labels, ordered=ordered)
-        # )
+    Returns
+    -------
+    list with single element
+        Computed index name, `None` if it could not be determined.
+    """
+    # TODO: SNOW-1063345: Modin upgrade - modin.pandas functions in general.py
+    axis = pandas.DataFrame()._get_axis_number(axis)
+
+    def get_names(obj):
+        return obj.columns.names if axis else obj.index.names
+
+    names = np.array([get_names(obj) for obj in objs])
+
+    # saving old name, only if index names of all objs are the same
+    if np.all(names == names[0]):
+        # we must do this check to avoid this calls `list(str_like_name)`
+        return list(names[0]) if is_list_like(names[0]) else [names[0]]
+    else:
+        return None