diff --git a/python/pyspark/pandas/generic.py b/python/pyspark/pandas/generic.py index c60097e952..c1009b0c62 100644 --- a/python/pyspark/pandas/generic.py +++ b/python/pyspark/pandas/generic.py @@ -860,6 +860,11 @@ class Frame(object, metaclass=ABCMeta): ) if num_files is not None: + warnings.warn( + "`num_files` has been deprecated and might be removed in a future version. " + "Use `DataFrame.spark.repartition` instead.", + FutureWarning, + ) sdf = sdf.repartition(num_files) builder = sdf.write.mode(mode) @@ -998,6 +1003,11 @@ class Frame(object, metaclass=ABCMeta): sdf = psdf.to_spark(index_col=index_col) # type: ignore if num_files is not None: + warnings.warn( + "`num_files` has been deprecated and might be removed in a future version. " + "Use `DataFrame.spark.repartition` instead.", + FutureWarning, + ) sdf = sdf.repartition(num_files) builder = sdf.write.mode(mode) diff --git a/python/pyspark/pandas/namespace.py b/python/pyspark/pandas/namespace.py index a46926d102..9af91cb48b 100644 --- a/python/pyspark/pandas/namespace.py +++ b/python/pyspark/pandas/namespace.py @@ -39,6 +39,7 @@ from distutils.version import LooseVersion from functools import reduce from io import BytesIO import json +import warnings import numpy as np import pandas as pd @@ -2822,6 +2823,8 @@ def broadcast(obj: DataFrame) -> DataFrame: """ Marks a DataFrame as small enough for use in broadcast joins. + .. deprecated:: 3.2.0 + Use :func:`DataFrame.spark.hint` instead. Parameters ---------- obj : DataFrame @@ -2852,6 +2855,11 @@ def broadcast(obj: DataFrame) -> DataFrame: ...BroadcastHashJoin... ... """ + warnings.warn( + "`broadcast` has been deprecated and might be removed in a future version. " + "Use `DataFrame.spark.hint` with 'broadcast' for `name` parameter instead.", + FutureWarning, + ) if not isinstance(obj, DataFrame): raise TypeError("Invalid type : expected DataFrame got {}".format(type(obj).__name__)) return DataFrame(