diff --git a/python/tests/stats/test_dbscan.py b/python/tests/stats/test_dbscan.py index 70f236291d..f387ee8a9c 100644 --- a/python/tests/stats/test_dbscan.py +++ b/python/tests/stats/test_dbscan.py @@ -93,6 +93,8 @@ def test_dbscan_valid_parameters(self): self.spark.conf.set( "sedona.join.autoBroadcastJoinThreshold", -1 ) + self.spark.conf.set("spark.sql.autoBroadcastJoinThreshold", -1) + df = self.create_sample_dataframe() for epsilon in [0.6, 0.7, 0.8]: for min_pts in [3, 4, 5]: @@ -105,6 +107,8 @@ def test_dbscan_valid_parameters_default_column_name(self): self.spark.conf.set( "sedona.join.autoBroadcastJoinThreshold", -1 ) + self.spark.conf.set("spark.sql.autoBroadcastJoinThreshold", -1) + df = self.create_sample_dataframe().select( "id", f.col("arealandmark").alias("geometryFieldName") ) @@ -120,6 +124,8 @@ def test_dbscan_valid_parameters_polygons(self): self.spark.conf.set( "sedona.join.autoBroadcastJoinThreshold", -1 ) + self.spark.conf.set("spark.sql.autoBroadcastJoinThreshold", -1) + df = self.create_sample_dataframe().select( "id", ST_Buffer(f.col("arealandmark"), 0.000001).alias("geometryFieldName") ) @@ -135,6 +141,8 @@ def test_dbscan_supports_other_distance_function(self): self.spark.conf.set( "sedona.join.autoBroadcastJoinThreshold", -1 ) + self.spark.conf.set("spark.sql.autoBroadcastJoinThreshold", -1) + df = self.create_sample_dataframe().select( "id", ST_Buffer(f.col("arealandmark"), 0.000001).alias("geometryFieldName") ) @@ -181,6 +189,8 @@ def test_return_empty_df_when_no_clusters(self): self.spark.conf.set( "sedona.join.autoBroadcastJoinThreshold", -1 ) + self.spark.conf.set("spark.sql.autoBroadcastJoinThreshold", -1) + df = self.create_sample_dataframe() epsilon = 0.1 min_pts = 10000 @@ -197,6 +207,8 @@ def test_dbscan_doesnt_duplicate_border_points_in_two_clusters(self): self.spark.conf.set( "sedona.join.autoBroadcastJoinThreshold", -1 ) + self.spark.conf.set("spark.sql.autoBroadcastJoinThreshold", -1) + input_df = self.spark.createDataFrame( [ {"id": 10, "x": 1.0, "y": 1.8}, @@ -222,6 +234,8 @@ def test_return_outliers_false_doesnt_return_outliers(self): self.spark.conf.set( "sedona.join.autoBroadcastJoinThreshold", -1 ) + self.spark.conf.set("spark.sql.autoBroadcastJoinThreshold", -1) + df = self.create_sample_dataframe() for epsilon in [0.6, 0.7, 0.8]: for min_pts in [3, 4, 5]: