Skip to content

Commit

Permalink
Merge pull request #272 from moj-analytical-services/dbrix_fix
Browse files Browse the repository at this point in the history
possible fix for databricks issue
  • Loading branch information
mamonu authored Feb 4, 2022
2 parents eb72e8a + b95902e commit 563473c
Show file tree
Hide file tree
Showing 2 changed files with 8 additions and 2 deletions.
2 changes: 1 addition & 1 deletion pyproject.toml
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
[tool.poetry]
name = "splink"
version = "2.1.4"
version = "2.1.5"
description = "Implementation of Fellegi-Sunter's canonical model of record linkage in Apache Spark, including EM algorithm to estimate parameters"
authors = ["Robin Linacre <[email protected]>", "Sam Lindsay", "Theodore Manassis"]
license = "MIT"
Expand Down
8 changes: 7 additions & 1 deletion splink/cluster.py
Original file line number Diff line number Diff line change
Expand Up @@ -82,9 +82,15 @@ def _check_graphframes_installation(spark):
if key in config_keys:
if "graphframes" in value:
graphframe_jar_registered = True

databricks_backend = False
for key, value in all_config:
if "databricks" in key:
databricks_backend = True

if not graphframe_jar_registered:
raise Exception(graphframes_jar_missing_message)
if not databricks_backend:
raise Exception(graphframes_jar_missing_message)

from pyspark.sql import Row

Expand Down

0 comments on commit 563473c

Please sign in to comment.