1{ lib
2, buildPythonPackage
3, fetchPypi
4, py4j
5}:
6
7buildPythonPackage rec {
8 pname = "pyspark";
9 version = "3.2.0";
10
11 src = fetchPypi {
12 inherit pname version;
13 sha256 = "bfea06179edbfb4bc76a0f470bd3c38e12f00e1023e3ad0373558d07cff102ab";
14 };
15
16 # pypandoc is broken with pandoc2, so we just lose docs.
17 postPatch = ''
18 sed -i "s/'pypandoc'//" setup.py
19
20 substituteInPlace setup.py \
21 --replace py4j==0.10.9.2 'py4j>=0.10.9,<0.11'
22 '';
23
24 propagatedBuildInputs = [
25 py4j
26 ];
27
28 # Tests assume running spark instance
29 doCheck = false;
30
31 pythonImportsCheck = [
32 "pyspark"
33 ];
34
35 meta = with lib; {
36 description = "Python bindings for Apache Spark";
37 homepage = "https://github.com/apache/spark/tree/master/python";
38 license = licenses.asl20;
39 maintainers = [ maintainers.shlevy ];
40 };
41}