nixpkgs/pkgs/applications/networking/cluster/spark/default.nix

73 lines
2.2 KiB
Nix
Raw Normal View History

2015-12-26 18:29:08 +01:00
{ stdenv, fetchzip, makeWrapper, jre, pythonPackages
2017-03-26 18:17:17 +02:00
, RSupport? true, R
2014-12-04 17:27:01 +01:00
, mesosSupport ? true, mesos
, version
2014-12-04 17:27:01 +01:00
}:
let
versionMap = {
2017-03-26 16:07:21 +02:00
"1.6.3" = {
hadoopVersion = "cdh4";
2017-03-26 16:07:21 +02:00
sparkSha256 = "00il083cjb9xqzsma2ifphq9ggichwndrj6skh2z5z9jk3z0lgyn";
};
"2.1.0" = {
hadoopVersion = "hadoop2.4";
sparkSha256 = "0pbsmbjwijsfgbnm56kgwnmnlqkz3w010ma0d7vzlkdklj40vqn2";
};
};
in
with versionMap.${version};
2014-12-04 17:27:01 +01:00
with stdenv.lib;
stdenv.mkDerivation rec {
name = "spark-${version}";
2015-12-26 18:29:08 +01:00
src = fetchzip {
url = "mirror://apache/spark/${name}/${name}-bin-${hadoopVersion}.tgz";
sha256 = sparkSha256;
};
2014-12-04 17:27:01 +01:00
buildInputs = [ makeWrapper jre pythonPackages.python pythonPackages.numpy ]
2017-03-26 18:17:17 +02:00
++ optional RSupport R
++ optional mesosSupport mesos;
untarDir = "${name}-bin-${hadoopVersion}";
installPhase = ''
mkdir -p $out/{lib/${untarDir}/conf,bin,/share/java}
2014-12-04 17:27:01 +01:00
mv * $out/lib/${untarDir}
sed -e 's/INFO, console/WARN, console/' < \
$out/lib/${untarDir}/conf/log4j.properties.template > \
$out/lib/${untarDir}/conf/log4j.properties
2014-12-04 17:27:01 +01:00
cat > $out/lib/${untarDir}/conf/spark-env.sh <<- EOF
export JAVA_HOME="${jre}"
export SPARK_HOME="$out/lib/${untarDir}"
export PYSPARK_PYTHON="${pythonPackages.python}/bin/${pythonPackages.python.executable}"
export PYTHONPATH="\$PYTHONPATH:$PYTHONPATH"
2017-03-26 18:17:17 +02:00
${optionalString RSupport
''export SPARKR_R_SHELL="${R}/bin/R"
export PATH=$PATH:"${R}/bin/R"''}
2014-12-04 17:27:01 +01:00
${optionalString mesosSupport
''export MESOS_NATIVE_LIBRARY="$MESOS_NATIVE_LIBRARY"''}
EOF
2014-12-04 17:27:01 +01:00
for n in $(find $out/lib/${untarDir}/bin -type f ! -name "*.*"); do
makeWrapper "$n" "$out/bin/$(basename $n)"
done
ln -s $out/lib/${untarDir}/lib/spark-assembly-*.jar $out/share/java
'';
meta = {
2017-03-26 18:17:17 +02:00
description = "Apache Spark is a fast and general engine for large-scale data processing";
homepage = "http://spark.apache.org";
license = stdenv.lib.licenses.asl20;
platforms = stdenv.lib.platforms.all;
2014-12-04 17:27:01 +01:00
maintainers = with maintainers; [ thoughtpolice offline ];
repositories.git = git://git.apache.org/spark.git;
};
}