diff --git a/Dockerfile b/Dockerfile index 7efd40c281dc86a76024579d5540dcf5694636d6..4e4ed064152bbcec8ff66cebd74d42e65383eb34 100644 --- a/Dockerfile +++ b/Dockerfile @@ -3,16 +3,9 @@ FROM $FROM ARG SPARK_NXCALS_URL=http://photons-resources.cern.ch/downloads/nxcals_pro/spark/spark-nxcals.zip -RUN cat <<EOF | tee /etc/yum.repos.d/influxdb.repo \ -[influxdb] \ -name = InfluxDB Repository - RHEL \$releasever \ -baseurl = https://repos.influxdata.com/rhel/\$releasever/\$basearch/stable \ -enabled = 1 \ -gpgcheck = 1 \ -gpgkey = https://repos.influxdata.com/influxdb.key \ -EOF - -RUN yum update -y && yum install -y python3 python3-pip python3-virtualenv git unzip bsdtar rsync CERN-CA-certs which influxdb && \ +COPY influxdb.centos7.repo /etc/yum.repos.d/influxdb.repo + +RUN yum update -y && yum install -y python3 python3-cython python3-pip python3-virtualenv git unzip bsdtar rsync CERN-CA-certs which influxdb && \ yum clean all ENV SPARK_HOME=/opt/nxcals-spark @@ -34,7 +27,7 @@ USER etlworker RUN cd $SPARK_HOME && \ yes | source $SPARK_HOME/source-me.sh && \ source $SPARK_HOME/nxcals-python3-env/bin/activate && \ - pip3 list && pip3 install pyspark==2.3.2 pandas scipy influxdb pyarrow + pip3 list && pip3 install pyspark[sql]==2.3.2 pandas scipy influxdb pyarrow==0.8.0 RUN source $SPARK_HOME/nxcals-python3-env/bin/activate && \ pip3 install git+https://gitlab.cern.ch/industrial-controls/services/dash/dash-etl.git@develop diff --git a/influxdb.centos7.repo b/influxdb.centos7.repo new file mode 100644 index 0000000000000000000000000000000000000000..e57289e6d25e83bd386822ddd41fa94ed7c8d896 --- /dev/null +++ b/influxdb.centos7.repo @@ -0,0 +1,6 @@ +[influxdb] +name = InfluxDB Repository - RHEL 7 +baseurl = https://repos.influxdata.com/rhel/7/x86_64/stable +enabled = 1 +gpgcheck = 1 +gpgkey = https://repos.influxdata.com/influxdb.key