-
Notifications
You must be signed in to change notification settings - Fork 20
/
Copy pathDockerfile
125 lines (102 loc) · 4.44 KB
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
# Use Ubuntu 18.04 as the base image
FROM ubuntu:18.04
ARG enable_spark
ARG enable_postgresql
ENV enable_spark=${enable_spark}
ENV enable_postgresql=${enable_postgresql}
# Set environment variables for PostgreSQL
ARG USER_HOME=/home/pilotscope
ENV PG_PATH ${USER_HOME}/pgsql/
ENV PG_DATA ${USER_HOME}/pg_data
ENV CONDA_DIR ${USER_HOME}/miniconda3
ENV LD_LIBRARY_PATH $PG_PATH/lib:$LD_LIBRARY_PATH
ENV JAVA_HOME ${USER_HOME}/jdk1.8.0_202
ENV PATH $JAVA_HOME/bin:$PG_PATH/bin:$CONDA_DIR/bin:$PATH
# Set non-interactive installation
ENV DEBIAN_FRONTEND=noninteractive
SHELL ["/bin/bash", "-c"]
# Install dependencies
RUN apt-get update && apt-get install -y sudo wget git bzip2 vim openssh-server gcc build-essential libreadline-dev zlib1g-dev bison flex gdb libssl-dev libbz2-dev libsqlite3-dev llvm libncurses5-dev libncursesw5-dev xz-utils libffi-dev liblzma-dev
# Create a pilotscope user
RUN echo 'root:root' | chpasswd && \
useradd -m -s /bin/bash pilotscope && \
echo "pilotscope:pilotscope" | chpasswd && \
usermod -aG sudo pilotscope
RUN git config --global http.postBuffer 524288000
# Set ssh
RUN sed -i 's/#PermitRootLogin prohibit-password/PermitRootLogin yes/' /etc/ssh/sshd_config
USER pilotscope
WORKDIR ${USER_HOME}
####### Install PilotScope Core #######
RUN git -c http.sslVerify=false clone --depth 1 --branch master https://github.com/alibaba/pilotscope.git PilotScopeCore
# Install Miniconda
RUN mkdir -p ${CONDA_DIR} && \
wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh -O ${CONDA_DIR}/miniconda.sh && \
bash ${CONDA_DIR}/miniconda.sh -b -u -p ${CONDA_DIR} && \
rm -rf ${CONDA_DIR}/miniconda.sh
RUN conda create --name pilotscope python=3.8
RUN conda init
# Install libraries
RUN source ${CONDA_DIR}/bin/activate pilotscope && \
cd ./PilotScopeCore && \
pip install -e . -i https://mirrors.aliyun.com/pypi/simple/ && \
pip install -e '.[dev]' -i https://mirrors.aliyun.com/pypi/simple/
####### Install PostgreSQL #######
RUN if [ "$enable_postgresql" = "true" ]; then \
git -c http.sslVerify=false clone --depth 1 --branch pilotscope-postgresql https://github.com/alibaba/pilotscope.git PilotScopePostgreSQL && \
cd ./PilotScopePostgreSQL && \
./configure --prefix=$PG_PATH --enable-depend --enable-cassert --enable-debug CFLAGS="-ggdb -O0" && \
make && make install && \
sh install_extension.sh && \
make && make install ; \
fi
RUN if [ "$enable_postgresql" = "true" ]; then \
# Initialize the database
${PG_PATH}/bin/initdb -D $PG_DATA && \
# Configure PostgreSQL to allow connections
echo "listen_addresses = '*'" >> $PG_DATA/postgresql.conf && \
echo "host all all all md5" >> $PG_DATA/pg_hba.conf && \
echo "shared_preload_libraries = 'pg_hint_plan'" >> $PG_DATA/postgresql.conf && \
${PG_PATH}/bin/pg_ctl start -D $PG_DATA && \
${PG_PATH}/bin/psql -d template1 -c "create database pilotscope;" && \
${PG_PATH}/bin/psql -c "ALTER USER pilotscope PASSWORD 'pilotscope';" \
; else \
echo "PostgreSQL installation skipped"; \
fi
######## Install Spark #######
RUN if [ "$enable_spark" = "true" ]; then \
# Download and install PilotScope patch for Spark
git -c http.sslVerify=false clone --depth 1 --branch pilotscope-spark https://github.com/alibaba/pilotscope.git PilotScopeSpark && \
cd ./PilotScopeSpark && \
# Download Spark
wget https://archive.apache.org/dist/spark/spark-3.3.2/spark-3.3.2.tgz && \
tar -xzvf spark-3.3.2.tgz && \
rm spark-3.3.2.tgz; \
fi
RUN if [ "$enable_spark" = "true" ]; then \
# Apply patch
cd ./PilotScopeSpark && \
git config --global user.email "[email protected]" && \
git config --global user.name "pilotscope" && \
bash apply_patch.sh /pilotscope_spark.patch; \
fi
RUN if [ "$enable_spark" = "true" ]; then \
# Install JDK
wget https://github.com/WoodyBryant/JDK/releases/download/v2/jdk-8u202-linux-x64.tar.gz && \
tar -xzf jdk-8u202-linux-x64.tar.gz -C ${USER_HOME} && \
rm jdk-8u202-linux-x64.tar.gz; \
fi
RUN if [ "$enable_spark" = "true" ]; then \
# Compile Spark
cd ./PilotScopeSpark/spark-3.3.2 && \
./build/mvn -DskipTests clean package;\
fi
RUN if [ "$enable_spark" = "true" ]; then \
# Install PySpark
cd ./PilotScopeSpark/spark-3.3.2/python && \
source ${CONDA_DIR}/bin/activate pilotscope && \
python setup.py install \
; else \
echo "Spark installation skipped"; \
fi
CMD ["/bin/bash"]