# Download base image ubuntu 18.04 FROM ubuntu:18.04 # Set environment variables ENV NB_USER jovyan ENV NB_UID 1000 ENV HOME /home/${NB_USER} ENV JAVA_HOME /usr/lib/jvm/java-8-openjdk-amd64/ # Install required packages RUN apt-get update && apt-get install -y \ tar \ wget \ bash \ rsync \ gcc \ libfreetype6-dev \ libhdf5-serial-dev \ libpng-dev \ libzmq3-dev \ python3 \ python3-dev \ python3-pip \ unzip \ pkg-config \ software-properties-common \ graphviz \ openjdk-8-jdk \ ant \ ca-certificates-java \ && apt-get clean \ && update-ca-certificates -f # Install Python 3.8 and pip RUN add-apt-repository ppa:deadsnakes/ppa \ && apt-get update \ && apt-get install -y python3.8 python3-pip \ && apt-get clean # Set up JAVA_HOME RUN echo "export JAVA_HOME=/usr/lib/jvm/java-8-openjdk-amd64/" >> /etc/profile \ && echo "export PATH=\$JAVA_HOME/bin:\$PATH" >> /etc/profile # Create a new user named "jovyan" with user ID 1000 RUN useradd -m -u ${NB_UID} ${NB_USER} # Switch to the "jovyan" user USER ${NB_USER} # Set home and path variables for the user ENV HOME=/home/${NB_USER} \ PATH=/home/${NB_USER}/.local/bin:$PATH # Set up PySpark to use Python 3.8 for both driver and workers ENV PYSPARK_PYTHON=/usr/bin/python3.8 ENV PYSPARK_DRIVER_PYTHON=/usr/bin/python3.8 # Set the working directory to the user's home directory WORKDIR ${HOME} # Upgrade pip and install Python dependencies RUN python3.8 -m pip install --upgrade pip # Copy requirements.txt to the container and install dependencies COPY requirements.txt /tmp/requirements.txt RUN python3.8 -m pip install -r /tmp/requirements.txt # Explicitly copy the streamlit.py file into the container COPY streamlit.py /home/jovyan/streamlit.py # Expose port for Streamlit EXPOSE 7860 # Define the entry point for the container ENTRYPOINT ["streamlit", "run", "/home/jovyan/streamlit.py", "--server.port=7860", "--server.address=0.0.0.0"]