Skip to content

Commit f4b504a

Browse files
committed
Add Docker build and push workflows, and update README and deployment configurations
1 parent 86657ee commit f4b504a

File tree

6 files changed

+51
-12
lines changed

6 files changed

+51
-12
lines changed

.github/workflows/build-docker.yml

Lines changed: 36 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,36 @@
1+
name: Build Docker
2+
3+
on:
4+
push:
5+
branches:
6+
- master
7+
pull_request:
8+
paths:
9+
- 'docker/**'
10+
jobs:
11+
build:
12+
runs-on: ubuntu-latest
13+
steps:
14+
- uses: actions/checkout@v3
15+
16+
- name: Log in to Docker Hub
17+
uses: docker/login-action@v1
18+
with:
19+
username: ${{ secrets.DOCKERHUB_USERNAME }}
20+
password: ${{ secrets.DOCKERHUB_PASSWORD }}
21+
22+
- name: Docker Build & Push
23+
run: |
24+
timestamp=$(date +"%Y%m%d%H%M%S")
25+
26+
docker build -t ${{ secrets.DOCKERHUB_USERNAME }}/all-spark-notebook:$timestamp -f docker/jupyter-notebook/Dockerfile.notebook ./docker/jupyter-notebook
27+
docker tag ${{ secrets.DOCKERHUB_USERNAME }}/all-spark-notebook:$timestamp ${{ secrets.DOCKERHUB_USERNAME }}/all-spark-notebook:latest
28+
29+
docker push ${{ secrets.DOCKERHUB_USERNAME }}/all-spark-notebook:$timestamp
30+
docker push ${{ secrets.DOCKERHUB_USERNAME }}/all-spark-notebook:latest
31+
32+
docker build -t ${{ secrets.DOCKERHUB_USERNAME }}/spark-history-server:$timestamp -f docker/spark-history-server/Dockerfile ./docker/spark-history-server
33+
docker tag ${{ secrets.DOCKERHUB_USERNAME }}/spark-history-server:$timestamp ${{ secrets.DOCKERHUB_USERNAME }}/spark-history-server:latest
34+
35+
docker push ${{ secrets.DOCKERHUB_USERNAME }}/spark-history-server:$timestamp
36+
docker push ${{ secrets.DOCKERHUB_USERNAME }}/spark-history-server:latest

.github/workflows/build-deploy-examples.yml renamed to .github/workflows/build-examples.yml

Lines changed: 1 addition & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
name: Build & Deploy Examples
1+
name: Build Examples
22

33
# Controls when the workflow will run
44
on:
@@ -54,13 +54,4 @@ jobs:
5454
docker build -t ${{ secrets.DOCKERHUB_USERNAME }}/word-count:$VERSION_WITH_TIMESTAMP --build-arg VERSION=$VERSION .
5555
docker push ${{ secrets.DOCKERHUB_USERNAME }}/word-count:$VERSION_WITH_TIMESTAMP
5656
57-
deploy-examples:
58-
needs: build-examples
59-
runs-on: ubuntu-latest
60-
if: ${{ github.event.inputs.deploy-example != 'None' }}
61-
62-
steps:
63-
- name: Deploy to GKE
64-
run: |
65-
echo "Deploy ${{ github.event.inputs.deploy-example }} to GKE!"
6657

README.md

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,9 +7,21 @@
77
<img alt="GitHub License" src="https://img.shields.io/github/license/xuwenyihust/Data-Platform?link=https%3A%2F%2Fgithub.com%2Fxuwenyihust%2FData-Platform%2Fblob%2Fmain%2FLICENSE">
88
</p>
99

10+
> ⚠️ Currently in Development: Expect breaking changes and bugs!
11+
1012
## Overview
1113
A big data platform for data processing and machine learning based on Kubernetes and Spark.
1214

15+
## Features
16+
- Spark Application Deployment
17+
- Jar Application Submission
18+
- PySpark Application Submission
19+
- Jupyter Notebook
20+
- Customized Integration with PySpark
21+
- Monitoring
22+
- Spark UI
23+
- History Server
24+
1325
## Supported Versions
1426
- Spark: 3.5.0
1527
- Scala: 2.12

helm/data-platform/templates/notebook-deployment.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ spec:
1515
serviceAccountName: spark
1616
containers:
1717
- name: notebook
18-
image: wenyixu101/all-spark-notebook:spark-3.5.0_26
18+
image: wenyixu101/all-spark-notebook:latest
1919
imagePullPolicy: Always
2020
command: ["/bin/bash", "-c", "start-notebook.sh"]
2121
ports:

helm/data-platform/templates/spark-history-server-deployment.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ spec:
1414
spec:
1515
containers:
1616
- name: spark-history-server
17-
image: wenyixu101/spark-history-server:3.5.0
17+
image: wenyixu101/spark-history-server:latest
1818
command: ["/bin/sh", "-c"]
1919
args: ["/opt/spark/bin/spark-class org.apache.spark.deploy.history.HistoryServer"]
2020
env:

0 commit comments

Comments
 (0)