Merge pull request #23 from luoziqing99/milestone6

Merge milestone6 to main
luoziqing99 · Dec 12, 2023 · 1030790 · 1030790
2 parents 39f99ff + 42b6acd
commit 1030790
Show file tree

Hide file tree

Showing 119 changed files with 11,172 additions and 1 deletion.
diff --git a/.dvc/.gitignore b/.dvc/.gitignore
@@ -0,0 +1,3 @@
+/config.local
+/tmp
+/cache
diff --git a/.dvc/config b/.dvc/config
@@ -0,0 +1,4 @@
+[core]
+    remote = gcs
+['remote "gcs"']
+    url = gs://ac215-sciencetutor/dvc
diff --git a/.dvcignore b/.dvcignore
@@ -0,0 +1,3 @@
+# Add patterns of files dvc should ignore, which could improve
+# the performance. Learn more at
+# https://dvc.org/doc/user-guide/dvcignore
diff --git a/.github/workflows/ci-cd.yml b/.github/workflows/ci-cd.yml
@@ -0,0 +1,51 @@
+name: Continuous Integration and Continuous Deployment
+run-name: ${{ github.actor }} submitted a CI CD Action
+on:
+  push:
+    branches: [ "main", "milestone6", "milestone6-yp"]
+
+jobs:
+  Explore-GitHub-Actions:
+    if: contains(github.event.head_commit.message, '/run-')
+    runs-on: ubuntu-latest
+    steps:
+      - run: echo "Comment ${{ github.event.head_commit.message }}"
+      - run: echo "Job was automatically triggered by a ${{ github.event_name }} event."
+      - run: echo "Job is now running on a ${{ runner.os }} server hosted by GitHub!"
+      - run: echo "Branch is ${{ github.ref }} and your repository is ${{ github.repository }}."
+      - name: Check out repository code
+        uses: actions/checkout@v4
+      - id: 'auth'
+        uses: google-github-actions/auth@v1
+        with:
+          credentials_json: '${{ secrets.GOOGLE_APPLICATION_CREDENTIALS }}'
+      - name: Configure Google Cloud SDK
+        uses: google-github-actions/setup-gcloud@v1
+      - name: Configure Docker Client
+        run: |-
+          gcloud auth configure-docker # --quiet #authenticate to gcr
+      - run: echo "💡 The ${{ github.repository }} repository has been cloned to the runner."
+      - run: echo "🖥️ The workflow is now ready to test your code on the runner."
+      - name: List files in the repository
+        run: |
+          ls ${{ github.workspace }}
+      - name: Build App Deploy Container 
+        run: |-
+          cd ${{ github.workspace }}/src/app_deploy/
+          docker build -t app_deployment --platform=linux/amd64 -f Dockerfile .
+      - name: Run Deploy App
+        if: contains(github.event.head_commit.message, '/run-deploy-app')
+        run: |-
+          docker run --rm --name app_deployment \
+            -v /var/run/docker.sock:/var/run/docker.sock \
+            -v $HOME/.ssh:/home/app/.ssh \
+            -v ${{ github.workspace }}/src/frontend:/frontend-react \
+            -v ${{ github.workspace }}/src/api-service:/api-service \
+            --volume $GITHUB_WORKSPACE:/workspace \
+            --mount type=bind,source=$GOOGLE_APPLICATION_CREDENTIALS,target=/secrets/deployment.json \
+            --env GOOGLE_APPLICATION_CREDENTIALS=/secrets/deployment.json \
+            -e USE_GKE_GCLOUD_AUTH_PLUGIN=True \
+            -e GCP_PROJECT=ac215project-398401 \
+            -e GCP_ZONE=us-west3-b \
+            app_deployment ./deploy-app.sh
+      - run: echo "Job's status is ${{ job.status }}."
diff --git a/.gitignore b/.gitignore
@@ -127,3 +127,18 @@ dmypy.json
 
 # Pyre type checker
 .pyre/
+
+src/data_processing/ScienceQA
+src/data_processing/ScienceQA-LLAVA
+# GCS creds
+src/data_processing/*.json
+.idea
+
+# DS_Store files
+*.DS_Store
+.vscode
+scienceqa-*.json*
+
+**/text-generation-webui
+
+src/api-service/api/LLaVA
diff --git a/README.md b/README.md
@@ -1 +1,305 @@
-# AC215_ScienceTutor
+# AC215 - ScienceTutor: An Educational Application For Children
+
+### Presentation Video
+* https://drive.google.com/file/d/1y41Zua5000fInmUBlQKhANr39Wn5bQJf/view?usp=sharing
+
+### Blog Post Link
+* https://medium.com/@lsjnancy/94a5af6b1b74
+
+------------
+
+## Project Organization
+```
+.
+├── .github
+│   └── workflows
+|       └── ci-cd.yml
+├── LICENSE
+├── README.md
+├── notebooks
+│   └── AC215_milestone3_model_training.ipynb
+├── pictures
+│   ├── apidoc.png
+│   ├── chatbot-v2.png
+│   ├── chatbot.png
+│   ├── compute_engine.png
+│   ├── gcs_model_bucket.png
+│   ├── k8s-v2.png
+│   ├── k8s.png
+│   ├── ml_workflow.png
+│   ├── ml_workflow_pipeline_run.png
+│   ├── postman.png
+│   ├── science_tutor_app_pipeline.png
+│   ├── science_tutor_app_pipeline2.png
+│   ├── ScienceQA1.png
+│   ├── ScienceQA2.png
+│   ├── solution_architecture.png
+│   ├── technical_architecture.png
+│   ├── vertex_ai_model_training.png
+│   ├── wandb_system.png
+│   ├── wandb_train.png
+│   └── web_server_demo.png
+├── presentations
+│   ├── AC215-final-presentation.mp4
+│   ├── AC215-final-presentation.pdf
+│   ├── AC215-midterm-demo.mp4
+│   └── AC215-midterm.pdf
+├── references
+│   ├── Learn to Explain-Multimodal Reasoning via ThoughtChainsforScienceQuestion Answering.pdf
+│   ├── Visual Instruction Tuning.pdf
+│   ├── Visual_Questions_Answering_Developments_Applications_Datasets_and_Opportunities_A_State-of-the-Art_Survey.pdf
+│   └── VQA-Visual Question Answering.pdf
+├── reports
+│   ├── milestone2.md
+│   ├── milestone3.md
+│   ├── milestone4.md
+│   └── milestone5.md
+└── src
+    ├── api-service                 <-- Code for app backend APIs
+    │   ├── Dockerfile
+    │   ├── api
+    │   │   └── model_backend.py
+    │   ├── docker-shell.sh
+    │   └── requirements.txt
+    ├── app_deploy                  <-- Code for app deployment to GCP
+    │   ├── Dockerfile
+    │   ├── deploy-create-instance.yml
+    │   ├── deploy-docker-images.yml
+    │   ├── deploy-k8s-cluster.yml
+    │   ├── deploy-provision-instance.yml
+    │   ├── deploy-setup-containers.yml
+    │   ├── deploy-setup-webserver.yml
+    │   ├── update-k8s-cluster.yml
+    │   ├── deploy-app-init.sh
+    │   ├── deploy-app.sh
+    │   ├── docker-entrypoint.sh
+    │   ├── docker-shell.sh
+    │   ├── update-deploy-app.sh
+    │   ├── inventory.yml
+    │   ├── inventory-prod.yml
+    │   └── nginx-conf
+    │       └── nginx
+    │           └── nginx.conf
+    ├── data_processing             <-- Code for data processing
+    │   ├── Dockerfile
+    │   ├── ScienceQA-LLAVA.dvc
+    │   ├── convert_scienceqa_to_llava.py
+    │   ├── docker-shell.sh
+    │   ├── requirements.txt
+    │   ├── upload_to_gcs.py
+    │   ├── upload_to_hf.py
+    │   └── utils.py
+    ├── frontend                    <-- Code for app frontend
+    │   ├── Dockerfile
+    │   ├── Dockerfile.dev
+    │   ├── docker-shell.sh
+    │   ├── index.html
+    │   ├── node_modules
+    │   ├── package-lock.json
+    │   ├── package.json
+    │   ├── public
+    │   │   ├── send.png
+    │   │   ├── student.png
+    │   │   ├── teacher.png
+    │   ├── src
+    │   │   ├── App.css
+    │   │   ├── App.jsx
+    │   │   ├── index.css
+    │   │   └── main.jsx
+    │   └── vite.config.js
+    ├── ml_workflow                 <-- Scripts for automating data processing and modeling
+    │   ├── Dockerfile
+    │   ├── Pipfile
+    │   ├── Pipfile.lock
+    │   ├── cli.py
+    │   ├── docker-entrypoint.sh
+    │   ├── docker-shell.sh
+    │   ├── model.py
+    │   ├── model_training.yaml
+    │   └── pipeline.yaml
+    ├── model_deploy                <-- Model deployment
+    │   ├── Dockerfile
+    │   ├── api_example
+    │   │   ├── req.json
+    │   │   └── websocket_streaming.py
+    │   ├── docker-shell.sh
+    │   └── failed_vertex_ai_script.py
+    ├── model_inference             <-- Model inference
+    │   ├── compute_metric.py
+    │   └── model_vqa_science.py
+    └── model_training              <-- Model training
+        ├── Dockerfile
+        ├── Pipfile
+        ├── Pipfile.lock
+        ├── cli.sh
+        ├── docker-entrypoint.sh
+        ├── docker-shell.sh
+        ├── download_from_gcs.py
+        ├── download_from_hf.py
+        ├── package
+        │   ├── PKG-INFO
+        │   ├── setup.cfg
+        │   ├── setup.py
+        │   └── trainer
+        │       ├── __init__.py
+        │       ├── task.py
+        │       └── wandb_api.py
+        ├── package-trainer.sh
+        ├── trainer-yp.tar.gz
+        ├── upload_model_to_gcs.py
+        └── upload_trainer_to_gcs.py
+```
+------------
+
+## AC215 - Final Project
+
+**Team Members** Sijia (Nancy) Li, Ziqing Luo, Yuqing Pan, Jiashu Xu, Xiaohan Zhao
+
+**Group Name** Science Tutor
+
+**Project - Problem Definition** In this project we aim to develop an educational application that provides instant and expert answers to science questions that children have in different domains such as natural, social and language science.
+
+### Data Description
+------------
+We will use [ScienceQA](https://scienceqa.github.io/#dataset), which is a public dataset that consists of ~21k multimodal multiple choice questions covering a diverse set of science topics (3 subjects, 26 topics, 127 categories, and 379 skills), as shown below. The dataset is available at [Hugging Face](https://huggingface.co/datasets/derek-thomas/ScienceQA). 
+
+#### Visual Question Answering:
+<img width="1362" alt="image" src="pictures/ScienceQA1.png">
+
+#### ScienceQA Topics:
+<img width="1362" alt="image" src="pictures/ScienceQA2.png">
+
+We train on the training subset of the ScienceQA, which consists of 12,726 training instances. After training on the dataset, we evaluate our model on the 4,241 test set. To ease development, we have also preprocessed and uploaded the reformatted dataset (LLaVA format) to:
+* Hugging Face: [cnut1648/ScienceQA-LLAVA](https://huggingface.co/datasets/cnut1648/ScienceQA-LLAVA/)
+* GCS: [gs://ac215-sciencetutor/ScienceQA-LLAVA](gs://ac215-sciencetutor/ScienceQA-LLAVA)
+
+In addition, ScienceQA contains the following data attributes:
+* **Question (and optionally image)** contains the actual science-related question
+* **Choices** are the possible choices
+* **Answer** is the integer index of the ground truth choice
+* **Subject, topic, category** contains the domain of the question
+* **Lecture** contains the context in which the question appears. We do not end up using this column because in practice, users might not give such detailed information. Our design goal is to train a model that can solve the question without accessing this information.
+
+We use DVC to version control two versions of the ScienceQA dataset, one for the original version which is multi-choice, another for the reformatted version where multi-choice is formatted as prompts and responses. 
+
+
+### Proposed Solution
+------------
+After completions of building a robust ML Pipeline in our previous milestone, we have built a back-end api service using Flask and a front-end web app using React. This will be our user-facing application that ties together the various components built in previous milestones.
+
+Here are our Solution Architecture and Technical Architecture to ensure all our components work together.
+
+#### Solution Architecture
+<img width="1362" alt="image" src="pictures/solution_architecture.png">
+
+#### Technical Architecture
+<img width="1362" alt="image" src="pictures/technical_architecture.png">
+
+#### ScienceTutor App
+A user friendly React app was built to interact with the Science Tutor chatbot in the web browser using the LLaVA-7b model finetuned on ScienceQA. Using the app, a user can type a question and upload an image, and then send the messages to the chatbot. The app will send the text and image (if an image is uploaded) to the backend api to get the model's output on what the answer will be to the given question (and image). Once the app gets the response from the backend api, the app will then reply to the user in the chat. 
+
+Here is a screenshot of our app:
+<img width="1362" alt="image" src="pictures/chatbot-v2.png">
+
+
+#### Kubernetes Deployment
+We deployed our frontend and backend to a kubernetes cluster to take care of load balancing and failover. We used ansible scripts to manage creating and updating the k8s cluster. Ansible helps us manage infrastructure as code and this is very useful to keep track of our app infrastructure as code in GitHub. It helps use setup deployments in a very automated way.
+
+Here is our deployed app on a K8s cluster in GCP:
+
+<img width="1362" alt="image" src="pictures/k8s-v2.jpg">
+
+
+### Code Structure
+------------
+The following are the folders from the previous milestones:
+```
+- data_processing
+- model_training
+- model_inference
+- model_deploy
+- ml_workflow
+- api-service
+- frontend
+- app_deploy
+```
+
+#### API Service Container
+
+This container has the python file `api/model_backend.py` to run and expose the backend apis.
+
+To run the container locally:
+* Open a terminal and go to the location where `src/api-service`
+* Run `sh docker-shell.sh`
+* The backend server is launched at `http://localhost:5000/` and `http://127.0.0.1:5000`
+* Go to `http://127.0.0.1:5000/chat` to interact with the endpoint
+* Go to `http://127.0.0.1:5000/apidocs` to view the APIs
+
+#### Frontend Container
+This container contains all the files to develop and build a react app. There are dockerfiles for both development and production. 
+
+To run the container locally:
+* Open a terminal and go to the location where `src/frontend`
+* Run `sh docker-shell.sh`
+* Once inside the docker container, run `npm install`
+* Once `npm` is installed, run `npm start`
+* Go to `http://localhost:8080` to access the app locally
+
+#### Deployment Container
+This container helps manage building and deploying all our app containers. This can be achieved with Ansible, with or without Kubernetes.
+
+To run the container locally:
+* Open a terminal and go to the location `AC215_ScienceTutor/src/app_deploy`
+* Run `sh docker-shell.sh`
+
+**Deploy with Ansible and Kubernetes**
+
+* Build and Push Docker Containers to GCR (Google Container Registry)
+```
+ansible-playbook deploy-docker-images.yml -i inventory.yml
+```
+
+* Create and Deploy Cluster
+```
+ansible-playbook deploy-k8s-cluster.yml -i inventory.yml --extra-vars cluster_state=present
+```
+Once the command runs go to `http://<YOUR INGRESS IP>.sslip.io`
+
+**Deploy with Ansible**
+
+* Build and Push Docker Containers to GCR
+```
+ansible-playbook deploy-docker-images.yml -i inventory.yml
+```
+
+* Create Compute Instance (VM) Server in GCP
+```
+ansible-playbook deploy-create-instance.yml -i inventory.yml --extra-vars cluster_state=present
+```
+
+* Provision Compute Instance in GCP
+Install and setup all the required things for deployment.
+```
+ansible-playbook deploy-provision-instance.yml -i inventory.yml
+```
+
+* Setup Docker Containers in the Compute Instance
+```
+ansible-playbook deploy-setup-containers.yml -i inventory.yml
+```
+
+* Setup Webserver on the Compute Instance
+```
+ansible-playbook deploy-setup-webserver.yml -i inventory.yml
+```
+Once the command runs go to `http://<External IP>` 
+
+#### Deploy with GitHub Actions
+Finally, we added CI/CD using GitHub Actions, such that we can trigger deployment or any other pipeline using GitHub Events. Our CI/CD yaml file can be found under .github/workflows. 
+
+```ci-cd.yml```:
+We implemented a CI/CD workflow to use the deployment container to:
+* Invoke docker image building and pushing to GCR on code changes
+* Deploy the changed containers to update the k8s cluster
+
+---
diff --git a/notebooks/.gitkeep b/notebooks/.gitkeep
diff --git a/notebooks/AC215_milestone3_model_training.ipynb b/notebooks/AC215_milestone3_model_training.ipynb
diff --git a/pictures/ScienceQA1.png b/pictures/ScienceQA1.png
diff --git a/pictures/ScienceQA2.png b/pictures/ScienceQA2.png
diff --git a/pictures/apidoc.png b/pictures/apidoc.png
diff --git a/pictures/chatbot-v2.png b/pictures/chatbot-v2.png
diff --git a/pictures/chatbot.png b/pictures/chatbot.png
diff --git a/pictures/compute_engine.png b/pictures/compute_engine.png
diff --git a/pictures/gcs_model_bucket.png b/pictures/gcs_model_bucket.png
diff --git a/pictures/k8s-v2.jpg b/pictures/k8s-v2.jpg
diff --git a/pictures/k8s.png b/pictures/k8s.png
diff --git a/pictures/ml_workflow.png b/pictures/ml_workflow.png
diff --git a/pictures/ml_workflow_pipeline_run.png b/pictures/ml_workflow_pipeline_run.png
diff --git a/pictures/postman.png b/pictures/postman.png
diff --git a/pictures/science_tutor_app_pipeline.png b/pictures/science_tutor_app_pipeline.png
diff --git a/pictures/science_tutor_app_pipeline2.png b/pictures/science_tutor_app_pipeline2.png
diff --git a/pictures/solution_architecture.png b/pictures/solution_architecture.png
diff --git a/pictures/technical_architecture.png b/pictures/technical_architecture.png
diff --git a/pictures/vertex_ai_model_training.png b/pictures/vertex_ai_model_training.png
diff --git a/pictures/wandb_system.png b/pictures/wandb_system.png
diff --git a/pictures/wandb_train.png b/pictures/wandb_train.png
diff --git a/pictures/web_server_demo.png b/pictures/web_server_demo.png
diff --git a/presentations/AC215-final-presentation.mp4 b/presentations/AC215-final-presentation.mp4
diff --git a/presentations/AC215-final-presentation.pdf b/presentations/AC215-final-presentation.pdf
diff --git a/presentations/AC215-midterm-demo.mp4 b/presentations/AC215-midterm-demo.mp4
diff --git a/presentations/AC215-midterm.pdf b/presentations/AC215-midterm.pdf
diff --git a/references/.gitkeep b/references/.gitkeep
diff --git a/...s/Learn to Explain-Multimodal Reasoning via ThoughtChainsforScienceQuestion Answering.pdf b/...s/Learn to Explain-Multimodal Reasoning via ThoughtChainsforScienceQuestion Answering.pdf
diff --git a/references/VQA-Visual Question Answering.pdf b/references/VQA-Visual Question Answering.pdf
diff --git a/references/Visual Instruction Tuning.pdf b/references/Visual Instruction Tuning.pdf
diff --git a/...wering_Developments_Applications_Datasets_and_Opportunities_A_State-of-the-Art_Survey.pdf b/...wering_Developments_Applications_Datasets_and_Opportunities_A_State-of-the-Art_Survey.pdf
diff --git a/reports/.gitkeep b/reports/.gitkeep