tweak examples, add light tests, add gh action (#23)

* tweak examples, add light tests, add gh action * remove launch.json * remove beta9ignore * tweak to run in pr rn * refactor a bit * beam auth in action * set env * update deps * try unset CI * try setting manually * add workspace id env * merge and update one test * fix test
beam-cloud · Aug 2, 2024 · a065cd4 · a065cd4
1 parent 9203bda
commit a065cd4
Show file tree

Hide file tree

Showing 56 changed files with 4,081 additions and 58 deletions.
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
@@ -0,0 +1,52 @@
+name: Tests
+
+on: [push, pull_request, workflow_dispatch]
+
+jobs:
+  light-test:
+    runs-on: ubuntu-latest
+    env:
+      BEAM_AUTH_TOKEN: ${{ secrets.BEAM_AUTH_TOKEN }}
+      BEAM_WORKSPACE_ID: ${{ secrets.BEAM_WORKSPACE_ID }}
+
+    steps:
+    - uses: actions/checkout@v3
+
+    - name: set up python
+      uses: actions/setup-python@v4
+      with:
+        python-version: '3.x'
+
+    - name: install poetry
+      uses: snok/install-poetry@v1
+      with:
+        version: '1.5.1'
+        virtualenvs-create: true
+        virtualenvs-in-project: true
+
+    - name: load cached venv
+      id: cached-poetry-dependencies
+      uses: actions/cache@v3
+      with:
+        path: .venv
+        key: venv-${{ runner.os }}-${{ hashFiles('**/poetry.lock') }}
+
+    - name: install dependencies
+      if: steps.cached-poetry-dependencies.outputs.cache-hit != 'true'
+      run: poetry install --no-interaction --no-root
+
+    - name: configure beam
+      run: |
+        source .venv/bin/activate
+        mkdir -p ~/.beam
+        cat << EOF > ~/.beam/config.ini
+        [default]
+        token = ${{ secrets.BEAM_AUTH_TOKEN }}
+        gateway_host = gateway.beam.cloud
+        gateway_port = 443
+        EOF
+
+    - name: run tests
+      run: |
+        source .venv/bin/activate
+        pytest tests/light_test.py
diff --git a/.gitignore b/.gitignore
@@ -3,4 +3,5 @@
 __pycache__
 __downloads__
 .env
-.venv
+.venv
+.vscode/launch.json
diff --git a/02_customizing_environment/custom_image.py b/02_customizing_environment/custom_image.py
@@ -11,17 +11,15 @@
 image = Image(
     python_version="python3.9",
     python_packages=[
-        "transformers",
         "torch",
     ],
-    commands=["apt-get update -y && apt-get install ffmpeg -y"],
-    base_image="docker.io/nvidia/cuda:12.1.1-runtime-ubuntu20.04",
+    commands=["apt-get update -y && apt-get install neovim -y"],
+    base_image="docker.io/nvidia/cuda:12.3.1-runtime-ubuntu20.04",
 )
 
 
-@endpoint()
-def handler(image=image):
+@endpoint(image=image)
+def handler():
     import torch
 
-    print(torch)
-    return {}
+    return {"torch_version": + torch.__version__}
diff --git a/02_customizing_environment/gpu_acceleration.py b/02_customizing_environment/gpu_acceleration.py
@@ -11,8 +11,8 @@
 
 @endpoint(gpu="T4")
 def handler():
-    print("📡 This is running on a GPU!")
     print(subprocess.check_output(["nvidia-smi"]))
+    return "This container has a GPU attached 📡!"
 
 
 if __name__ == "__main__":

diff --git a/02_customizing_environment/using_secrets.py b/02_customizing_environment/using_secrets.py
@@ -8,15 +8,17 @@
 Once the secret is created, it can be accessed as an environment variable (see below).
 """
 
+import os
 from beam import function
 
+os.environ["FOO"] = "bar"
 
-@function(secrets=["AWS_ACCESS_KEY"])
+@function(secrets=["FOO"])
 def handler():
     import os
 
-    my_secret = os.environ["AWS_ACCESS_KEY"]
-    print(f"Secret: {my_secret}")
+    my_secret = os.environ["FOO"]
+    return f"secret {my_secret}"
 
 
 if __name__ == "__main__":

diff --git a/03_endpoint/keep_warm.py b/03_endpoint/keep_warm.py
@@ -11,4 +11,4 @@
 # Each container will stay up for 5 min before shutting down automatically
 @endpoint(keep_warm_seconds=300)
 def handler():
-    return {}
+    return "warm"
diff --git a/03_endpoint/preload_models.py b/03_endpoint/preload_models.py
@@ -51,6 +51,4 @@ def predict(context, prompt):
         generate_ids, skip_special_tokens=True, clean_up_tokenization_spaces=False
     )[0]
 
-    print(result)
-
     return {"prediction": result}
diff --git a/04_task_queue/async_task.py b/04_task_queue/async_task.py
@@ -7,7 +7,7 @@
 
 Task queues are deployed the same way as web endpoints. 
 
-As a recap, this is the CLI command to deploy an task queue or endpoint:
+As a recap, this is the CLI command to deploy a task queue or endpoint:
 
 ```
 beam deploy [file.py]:[function] --name [name]
@@ -36,5 +36,6 @@ def multiply(**inputs):
     return {"result": result}
 
 
-# Interactively enqueue a task without deploying
-multiply.put(x=1)
+if __name__ == "__main__":
+    # Interactively enqueue a task without deploying
+    multiply.put(x=1)
diff --git a/04_task_queue/task_callbacks.py b/04_task_queue/task_callbacks.py
@@ -12,7 +12,7 @@
 from beam import function
 
 
-@function(callback_url="https://your-server.io")
+@function(callback_url="https://www.beam.cloud/")
 def handler(x):
     return {"result": x}
 

diff --git a/05_function/scaling_out.py b/05_function/scaling_out.py
@@ -23,6 +23,8 @@ def main():
     for result in square.map(numbers):
         print(result)
         squared.append(result)
+
+    print("result", squared)
 
 
 if __name__ == "__main__":

diff --git a/05_function/sharing_state.py b/05_function/sharing_state.py
@@ -6,17 +6,29 @@
 `Queue()` is a concurrency-safe distributed queue, accessible both locally and within remote containers.
 """
 
-from beam import Queue
+from beam import Queue, function
 
-val = [1, 2, 3]
 
-# Initialize the Queue
-q = Queue(name="myqueue")
+@function(cpu=0.1)
+def access_queue(): 
+    q = Queue(name="myqueue")
+    return q.pop()
 
-for i in range(100):
-    # Insert something to the queue
-    q.put(val)
-while not q.empty():
-    # Remove something from the queue
-    val = q.pop()
-    print(val)
+if __name__ == "__main__":
+    val = ["eli", "luke", "john", "nick"]
+
+    # Initialize the Queue
+    q = Queue(name="myqueue")
+
+    for i in val:
+        # Insert something to the queue
+        q.put(i)
+
+    while not q.empty():
+        # Remove something from the queue
+        val = q.pop()
+        print(val)
+
+    q.put("daniel")
+
+    print(access_queue.remote())
diff --git a/06_volume/mounting_volumes.py b/06_volume/mounting_volumes.py
diff --git a/06_volume/reading_and_writing_data.py → 06_volume/volume_use.py b/06_volume/reading_and_writing_data.py → 06_volume/volume_use.py
@@ -7,17 +7,23 @@
 from beam import function, Volume
 
 
-VOLUME_PATH = "./model_weights"
+VOLUME_PATH = "./example-volume"
 
 
 @function(
-    volumes=[Volume(name="model-weights", mount_path=VOLUME_PATH)],
+    volumes=[Volume(name="example-volume", mount_path=VOLUME_PATH)],
 )
 def access_files():
     # Write files to a volume
     with open(f"{VOLUME_PATH}/somefile.txt", "w") as f:
-        f.write("Writing to the volume!")
+        f.write("On the volume!")
 
     # Read files from a volume
+    s = ""
     with open(f"{VOLUME_PATH}/somefile.txt", "r") as f:
-        f.read()
+        s = f.read()
+
+    return s
+
+if __name__ == "__main__":
+    print(access_files.remote())
diff --git a/07_image_generation/saving-outputs/app.py → 07_outputs/outputs.py b/07_image_generation/saving-outputs/app.py → 07_outputs/outputs.py
@@ -35,11 +35,10 @@ def save_image():
     # Print other details about the output
     print(f"Output ID: {output.id}")
     print(f"Output Path: {output.path}")
-    print(f"Output Stats: {output.stat()}")
     print(f"Output Exists: {output.exists()}")
 
     return {"image": url}
 
 
 if __name__ == "__main__":
-    save_image()
+    save_image.remote()
diff --git a/...generation/sdxl-turbo-streaming/README.md → ...generation/sdxl-turbo-streaming/README.md b/...generation/sdxl-turbo-streaming/README.md → ...generation/sdxl-turbo-streaming/README.md
diff --git a/...ation/sdxl-turbo-streaming/backend/app.py → ...ation/sdxl-turbo-streaming/backend/app.py b/...ation/sdxl-turbo-streaming/backend/app.py → ...ation/sdxl-turbo-streaming/backend/app.py
@@ -1,4 +1,3 @@
-from beam import endpoint, Image
 from beam import Image, Volume, endpoint, Output
 
 CACHE_PATH = "./models"

diff --git a/.../sdxl-turbo-streaming/frontend/.gitignore → .../sdxl-turbo-streaming/frontend/.gitignore b/.../sdxl-turbo-streaming/frontend/.gitignore → .../sdxl-turbo-streaming/frontend/.gitignore
diff --git a/...n/sdxl-turbo-streaming/frontend/README.md → ...n/sdxl-turbo-streaming/frontend/README.md b/...n/sdxl-turbo-streaming/frontend/README.md → ...n/sdxl-turbo-streaming/frontend/README.md
diff --git a/...rbo-streaming/frontend/components/Home.js → ...rbo-streaming/frontend/components/Home.js b/...rbo-streaming/frontend/components/Home.js → ...rbo-streaming/frontend/components/Home.js
diff --git a/...xl-turbo-streaming/frontend/jsconfig.json → ...xl-turbo-streaming/frontend/jsconfig.json b/...xl-turbo-streaming/frontend/jsconfig.json → ...xl-turbo-streaming/frontend/jsconfig.json
diff --git a/...-turbo-streaming/frontend/next.config.mjs → ...-turbo-streaming/frontend/next.config.mjs b/...-turbo-streaming/frontend/next.config.mjs → ...-turbo-streaming/frontend/next.config.mjs
diff --git a/...urbo-streaming/frontend/package-lock.json → ...urbo-streaming/frontend/package-lock.json b/...urbo-streaming/frontend/package-lock.json → ...urbo-streaming/frontend/package-lock.json
diff --git a/...dxl-turbo-streaming/frontend/package.json → ...dxl-turbo-streaming/frontend/package.json b/...dxl-turbo-streaming/frontend/package.json → ...dxl-turbo-streaming/frontend/package.json
diff --git a/...l-turbo-streaming/frontend/pages/index.js → ...l-turbo-streaming/frontend/pages/index.js b/...l-turbo-streaming/frontend/pages/index.js → ...l-turbo-streaming/frontend/pages/index.js
diff --git a/...rbo-streaming/frontend/public/favicon.ico → ...rbo-streaming/frontend/public/favicon.ico b/...rbo-streaming/frontend/public/favicon.ico → ...rbo-streaming/frontend/public/favicon.ico
diff --git a/...-turbo-streaming/frontend/public/next.svg → ...-turbo-streaming/frontend/public/next.svg b/...-turbo-streaming/frontend/public/next.svg → ...-turbo-streaming/frontend/public/next.svg
diff --git a/...urbo-streaming/frontend/public/vercel.svg → ...urbo-streaming/frontend/public/vercel.svg b/...urbo-streaming/frontend/public/vercel.svg → ...urbo-streaming/frontend/public/vercel.svg
diff --git a/...streaming/frontend/styles/Home.module.css → ...streaming/frontend/styles/Home.module.css b/...streaming/frontend/styles/Home.module.css → ...streaming/frontend/styles/Home.module.css
diff --git a/...rbo-streaming/frontend/styles/globals.css → ...rbo-streaming/frontend/styles/globals.css b/...rbo-streaming/frontend/styles/globals.css → ...rbo-streaming/frontend/styles/globals.css
diff --git a/07_image_generation/sdxl-turbo/README.md → 09_image_generation/sdxl-turbo/README.md b/07_image_generation/sdxl-turbo/README.md → 09_image_generation/sdxl-turbo/README.md
diff --git a/...mage_generation/sdxl-turbo/backend/app.py → ...mage_generation/sdxl-turbo/backend/app.py b/...mage_generation/sdxl-turbo/backend/app.py → ...mage_generation/sdxl-turbo/backend/app.py
diff --git a/...generation/sdxl-turbo/frontend/.gitignore → ...generation/sdxl-turbo/frontend/.gitignore b/...generation/sdxl-turbo/frontend/.gitignore → ...generation/sdxl-turbo/frontend/.gitignore
diff --git a/...on/sdxl-turbo/frontend/assets/favicon.ico → ...on/sdxl-turbo/frontend/assets/favicon.ico b/...on/sdxl-turbo/frontend/assets/favicon.ico → ...on/sdxl-turbo/frontend/assets/favicon.ico
diff --git a/...tion/sdxl-turbo/frontend/requirements.txt → ...tion/sdxl-turbo/frontend/requirements.txt b/...tion/sdxl-turbo/frontend/requirements.txt → ...tion/sdxl-turbo/frontend/requirements.txt
diff --git a/...eneration/sdxl-turbo/frontend/rxconfig.py → ...eneration/sdxl-turbo/frontend/rxconfig.py b/...eneration/sdxl-turbo/frontend/rxconfig.py → ...eneration/sdxl-turbo/frontend/rxconfig.py
diff --git a/...bo/frontend/sdxl_frontend/beam_service.py → ...bo/frontend/sdxl_frontend/beam_service.py b/...bo/frontend/sdxl_frontend/beam_service.py → ...bo/frontend/sdxl_frontend/beam_service.py
diff --git a/...o/frontend/sdxl_frontend/sdxl_frontend.py → ...o/frontend/sdxl_frontend/sdxl_frontend.py b/...o/frontend/sdxl_frontend/sdxl_frontend.py → ...o/frontend/sdxl_frontend/sdxl_frontend.py
diff --git a/...eneration/sdxl-turbo/static/reflex-ui.png → ...eneration/sdxl-turbo/static/reflex-ui.png b/...eneration/sdxl-turbo/static/reflex-ui.png → ...eneration/sdxl-turbo/static/reflex-ui.png
diff --git a/07_image_generation/sdxl/README.md → 09_image_generation/sdxl/README.md b/07_image_generation/sdxl/README.md → 09_image_generation/sdxl/README.md
diff --git a/07_image_generation/sdxl/backend/app.py → 09_image_generation/sdxl/backend/app.py b/07_image_generation/sdxl/backend/app.py → 09_image_generation/sdxl/backend/app.py
diff --git a/07_image_generation/sdxl/frontend/.gitignore → 09_image_generation/sdxl/frontend/.gitignore b/07_image_generation/sdxl/frontend/.gitignore → 09_image_generation/sdxl/frontend/.gitignore
diff --git a/...neration/sdxl/frontend/assets/favicon.ico → ...neration/sdxl/frontend/assets/favicon.ico b/...neration/sdxl/frontend/assets/favicon.ico → ...neration/sdxl/frontend/assets/favicon.ico
diff --git a/...generation/sdxl/frontend/requirements.txt → ...generation/sdxl/frontend/requirements.txt b/...generation/sdxl/frontend/requirements.txt → ...generation/sdxl/frontend/requirements.txt
diff --git a/...mage_generation/sdxl/frontend/rxconfig.py → ...mage_generation/sdxl/frontend/rxconfig.py b/...mage_generation/sdxl/frontend/rxconfig.py → ...mage_generation/sdxl/frontend/rxconfig.py
diff --git a/...xl/frontend/sdxl_frontend/beam_service.py → ...xl/frontend/sdxl_frontend/beam_service.py b/...xl/frontend/sdxl_frontend/beam_service.py → ...xl/frontend/sdxl_frontend/beam_service.py
diff --git a/...l/frontend/sdxl_frontend/sdxl_frontend.py → ...l/frontend/sdxl_frontend/sdxl_frontend.py b/...l/frontend/sdxl_frontend/sdxl_frontend.py → ...l/frontend/sdxl_frontend/sdxl_frontend.py
diff --git a/...mage_generation/sdxl/static/reflex-ui.png → ...mage_generation/sdxl/static/reflex-ui.png b/...mage_generation/sdxl/static/reflex-ui.png → ...mage_generation/sdxl/static/reflex-ui.png
diff --git a/...e_generation/stable-diffusion-lora/app.py → ...e_generation/stable-diffusion-lora/app.py b/...e_generation/stable-diffusion-lora/app.py → ...e_generation/stable-diffusion-lora/app.py
diff --git a/10_language_models/mixtral7b/app.py b/10_language_models/mixtral7b/app.py
@@ -0,0 +1,94 @@
+"""
+### Mixtral 7B ###
+
+Note: This is a gated Huggingface model and you must request access to it here:
+
+https://huggingface.co/mistralai/Mistral-7B-v0.1
+
+Retrieve your HF token from this page: https://huggingface.co/settings/tokens
+
+After your access is granted, make sure to save your Huggingface token on Beam:
+
+```
+$ beam secret create [SECRET]
+```
+
+...and add the secret to your Beam function decorator:
+
+@endpoint(secrets=["HF_TOKEN"])
+"""
+
+from beam import endpoint, Image, Volume, env
+
+# This ensures that these packages are only loaded when the script is running remotely on Beam
+if env.is_remote():
+    import torch
+    from transformers import AutoModelForCausalLM, AutoTokenizer
+
+CHECKPOINT = "mistralai/Mistral-7B-v0.1"
+BEAM_VOLUME_PATH = "./cached_models"
+
+
+def load_models():
+    model = AutoModelForCausalLM.from_pretrained(
+        CHECKPOINT,
+        torch_dtype=torch.float16,
+        device_map="auto",
+        cache_dir=BEAM_VOLUME_PATH,
+    )
+    tokenizer = AutoTokenizer.from_pretrained(CHECKPOINT)
+    return model, tokenizer
+
+
+@endpoint(
+    secrets=["HF_TOKEN"],
+    on_start=load_models,
+    name="mistral-7b",
+    cpu=2,
+    memory="32Gi",
+    gpu="A10G",
+    image=Image(
+        python_version="python3.11",
+        python_packages=[
+            "transformers==4.42.3",
+            "sentencepiece==0.1.99",
+            "accelerate==0.23.0",
+            "torch==2.0.1",
+        ],
+    ),
+    volumes=[
+        Volume(
+            name="cached_models",
+            mount_path=BEAM_VOLUME_PATH,
+        )
+    ],
+)
+def generate(context, **inputs):
+    # Retrieve model and tokenizer from on_start
+    model, tokenizer = context.on_start_value
+
+    # Inputs passed to API
+    prompt = inputs.get("prompt")
+    if not prompt:
+        return {"error": "Please provide a prompt."}
+
+    generate_args = {
+        "max_new_tokens": inputs.get("max_new_tokens", 128),
+        "temperature": inputs.get("temperature", 1.0),
+        "top_p": inputs.get("top_p", 0.95),
+        "top_k": inputs.get("top_k", 50),
+        "repetition_penalty": 1.0,
+        "no_repeat_ngram_size": 0,
+        "use_cache": True,
+        "do_sample": True,
+        "eos_token_id": tokenizer.eos_token_id,
+        "pad_token_id": tokenizer.pad_token_id,
+    }
+
+    input_ids = tokenizer(prompt, return_tensors="pt").input_ids.cuda()
+
+    with torch.no_grad():
+        output = model.generate(inputs=input_ids, **generate_args)
+        generated_text = tokenizer.decode(output[0], skip_special_tokens=True)
+
+    return {"generated_text": generated_text}
diff --git a/10_experimental/signal-example-inference.py → 11_experimental/signal-example-inference.py b/10_experimental/signal-example-inference.py → 11_experimental/signal-example-inference.py
diff --git a/10_experimental/signal-example-train.py → 11_experimental/signal-example-train.py b/10_experimental/signal-example-train.py → 11_experimental/signal-example-train.py
diff --git a/README.md b/README.md
@@ -10,6 +10,15 @@
 
 This repo includes various code examples that demonstrate the functionality of Beam.
 
+## Running examples
+Some of the examples showcase local usecases and others are examples of full deployments. For the examples that can 
+be run locally, you can use poetry to get python setup correctly. 
+
+```bash 
+poetry install 
+poetry shell
+```
+
 ---
 
 **Attention Beta9 users**: These examples are for the [beam.cloud](beam.cloud) product. If you are coming from the open-source [Beta9](https://github.com/beam-cloud/beta9/) repo, any of these examples can be run by changing the Python imports from **beam** to **beta9**: