ClickHouse · alexey-milovidov · Nov 12, 2024 · Nov 12, 2024 · Nov 12, 2024
diff --git a/tinybird/README.md b/tinybird/README.md
@@ -0,0 +1,32 @@
+# Disclaimer
+
+Benchmarking a database often requires deep expertise and fine-tuning. Here, our goal is merely to test the default experience of a new
+user, i.e. someone who does not invest the time to optimize performance.
+
+Testing is semi-automated.
+
+The system has a timeout of 10s; after that, it recommends to optimize (rewrite) the query.
+
+Load time and data size in the results are set to 0, as Tinybird did not indicate these resources.
+
+# Creating an account
+
+Head to https://www.tinybird.co and create an account.
+
+# Inserting data
+
+Tinybird supports data inserts from various sources. We are going to use S3 to load a Parquet file into Tinybird. Since Tinybird limits the
+file size to 1 GB, and the test data set is larger than that, we split it into smaller chunks using ClickHouse:
+
+```sql
+INSERT INTO FUNCTION s3('https://hitsparquet.s3.eu-west-3.amazonaws.com/data/hits_{_partition_id}.parquet', '', '', 'Parquet')
+PARTITION BY rand() % 50
+SELECT * FROM hits
+```
+
+Importing files with sizes a little bit less than 1 GB did not always work. We instead used 50 files of around 280 MB each. You will need to
+use the auto mode to make sure all the files are read.
+
+# Querying the data
+
+Once the data is inserted you can create the endpoints needed to run the benchmark using pipes. `run.sh` will iterate through each endpoint.
diff --git a/tinybird/results/tinybird.json b/tinybird/results/tinybird.json
@@ -0,0 +1,58 @@
+{
+    "system": "Tinybird",
+    "date": "2024-11-11",
+    "machine": "serverless",
+    "cluster_size": 1,
+    "comment": "",
+
+    "tags": ["C++", "column-oriented", "ClickHouse derivative"],
+
+    "load_time": 0,
+    "data_size": 0,
+
+    "result": [
+  [0.002, 0.002, 0.006],
+  [0.03, 0.03, 0.034],
+  [0.08, 0.08, 0.083],
+  [0.109, 0.104, 0.102],
+  [1.011, 0.668, 0.637],
+  [0.664, 0.582, 0.597],
+  [1.899, 0.055, 0.068],
+  [0.036, 0.033, 0.032],
+  [2.55, 2.519, 2.341],
+  [2.076, 2.042, 2.387],
+  [0.344, 0.365, 0.322],
+  [0.599, 0.401, 0.413],
+  [1.228, 1.265, 1.085],
+  [1.742, 1.729, 1.941],
+  [1.477, 1.468, 1.423],
+  [1.442, 1.317, 1.496],
+  [4.402, 4.385, 4.476],
+  [3.236, 3.165, 3.396],
+  [9.751, 9.707, 8.164],
+  [0.079, 0.084, 0.074],
+  [2.924, 1.204, 1.213],
+  [1.243, 1.122, 1.69],
+  [3.846, 1.67, 1.727],
+  [7.491, 8.793, 7.513],
+  [0.352, 0.338, 0.39],
+  [0.293, 0.255, 0.262],
+  [0.384, 0.445, 0.407],
+  [1.518, 1.366, 1.326],
+  [null, null, null],
+  [0.09, 0.092, 0.094],
+  [0.951, 0.897, 0.946],
+  [1.152, 1.106, 1.299],
+  [5.331, 5.509, 5.432],
+  [8.104, 8.451, 8.519],
+  [6.037, 6.861, 7.138],
+  [3.298, 3.412, 3.422],
+  [1.225, 1.121, 1.167],
+  [1.53, 1.768, 1.189],
+  [0.989, 0.891, 0.854],
+  [2.183, 2.042, 1.919],
+  [0.166, 0.018, 0.015],
+  [0.527, 0.284, 0.304],
+  [0.214, 0.213, 0.205]
+]
+}
diff --git a/tinybird/run.sh b/tinybird/run.sh
@@ -0,0 +1,24 @@
+#!/bin/bash
+
+# Define the base URL and Authorization token
+BASE_URL="https://api.tinybird.co/v0/pipes/"
+AUTH_HEADER=<TOKEN>
+
+results="["
+
+for i in {1..43}; do
+    times=()
+    for j in {1..3}; do
+        response=$(curl -s --compressed -H "$AUTH_HEADER" "${BASE_URL}Q${i}.json")
+
+        elapsed=$(echo "$response" | jq '.statistics.elapsed')
+        echo "$elapsed"
+        times+=($elapsed)
+    done
+    results+=$(printf "[%s,%s,%s]," "${times[0]}" "${times[1]}" "${times[2]}")
+done
+
+results=${results%,}
+results+="]"
+
+echo "$results"