-
Notifications
You must be signed in to change notification settings - Fork 13
52 lines (45 loc) · 1.48 KB
/
parquet.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
name: Create Parquet
on:
workflow_dispatch:
schedule:
- cron: '50 */6 * * *'
concurrency: ci-parquet-${{ github.ref }}
permissions:
contents: write
jobs:
create-parquet:
name: Create parquet
runs-on: ubuntu-latest
if: github.repository == 'pypi-data/pypi-json-data'
steps:
- name: Maximize build space
uses: easimon/maximize-build-space@master
with:
root-reserve-mb: 512
swap-size-mb: 1024
remove-dotnet: 'true'
remove-codeql: 'true'
remove-docker-images: 'true'
remove-android: 'true'
- name: Install tools
shell: bash
run: |
set -euo pipefail
IFS=$'\n\t'
sudo apt install -y wget libdeflate-tools
- uses: actions/setup-python@v4
with:
python-version: "3.10"
- run: pip install "polars[pyarrow]" tqdm click
- run: wget https://raw.githubusercontent.com/pypi-data/pypi-json-data/main/pypi_data_downloader/parquet.py
- run: wget --progress=dot:giga https://github.com/pypi-data/pypi-json-data/releases/download/latest/pypi-data.sqlite.gz
- run: libdeflate-gzip -d pypi-data.sqlite.gz
- run: python parquet.py pypi-data.sqlite pypi-data.parquet
- name: Publish
uses: softprops/action-gh-release@v1
with:
draft: false
name: "Latest Release"
tag_name: "latest"
target_commitish: "empty"
files: 'pypi-data.parquet'