Collect cluster stats #23272
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Collect cluster stats | |
on: | |
repository_dispatch: | |
workflow_dispatch: | |
inputs: | |
qdrant_python_client_version: | |
description: "Qdrant python client version" | |
default: 1.12.1 | |
schedule: | |
# Run every 15 minutes | |
- cron: "*/15 * * * *" | |
jobs: | |
collect-stats: | |
runs-on: ubuntu-latest | |
steps: | |
- uses: actions/checkout@v3 | |
- uses: webfactory/[email protected] | |
with: | |
ssh-private-key: ${{ secrets.SSH_PRIVATE_KEY }} | |
- name: Install tools | |
run: | | |
bash -x tools/ci/install-hcloud.sh | |
- name: Collect and store cluster and bfb status | |
id: cluster_checks | |
run: | | |
export HCLOUD_TOKEN=${{ secrets.HCLOUD_TOKEN }} | |
export QDRANT_API_KEY=${{ secrets.QDRANT_API_KEY }} | |
export QDRANT_CLUSTER_URL=${{ secrets.QDRANT_CLUSTER_URL }} | |
export QC_NAME="qdrant-$(echo $QDRANT_CLUSTER_URL | sed -E 's~([^.]+)\..*~\1~')" | |
export POSTGRES_PASSWORD=${{ secrets.POSTGRES_PASSWORD }} | |
export POSTGRES_HOST=${{ secrets.POSTGRES_HOST }} | |
export QDRANT_PYTHON_CLIENT_VERSION=${{ inputs.qdrant_python_client_version }} | |
bash -x tools/check-cluster-health.sh | |
bash -x tools/collect-node-metrics.sh | |
- uses: actions/upload-artifact@v4 | |
with: | |
name: points-dump | |
path: data/points-dump | |
retention-days: 7 | |
- name: Fail job if any check failed | |
if: steps.cluster_checks.outputs.failed == 'true' | |
run: exit 1 | |
collect-stats-debug-cluster: | |
if: ${{ vars.ENABLE_DEBUG_CLUSTER == 'true' && ! cancelled() }} | |
needs: collect-stats | |
runs-on: ubuntu-latest | |
steps: | |
- uses: actions/checkout@v3 | |
- uses: webfactory/[email protected] | |
with: | |
ssh-private-key: ${{ secrets.SSH_PRIVATE_KEY }} | |
- name: Install tools | |
run: | | |
bash -x tools/ci/install-hcloud.sh | |
- name: Collect and store cluster and bfb status | |
id: cluster_checks | |
run: | | |
export HCLOUD_TOKEN=${{ secrets.HCLOUD_TOKEN }} | |
export QDRANT_API_KEY=${{ secrets.QDRANT_API_KEY }} | |
export QDRANT_CLUSTER_URL=${{ secrets.QDRANT_CLUSTER_URL_2 }} | |
export QC_NAME="qdrant-$(echo $QDRANT_CLUSTER_URL | sed -E 's~([^.]+)\..*~\1~')" | |
export POSTGRES_PASSWORD=${{ secrets.POSTGRES_PASSWORD }} | |
export POSTGRES_HOST=${{ secrets.POSTGRES_HOST }} | |
export QDRANT_PYTHON_CLIENT_VERSION=${{ inputs.qdrant_python_client_version }} | |
bash -x tools/check-cluster-health.sh | |
bash -x tools/collect-node-metrics.sh | |
- uses: actions/upload-artifact@v4 | |
with: | |
name: points-dump-debug | |
path: data/points-dump-debug | |
retention-days: 7 | |
- name: Fail job if any check failed | |
if: steps.cluster_checks.outputs.failed == 'true' | |
run: exit 1 | |
collect-stats-three-cluster: | |
if: ${{ vars.ENABLE_DEBUG_CLUSTER == 'true' && ! cancelled() }} | |
needs: collect-stats-debug-cluster | |
runs-on: ubuntu-latest | |
steps: | |
- uses: actions/checkout@v3 | |
- uses: webfactory/[email protected] | |
with: | |
ssh-private-key: ${{ secrets.SSH_PRIVATE_KEY }} | |
- name: Install tools | |
run: | | |
bash -x tools/ci/install-hcloud.sh | |
- name: Collect and store cluster and bfb status | |
id: cluster_checks | |
run: | | |
export HCLOUD_TOKEN=${{ secrets.HCLOUD_TOKEN }} | |
export QDRANT_API_KEY=${{ secrets.QDRANT_API_KEY }} | |
export QDRANT_CLUSTER_URL=${{ secrets.QDRANT_CLUSTER_URL_3 }} | |
export QC_NAME="qdrant-$(echo $QDRANT_CLUSTER_URL | sed -E 's~([^.]+)\..*~\1~')" | |
export POSTGRES_PASSWORD=${{ secrets.POSTGRES_PASSWORD }} | |
export POSTGRES_HOST=${{ secrets.POSTGRES_HOST }} | |
export QDRANT_PYTHON_CLIENT_VERSION=${{ inputs.qdrant_python_client_version }} | |
bash -x tools/check-cluster-health.sh | |
bash -x tools/collect-node-metrics.sh | |
- uses: actions/upload-artifact@v4 | |
with: | |
name: points-dump-debug | |
path: data/points-dump-debug | |
retention-days: 7 | |
- name: Fail job if any check failed | |
if: steps.cluster_checks.outputs.failed == 'true' | |
run: exit 1 |