-
Notifications
You must be signed in to change notification settings - Fork 51
274 lines (240 loc) · 8.69 KB
/
nucliadb_search.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
name: nucliadb Search (py)
on:
pull_request:
branches:
- main
paths:
- '.github/workflows/nucliadb_search.yml'
- 'charts/nucliadb_search/**'
- 'nucliadb_utils/**'
- 'nucliadb/src/nucliadb/ingest/**'
- 'nucliadb/src/nucliadb/search/**'
- 'nucliadb/src/nucliadb/common/**'
- 'nucliadb_models/**'
- 'nucliadb_telemetry/**'
- 'nucliadb_protos/python/**'
- 'nucliadb_node/**'
- "nucliadb_sidecar/**"
- 'nucliadb_vectors/**'
- 'nucliadb_texts2/**'
- 'nucliadb_paragraphs3/**'
- 'nucliadb_core/**'
- 'nucliadb_relations2/**'
push:
branches:
- main
paths:
- '.github/workflows/nucliadb_search.yml'
- 'charts/nucliadb_search/**'
- 'nucliadb_utils/**'
- 'nucliadb/src/nucliadb/ingest/**'
- 'nucliadb/src/nucliadb/search/**'
- 'nucliadb/src/nucliadb/common/**'
- 'nucliadb_models/**'
- 'nucliadb_telemetry/**'
- 'nucliadb_protos/python/**'
- 'nucliadb_node/**'
- "nucliadb_sidecar/**"
concurrency:
group: ${{ github.workflow }}-${{ github.ref }}
cancel-in-progress: false
permissions:
id-token: write # This is required for requesting the JWT
contents: write # This is required for actions/checkout
pull-requests: write # Used by the benchmark action to leave a comment
env:
IMAGE_NAME: search
GCP_WORKLOAD_IDENTITY_PROVIDER: "projects/224545243904/locations/global/workloadIdentityPools/gh-nuclia/providers/gh-nuclia-provider"
GCP_SERVICE_ACCOUNT: "[email protected]"
jobs:
# Job to run tests
tests:
runs-on: ubuntu-latest
strategy:
max-parallel: 3
matrix:
include:
- maindb_driver: "pg"
storage_backend: "s3"
python-version: "3.12"
- maindb_driver: "pg"
storage_backend: "gcs"
python-version: "3.12"
steps:
- name: Checkout the repository
uses: actions/checkout@v3
- name: Authenticate to Google Cloud
id: gcp-auth
uses: google-github-actions/auth@v2
with:
workload_identity_provider: "${{ env.GCP_WORKLOAD_IDENTITY_PROVIDER }}"
service_account: "${{ env.GCP_SERVICE_ACCOUNT }}"
token_format: access_token
# setup docker, as we need to pull the node image to run the tests
- name: Login to Google Artifact Registry
uses: docker/login-action@v3
with:
registry: europe-west4-docker.pkg.dev
username: oauth2accesstoken
password: ${{ steps.gcp-auth.outputs.access_token }}
- name: 'Set up Cloud SDK'
uses: 'google-github-actions/setup-gcloud@v1'
- name: Setup Python
uses: actions/setup-python@v4
with:
python-version: ${{ matrix.python-version }}
cache: 'pip'
- name: Install the package
run: make -C nucliadb/ install-dev
- uses: dorny/paths-filter@v2
id: filter
with:
filters: |
node_modified:
- 'nucliadb_core/**'
- 'nucliadb_node/src/**'
- 'nucliadb_paragraphs3/**'
- 'nucliadb_procs/**'
- 'nucliadb_relations2/**'
- 'nucliadb_telemetry/**'
- 'nucliadb_texts2/**'
- 'nucliadb_vectors/**'
sidecar_modified:
- 'nucliadb_sidecar/**'
- name: Calc git info
id: git
run: |-
BRANCH=${GITHUB_HEAD_REF:-${GITHUB_REF#refs/heads/}}
echo "branch=$BRANCH" >> $GITHUB_OUTPUT
- name: Install jq
run: |
sudo apt-get update -y || true
sudo apt-get install -y jq
- name: Build local Node for testing
if: steps.filter.outputs.node_modified == 'true'
env:
SECRET_KEY: ${{ secrets.RUST_BUILD_SERVER_SECRET }}
COMMIT_HASH: ${{ github.event.pull_request.head.sha || github.sha }}
BRANCH: ${{ steps.git.outputs.branch }}
run: |
make build-node-debug
- name: Build local Sidecar for testing
if: steps.filter.outputs.sidecar_modified == 'true'
run: |
make build-sidecar
- name: Run tests
env:
TESTING_MAINDB_DRIVER: ${{ matrix.maindb_driver }}
TESTING_STORAGE_BACKEND: ${{ matrix.storage_backend }}
run: |
make -C nucliadb/ pytest_extra_flags="--benchmark-json ../benchmarks.json" test-cov-search
- name: Upload coverage to Codecov
uses: codecov/codecov-action@v3
with:
file: ./coverage.xml
flags: search
- name: Download previous benchmark data
uses: actions/cache@v1
with:
path: ./cache
key: ${{ runner.os }}-search-benchmark
- name: Comment and Store benchmark result
uses: benchmark-action/github-action-benchmark@v1
if: github.event_name == 'push'
with:
tool: 'pytest'
output-file-path: benchmarks.json
external-data-json-path: ./cache/benchmark-data.json
save-data-file: true
comment-always: true
github-token: ${{ secrets.GITHUB_TOKEN }}
comment-on-alert: true
fail-on-alert: true
alert-comment-cc-users: '@nuclia/nuclia-db'
- name: Comment benchmark result based on main
uses: benchmark-action/github-action-benchmark@v1
if: github.event_name != 'push'
with:
tool: 'pytest'
output-file-path: benchmarks.json
external-data-json-path: ./cache/benchmark-data.json
save-data-file: false
comment-always: true
github-token: ${{ secrets.GITHUB_TOKEN }}
comment-on-alert: true
fail-on-alert: true
alert-comment-cc-users: '@nuclia/nuclia-db'
- name: Store on GH Pages
uses: benchmark-action/github-action-benchmark@v1
if: github.event_name == 'push'
with:
tool: 'pytest'
output-file-path: benchmarks.json
auto-push: true
gh-repository: github.com/nuclia/nucliadb_performance
gh-pages-branch: main
github-token: ${{ secrets.PERFORMANCE_TOKEN }}
# PR workflows END here
# PUSH workflows contine with deploy activities
build:
name: Build image and push
needs: tests
uses: ./.github/workflows/_build-img-nucliadb.yml
with:
platforms: linux/amd64,linux/arm64
image-name: search
cache-gha-mode: min
secrets:
inherit
if: github.event_name == 'push'
deploy:
name: Deploy Helm chart and trigger internal CI
runs-on: ubuntu-latest
needs: build
if: github.event_name == 'push'
steps:
- name: Generate a token
id: app-token
uses: actions/create-github-app-token@v1
with:
app-id: ${{ secrets.GHAPP_ID_NUCLIABOT }}
private-key: ${{ secrets.PK_GHAPP_NUCLIABOT }}
owner: nuclia
- name: Checkout repository
uses: actions/checkout@v3
- name: Calculate short sha
id: env-vars
run: |-
HASH=`git rev-parse --short HEAD`
echo "short_sha=$HASH" >> $GITHUB_OUTPUT
- name: Set helm package image
id: version_step
env:
CONTAINER_REGISTRY: europe-west4-docker.pkg.dev/nuclia-internal/nuclia
run: |-
sed -i.bak "s#IMAGE_TO_REPLACE#$IMAGE_NAME:${{ steps.env-vars.outputs.short_sha }}#" ./charts/nucliadb_search/values.yaml
sed -i.bak "s#CONTAINER_REGISTRY_TO_REPLACE#$CONTAINER_REGISTRY#" ./charts/nucliadb_search/values.yaml
VERSION=`cat VERSION`
VERSION_SHA=$VERSION+${{ steps.env-vars.outputs.short_sha }}
sed -i.bak "s#99999.99999.99999#$VERSION_SHA#" ./charts/nucliadb_search/Chart.yaml
echo "version_number=$VERSION_SHA" >> $GITHUB_OUTPUT
- name: Configure Git
run: |
git config user.name "$GITHUB_ACTOR"
git config user.email "[email protected]"
- name: Install Helm
uses: azure/setup-helm@v3
with:
version: v3.4.0
- name: Push helm package
run: |-
helm lint charts/nucliadb_search
helm package charts/nucliadb_search
curl --data-binary "@nucliadb_search-${{ steps.version_step.outputs.version_number }}.tgz" ${{ secrets.HELM_CHART_URL }}/api/charts
- name: Repository Dispatch
uses: peter-evans/repository-dispatch@v2
with:
token: ${{ steps.app-token.outputs.token }}
repository: nuclia/nucliadb_deploy
event-type: promote
client-payload: '{"component": "nucliadb_search", "chart-version": "${{ steps.version_step.outputs.version_number }}" }'