browsertrix/backend/btrixcloud/k8s/templates/profile_job.yaml
Tessa Walsh 0fa60ebc45
Rename archives/teams -> orgs in codebase + add db migration (#486)
* Rename archives to orgs and aid to oid on backend

* Rename archive to org and aid to oid in frontend

* Remove translation artifact

* Rename team -> organization

* Add database migrations and run once on startup

* This commit also applies the new by_one_worker decorator to other
asyncio tasks to prevent heavy tasks from being run in each worker.

* Run black, pylint, and husky via pre-commit

* Set db version and use in migrations

* Update and prepare database in single task

* Migrate k8s configmaps
2023-01-18 14:51:04 -08:00

84 lines
1.9 KiB
YAML

apiVersion: batch/v1
kind: Job
metadata:
name: "job-{{ id }}"
labels:
btrix.profile: "1"
btrix.org: {{ oid }}
btrix.user: {{ userid }}
{%- if baseprofile %}
btrix.baseprofile: "{{ baseprofile }}"
{%- endif %}
spec:
template:
metadata:
labels:
btrix.profile: "1"
btrix.org: {{ oid }}
btrix.user: {{ userid }}
{%- if baseprofile %}
btrix.baseprofile: "{{ baseprofile }}"
{%- endif %}
spec:
restartPolicy: OnFailure
affinity:
nodeAffinity:
preferredDuringSchedulingIgnoredDuringExecution:
- weight: 1
preference:
matchExpressions:
- key: nodeType
operator: In
values:
- "{{ crawler_node_type }}"
tolerations:
- key: "nodeType"
operator: "Equal"
value: "crawling"
effect: "NoSchedule"
containers:
- name: crawl-job
image: {{ job_image }}
imagePullPolicy: IfNotPresent
command: ["python", "-m", "btrixcloud.k8s.profile_job"]
volumeMounts:
- name: config-volume
mountPath: /config
env:
- name: JOB_ID
valueFrom:
fieldRef:
fieldPath: metadata.labels['job-name']
- name: STORE_PATH
value: {{ storage_path }}
- name: STORAGE_NAME
value: {{ storage_name }}
- name: IDLE_TIMEOUT
value: "{{ idle_timeout }}"
- name: START_URL
value: {{ url }}
- name: PROFILE_PATH
value: {{ profile_path }}
volumes:
- name: config-volume
configMap:
name: shared-job-config
items:
- key: config.yaml
path: config.yaml