Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Added a tolerance to run on a dedicated node for stacking. #316

Open
wants to merge 2 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 2 additions & 1 deletion banzai/celery.py
Original file line number Diff line number Diff line change
Expand Up @@ -116,7 +116,8 @@ def schedule_calibration_stacking(site: str, runtime_context: dict, min_date=Non
'instrument': instrument.camera, 'frame_type': frame_type})
stack_calibrations.apply_async(args=(stacking_min_date, stacking_max_date, instrument.id, frame_type,
vars(runtime_context), blocks_for_calibration),
countdown=message_delay_in_seconds)
countdown=message_delay_in_seconds,
queue=runtime_context.CELERY_STACK_QUEUE_NAME)
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

This queue also needs to be added to the app.conf

https://docs.celeryproject.org/en/stable/userguide/routing.html#manual-routing

else:
logger.warning('No scheduled calibration blocks found.',
extra_tags={'site': site, 'min_date': min_date, 'max_date': max_date,
Expand Down
2 changes: 2 additions & 0 deletions banzai/settings.py
Original file line number Diff line number Diff line change
Expand Up @@ -143,3 +143,5 @@
LOSSLESS_EXTENSIONS = []

CELERY_TASK_QUEUE_NAME = os.getenv('CELERY_TASK_QUEUE_NAME', 'celery')

CELERY_STACK_QUEUE_NAME = os.getenv('CELERY_STACK_QUEUE_NAME', 'celery')
8 changes: 5 additions & 3 deletions banzai/tests/test_celery.py
Original file line number Diff line number Diff line change
Expand Up @@ -180,7 +180,8 @@ def setup(self):
self.max_date = '2019-02-20T09:55:09'
self.context = Context({'db_address': 'db_address', 'CALIBRATION_IMAGE_TYPES': ['BIAS'],
'CALIBRATION_STACK_DELAYS': {'BIAS': 300},
'CALIBRATION_STACKER_STAGES': {'BIAS': ['banzai.bias.BiasMaker']}})
'CALIBRATION_STACKER_STAGES': {'BIAS': ['banzai.bias.BiasMaker']},
'CELERY_STACK_QUEUE_NAME': 'celery-stack'})
self.frame_type = 'BIAS'
self.fake_blocks_response_json = fake_blocks_response_json
self.fake_inst = FakeInstrument(site='coj', camera='2m0-SciCam-Spectral', enclosure='clma', telescope='2m0a')
Expand All @@ -198,7 +199,7 @@ def test_submit_stacking_tasks_to_queue_no_delay(self, mock_filter_blocks, mock_
mock_stack_calibrations.assert_called_with(args=(self.min_date, self.max_date, self.fake_inst.id,
self.frame_type, vars(self.context),
mock_filter_blocks.return_value),
countdown=0)
countdown=0, queue='celery-stack')

@mock.patch('banzai.celery.stack_calibrations.apply_async')
@mock.patch('banzai.celery.dbs.get_instruments_at_site')
Expand All @@ -215,7 +216,8 @@ def test_submit_stacking_tasks_to_queue_with_delay(self, mock_filter_blocks, moc
mock_stack_calibrations.assert_called_with(args=(self.min_date, self.max_date, self.fake_inst.id,
self.frame_type, vars(self.context),
mock_filter_blocks.return_value),
countdown=(60+CALIBRATION_STACK_DELAYS['BIAS']))
countdown=(60+CALIBRATION_STACK_DELAYS['BIAS']),
queue='celery-stack')

@mock.patch('banzai.calibrations.make_master_calibrations')
@mock.patch('banzai.celery.dbs.get_individual_cal_frames')
Expand Down
2 changes: 2 additions & 0 deletions helm-chart/banzai/templates/_helpers.tpl
Original file line number Diff line number Diff line change
Expand Up @@ -175,6 +175,8 @@ Celery task queue configuration
value: {{ .Values.banzai.queueName | quote }}
- name: CELERY_TASK_QUEUE_NAME
value: {{ .Values.banzai.celeryTaskQueueName | quote }}
- name: CELERY_STACK_QUEUE_NAME
value: {{ .Values.banzai.celeryStackQueueName | quote }}
- name: BANZAI_WORKER_LOGLEVEL
value: {{ .Values.banzai.banzaiWorkerLogLevel | quote }}
{{- end -}}
70 changes: 70 additions & 0 deletions helm-chart/banzai/templates/stacker.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,70 @@
apiVersion: apps/v1
kind: Deployment
metadata:
name: {{ include "banzai.fullname" . -}} -workers
labels:
{{ include "banzai.labels" . | indent 4 }}
spec:
selector:
matchLabels:
app.kubernetes.io/name: {{ include "banzai.name" . }}
app.kubernetes.io/instance: {{ .Release.Name }}
template:
metadata:
labels:
app.kubernetes.io/name: {{ include "banzai.name" . }}
app.kubernetes.io/instance: "{{ .Release.Name }}"
spec:
{{- with .Values.imagePullSecrets }}
imagePullSecrets:
{{- toYaml . | nindent 8 }}
{{- end }}
securityContext:
{{- toYaml .Values.podSecurityContext | nindent 8 }}

containers:
- name: {{ .Chart.Name }}
image: "{{ .Values.image.repository }}:{{ .Values.image.tag }}"
imagePullPolicy: {{ .Values.image.pullPolicy }}
securityContext:
{{- toYaml .Values.securityContext | nindent 12 }}
command:
- "celery"
- "-A"
- "banzai"
- "worker"
- "--concurrency"
- "1"
- "-l"
- "info"
- "-Q"
- "$(CELERY_STACK_QUEUE_NAME)"
env:
- name: OMP_NUM_THREADS
value: "8"
{{- include "banzai.Env" . | nindent 12 }}
resources:
requests:
cpu: "0.3"
memory: "1Gi"
limits:
cpu: "8"
memory: "16Gi"
volumeMounts:
- name: tmp
mountPath: /tmp
readOnly: false
volumes:
- name: tmp
emptyDir:
sizeLimit: 100Gi
{{- with .Values.nodeSelector }}
nodeSelector:
{{- toYaml . | nindent 8 }}
{{- end }}
{{- with .Values.affinity }}
affinity:
{{- toYaml . | nindent 8 }}
{{- end }}
tolerations:
- dedicated: "banzai-disk"
1 change: 1 addition & 0 deletions helm-chart/banzai/values-dev.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -29,6 +29,7 @@ banzai:
fitsExchange: archived_fits
queueName: banzai_dev_pipeline
celeryTaskQueueName: banzai_imaging
celeryStackQueueName: banzai_imaging_stacking

# CronJob configuration to periodically update instrument table in BANZAI DB
instrumentTableCronjob:
Expand Down
1 change: 1 addition & 0 deletions helm-chart/banzai/values-prod.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -38,6 +38,7 @@ banzai:
fitsExchange: archived_fits
queueName: banzai_pipeline
celeryTaskQueueName: banzai_imaging
celeryStackQueueName: banzai_imaging_stacking

# CronJob configuration to periodically update instrument table in BANZAI DB
instrumentTableCronjob:
Expand Down