Skip to content

Commit 04eb548

Browse files
sambhav13sambhav13
and
sambhav13
authored
fix: Remove job_start_event and job_end_event from airflow dag templates (#768)
Co-authored-by: sambhav13 <[email protected]>
1 parent 3ec5e08 commit 04eb548

File tree

2 files changed

+23
-65
lines changed

2 files changed

+23
-65
lines changed

Diff for: ext/scheduler/airflow2/resources/base_dag.py

+12-33
Original file line numberDiff line numberDiff line change
@@ -13,14 +13,10 @@
1313
from __lib import optimus_sla_miss_notify, SuperKubernetesPodOperator, \
1414
SuperExternalTaskSensor, ExternalHttpSensor
1515

16-
from __lib import JOB_START_EVENT_NAME, \
17-
JOB_END_EVENT_NAME, \
18-
log_start_event, \
19-
log_success_event, \
16+
from __lib import log_success_event, \
2017
log_retry_event, \
2118
log_failure_event, \
22-
EVENT_NAMES, \
23-
log_job_end, log_job_start
19+
EVENT_NAMES
2420

2521
SENSOR_DEFAULT_POKE_INTERVAL_IN_SECS = int(Variable.get("sensor_poke_interval_in_secs", default_var=15 * 60))
2622
SENSOR_DEFAULT_TIMEOUT_IN_SECS = int(Variable.get("sensor_timeout_in_secs", default_var=15 * 60 * 60))
@@ -69,23 +65,6 @@
6965
]
7066
)
7167

72-
publish_job_start_event = PythonOperator(
73-
task_id = JOB_START_EVENT_NAME,
74-
python_callable = log_job_start,
75-
provide_context=True,
76-
depends_on_past=False,
77-
dag=dag
78-
)
79-
80-
publish_job_end_event = PythonOperator(
81-
task_id = JOB_END_EVENT_NAME,
82-
python_callable = log_job_end,
83-
provide_context=True,
84-
trigger_rule= 'all_success',
85-
depends_on_past=False,
86-
dag=dag
87-
)
88-
8968
{{$baseTaskSchema := .Job.Task.Unit.Info -}}
9069
{{- $setCPURequest := not (empty .Metadata.Resource.Request.CPU) -}}
9170
{{- $setMemoryRequest := not (empty .Metadata.Resource.Request.Memory) -}}
@@ -299,33 +278,33 @@
299278

300279
# upstream sensors -> base transformation task
301280
{{- range $i, $t := $.Job.Dependencies }}
302-
publish_job_start_event >> wait_{{ $t.Job.Name | replace "-" "__dash__" | replace "." "__dot__" }} >> transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}}
281+
wait_{{ $t.Job.Name | replace "-" "__dash__" | replace "." "__dot__" }} >> transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}}
303282
{{- end}}
304283
{{- range $_, $t := $.Job.ExternalDependencies.HTTPDependencies }}
305-
publish_job_start_event >> wait_{{ $t.Name }} >> transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}}
284+
wait_{{ $t.Name }} >> transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}}
306285
{{- end}}
307286
{{- range $_, $dependency := $.Job.ExternalDependencies.OptimusDependencies}}
308287
{{ $identity := print $dependency.Name "-" $dependency.ProjectName "-" $dependency.JobName }}
309-
publish_job_start_event >> wait_{{ $identity | replace "-" "__dash__" | replace "." "__dot__" }} >> transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}}
288+
wait_{{ $identity | replace "-" "__dash__" | replace "." "__dot__" }} >> transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}}
310289
{{- end}}
311290
{{if and (not $.Job.Dependencies) (not $.Job.ExternalDependencies.HTTPDependencies) (not $.Job.ExternalDependencies.OptimusDependencies)}}
312291
# if no sensor and dependency is configured
313-
publish_job_start_event >> transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}}
292+
transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}}
314293
{{end}}
315294
# post completion hook
316-
transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}} >> publish_job_end_event
295+
transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}}
317296

318297
# set inter-dependencies between task and hooks
319298
{{- range $_, $task := .Job.Hooks }}
320299
{{- $hookSchema := $task.Unit.Info }}
321300
{{- if eq $hookSchema.HookType $.HookTypePre }}
322-
publish_job_start_event >> hook_{{$hookSchema.Name | replace "-" "__dash__"}} >> transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}}
301+
hook_{{$hookSchema.Name | replace "-" "__dash__"}} >> transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}}
323302
{{- end -}}
324303
{{- if eq $hookSchema.HookType $.HookTypePost }}
325-
transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}} >> hook_{{$hookSchema.Name | replace "-" "__dash__"}} >> publish_job_end_event
304+
transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}} >> hook_{{$hookSchema.Name | replace "-" "__dash__"}}
326305
{{- end -}}
327306
{{- if eq $hookSchema.HookType $.HookTypeFail }}
328-
transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}} >> hook_{{$hookSchema.Name | replace "-" "__dash__"}} >> publish_job_end_event
307+
transformation_{{$baseTaskSchema.Name | replace "-" "__dash__" | replace "." "__dot__"}} >> hook_{{$hookSchema.Name | replace "-" "__dash__"}}
329308
{{- end -}}
330309
{{- end }}
331310

@@ -334,7 +313,7 @@
334313
{{- $hookSchema := $t.Unit.Info }}
335314
{{- range $_, $depend := $t.DependsOn }}
336315
{{- $dependHookSchema := $depend.Unit.Info }}
337-
hook_{{$dependHookSchema.Name | replace "-" "__dash__"}} >> hook_{{$hookSchema.Name | replace "-" "__dash__"}} >> publish_job_end_event
316+
hook_{{$dependHookSchema.Name | replace "-" "__dash__"}} >> hook_{{$hookSchema.Name | replace "-" "__dash__"}}
338317
{{- end }}
339318
{{- end }}
340319

@@ -349,7 +328,7 @@
349328
{{- $fhookSchema := $ftask.Unit.Info }}
350329
{{- if eq $fhookSchema.HookType $.HookTypeFail }} hook_{{$fhookSchema.Name | replace "-" "__dash__"}}, {{- end -}}
351330
{{- end -}}
352-
] >> publish_job_end_event
331+
]
353332

354333
{{- end -}}
355334

Diff for: ext/scheduler/airflow2/resources/expected_compiled_template.py

+11-32
Original file line numberDiff line numberDiff line change
@@ -13,14 +13,10 @@
1313
from __lib import optimus_sla_miss_notify, SuperKubernetesPodOperator, \
1414
SuperExternalTaskSensor, ExternalHttpSensor
1515

16-
from __lib import JOB_START_EVENT_NAME, \
17-
JOB_END_EVENT_NAME, \
18-
log_start_event, \
19-
log_success_event, \
16+
from __lib import log_success_event, \
2017
log_retry_event, \
2118
log_failure_event, \
22-
EVENT_NAMES, \
23-
log_job_end, log_job_start
19+
EVENT_NAMES
2420

2521
SENSOR_DEFAULT_POKE_INTERVAL_IN_SECS = int(Variable.get("sensor_poke_interval_in_secs", default_var=15 * 60))
2622
SENSOR_DEFAULT_TIMEOUT_IN_SECS = int(Variable.get("sensor_timeout_in_secs", default_var=15 * 60 * 60))
@@ -61,23 +57,6 @@
6157
]
6258
)
6359

64-
publish_job_start_event = PythonOperator(
65-
task_id = JOB_START_EVENT_NAME,
66-
python_callable = log_job_start,
67-
provide_context=True,
68-
depends_on_past=False,
69-
dag=dag
70-
)
71-
72-
publish_job_end_event = PythonOperator(
73-
task_id = JOB_END_EVENT_NAME,
74-
python_callable = log_job_end,
75-
provide_context=True,
76-
trigger_rule= 'all_success',
77-
depends_on_past=False,
78-
dag=dag
79-
)
80-
8160

8261
JOB_DIR = "/data"
8362
IMAGE_PULL_POLICY="IfNotPresent"
@@ -315,22 +294,22 @@
315294
####################################
316295

317296
# upstream sensors -> base transformation task
318-
publish_job_start_event >> wait_foo__dash__intra__dash__dep__dash__job >> transformation_bq
319-
publish_job_start_event >> wait_foo__dash__inter__dash__dep__dash__job >> transformation_bq
297+
wait_foo__dash__intra__dash__dep__dash__job >> transformation_bq
298+
wait_foo__dash__inter__dash__dep__dash__job >> transformation_bq
320299

321-
publish_job_start_event >> wait_external__dash__optimus__dash__foo__dash__external__dash__optimus__dash__project__dash__foo__dash__external__dash__optimus__dash__dep__dash__job >> transformation_bq
300+
wait_external__dash__optimus__dash__foo__dash__external__dash__optimus__dash__project__dash__foo__dash__external__dash__optimus__dash__dep__dash__job >> transformation_bq
322301

323302
# post completion hook
324-
transformation_bq >> publish_job_end_event
303+
transformation_bq
325304

326305
# set inter-dependencies between task and hooks
327-
publish_job_start_event >> hook_transporter >> transformation_bq
328-
transformation_bq >> hook_predator >> publish_job_end_event
329-
transformation_bq >> hook_hook__dash__for__dash__fail >> publish_job_end_event
306+
hook_transporter >> transformation_bq
307+
transformation_bq >> hook_predator
308+
transformation_bq >> hook_hook__dash__for__dash__fail
330309

331310
# set inter-dependencies between hooks and hooks
332-
hook_transporter >> hook_predator >> publish_job_end_event
311+
hook_transporter >> hook_predator
333312

334313
# arrange failure hook after post hooks
335314

336-
hook_predator >> [ hook_hook__dash__for__dash__fail,] >> publish_job_end_event
315+
hook_predator >> [ hook_hook__dash__for__dash__fail,]

0 commit comments

Comments
 (0)