My solution to this problem is:
from airflow.utils.db import provide_session
from airflow.models import XCom
dag = DAG(...)
@provide_session
def cleanup_xcom(**context):
dag = context["dag"]
dag_id = dag._dag_id
session=context["session"]
session.query(XCom).filter(XCom.dag_id == dag_id).delete()
clean_xcom = PythonOperator(
task_id="clean_xcom",
python_callable = cleanup_xcom,
provide_context=True,
dag=dag
)
clean_xcom
In Airflow 2.1.x, the code below likes not to work ...
from airflow.models import DAG
from airflow.utils.db import provide_session
from airflow.models import XCom
@provide_session
def cleanup_xcom(context, session=None):
dag_id = context["ti"]["dag_id"]
session.query(XCom).filter(XCom.dag_id == dag_id).delete()
dag = DAG( ...
on_success_callback=cleanup_xcom,
)
so change to
from airflow.models import DAG
from airflow.utils.db import provide_session
from airflow.models import XCom
from airflow.operators.python import PythonOperator
from airflow.operators.dummy import DummyOperator
from airflow.utils.dates import days_ago
with DAG(dag_id="cleanup_xcom_demo", schedule_interval=None, start_date=days_ago(2)) as dag:
# cleanup_xcom
@provide_session
def cleanup_xcom(session=None, **context):
dag = context["dag"]
dag_id = dag._dag_id
# It will delete all xcom of the dag_id
session.query(XCom).filter(XCom.dag_id == dag_id).delete()
clean_xcom = PythonOperator(
task_id="clean_xcom",
python_callable = cleanup_xcom,
provide_context=True,
# dag=dag
)
start = DummyOperator(task_id="start")
end = DummyOperator(task_id="end", trigger_rule="none_failed")
start >> clean_xcom >> end