From 4a879e62d4172f77cbae1ce1f5d4d417b8b8befd Mon Sep 17 00:00:00 2001 From: Arthur Chan Date: Wed, 1 Jun 2022 09:42:09 +0100 Subject: [PATCH] airflow-py: initial integration (#7731) * airflow-py: initial integration initial fuzzer setup * Fix fuzzer --- projects/airflow/Dockerfile | 26 ++++++++++++++++ projects/airflow/build.sh | 25 +++++++++++++++ projects/airflow/dag_fuzz.py | 57 +++++++++++++++++++++++++++++++++++ projects/airflow/project.yaml | 11 +++++++ 4 files changed, 119 insertions(+) create mode 100644 projects/airflow/Dockerfile create mode 100644 projects/airflow/build.sh create mode 100644 projects/airflow/dag_fuzz.py create mode 100644 projects/airflow/project.yaml diff --git a/projects/airflow/Dockerfile b/projects/airflow/Dockerfile new file mode 100644 index 000000000..08a190396 --- /dev/null +++ b/projects/airflow/Dockerfile @@ -0,0 +1,26 @@ +# Copyright 2022 Google LLC. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# +################################################################################ + +FROM gcr.io/oss-fuzz-base/base-builder-python + +RUN apt-get install sqlite3 +RUN pip3 install --upgrade pip + +RUN git clone https://github.com/apache/airflow +ENV AIRFLOW_HOME=$SRC/airflow/ +WORKDIR airflow + +COPY build.sh dag_fuzz.py $SRC/ diff --git a/projects/airflow/build.sh b/projects/airflow/build.sh new file mode 100644 index 000000000..e72d693bc --- /dev/null +++ b/projects/airflow/build.sh @@ -0,0 +1,25 @@ +#!/bin/bash -eu +# Copyright 2022 Google LLC. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# +################################################################################ + +# Build and install project (using current CFLAGS, CXXFLAGS). +pip3 install --upgrade pip +pip3 install colorlog +pip3 install . + +# Build fuzzers in $OUT. +cd $SRC +compile_python_fuzzer dag_fuzz.py --add-data airflow:airflow --add-data airflow/airflow:airflow diff --git a/projects/airflow/dag_fuzz.py b/projects/airflow/dag_fuzz.py new file mode 100644 index 000000000..7ddde679e --- /dev/null +++ b/projects/airflow/dag_fuzz.py @@ -0,0 +1,57 @@ +#!/usr/bin/python3 + +# Copyright 2022 Google LLC +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +import atheris +import colorlog +from datetime import datetime, timedelta +with atheris.instrument_imports(): + import airflow + from airflow import DAG + from airflow.exceptions import AirflowException + from airflow.operators.dummy_operator import DummyOperator + from airflow.operators.python_operator import PythonOperator + +def py_func(): + return + +def TestInput(input_bytes): + fdp = atheris.FuzzedDataProvider(input_bytes) + + default_args = { + 'owner': fdp.ConsumeString(8), + 'depends_on_past': fdp.ConsumeBool(), + 'start_date': airflow.utils.dates.days_ago(fdp.ConsumeIntInRange(1,5)), + 'email': [fdp.ConsumeString(8)], + 'email_on_failure': fdp.ConsumeBool(), + 'email_on_retry': fdp.ConsumeBool(), + 'retries': fdp.ConsumeIntInRange(1,5), + 'retry_delay': timedelta(minutes=fdp.ConsumeIntInRange(1,5)), + } + + try: + with DAG(fdp.ConsumeString(8), schedule_interval='@daily', default_args=default_args) as dag: + dummy_task = DummyOperator(task_id=fdp.ConsumeString(8), retries=fdp.ConsumeIntInRange(1,5)) + python_task = PythonOperator(task_id=fdp.ConsumeString(8), python_callable=py_func) + + dummy_task >> python_task + except AirflowException: + pass + +def main(): + atheris.Setup(sys.argv, TestInput, enable_python_coverage=True) + atheris.Fuzz() + +if __name__ == "__main__": + main() diff --git a/projects/airflow/project.yaml b/projects/airflow/project.yaml new file mode 100644 index 000000000..36a72d460 --- /dev/null +++ b/projects/airflow/project.yaml @@ -0,0 +1,11 @@ +fuzzing_engines: +- libfuzzer +homepage: https://github.com/apache/airflow +language: python +main_repo: https://github.com/apache/airflow +sanitizers: +- address +vendor_ccs: +- david@adalogics.com +- adam@adalogics.com +- arthur.chan@adalogics.com