dask: initial integration (#7688)

* dask: initial integration

* dask: add fuse fuzzer

* update project yaml to match
https://github.com/google/oss-fuzz/pull/7698
This commit is contained in:
DavidKorczynski 2022-05-24 03:06:25 +01:00 committed by GitHub
parent dd9f2c2778
commit 94b400c520
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
5 changed files with 177 additions and 0 deletions

22
projects/dask/Dockerfile Normal file
View File

@ -0,0 +1,22 @@
# Copyright 2022 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
################################################################################
FROM gcr.io/oss-fuzz-base/base-builder-python
RUN apt-get update && apt-get install -y pkg-config
RUN git clone https://github.com/dask/dask
COPY build.sh fuzz_fuse.py $SRC/
WORKDIR $SRC/dask

23
projects/dask/build.sh Executable file
View File

@ -0,0 +1,23 @@
#!/bin/bash -eu
# Copyright 2022 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
################################################################################
pip3 install .
# Build fuzzers in $OUT.
for fuzzer in $(find $SRC -name 'fuzz_*.py'); do
compile_python_fuzzer $fuzzer
done

View File

@ -0,0 +1,76 @@
#!/usr/bin/python3
# Copyright 2022 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import sys
import atheris
import dask
from dask.optimization import (
fuse,
fuse_linear,
)
from dask.utils_test import dec, inc, add
def get_fuse_dict(data):
fdp = atheris.FuzzedDataProvider(data)
fuse_dict = dict()
number_of_entries = fdp.ConsumeIntInRange(1, 50)
operations = [dec, inc, add]
previous_keys = list()
key="a"
fuse_dict[key] = 1
previous_keys.append(key)
for i in range(number_of_entries):
newk=key+str(i)
val_op = operations[fdp.ConsumeIntInRange(0, 2)]
val_id = previous_keys[fdp.ConsumeIntInRange(0, len(previous_keys)-1)]
fuse_dict[newk] = (val_op, val_id)
previous_keys.append(newk)
return fuse_dict
@atheris.instrument_func
def TestOneInput(data):
if len(data) < 10:
return
fdp = atheris.FuzzedDataProvider(data)
fuzzed_dict = get_fuse_dict(data)
if len(fuzzed_dict) == 0:
return
if fdp.ConsumeBool():
fuse(
fuzzed_dict,
rename_keys=fdp.ConsumeBool()
)
else:
fuse_linear(
fuzzed_dict,
rename_keys=fdp.ConsumeBool()
)
def main():
atheris.instrument_all()
atheris.Setup(sys.argv, TestOneInput, enable_python_coverage=True)
atheris.Fuzz()
if __name__ == "__main__":
main()

View File

@ -0,0 +1,45 @@
#!/usr/bin/python3
# Copyright 2022 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import sys
import atheris
import json
from dask.config import (
deserialize,
serialize
)
@atheris.instrument_func
def TestOneInput(data):
fdp = atheris.FuzzedDataProvider(data)
try:
fuzzed_dict = json.loads(fdp.ConsumeString(sys.maxsize))
except json.JSONDecodeError:
return
if type(fuzzed_dict) is not dict:
return
serialized = serialize(fuzzed_dict)
config = deserialize(serialized)
def main():
atheris.instrument_all()
atheris.Setup(sys.argv, TestOneInput, enable_python_coverage=True)
atheris.Fuzz()
if __name__ == "__main__":
main()

View File

@ -0,0 +1,11 @@
homepage: "https://github.com/dask/dask"
main_repo: "https://github.com/dask/dask"
language: python
fuzzing_engines:
- libfuzzer
sanitizers:
- address
- undefined
vendor_ccs:
- david@adalogics.com
- adam@adalogics.com