diff options
author | Roman Wagner <roman.wagner18@gmx.de> | 2021-05-12 21:13:48 +0200 |
---|---|---|
committer | GitHub <noreply@github.com> | 2021-05-12 12:13:48 -0700 |
commit | 87eeb3aa8691e1c286749a3726bfb42f4c4a6a94 (patch) | |
tree | a70182befe706d1a77f68975f562a8fe699acaea | |
parent | aac200815a809c03f62cd39c7fc139800be61169 (diff) |
[jsoup] initial integration (#5720)
-rw-r--r-- | projects/jsoup/Dockerfile | 38 | ||||
-rw-r--r-- | projects/jsoup/HtmlFuzzer.java | 25 | ||||
-rw-r--r-- | projects/jsoup/XmlFuzzer.java | 26 | ||||
-rwxr-xr-x | projects/jsoup/build.sh | 52 | ||||
-rw-r--r-- | projects/jsoup/project.yaml | 11 |
5 files changed, 152 insertions, 0 deletions
diff --git a/projects/jsoup/Dockerfile b/projects/jsoup/Dockerfile new file mode 100644 index 00000000..f9f4a2f1 --- /dev/null +++ b/projects/jsoup/Dockerfile @@ -0,0 +1,38 @@ +# Copyright 2021 Google LLC +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# +################################################################################ + +FROM gcr.io/oss-fuzz-base/base-builder + +RUN curl -L https://downloads.apache.org/maven/maven-3/3.6.3/binaries/apache-maven-3.6.3-bin.zip -o maven.zip && \ + unzip maven.zip -d $SRC/maven && \ + rm -rf maven.zip + +ENV MVN $SRC/maven/apache-maven-3.6.3/bin/mvn + +RUN git clone --depth 1 https://github.com/google/fuzzing && \ + mv fuzzing/dictionaries/html.dict $SRC/HtmlFuzzer.dict && \ + mv fuzzing/dictionaries/xml.dict $SRC/XmlFuzzer.dict && \ + rm -rf fuzzing + +RUN git clone --depth 1 https://github.com/dvyukov/go-fuzz-corpus && \ + zip -j $SRC/XmlFuzzer_seed_corpus.zip go-fuzz-corpus/xml/corpus/* && \ + rm -rf go-fuzz-corpus + +RUN git clone --depth 1 https://github.com/jhy/jsoup/ + +COPY build.sh $SRC/ +COPY HtmlFuzzer.java XmlFuzzer.java $SRC/ +WORKDIR $SRC/jsoup diff --git a/projects/jsoup/HtmlFuzzer.java b/projects/jsoup/HtmlFuzzer.java new file mode 100644 index 00000000..5f2090e7 --- /dev/null +++ b/projects/jsoup/HtmlFuzzer.java @@ -0,0 +1,25 @@ +// Copyright 2021 Google LLC +// +// Licensed under the Apache License, Version 2.0 (the "License"); +// you may not use this file except in compliance with the License. +// You may obtain a copy of the License at +// +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, software +// distributed under the License is distributed on an "AS IS" BASIS, +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +// See the License for the specific language governing permissions and +// limitations under the License. +// +//////////////////////////////////////////////////////////////////////////////// + +import com.code_intelligence.jazzer.api.FuzzedDataProvider; + +import org.jsoup.Jsoup; + +public class HtmlFuzzer { + public static void fuzzerTestOneInput(FuzzedDataProvider data) { + Jsoup.parse(data.consumeRemainingAsString()); + } +} diff --git a/projects/jsoup/XmlFuzzer.java b/projects/jsoup/XmlFuzzer.java new file mode 100644 index 00000000..ddce20be --- /dev/null +++ b/projects/jsoup/XmlFuzzer.java @@ -0,0 +1,26 @@ +// Copyright 2021 Google LLC +// +// Licensed under the Apache License, Version 2.0 (the "License"); +// you may not use this file except in compliance with the License. +// You may obtain a copy of the License at +// +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, software +// distributed under the License is distributed on an "AS IS" BASIS, +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +// See the License for the specific language governing permissions and +// limitations under the License. +// +//////////////////////////////////////////////////////////////////////////////// + +import com.code_intelligence.jazzer.api.FuzzedDataProvider; + +import org.jsoup.Jsoup; +import org.jsoup.parser.Parser; + +public class XmlFuzzer { + public static void fuzzerTestOneInput(FuzzedDataProvider data) { + Jsoup.parse(data.consumeRemainingAsString(), "", Parser.xmlParser()); + } +} diff --git a/projects/jsoup/build.sh b/projects/jsoup/build.sh new file mode 100755 index 00000000..4bbe473e --- /dev/null +++ b/projects/jsoup/build.sh @@ -0,0 +1,52 @@ +#!/bin/bash -eu +# Copyright 2021 Google Inc. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# +################################################################################ + +# Move seed corpus and dictionary. +mv $SRC/{*.zip,*.dict} $OUT + +MAVEN_ARGS="-Dmaven.test.skip=true -Djavac.src.version=15 -Djavac.target.version=15" +$MVN package org.apache.maven.plugins:maven-shade-plugin:3.2.4:shade $MAVEN_ARGS +CURRENT_VERSION=$($MVN org.apache.maven.plugins:maven-help-plugin:3.2.0:evaluate \ + -Dexpression=project.version -q -DforceStdout) +cp "target/jsoup-$CURRENT_VERSION.jar" $OUT/jsoup.jar + +ALL_JARS="jsoup.jar" + +# The classpath at build-time includes the project jars in $OUT as well as the +# Jazzer API. +BUILD_CLASSPATH=$(echo $ALL_JARS | xargs printf -- "$OUT/%s:"):$JAZZER_API_PATH + +# All .jar and .class files lie in the same directory as the fuzzer at runtime. +RUNTIME_CLASSPATH=$(echo $ALL_JARS | xargs printf -- "\$this_dir/%s:"):\$this_dir + +for fuzzer in $(find $SRC -name '*Fuzzer.java'); do + fuzzer_basename=$(basename -s .java $fuzzer) + javac -cp $BUILD_CLASSPATH $fuzzer + cp $SRC/$fuzzer_basename.class $OUT/ + + # Create an execution wrapper that executes Jazzer with the correct arguments. + echo "#!/bin/sh +# LLVMFuzzerTestOneInput for fuzzer detection. +this_dir=\$(dirname \"\$0\") +LD_LIBRARY_PATH=\"$JVM_LD_LIBRARY_PATH\":\$this_dir \ +\$this_dir/jazzer_driver --agent_path=\$this_dir/jazzer_agent_deploy.jar \ +--cp=$RUNTIME_CLASSPATH \ +--target_class=$fuzzer_basename \ +--jvm_args=\"-Xmx2048m\" \ +\$@" > $OUT/$fuzzer_basename + chmod u+x $OUT/$fuzzer_basename +done diff --git a/projects/jsoup/project.yaml b/projects/jsoup/project.yaml new file mode 100644 index 00000000..acd3d211 --- /dev/null +++ b/projects/jsoup/project.yaml @@ -0,0 +1,11 @@ +homepage: "https://github.com/jhy/jsoup/" +language: jvm +primary_contact: "bm-dev@yandex.com" +auto_ccs: + - "wagner@code-intelligence.com" + - "jonathan@hedley.net" +fuzzing_engines: + - libfuzzer +main_repo: "https://github.com/jhy/jsoup/" +sanitizers: + - address |