Skip to content

Commit

Permalink
Add support to Aggregation Fuzzer to call Presto java and setup CI run.
Browse files Browse the repository at this point in the history
  • Loading branch information
kgpai committed Dec 9, 2023
1 parent e40ae26 commit d8b4822
Show file tree
Hide file tree
Showing 2 changed files with 177 additions and 10 deletions.
153 changes: 153 additions & 0 deletions .github/workflows/experimental.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,153 @@
# Copyright (c) Facebook, Inc. and its affiliates.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

name: "Experimental Fuzzer Jobs"

on:
pull_request:
paths:
- ".github/workflows/experimental.yml"

schedule:
- cron: '0 1 * * *'

workflow_dispatch:
inputs:
ref:
description: 'Ref to checkout out'
default: 'main'
numThreads:
description: 'Number of threads'
default: 16
maxHighMemJobs:
description: 'Number of high memory jobs'
default: 8
maxLinkJobs:
description: 'Maximum number of link jobs'
default: 4
extraCMakeFlags:
description: 'Additional CMake flags'
default: ''

defaults:
run:
shell: bash

permissions:
contents: read

jobs:
compile:
runs-on: 8-core
timeout-minutes: 120
env:
CCACHE_DIR: "${{ github.workspace }}/.ccache/"
CCACHE_BASEDIR: "${{ github.workspace }}"
LINUX_DISTRO: "ubuntu"
steps:

- name: "Restore ccache"
uses: actions/cache@v3
with:
path: "${{ env.CCACHE_DIR }}"
# We are using the benchmark ccache as it has all
# required features enabled, so no need to create a new one
key: ccache-benchmark-${{ github.sha }}
restore-keys: |
ccache-benchmark-
- name: "Checkout Repo"
uses: actions/checkout@v3
with:
path: velox
submodules: 'recursive'
ref: "${{ inputs.ref || 'main' }}"

- name: "Install dependencies"
run: cd velox && source ./scripts/setup-ubuntu.sh

- name: "Build"
run: |
cd velox
make debug NUM_THREADS="${{ inputs.numThreads || 8 }}" MAX_HIGH_MEM_JOBS="${{ inputs.maxHighMemJobs || 8 }}" MAX_LINK_JOBS="${{ inputs.maxLinkJobs || 4 }}" EXTRA_CMAKE_FLAGS="-DVELOX_ENABLE_ARROW=ON ${{ inputs.extraCMakeFlags }}"
ccache -s
- name: Upload presto fuzzer
uses: actions/upload-artifact@v3
with:
name: presto
path: velox/_build/debug/velox/expression/tests/velox_expression_fuzzer_test

- name: Upload spark fuzzer
uses: actions/upload-artifact@v3
with:
name: spark
path: |
velox/_build/debug/velox/expression/tests/spark_expression_fuzzer_test
velox/_build/debug/velox/expression/tests/spark_aggregation_fuzzer_test
- name: Upload aggregation fuzzer
uses: actions/upload-artifact@v3
with:
name: aggregation
path: velox/_build/debug/velox/exec/tests/velox_aggregation_fuzzer_test

- name: Upload join fuzzer
uses: actions/upload-artifact@v3
with:
name: join
path: velox/_build/debug/velox/exec/tests/velox_join_fuzzer_test

presto-java-aggregation-fuzzer-run:
runs-on: ubuntu-latest
container: ghcr.io/facebookincubator/velox-dev:presto-java
needs: compile
timeout-minutes: 120
steps:

- name: "Checkout Repo"
uses: actions/checkout@v3
with:
ref: "${{ inputs.ref || 'main' }}"

- name: "Install dependencies"
run: source ./scripts/setup-ubuntu.sh

- name: Download aggregation fuzzer
uses: actions/download-artifact@v3
with:
name: aggregation

- name: "Run Aggregate Fuzzer"
run: |
mkdir -p /tmp/aggregate_fuzzer_repro/
rm -rfv /tmp/aggregate_fuzzer_repro/*
chmod -R 777 /tmp/aggregate_fuzzer_repro
chmod +x velox_aggregation_fuzzer_test
./velox_aggregation_fuzzer_test \
--seed ${RANDOM} \
--duration_sec 3600 \
--logtostderr=1 \
--minloglevel=0 \
--repro_persist_path=/tmp/aggregate_fuzzer_repro \
--prestoCoordinatorUri=http://127.0.0.1:8080 \
&& echo -e "\n\nAggregation fuzzer run finished successfully."
- name: Archive aggregate production artifacts
if: always()
uses: actions/upload-artifact@v3
with:
name: aggregate-fuzzer-failure-artifacts
path: |
/tmp/aggregate_fuzzer_repro
34 changes: 24 additions & 10 deletions velox/exec/tests/AggregationFuzzerTest.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -24,6 +24,7 @@
#include "velox/exec/tests/utils/AssertQueryBuilder.h"
#include "velox/exec/tests/utils/DuckQueryRunner.h"
#include "velox/exec/tests/utils/PlanBuilder.h"
#include "velox/exec/tests/utils/PrestoQueryRunner.h"
#include "velox/functions/prestosql/aggregates/RegisterAggregateFunctions.h"
#include "velox/functions/prestosql/registration/RegistrationFunctions.h"
#include "velox/functions/prestosql/window/WindowFunctionsRegistration.h"
Expand All @@ -43,6 +44,11 @@ DEFINE_string(
"this comma separated list of function names "
"(e.g: --only \"min\" or --only \"sum,avg\").");

DEFINE_string(
prestoCoordinatorUri,
"",
"Presto coordinator Uri, along with port. If this is set we");

namespace facebook::velox::exec::test {
namespace {

Expand Down Expand Up @@ -835,15 +841,23 @@ int main(int argc, char** argv) {

size_t initialSeed = FLAGS_seed == 0 ? std::time(nullptr) : FLAGS_seed;

auto duckQueryRunner =
std::make_unique<facebook::velox::exec::test::DuckQueryRunner>();
duckQueryRunner->disableAggregateFunctions({
"skewness",
// DuckDB results on constant inputs are incorrect. Should be NaN,
// but DuckDB returns some random value.
"kurtosis",
"entropy",
});
std::unique_ptr<facebook::velox::exec::test::ReferenceQueryRunner> runner;

if (FLAGS_prestoCoordinatorUri.empty()) {
auto duckQueryRunner =
std::make_unique<facebook::velox::exec::test::DuckQueryRunner>();
duckQueryRunner->disableAggregateFunctions({
"skewness",
// DuckDB results on constant inputs are incorrect. Should be NaN,
// but DuckDB returns some random value.
"kurtosis",
"entropy",
});
runner = std::move(duckQueryRunner);
} else {
runner = std::make_unique<facebook::velox::exec::test::PrestoQueryRunner>(
FLAGS_prestoCoordinatorUri, "aggregation_fuzzer");
}

// List of functions that have known bugs that cause crashes or failures.
static const std::unordered_set<std::string> skipFunctions = {
Expand Down Expand Up @@ -914,5 +928,5 @@ int main(int argc, char** argv) {
facebook::velox::exec::test::getCustomInputGenerators();
options.timestampPrecision =
facebook::velox::VectorFuzzer::Options::TimestampPrecision::kMilliSeconds;
return Runner::run(initialSeed, std::move(duckQueryRunner), options);
return Runner::run(initialSeed, std::move(runner), options);
}

0 comments on commit d8b4822

Please sign in to comment.