├── .github └── workflows │ └── ci.yml ├── .gitignore ├── .jvmopts ├── .scalafix.conf ├── Dockerfile ├── Dockerfile-mini ├── LICENSE ├── README.md ├── accelerators ├── comet_env_setup.sh ├── comet_ex.sh ├── gluten_config.properties ├── gluten_env_setup.sh ├── gluten_spark_34_ex.sh ├── install_rust_if_needed.sh ├── run_gluten.sh ├── setup_comet.sh ├── setup_gluten_deps.sh ├── setup_gluten_from_src.sh └── setup_gluten_spark34.sh ├── appveyor.yml ├── c ├── conf ├── log4j.properties └── sbtconfig.txt ├── core └── src │ ├── main │ ├── java │ │ └── com │ │ │ └── highperformancespark │ │ │ └── examples │ │ │ ├── JavaInterop.java │ │ │ ├── WordCount.java │ │ │ ├── dataframe │ │ │ ├── JavaHappyPandas.java │ │ │ ├── JavaLoadSave.java │ │ │ └── JavaUDFs.java │ │ │ ├── ffi │ │ │ └── SumJNIJava.java │ │ │ └── objects │ │ │ ├── JavaCoffeeShop.java │ │ │ ├── JavaPandaInfo.java │ │ │ ├── JavaPandaPlace.java │ │ │ ├── JavaPandas.java │ │ │ └── JavaRawPanda.java │ ├── julia │ │ ├── setup.jl │ │ └── wc.jl │ ├── perl │ │ ├── Changes │ │ ├── MANIFEST │ │ ├── Makefile.PL │ │ ├── README │ │ ├── ghinfo.pl │ │ ├── ignore.txt │ │ ├── lib │ │ │ └── HighPerformanceSpark │ │ │ │ └── Examples.pm │ │ ├── t │ │ │ ├── 00-load.t │ │ │ ├── manifest.t │ │ │ ├── pod-coverage.t │ │ │ └── pod.t │ │ └── xt │ │ │ └── boilerplate.t │ ├── r │ │ ├── dapply.R │ │ └── wc.R │ └── scala │ │ └── com │ │ └── high-performance-spark-examples │ │ ├── dataframe │ │ ├── HappyPandas.scala │ │ ├── LoadSave.scala │ │ ├── MixedDataset.scala │ │ ├── MixedDataset.scala_back │ │ ├── NullabilityFilterOptimizer.scala │ │ ├── RawPandas.scala │ │ ├── RegularSQL.scala │ │ ├── SQLExtension.scala │ │ └── UDFs.scala │ │ ├── errors │ │ └── throws.scala │ │ ├── goldilocks │ │ ├── GoldilocksFirstTry.scala │ │ ├── GoldilocksSecondarySort.scala │ │ ├── GoldilocksWithHashMap.scala │ │ ├── RDDJoinExamples.scala │ │ └── SecondarySort.scala │ │ ├── ml │ │ ├── CustomPipeline.scala │ │ ├── SimpleExport.scala │ │ ├── SimpleNaiveBayes.scala │ │ └── SimplePipeline.scala │ │ ├── mllib │ │ └── GoldilocksMLlib.scala │ │ ├── native │ │ ├── NativeExample.scala │ │ ├── PipeExample.scala │ │ ├── StandAlone.scala │ │ ├── SumFJNA.scala │ │ ├── SumJNA.scala │ │ └── SumJNI.scala │ │ ├── perf │ │ └── SimplePerfTest.scala │ │ ├── streaming │ │ ├── DStream.scala │ │ └── Structured.scala │ │ ├── tokenize │ │ └── SampleTokenize.scala │ │ ├── tools │ │ ├── FilterInvalidPandas.scala │ │ ├── GenerateScalingData.scala │ │ ├── ResourceProfileEx.scala │ │ └── SampleData.scala │ │ ├── transformations │ │ ├── Accumulators.scala │ │ ├── NarrowAndWide.scala │ │ ├── NewAccumulators.scala │ │ └── SmartAggregations.scala │ │ └── wordcount │ │ └── WordCount.scala │ └── test │ ├── java │ └── com │ │ └── highperformancespark │ │ └── examples │ │ ├── JavaInteropTest.java │ │ └── dataframe │ │ └── JavaHappyPandasTest.java │ └── scala │ └── com │ ├── high-performance-spark-examples │ ├── dataframe │ │ ├── HappyPandasTest.scala │ │ ├── MixedDatasetSuite.scala │ │ ├── PandaPlaceFilterPushdown.scala │ │ └── SQLExtensionTest.scala │ ├── errors │ │ └── ThrowsSuite.scala │ ├── goldilocks │ │ ├── EvaluationTests.scala │ │ ├── GoldilocksLargeTests.scala │ │ ├── JoinTest.scala │ │ ├── QuantileOnlyArtisanalTest.scala │ │ └── SortingTests.scala │ ├── ml │ │ ├── CustomPipeline.scala │ │ └── SimpleNaiveBayes.scala │ ├── mllib │ │ └── GoldilocksMLlibSuite.scala │ ├── native │ │ ├── NativeExample.scala │ │ └── PipeExampleSuite.scala │ ├── streaming │ │ └── DStreamSuite.scala │ ├── tokenize │ │ └── SampleTokenizeSuite.scala │ ├── tools │ │ ├── FilterInvalidPandasSuite.scala │ │ └── GenerateScalingDataSuite.scala │ ├── transformations │ │ └── Accumulators.scala │ └── wordcount │ │ └── WordCountTest.scala │ └── highperformancespark │ └── examples │ └── JavaInteropHelper.scala ├── data └── project.csv ├── env_setup.sh ├── high_performance_pyspark └── __init__.py ├── iceberg-workshop-solutions ├── Workshop-Template.ipynb └── Workshop.ipynb ├── migration └── sql.sh ├── misc ├── container_launch.sh └── kernel.json ├── native └── src │ ├── CMakeLists.txt │ ├── c │ ├── gluten │ │ └── GlutenUDF.cpp │ ├── include │ │ └── com_highperformancespark_examples_ffi_SumJNI.h │ ├── sum.c │ ├── sum.h │ ├── sum_wrapper.c │ └── sumf_wrapper.c │ └── fortran │ └── sumf.f95 ├── project ├── build.properties └── plugins.sbt ├── python ├── .flake8 ├── README.md ├── examples │ ├── SQLLineage.py │ ├── __init__.py │ ├── bad_pyspark.py │ ├── bad_pyspark.py.fail │ ├── dual_write.py │ ├── load_previous_run_data.py │ ├── pandera_ex.py │ ├── simple_perf.py │ ├── spark_expectations_example.py │ ├── spark_expectations_example.py.fail │ ├── test_dual_write.py │ ├── test_dual_write_new.py │ ├── test_load_previous_run_data.py │ └── udf.py ├── pyproject.toml ├── requirements.txt ├── setup.cfg └── tox.ini ├── resources ├── mysql-connector-java-5.1.38.jar └── rawpanda.json ├── run_container.sh ├── run_pyspark_examples.sh ├── run_sql_examples.sh ├── scalastyle-config.xml ├── se_complex.json ├── se_simple.json ├── shell-scripts └── launch-with-mysql-jdbc ├── sql ├── gluten_only_nonpartitioned_table_join.sql ├── iceberg-schema-evolution-gotcha-possibility.sql ├── iceberg-schema-evolution-gotcha-possibility.sql.expected_to_fail ├── iceberg-schema-evolution-gotcha-workaround.sql ├── nonpartitioned_table_join.sql ├── nonpartitioned_table_join.sql.conf ├── partioned_table_join.sql ├── partioned_table_join.sql.conf └── wap.sql └── target-validator ├── ex.yaml └── runme.sh /.github/workflows/ci.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/.github/workflows/ci.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/.gitignore -------------------------------------------------------------------------------- /.jvmopts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/.jvmopts -------------------------------------------------------------------------------- /.scalafix.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/.scalafix.conf -------------------------------------------------------------------------------- /Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/Dockerfile -------------------------------------------------------------------------------- /Dockerfile-mini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/Dockerfile-mini -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/README.md -------------------------------------------------------------------------------- /accelerators/comet_env_setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/accelerators/comet_env_setup.sh -------------------------------------------------------------------------------- /accelerators/comet_ex.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/accelerators/comet_ex.sh -------------------------------------------------------------------------------- /accelerators/gluten_config.properties: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/accelerators/gluten_config.properties -------------------------------------------------------------------------------- /accelerators/gluten_env_setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/accelerators/gluten_env_setup.sh -------------------------------------------------------------------------------- /accelerators/gluten_spark_34_ex.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/accelerators/gluten_spark_34_ex.sh -------------------------------------------------------------------------------- /accelerators/install_rust_if_needed.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/accelerators/install_rust_if_needed.sh -------------------------------------------------------------------------------- /accelerators/run_gluten.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/accelerators/run_gluten.sh -------------------------------------------------------------------------------- /accelerators/setup_comet.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/accelerators/setup_comet.sh -------------------------------------------------------------------------------- /accelerators/setup_gluten_deps.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/accelerators/setup_gluten_deps.sh -------------------------------------------------------------------------------- /accelerators/setup_gluten_from_src.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/accelerators/setup_gluten_from_src.sh -------------------------------------------------------------------------------- /accelerators/setup_gluten_spark34.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/accelerators/setup_gluten_spark34.sh -------------------------------------------------------------------------------- /appveyor.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/appveyor.yml -------------------------------------------------------------------------------- /c: -------------------------------------------------------------------------------- 1 | bloop 2 | 3 | -------------------------------------------------------------------------------- /conf/log4j.properties: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/conf/log4j.properties -------------------------------------------------------------------------------- /conf/sbtconfig.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/conf/sbtconfig.txt -------------------------------------------------------------------------------- /core/src/main/java/com/highperformancespark/examples/JavaInterop.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/java/com/highperformancespark/examples/JavaInterop.java -------------------------------------------------------------------------------- /core/src/main/java/com/highperformancespark/examples/WordCount.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/java/com/highperformancespark/examples/WordCount.java -------------------------------------------------------------------------------- /core/src/main/java/com/highperformancespark/examples/dataframe/JavaHappyPandas.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/java/com/highperformancespark/examples/dataframe/JavaHappyPandas.java -------------------------------------------------------------------------------- /core/src/main/java/com/highperformancespark/examples/dataframe/JavaLoadSave.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/java/com/highperformancespark/examples/dataframe/JavaLoadSave.java -------------------------------------------------------------------------------- /core/src/main/java/com/highperformancespark/examples/dataframe/JavaUDFs.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/java/com/highperformancespark/examples/dataframe/JavaUDFs.java -------------------------------------------------------------------------------- /core/src/main/java/com/highperformancespark/examples/ffi/SumJNIJava.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/java/com/highperformancespark/examples/ffi/SumJNIJava.java -------------------------------------------------------------------------------- /core/src/main/java/com/highperformancespark/examples/objects/JavaCoffeeShop.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/java/com/highperformancespark/examples/objects/JavaCoffeeShop.java -------------------------------------------------------------------------------- /core/src/main/java/com/highperformancespark/examples/objects/JavaPandaInfo.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/java/com/highperformancespark/examples/objects/JavaPandaInfo.java -------------------------------------------------------------------------------- /core/src/main/java/com/highperformancespark/examples/objects/JavaPandaPlace.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/java/com/highperformancespark/examples/objects/JavaPandaPlace.java -------------------------------------------------------------------------------- /core/src/main/java/com/highperformancespark/examples/objects/JavaPandas.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/java/com/highperformancespark/examples/objects/JavaPandas.java -------------------------------------------------------------------------------- /core/src/main/java/com/highperformancespark/examples/objects/JavaRawPanda.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/java/com/highperformancespark/examples/objects/JavaRawPanda.java -------------------------------------------------------------------------------- /core/src/main/julia/setup.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/julia/setup.jl -------------------------------------------------------------------------------- /core/src/main/julia/wc.jl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/julia/wc.jl -------------------------------------------------------------------------------- /core/src/main/perl/Changes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/Changes -------------------------------------------------------------------------------- /core/src/main/perl/MANIFEST: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/MANIFEST -------------------------------------------------------------------------------- /core/src/main/perl/Makefile.PL: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/Makefile.PL -------------------------------------------------------------------------------- /core/src/main/perl/README: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/README -------------------------------------------------------------------------------- /core/src/main/perl/ghinfo.pl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/ghinfo.pl -------------------------------------------------------------------------------- /core/src/main/perl/ignore.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/ignore.txt -------------------------------------------------------------------------------- /core/src/main/perl/lib/HighPerformanceSpark/Examples.pm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/lib/HighPerformanceSpark/Examples.pm -------------------------------------------------------------------------------- /core/src/main/perl/t/00-load.t: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/t/00-load.t -------------------------------------------------------------------------------- /core/src/main/perl/t/manifest.t: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/t/manifest.t -------------------------------------------------------------------------------- /core/src/main/perl/t/pod-coverage.t: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/t/pod-coverage.t -------------------------------------------------------------------------------- /core/src/main/perl/t/pod.t: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/t/pod.t -------------------------------------------------------------------------------- /core/src/main/perl/xt/boilerplate.t: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/perl/xt/boilerplate.t -------------------------------------------------------------------------------- /core/src/main/r/dapply.R: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/r/dapply.R -------------------------------------------------------------------------------- /core/src/main/r/wc.R: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/r/wc.R -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/dataframe/HappyPandas.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/dataframe/HappyPandas.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/dataframe/LoadSave.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/dataframe/LoadSave.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/dataframe/MixedDataset.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/dataframe/MixedDataset.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/dataframe/MixedDataset.scala_back: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/dataframe/MixedDataset.scala_back -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/dataframe/NullabilityFilterOptimizer.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/dataframe/NullabilityFilterOptimizer.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/dataframe/RawPandas.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/dataframe/RawPandas.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/dataframe/RegularSQL.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/dataframe/RegularSQL.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/dataframe/SQLExtension.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/dataframe/SQLExtension.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/dataframe/UDFs.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/dataframe/UDFs.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/errors/throws.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/errors/throws.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/goldilocks/GoldilocksFirstTry.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/goldilocks/GoldilocksFirstTry.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/goldilocks/GoldilocksSecondarySort.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/goldilocks/GoldilocksSecondarySort.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/goldilocks/GoldilocksWithHashMap.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/goldilocks/GoldilocksWithHashMap.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/goldilocks/RDDJoinExamples.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/goldilocks/RDDJoinExamples.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/goldilocks/SecondarySort.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/goldilocks/SecondarySort.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/ml/CustomPipeline.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/ml/CustomPipeline.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/ml/SimpleExport.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/ml/SimpleExport.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/ml/SimpleNaiveBayes.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/ml/SimpleNaiveBayes.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/ml/SimplePipeline.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/ml/SimplePipeline.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/mllib/GoldilocksMLlib.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/mllib/GoldilocksMLlib.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/native/NativeExample.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/native/NativeExample.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/native/PipeExample.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/native/PipeExample.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/native/StandAlone.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/native/StandAlone.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/native/SumFJNA.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/native/SumFJNA.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/native/SumJNA.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/native/SumJNA.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/native/SumJNI.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/native/SumJNI.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/perf/SimplePerfTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/perf/SimplePerfTest.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/streaming/DStream.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/streaming/DStream.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/streaming/Structured.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/streaming/Structured.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/tokenize/SampleTokenize.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/tokenize/SampleTokenize.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/tools/FilterInvalidPandas.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/tools/FilterInvalidPandas.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/tools/GenerateScalingData.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/tools/GenerateScalingData.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/tools/ResourceProfileEx.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/tools/ResourceProfileEx.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/tools/SampleData.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/tools/SampleData.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/transformations/Accumulators.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/transformations/Accumulators.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/transformations/NarrowAndWide.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/transformations/NarrowAndWide.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/transformations/NewAccumulators.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/transformations/NewAccumulators.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/transformations/SmartAggregations.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/transformations/SmartAggregations.scala -------------------------------------------------------------------------------- /core/src/main/scala/com/high-performance-spark-examples/wordcount/WordCount.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/main/scala/com/high-performance-spark-examples/wordcount/WordCount.scala -------------------------------------------------------------------------------- /core/src/test/java/com/highperformancespark/examples/JavaInteropTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/java/com/highperformancespark/examples/JavaInteropTest.java -------------------------------------------------------------------------------- /core/src/test/java/com/highperformancespark/examples/dataframe/JavaHappyPandasTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/java/com/highperformancespark/examples/dataframe/JavaHappyPandasTest.java -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/dataframe/HappyPandasTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/dataframe/HappyPandasTest.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/dataframe/MixedDatasetSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/dataframe/MixedDatasetSuite.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/dataframe/PandaPlaceFilterPushdown.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/dataframe/PandaPlaceFilterPushdown.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/dataframe/SQLExtensionTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/dataframe/SQLExtensionTest.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/errors/ThrowsSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/errors/ThrowsSuite.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/goldilocks/EvaluationTests.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/goldilocks/EvaluationTests.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/goldilocks/GoldilocksLargeTests.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/goldilocks/GoldilocksLargeTests.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/goldilocks/JoinTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/goldilocks/JoinTest.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/goldilocks/QuantileOnlyArtisanalTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/goldilocks/QuantileOnlyArtisanalTest.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/goldilocks/SortingTests.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/goldilocks/SortingTests.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/ml/CustomPipeline.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/ml/CustomPipeline.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/ml/SimpleNaiveBayes.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/ml/SimpleNaiveBayes.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/mllib/GoldilocksMLlibSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/mllib/GoldilocksMLlibSuite.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/native/NativeExample.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/native/NativeExample.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/native/PipeExampleSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/native/PipeExampleSuite.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/streaming/DStreamSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/streaming/DStreamSuite.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/tokenize/SampleTokenizeSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/tokenize/SampleTokenizeSuite.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/tools/FilterInvalidPandasSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/tools/FilterInvalidPandasSuite.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/tools/GenerateScalingDataSuite.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/tools/GenerateScalingDataSuite.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/transformations/Accumulators.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/transformations/Accumulators.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/high-performance-spark-examples/wordcount/WordCountTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/high-performance-spark-examples/wordcount/WordCountTest.scala -------------------------------------------------------------------------------- /core/src/test/scala/com/highperformancespark/examples/JavaInteropHelper.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/core/src/test/scala/com/highperformancespark/examples/JavaInteropHelper.scala -------------------------------------------------------------------------------- /data/project.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/data/project.csv -------------------------------------------------------------------------------- /env_setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/env_setup.sh -------------------------------------------------------------------------------- /high_performance_pyspark/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/high_performance_pyspark/__init__.py -------------------------------------------------------------------------------- /iceberg-workshop-solutions/Workshop-Template.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/iceberg-workshop-solutions/Workshop-Template.ipynb -------------------------------------------------------------------------------- /iceberg-workshop-solutions/Workshop.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/iceberg-workshop-solutions/Workshop.ipynb -------------------------------------------------------------------------------- /migration/sql.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/migration/sql.sh -------------------------------------------------------------------------------- /misc/container_launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/misc/container_launch.sh -------------------------------------------------------------------------------- /misc/kernel.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/misc/kernel.json -------------------------------------------------------------------------------- /native/src/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/native/src/CMakeLists.txt -------------------------------------------------------------------------------- /native/src/c/gluten/GlutenUDF.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/native/src/c/gluten/GlutenUDF.cpp -------------------------------------------------------------------------------- /native/src/c/include/com_highperformancespark_examples_ffi_SumJNI.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/native/src/c/include/com_highperformancespark_examples_ffi_SumJNI.h -------------------------------------------------------------------------------- /native/src/c/sum.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/native/src/c/sum.c -------------------------------------------------------------------------------- /native/src/c/sum.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/native/src/c/sum.h -------------------------------------------------------------------------------- /native/src/c/sum_wrapper.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/native/src/c/sum_wrapper.c -------------------------------------------------------------------------------- /native/src/c/sumf_wrapper.c: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/native/src/c/sumf_wrapper.c -------------------------------------------------------------------------------- /native/src/fortran/sumf.f95: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/native/src/fortran/sumf.f95 -------------------------------------------------------------------------------- /project/build.properties: -------------------------------------------------------------------------------- 1 | sbt.version=1.9.9 2 | -------------------------------------------------------------------------------- /project/plugins.sbt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/project/plugins.sbt -------------------------------------------------------------------------------- /python/.flake8: -------------------------------------------------------------------------------- 1 | [flake8] 2 | max-line-length = 120 -------------------------------------------------------------------------------- /python/README.md: -------------------------------------------------------------------------------- 1 | Python examples for High Performance Spark 2 | -------------------------------------------------------------------------------- /python/examples/SQLLineage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/examples/SQLLineage.py -------------------------------------------------------------------------------- /python/examples/__init__.py: -------------------------------------------------------------------------------- 1 | __version__ = 0.2 2 | -------------------------------------------------------------------------------- /python/examples/bad_pyspark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/examples/bad_pyspark.py -------------------------------------------------------------------------------- /python/examples/bad_pyspark.py.fail: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /python/examples/dual_write.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/examples/dual_write.py -------------------------------------------------------------------------------- /python/examples/load_previous_run_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/examples/load_previous_run_data.py -------------------------------------------------------------------------------- /python/examples/pandera_ex.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/examples/pandera_ex.py -------------------------------------------------------------------------------- /python/examples/simple_perf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/examples/simple_perf.py -------------------------------------------------------------------------------- /python/examples/spark_expectations_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/examples/spark_expectations_example.py -------------------------------------------------------------------------------- /python/examples/spark_expectations_example.py.fail: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /python/examples/test_dual_write.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/examples/test_dual_write.py -------------------------------------------------------------------------------- /python/examples/test_dual_write_new.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/examples/test_dual_write_new.py -------------------------------------------------------------------------------- /python/examples/test_load_previous_run_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/examples/test_load_previous_run_data.py -------------------------------------------------------------------------------- /python/examples/udf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/examples/udf.py -------------------------------------------------------------------------------- /python/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/pyproject.toml -------------------------------------------------------------------------------- /python/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/requirements.txt -------------------------------------------------------------------------------- /python/setup.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/setup.cfg -------------------------------------------------------------------------------- /python/tox.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/python/tox.ini -------------------------------------------------------------------------------- /resources/mysql-connector-java-5.1.38.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/resources/mysql-connector-java-5.1.38.jar -------------------------------------------------------------------------------- /resources/rawpanda.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/resources/rawpanda.json -------------------------------------------------------------------------------- /run_container.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/run_container.sh -------------------------------------------------------------------------------- /run_pyspark_examples.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/run_pyspark_examples.sh -------------------------------------------------------------------------------- /run_sql_examples.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/run_sql_examples.sh -------------------------------------------------------------------------------- /scalastyle-config.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/scalastyle-config.xml -------------------------------------------------------------------------------- /se_complex.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/se_complex.json -------------------------------------------------------------------------------- /se_simple.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/se_simple.json -------------------------------------------------------------------------------- /shell-scripts/launch-with-mysql-jdbc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/shell-scripts/launch-with-mysql-jdbc -------------------------------------------------------------------------------- /sql/gluten_only_nonpartitioned_table_join.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/sql/gluten_only_nonpartitioned_table_join.sql -------------------------------------------------------------------------------- /sql/iceberg-schema-evolution-gotcha-possibility.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/sql/iceberg-schema-evolution-gotcha-possibility.sql -------------------------------------------------------------------------------- /sql/iceberg-schema-evolution-gotcha-possibility.sql.expected_to_fail: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /sql/iceberg-schema-evolution-gotcha-workaround.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/sql/iceberg-schema-evolution-gotcha-workaround.sql -------------------------------------------------------------------------------- /sql/nonpartitioned_table_join.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/sql/nonpartitioned_table_join.sql -------------------------------------------------------------------------------- /sql/nonpartitioned_table_join.sql.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/sql/nonpartitioned_table_join.sql.conf -------------------------------------------------------------------------------- /sql/partioned_table_join.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/sql/partioned_table_join.sql -------------------------------------------------------------------------------- /sql/partioned_table_join.sql.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/sql/partioned_table_join.sql.conf -------------------------------------------------------------------------------- /sql/wap.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/sql/wap.sql -------------------------------------------------------------------------------- /target-validator/ex.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/target-validator/ex.yaml -------------------------------------------------------------------------------- /target-validator/runme.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/high-performance-spark/high-performance-spark-examples/HEAD/target-validator/runme.sh --------------------------------------------------------------------------------