├── .github └── workflows │ ├── ci.yml │ └── docs.yml ├── .gitignore ├── LICENSE ├── README.md ├── contributing ├── DEVELOPMENT.md └── RELEASE.md ├── docs ├── api-reference.md ├── building-data-sources.md ├── data-sources-guide.md ├── datasources │ ├── arrow.md │ ├── fake.md │ ├── github.md │ ├── googlesheets.md │ ├── huggingface.md │ ├── jsonplaceholder.md │ ├── kaggle.md │ ├── lance.md │ ├── opensky.md │ ├── robinhood.md │ ├── salesforce.md │ ├── simplejson.md │ ├── stock.md │ └── weather.md ├── index.md └── simple-stream-reader-architecture.md ├── examples └── salesforce_example.py ├── mkdocs.yml ├── pyproject.toml ├── pyspark_datasources ├── __init__.py ├── arrow.py ├── fake.py ├── github.py ├── googlesheets.py ├── huggingface.py ├── jsonplaceholder.py ├── kaggle.py ├── lance.py ├── opensky.py ├── robinhood.py ├── salesforce.py ├── simplejson.py ├── stock.py └── weather.py ├── tests ├── __init__.py ├── test_data_sources.py ├── test_google_sheets.py └── test_robinhood.py └── uv.lock /.github/workflows/ci.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/.github/workflows/ci.yml -------------------------------------------------------------------------------- /.github/workflows/docs.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/.github/workflows/docs.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/README.md -------------------------------------------------------------------------------- /contributing/DEVELOPMENT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/contributing/DEVELOPMENT.md -------------------------------------------------------------------------------- /contributing/RELEASE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/contributing/RELEASE.md -------------------------------------------------------------------------------- /docs/api-reference.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/api-reference.md -------------------------------------------------------------------------------- /docs/building-data-sources.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/building-data-sources.md -------------------------------------------------------------------------------- /docs/data-sources-guide.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/data-sources-guide.md -------------------------------------------------------------------------------- /docs/datasources/arrow.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/arrow.md -------------------------------------------------------------------------------- /docs/datasources/fake.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/fake.md -------------------------------------------------------------------------------- /docs/datasources/github.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/github.md -------------------------------------------------------------------------------- /docs/datasources/googlesheets.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/googlesheets.md -------------------------------------------------------------------------------- /docs/datasources/huggingface.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/huggingface.md -------------------------------------------------------------------------------- /docs/datasources/jsonplaceholder.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/jsonplaceholder.md -------------------------------------------------------------------------------- /docs/datasources/kaggle.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/kaggle.md -------------------------------------------------------------------------------- /docs/datasources/lance.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/lance.md -------------------------------------------------------------------------------- /docs/datasources/opensky.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/opensky.md -------------------------------------------------------------------------------- /docs/datasources/robinhood.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/robinhood.md -------------------------------------------------------------------------------- /docs/datasources/salesforce.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/salesforce.md -------------------------------------------------------------------------------- /docs/datasources/simplejson.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/simplejson.md -------------------------------------------------------------------------------- /docs/datasources/stock.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/stock.md -------------------------------------------------------------------------------- /docs/datasources/weather.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/datasources/weather.md -------------------------------------------------------------------------------- /docs/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/index.md -------------------------------------------------------------------------------- /docs/simple-stream-reader-architecture.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/docs/simple-stream-reader-architecture.md -------------------------------------------------------------------------------- /examples/salesforce_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/examples/salesforce_example.py -------------------------------------------------------------------------------- /mkdocs.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/mkdocs.yml -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyproject.toml -------------------------------------------------------------------------------- /pyspark_datasources/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/__init__.py -------------------------------------------------------------------------------- /pyspark_datasources/arrow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/arrow.py -------------------------------------------------------------------------------- /pyspark_datasources/fake.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/fake.py -------------------------------------------------------------------------------- /pyspark_datasources/github.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/github.py -------------------------------------------------------------------------------- /pyspark_datasources/googlesheets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/googlesheets.py -------------------------------------------------------------------------------- /pyspark_datasources/huggingface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/huggingface.py -------------------------------------------------------------------------------- /pyspark_datasources/jsonplaceholder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/jsonplaceholder.py -------------------------------------------------------------------------------- /pyspark_datasources/kaggle.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/kaggle.py -------------------------------------------------------------------------------- /pyspark_datasources/lance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/lance.py -------------------------------------------------------------------------------- /pyspark_datasources/opensky.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/opensky.py -------------------------------------------------------------------------------- /pyspark_datasources/robinhood.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/robinhood.py -------------------------------------------------------------------------------- /pyspark_datasources/salesforce.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/salesforce.py -------------------------------------------------------------------------------- /pyspark_datasources/simplejson.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/simplejson.py -------------------------------------------------------------------------------- /pyspark_datasources/stock.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/stock.py -------------------------------------------------------------------------------- /pyspark_datasources/weather.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/pyspark_datasources/weather.py -------------------------------------------------------------------------------- /tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/test_data_sources.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/tests/test_data_sources.py -------------------------------------------------------------------------------- /tests/test_google_sheets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/tests/test_google_sheets.py -------------------------------------------------------------------------------- /tests/test_robinhood.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/tests/test_robinhood.py -------------------------------------------------------------------------------- /uv.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/allisonwang-db/pyspark-data-sources/HEAD/uv.lock --------------------------------------------------------------------------------