├── .dockerignore ├── .env ├── .gitattributes ├── .github ├── ISSUE_TEMPLATE │ ├── bug_report.md │ └── feature_request.md ├── actions │ └── greplint │ │ └── action.yml └── workflows │ ├── codeql.yml │ ├── dependency-review.yml │ ├── doclint.yml │ ├── draft_release.yml │ ├── linting.yml │ ├── pypi_release.yml │ ├── remote-integ-tests.yml │ └── testing.yml ├── .gitignore ├── .gitmodules ├── .pre-commit-config.yaml ├── .readthedocs.yaml ├── CONTRIBUTING.md ├── LICENSE ├── Makefile ├── README.md ├── apps ├── Makefile ├── docker-base │ ├── Dockerfile.buildx │ ├── Makefile.docker-base │ ├── gen-pyproject-copy.sh │ └── poetry-install.sh ├── git │ └── git-credential-from-env.py ├── integration │ ├── README.md │ ├── integration │ │ ├── __init__.py │ │ ├── automation │ │ │ ├── __init__.py │ │ │ └── runtests.sh │ │ ├── conftest.py │ │ ├── containers │ │ │ ├── __init__.py │ │ │ ├── running.py │ │ │ └── stack.py │ │ ├── ingests │ │ │ ├── __init__.py │ │ │ ├── crawler.py │ │ │ ├── index.py │ │ │ ├── index_info.py │ │ │ └── jupyter.py │ │ ├── queries │ │ │ ├── __init__.py │ │ │ ├── opensearch.py │ │ │ ├── options.py │ │ │ └── queries.py │ │ └── tests │ │ │ ├── __init__.py │ │ │ └── test_basic.py │ ├── poetry.lock │ └── pyproject.toml ├── jupyter │ ├── Dockerfile.buildx │ ├── Makefile.jupyter │ ├── README.md │ ├── bind_dir │ │ ├── BIND_MOUNT_BETWEEN_DOCKER_AND_HOST │ │ └── setup.sh │ ├── entrypoint.py │ ├── poetry.lock │ ├── profile │ ├── pyproject.toml │ ├── run-jupyter.sh │ └── sudoers ├── opensearch │ ├── 2.11 │ │ ├── Dockerfile │ │ ├── README.md │ │ ├── opensearch.yml │ │ └── sycamore-opensearch.sh │ ├── Dockerfile │ ├── README.md │ ├── authority.pem │ ├── config.yml │ ├── opensearch.yml │ ├── roles_mapping.yml │ ├── setup_models.py │ └── sycamore-opensearch.sh ├── remote-processor-service │ ├── Dockerfile.build │ ├── Dockerfile.buildx │ ├── Makefile │ ├── README.md │ ├── config │ │ └── pipelines.yml │ ├── poetry.lock │ ├── pyproject.toml │ └── remote_processor_service │ │ ├── cli.py │ │ └── rps_docker_entrypoint.sh └── timetrace │ ├── Makefile │ ├── README.md │ ├── ttanal │ ├── ttcat │ └── ttviz.cpp ├── autogen-groups.py ├── compose.yaml ├── docs ├── Makefile ├── make.bat └── source │ ├── conf.py │ ├── images │ ├── ArynArchitecture_APS+Sycamorev2.png │ ├── SycamoreDataflowDiagramv2.png │ ├── SycamoreDiagram2.png │ ├── favicon.ico │ ├── query_execution.svg │ └── sycamore_logo.svg │ ├── index.rst │ └── sycamore │ ├── APIs.rst │ ├── APIs │ ├── context.rst │ ├── docset.rst │ ├── docsetreader.rst │ ├── docsetwriter.rst │ ├── document.rst │ ├── functions.rst │ ├── gen │ ├── llm.rst │ ├── low_level_transforms.rst │ ├── low_level_transforms │ │ ├── assign_doc_properties.rst │ │ ├── augment_text.rst │ │ ├── basics.rst │ │ ├── bbox_merge.rst │ │ ├── detr_partitioner.rst │ │ ├── embed.rst │ │ ├── explode.rst │ │ ├── extract_entity.rst │ │ ├── extract_schema.rst │ │ ├── extract_table.rst │ │ ├── extract_table_properties.rst │ │ ├── llm_map.rst │ │ ├── llm_query.rst │ │ ├── map.rst │ │ ├── mark_misc.rst │ │ ├── merge_elements.rst │ │ ├── partition.rst │ │ ├── query.rst │ │ ├── random_sample.rst │ │ ├── regex_replace.rst │ │ ├── sketcher.rst │ │ ├── split_elements.rst │ │ ├── spread_properties.rst │ │ ├── standardizer.rst │ │ ├── summarize.rst │ │ └── summarize_images.rst │ ├── node.rst │ ├── prompts.rst │ └── query.rst │ ├── connectors.rst │ ├── connectors │ ├── duckdb.md │ ├── elasticsearch.md │ ├── neo4j.md │ ├── opensearch.md │ ├── pinecone.md │ ├── qdrant.md │ └── weaviate.md │ ├── get_started.rst │ ├── get_started │ ├── ai_configuration.md │ ├── concepts.md │ └── hardware.md │ ├── query.rst │ ├── querying_data │ └── using_aryn_opensearch_stack │ │ ├── APIs │ │ ├── conversation_memory.rst │ │ ├── conversation_memory │ │ │ └── functions.md │ │ └── gen │ │ ├── architecture.md │ │ ├── conversation_memory │ │ ├── imgs │ │ │ ├── ConversationMemoryMultiAgent.jpg │ │ │ ├── ConversationMemoryMultiAgent.png │ │ │ └── resource-diagram.png │ │ ├── overview.md │ │ ├── storage_for_genai_agents.md │ │ └── using_with_conversational_search.md │ │ ├── dedup.md │ │ ├── demo_query_ui.md │ │ ├── encryption.md │ │ ├── hybrid_search.md │ │ ├── imgs │ │ ├── pipeline-architecture.png │ │ └── xlarge_DemoUI_FollowUpQuestion.png │ │ ├── integrate_your_application.md │ │ ├── launching_with_Docker.md │ │ ├── load_data.md │ │ ├── remote_processors.md │ │ ├── reranking.md │ │ ├── running_a_data_preparation_job.md │ │ ├── using_jupyter_container.md │ │ └── using_rag_pipelines.md │ ├── transforms.rst │ ├── transforms │ ├── embed.md │ ├── explode.md │ ├── extract_entity.md │ ├── extract_schema.md │ ├── filter.md │ ├── flatmap.md │ ├── llm_query.md │ ├── map.md │ ├── map_batch.md │ ├── materialize.md │ ├── merge.md │ ├── partition.md │ ├── sketch.md │ └── summarize.md │ ├── tutorials.rst │ ├── tutorials │ ├── conversational_memory_with_langchain.md │ ├── etl_for_opensearch.md │ ├── etl_for_weaviate_tutorial.md │ ├── etl_pinecone_tutorial.md │ └── sycamore_jupyter_dev_example.md │ └── using_jupyter.md ├── examples ├── bench.py ├── bigquery-docparse │ ├── README.md │ ├── config.py │ ├── deploy-cf.sh │ ├── download-finals.py │ ├── get_status │ │ ├── main.py │ │ └── requirements.txt │ ├── info.sh │ ├── populate_uris.py │ ├── queue_async.py │ ├── sleep_until.py │ ├── stored_procedures.sql │ └── sync_code_with_bigquery.py ├── html_ingest.py ├── markdown.py ├── ndd_debug.py ├── query │ ├── ntsb_loader.py │ ├── ntsb_loader_materialized.py │ └── simple_ntsb.py ├── s3_ingest.py ├── simple_config.py ├── simple_duckdb.py ├── simple_ingest.py ├── simple_neo4j.py ├── simple_pinecone.py ├── simple_qdrant.py └── simple_weaviate.py ├── lib ├── import_timer │ ├── README.md │ ├── import_timer.py │ └── pyproject.toml ├── poetry-lock │ ├── README.md │ ├── poetry-lock-all.sh │ ├── poetry.lock │ ├── pyproject.toml │ └── sycamore_poetry_lock │ │ └── noop.py ├── remote-processors │ ├── Makefile │ ├── README.md │ ├── img │ │ └── RPS_Architecture.svg │ ├── poetry.lock │ ├── pyproject.toml │ └── remote_processors │ │ ├── __init__.py │ │ ├── processors │ │ ├── __init__.py │ │ ├── debug_processor.py │ │ ├── dedup_processor.py │ │ └── processor.py │ │ ├── search_request.py │ │ ├── search_response.py │ │ ├── server │ │ ├── __init__.py │ │ ├── pipeline.py │ │ ├── processor_registry.py │ │ └── remote_processor_service.py │ │ └── test │ │ ├── __init__.py │ │ ├── integration │ │ ├── conftest.py │ │ └── test_integ_debug.py │ │ ├── resources │ │ ├── configs │ │ │ ├── malformed │ │ │ │ ├── dupe_pipeline_names.yml │ │ │ │ ├── not_a_list.yml │ │ │ │ ├── pipeline_not_a_map.yml │ │ │ │ └── pipeline_with_many_keys.yml │ │ │ └── valid.yml │ │ └── sb_processed.jsonl │ │ ├── unit │ │ ├── __init__.py │ │ ├── processors │ │ │ ├── __init__.py │ │ │ ├── test_debug.py │ │ │ ├── test_dedup.py │ │ │ └── test_library.py │ │ ├── service │ │ │ ├── __init__.py │ │ │ ├── test_pipeline.py │ │ │ ├── test_processor_registry.py │ │ │ └── test_remote_processor_service.py │ │ └── test_base.py │ │ └── utils.py └── sycamore │ ├── README.md │ ├── poetry.lock │ ├── pyproject.toml │ └── sycamore │ ├── README.md │ ├── __init__.py │ ├── connectors │ ├── aryn │ │ ├── ArynReader.py │ │ ├── ArynWriter.py │ │ └── client.py │ ├── base_reader.py │ ├── base_writer.py │ ├── common.py │ ├── doc_reconstruct.py │ ├── duckdb │ │ ├── __init__.py │ │ ├── duckdb_reader.py │ │ └── duckdb_writer.py │ ├── elasticsearch │ │ ├── __init__.py │ │ ├── elasticsearch_reader.py │ │ └── elasticsearch_writer.py │ ├── file │ │ ├── __init__.py │ │ ├── file_scan.py │ │ ├── file_writer.py │ │ ├── file_writer_ray.py │ │ └── materialized_scan.py │ ├── iceberg │ │ └── iceberg_writer.py │ ├── neo4j │ │ ├── __init__.py │ │ └── neo4j_writer.py │ ├── opensearch │ │ ├── __init__.py │ │ ├── opensearch_reader.py │ │ ├── opensearch_writer.py │ │ ├── sync.py │ │ └── utils.py │ ├── pinecone │ │ ├── __init__.py │ │ ├── pinecone_reader.py │ │ └── pinecone_writer.py │ ├── qdrant │ │ ├── __init__.py │ │ ├── qdrant_reader.py │ │ └── qdrant_writer.py │ └── weaviate │ │ ├── __init__.py │ │ ├── weaviate_reader.py │ │ └── weaviate_writer.py │ ├── context.py │ ├── data │ ├── __init__.py │ ├── bbox.py │ ├── docid.py │ ├── document.py │ ├── element.py │ ├── metadata.py │ └── table.py │ ├── decorators.py │ ├── docset.py │ ├── evaluation │ ├── __init__.py │ ├── data.py │ ├── datasets.py │ ├── evaluate.py │ ├── metrics │ │ ├── __init__.py │ │ ├── generated_answer.py │ │ └── retrieval.py │ ├── ocr │ │ ├── __main__.py │ │ ├── data.py │ │ ├── llm_ocr.py │ │ ├── metrics.py │ │ └── models.py │ ├── pipeline.py │ └── subtasks.py │ ├── executor.py │ ├── functions │ ├── __init__.py │ ├── basic_filters.py │ ├── chunker.py │ ├── document.py │ ├── elements.py │ ├── rabin_karp.py │ ├── simhash.py │ └── tokenizer.py │ ├── grouped_data.py │ ├── llms │ ├── __init__.py │ ├── anthropic.py │ ├── bedrock.py │ ├── chained_llm.py │ ├── config.py │ ├── gemini.py │ ├── llms.py │ ├── openai.py │ └── prompts │ │ ├── __init__.py │ │ ├── default_prompts.py │ │ ├── jinja_fragments.py │ │ └── prompts.py │ ├── materialize.py │ ├── materialize_config.py │ ├── plan_nodes.py │ ├── query │ ├── README.md │ ├── __init__.py │ ├── client.py │ ├── execution │ │ ├── __init__.py │ │ ├── aggregation.py │ │ ├── metrics.py │ │ ├── operations.py │ │ ├── physical_operator.py │ │ ├── sycamore_executor.py │ │ └── sycamore_operator.py │ ├── logical_plan.py │ ├── operators │ │ ├── basic_filter.py │ │ ├── clustering.py │ │ ├── count.py │ │ ├── field_in.py │ │ ├── groupby.py │ │ ├── limit.py │ │ ├── llm_extract_entity.py │ │ ├── llm_filter.py │ │ ├── math.py │ │ ├── query_database.py │ │ ├── sort.py │ │ ├── summarize_data.py │ │ ├── top_k.py │ │ └── unroll.py │ ├── planner.py │ ├── planner_prompt.py │ ├── result.py │ ├── schema.py │ └── strategy.py │ ├── reader.py │ ├── rules │ ├── __init__.py │ └── optimize_resource_args.py │ ├── schema.py │ ├── tests │ ├── README.md │ ├── __init__.py │ ├── config.py │ ├── conftest.py │ ├── integration │ │ ├── __init__.py │ │ ├── connectors │ │ │ ├── aryn │ │ │ │ ├── test_aryn_reader.py │ │ │ │ ├── test_aryn_writer.py │ │ │ │ └── test_client.py │ │ │ ├── common.py │ │ │ ├── duckdb │ │ │ │ ├── test_duckdb_read.py │ │ │ │ └── test_pdf_to_duckdb.py │ │ │ ├── elasticsearch │ │ │ │ ├── test_elasticsearch_read.py │ │ │ │ └── test_pdf_to_elasticsearch.py │ │ │ ├── file │ │ │ │ ├── test_file_writer.py │ │ │ │ └── test_file_writer_to_s3.py │ │ │ ├── neo4j │ │ │ │ ├── test_docset_to_neo4j.py │ │ │ │ └── test_neo4j_writer_methods.py │ │ │ ├── opensearch │ │ │ │ ├── test_html_to_opensearch.py │ │ │ │ ├── test_opensearch_read.py │ │ │ │ └── test_pdf_to_opensearch.py │ │ │ ├── pinecone │ │ │ │ ├── test_pdf_to_pinecone.py │ │ │ │ └── test_pinecone_read.py │ │ │ ├── qdrant │ │ │ │ └── test_qdrant.py │ │ │ └── weaviate │ │ │ │ ├── test_pdf_to_weaviate.py │ │ │ │ └── test_weaviate_read.py │ │ ├── evaluation │ │ │ ├── test_datasets.py │ │ │ ├── test_evaluate.py │ │ │ └── test_pipeline.py │ │ ├── functions │ │ │ ├── __init__.py │ │ │ └── test_document.py │ │ ├── llms │ │ │ ├── test_anthropic.py │ │ │ ├── test_bedrock.py │ │ │ ├── test_chained_llm.py │ │ │ ├── test_gemini.py │ │ │ └── test_openai.py │ │ ├── query │ │ │ ├── __init__.py │ │ │ ├── conftest.py │ │ │ ├── execution │ │ │ │ ├── test_operations.py │ │ │ │ └── test_sycamore_query.py │ │ │ ├── test_planner.py │ │ │ └── test_query_opensearch.py │ │ ├── test_docset.py │ │ ├── test_executor.py │ │ ├── test_image_utils.py │ │ ├── test_materialize.py │ │ ├── textractor │ │ │ └── test_textractor.py │ │ ├── transforms │ │ │ ├── __init__.py │ │ │ ├── property_extraction │ │ │ │ ├── __init__.py │ │ │ │ └── test_schema_extract.py │ │ │ ├── test_aggregation.py │ │ │ ├── test_base.py │ │ │ ├── test_data_extraction.py │ │ │ ├── test_embed.py │ │ │ ├── test_llm_filter.py │ │ │ ├── test_map.py │ │ │ ├── test_ocr_models.py │ │ │ ├── test_partition.py │ │ │ ├── test_random_sample.py │ │ │ ├── test_rerank.py │ │ │ ├── test_sort.py │ │ │ ├── test_summarize_images.py │ │ │ ├── test_table_extraction.py │ │ │ └── test_union.py │ │ └── utils │ │ │ └── test_pdf.py │ ├── manual │ │ ├── pdf2image_memusage.py │ │ ├── test_fast_sycamore_import.py │ │ └── test_opensearch_sync.py │ ├── pytest.ini │ ├── resources │ │ ├── data │ │ │ ├── docx │ │ │ │ └── aryn_website_sample.docx │ │ │ ├── htmls │ │ │ │ └── wikipedia_binary_search.html │ │ │ ├── imgs │ │ │ │ ├── sample-detr-image.png │ │ │ │ └── vert_table.png │ │ │ ├── json │ │ │ │ ├── example.json │ │ │ │ ├── model_server_output_transformer.json │ │ │ │ └── model_server_output_transformer_extract_tables.json │ │ │ ├── materialize │ │ │ │ ├── json_writer │ │ │ │ │ ├── 3fe9913e-60e2-11ef-90e5-e40d36f1e1ae.pickle │ │ │ │ │ ├── materialize.success │ │ │ │ │ └── md-9e6e68ee-ad8e-4e39-a2e1-7ef5befc588c.pickle │ │ │ │ └── llmfilter-ntsb-temp │ │ │ │ │ ├── doc-f-rhcfgmzrgifspjxjnl8vhh8.4fd48370db59b408b2700abd89bfe92e43009fde4ec216cfd112cdf17b7dfb35.pickle │ │ │ │ │ ├── materialize.clean │ │ │ │ │ ├── materialize.success │ │ │ │ │ ├── md-d-07bgl12pc0intnh2y74po4c.a98b82d885005500fb664fb18283cf80864de0fb6116e5acd9c3060dd91086a7.pickle │ │ │ │ │ ├── md-d-6wi2aqr0b504zojkdqnyybf.97ae3a37a86700c4601f89551892eb79faeaa0c9afe66f26ee20d8b7f996f929.pickle │ │ │ │ │ ├── md-d-75qp993ysz87aa1c1tsc5o0.0db762bad4ffb81bdde0f754087a65594f0cc8001986729f6ded86fa7ca7803e.pickle │ │ │ │ │ ├── md-d-89ww3vta189zsw6ac4vsjem.253ac204a7d81cc730b4a90202afaf3f78dbf27c87a17bcb94a23212b159cce6.pickle │ │ │ │ │ ├── md-d-a8pg30d1wqbff3zsf6c4l0w.c75fd5cba213cc7888ffe30f52d9fb7b637acd227a728b07ee7e1c50545c884e.pickle │ │ │ │ │ ├── md-d-ax65fkm5dy3cmkxtcfu6dv6.219182e0864996b3bb9855bd027940ff5989729f1e3ae80db8b2574f64eceb89.pickle │ │ │ │ │ ├── md-d-bx7u8xo31r49lnxi7r3thdr.7d4ab219ffa3c8c219fdcef0f384cac80e8e692a5669da4712f9076489aade58.pickle │ │ │ │ │ ├── md-d-g9dk50t6tir9sxomqvxpwhh.6f10891f3f44b8376061256d2a3d56b91945e3082abec53a5e8f1d3394492a37.pickle │ │ │ │ │ ├── md-d-k85dhbsu6n4rtp1vd62vkik.ef6d0f2992ef663296ab39f158b0a648f8bb9f4b679cfffc7df262ce49ef61e8.pickle │ │ │ │ │ ├── md-d-kl9t1to3b6t73hhclt9ke6q.26bb7d98dbcd581fa0873ea58b4cca247691b0aff527886dd69c56c407e4de6e.pickle │ │ │ │ │ ├── md-d-m3vkixw9pdmcbrfs3g6hhhf.2cb8ce11ce5feed99eacd754f8279868824d3266a59feaf92325a33a305bedc0.pickle │ │ │ │ │ ├── md-d-ml5ks4t608vrlz00gjk4fum.8d4b49675fa3c7236c71c93dc2fafd1eb95690c74a18d1594f588e953366887a.pickle │ │ │ │ │ ├── md-d-n3oawwwjt1hxatavnpjlbjb.7b9fa911fb9108ed58b8f80ce54106f0c4e98c87299a4df6519e0e9ebf142b07.pickle │ │ │ │ │ ├── md-d-poffmrto89o7t642owz0uqd.d864e9972c347cbc8900c223ff27a67815bf4cff87e812130969e73ae840ced1.pickle │ │ │ │ │ ├── md-d-qasv594a8qoyh0pwlmhljih.f3dc469668aade55c348445e4cbdfe9cec1c205e24506ee4cfc1124bad05dabb.pickle │ │ │ │ │ ├── md-d-rve5tvzjsb8qh6hcwdiq6qm.1022022f6d1712c26c86b3d4bc9152aeebc39806b9ea36285b5f3135cc53d672.pickle │ │ │ │ │ ├── md-d-swwvf71e2zvm5due6ongmjx.db0edaa58fcb926c43f191eca5b35e24721662924f3a3f28e544c49ed06c0fc4.pickle │ │ │ │ │ ├── md-d-u2q5b6b3k1liz40fdy8ibi9.a1761cb4fab284b222950d77e6deda85b44a607bcc588b9f38bff80d97b2a6dc.pickle │ │ │ │ │ ├── md-d-utp720v7v9ufcvce5tro2su.921a82b7ea58fbda1f36ce3aa828ef96efb10836a04560a6e4739b3182db4820.pickle │ │ │ │ │ ├── md-d-xjnfbj6qqys50k9pi988awd.fb4d50848f84e0f145c1d091aee688dbae19b8ef420ac7b4158042785fe24578.pickle │ │ │ │ │ └── md-d-zd8xb8wbpv6nit9wmujsjpi.d24c185d792566b7731a2d8aad7dc5cca24c4a1ac9fcd814f96fa9d7d0087a53.pickle │ │ │ ├── nested_json │ │ │ │ └── example.json │ │ │ ├── ocr_pdfs │ │ │ │ └── test_simple_ocr.pdf │ │ │ ├── pdfs │ │ │ │ ├── Ray.pdf │ │ │ │ ├── Ray_page1.pdf │ │ │ │ ├── Ray_page11.pdf │ │ │ │ ├── Transformer.pdf │ │ │ │ ├── basic_table.pdf │ │ │ │ ├── doctor_testimonial.pdf │ │ │ │ ├── ntsb-report.pdf │ │ │ │ ├── ntsb0.pdf │ │ │ │ ├── ntsb1.pdf │ │ │ │ ├── ntsb3.pdf │ │ │ │ └── visit_aryn.pdf │ │ │ ├── pptx │ │ │ │ └── design.pptx │ │ │ └── texts │ │ │ │ └── Ray.txt │ │ └── objects │ │ │ └── weaviate │ │ │ └── collection_params_b.pickle │ ├── unit │ │ ├── __init__.py │ │ ├── connectors │ │ │ ├── aryn │ │ │ │ └── test_aryn_reader.py │ │ │ ├── common │ │ │ │ ├── __init__.py │ │ │ │ ├── test_base_reader.py │ │ │ │ ├── test_base_writer.py │ │ │ │ └── test_common.py │ │ │ ├── duckdb │ │ │ │ ├── test_duckdb_reader.py │ │ │ │ └── test_duckdb_writer.py │ │ │ ├── elasticsearch │ │ │ │ ├── test_elasticsearch_reader.py │ │ │ │ └── test_elasticsearch_writer.py │ │ │ ├── file │ │ │ │ └── test_file_writer.py │ │ │ ├── iceberg │ │ │ │ └── test_iceberg_writer.py │ │ │ ├── opensearch │ │ │ │ ├── test_opensearch.py │ │ │ │ └── test_sync.py │ │ │ ├── pinecone │ │ │ │ ├── test_pinecone_reader.py │ │ │ │ └── test_pinecone_writer.py │ │ │ ├── qdrant │ │ │ │ └── test_qdrant_reader.py │ │ │ └── weaviate │ │ │ │ ├── test_weaviate_reader.py │ │ │ │ └── test_weaviate_writer.py │ │ ├── data │ │ │ ├── test_bbox.py │ │ │ ├── test_docid.py │ │ │ ├── test_document.py │ │ │ ├── test_element.py │ │ │ └── test_table.py │ │ ├── evaluation │ │ │ ├── __init__.py │ │ │ ├── test_evaluate.py │ │ │ └── test_metrics.py │ │ ├── functions │ │ │ ├── __init__.py │ │ │ ├── test_elements.py │ │ │ ├── test_field_to_value.py │ │ │ ├── test_rabin_karp.py │ │ │ ├── test_simhash.py │ │ │ ├── test_text_chunker.py │ │ │ └── test_tokenizer.py │ │ ├── inmempyarrowfs.py │ │ ├── llms │ │ │ ├── prompts │ │ │ │ ├── __init__.py │ │ │ │ └── test_prompts.py │ │ │ ├── test_bedrock.py │ │ │ └── test_llms.py │ │ ├── query │ │ │ ├── __init__.py │ │ │ ├── conftest.py │ │ │ ├── execution │ │ │ │ ├── __init__.py │ │ │ │ ├── test_sycamore_executor.py │ │ │ │ └── test_sycamore_operator.py │ │ │ ├── test_node.py │ │ │ ├── test_operations.py │ │ │ ├── test_plan.py │ │ │ ├── test_planner.py │ │ │ ├── test_result.py │ │ │ ├── test_schema.py │ │ │ └── test_strategy.py │ │ ├── scans │ │ │ ├── __init__.py │ │ │ ├── test_file_scan.py │ │ │ └── test_materialized_scan.py │ │ ├── test_context.py │ │ ├── test_docset.py │ │ ├── test_executor.py │ │ ├── test_grouped_data.py │ │ ├── test_import_speed.py │ │ ├── test_materialize.py │ │ ├── test_node.py │ │ ├── test_reader.py │ │ ├── test_rewriter.py │ │ ├── test_schema.py │ │ ├── test_writer.py │ │ ├── transforms │ │ │ ├── __init__.py │ │ │ ├── check_partition_impl.py │ │ │ ├── property_extraction │ │ │ │ ├── test_attribution.py │ │ │ │ ├── test_extract.py │ │ │ │ ├── test_prompts.py │ │ │ │ ├── test_schema_extract.py │ │ │ │ ├── test_strategy.py │ │ │ │ ├── test_types.py │ │ │ │ └── test_utils.py │ │ │ ├── test_aggregation.py │ │ │ ├── test_aryn_partitioner.py │ │ │ ├── test_assign_doc_properties.py │ │ │ ├── test_augment_text.py │ │ │ ├── test_base.py │ │ │ ├── test_base_llm.py │ │ │ ├── test_basics.py │ │ │ ├── test_bbox_merge.py │ │ │ ├── test_clustering.py │ │ │ ├── test_detr_partitioner.py │ │ │ ├── test_embed.py │ │ │ ├── test_explode.py │ │ │ ├── test_extract_document_structure.py │ │ │ ├── test_extract_entity.py │ │ │ ├── test_extract_table_properties.py │ │ │ ├── test_graph_entity_extractor.py │ │ │ ├── test_graph_relationship_extractor.py │ │ │ ├── test_llm_filter.py │ │ │ ├── test_llm_query.py │ │ │ ├── test_mapping.py │ │ │ ├── test_merge_elements.py │ │ │ ├── test_partition.py │ │ │ ├── test_random_sample.py │ │ │ ├── test_regex_replace.py │ │ │ ├── test_resolve_graph_entities.py │ │ │ ├── test_schema.py │ │ │ ├── test_similarity.py │ │ │ ├── test_sketcher.py │ │ │ ├── test_sort.py │ │ │ ├── test_split_elements.py │ │ │ ├── test_spread_properties.py │ │ │ ├── test_standardizer.py │ │ │ ├── test_summarize.py │ │ │ ├── test_summarize_images.py │ │ │ ├── test_table_extractor.py │ │ │ ├── test_table_transfomers.py │ │ │ ├── test_term_frequency.py │ │ │ ├── test_union.py │ │ │ └── text_extraction │ │ │ │ └── test_ocr_models.py │ │ └── utils │ │ │ ├── test_bbox_sort.py │ │ │ ├── test_cache.py │ │ │ ├── test_deep_eq.py │ │ │ ├── test_derivation.py │ │ │ ├── test_extract_json.py │ │ │ ├── test_fileformat_tools.py │ │ │ ├── test_import_utils.py │ │ │ ├── test_jupyter.py │ │ │ ├── test_markdown.py │ │ │ ├── test_nested.py │ │ │ ├── test_pdf_utils.py │ │ │ ├── test_pyarrow.py │ │ │ ├── test_pydantic_pickling.py │ │ │ ├── test_ray_utils.py │ │ │ ├── test_rotation.py │ │ │ ├── test_similarity.py │ │ │ ├── test_strings.py │ │ │ ├── test_sycamore_logger.py │ │ │ ├── test_threading.py │ │ │ ├── test_time_trace.py │ │ │ ├── test_xycut_sort.py │ │ │ └── test_zip_traverse.py │ └── utils.py │ ├── transforms │ ├── __init__.py │ ├── aggregation.py │ ├── assign_doc_properties.py │ ├── augment_text.py │ ├── base.py │ ├── base_llm.py │ ├── basics.py │ ├── bbox_merge.py │ ├── clustering.py │ ├── dataset_scan.py │ ├── detr_partitioner.py │ ├── detr_partitioner_config.py │ ├── embed.py │ ├── explode.py │ ├── extract_document_structure.py │ ├── extract_entity.py │ ├── extract_graph_entities.py │ ├── extract_graph_relationships.py │ ├── extract_schema.py │ ├── extract_table.py │ ├── extract_table_properties.py │ ├── groupby_count.py │ ├── llm_filter.py │ ├── llm_query.py │ ├── map.py │ ├── mark_misc.py │ ├── markdown.py │ ├── merge_elements.py │ ├── partition.py │ ├── property_extraction │ │ ├── __init__.py │ │ ├── attribution.py │ │ ├── extract.py │ │ ├── merge_schemas.py │ │ ├── prompts.py │ │ ├── strategy.py │ │ ├── types.py │ │ └── utils.py │ ├── query.py │ ├── random_sample.py │ ├── regex_replace.py │ ├── resolve_graph_entities.py │ ├── similarity.py │ ├── sketcher.py │ ├── sort.py │ ├── split_elements.py │ ├── spread_properties.py │ ├── standardizer.py │ ├── summarize.py │ ├── summarize_images.py │ ├── table_structure │ │ ├── extract.py │ │ └── table_transformers.py │ ├── term_frequency.py │ ├── text_extraction │ │ ├── __init__.py │ │ ├── ocr_models.py │ │ ├── pdf_miner.py │ │ └── text_extractor.py │ └── union.py │ ├── utils │ ├── __init__.py │ ├── aryn_config.py │ ├── bbox_sort.py │ ├── cache.py │ ├── deep_eq.py │ ├── deprecate.py │ ├── derivation.py │ ├── element_sort.py │ ├── extract_json.py │ ├── fileformat_tools.py │ ├── html_utils.py │ ├── http.py │ ├── image_utils.py │ ├── import_utils.py │ ├── jupyter.py │ ├── lineage_utils.py │ ├── llm_utils.py │ ├── markdown.py │ ├── memory_debugging.py │ ├── merge_utils.py │ ├── model_load.py │ ├── nested.py │ ├── pdf.py │ ├── pdf_utils.py │ ├── pickle_pydantic.py │ ├── pyarrow │ │ ├── __init__.py │ │ ├── fs.py │ │ └── types.py │ ├── pytorch_dir.py │ ├── ray_utils.py │ ├── rotation.py │ ├── similarity.py │ ├── strings.py │ ├── sycamore_logger.py │ ├── thread_local.py │ ├── threading.py │ ├── time_trace.py │ ├── xycut.py │ └── zip_traverse.py │ └── writer.py ├── notebooks ├── ArynPartitionerExample.ipynb ├── ArynPartitionerPython.ipynb ├── ArynPartitionerWithLangchain.ipynb ├── EBGaramond-Bold.ttf ├── OpenAI-logprob.ipynb ├── VisualizePartitioner.ipynb ├── aryn-opensearch-bedrock-rag-example.ipynb ├── default-prep-script.ipynb ├── docprep │ ├── minilm-l6-v2_greedy-section-merger_duckdb.ipynb │ ├── minilm-l6-v2_greedy-section-merger_opensearch.ipynb │ ├── minilm-l6-v2_greedy-text-element-merger_duckdb.ipynb │ ├── minilm-l6-v2_marked-merger_duckdb.ipynb │ ├── text-embedding-3-small_greedy-section-merger_duckdb.ipynb │ ├── text-embedding-3-small_greedy-section-merger_pinecone.ipynb │ ├── text-embedding-3-small_greedy-text-element-merger_opensearch.ipynb │ └── text-embedding-3-small_marked-merger_pinecone.ipynb ├── duckdb-writer.ipynb ├── earnings_calls_notebooks │ ├── workshop_nb_0.ipynb │ ├── workshop_nb_1.ipynb │ ├── workshop_nb_2.ipynb │ ├── workshop_nb_3.ipynb │ └── workshop_nb_4.ipynb ├── elasticsearch-writer.ipynb ├── financial-docs-10k-example.ipynb ├── jupyter_dev_example.ipynb ├── metadata-extraction.ipynb ├── ndd_example.ipynb ├── ntsb-demo.ipynb ├── opensearch-writer.ipynb ├── opensearch_docs_etl.ipynb ├── pinecone-writer.ipynb ├── query-demo.ipynb ├── run-notebook-tests.sh ├── subtask-sample.ipynb ├── sycamore-tutorial-intermediate-etl.ipynb ├── sycamore_demo.ipynb ├── tutorial.ipynb ├── unpickle_query.ipynb └── weaviate-writer.ipynb ├── poetry.lock └── pyproject.toml /.dockerignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.dockerignore -------------------------------------------------------------------------------- /.env: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.env -------------------------------------------------------------------------------- /.gitattributes: -------------------------------------------------------------------------------- 1 | sycamore/tests/resources/data/** -linguist-detectable 2 | -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/bug_report.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.github/ISSUE_TEMPLATE/bug_report.md -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/feature_request.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.github/ISSUE_TEMPLATE/feature_request.md -------------------------------------------------------------------------------- /.github/actions/greplint/action.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.github/actions/greplint/action.yml -------------------------------------------------------------------------------- /.github/workflows/codeql.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.github/workflows/codeql.yml -------------------------------------------------------------------------------- /.github/workflows/dependency-review.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.github/workflows/dependency-review.yml -------------------------------------------------------------------------------- /.github/workflows/doclint.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.github/workflows/doclint.yml -------------------------------------------------------------------------------- /.github/workflows/draft_release.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.github/workflows/draft_release.yml -------------------------------------------------------------------------------- /.github/workflows/linting.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.github/workflows/linting.yml -------------------------------------------------------------------------------- /.github/workflows/pypi_release.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.github/workflows/pypi_release.yml -------------------------------------------------------------------------------- /.github/workflows/remote-integ-tests.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.github/workflows/remote-integ-tests.yml -------------------------------------------------------------------------------- /.github/workflows/testing.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.github/workflows/testing.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.gitignore -------------------------------------------------------------------------------- /.gitmodules: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.gitmodules -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /.readthedocs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/.readthedocs.yaml -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/LICENSE -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/Makefile -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/README.md -------------------------------------------------------------------------------- /apps/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/Makefile -------------------------------------------------------------------------------- /apps/docker-base/Dockerfile.buildx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/docker-base/Dockerfile.buildx -------------------------------------------------------------------------------- /apps/docker-base/Makefile.docker-base: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/docker-base/Makefile.docker-base -------------------------------------------------------------------------------- /apps/docker-base/gen-pyproject-copy.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/docker-base/gen-pyproject-copy.sh -------------------------------------------------------------------------------- /apps/docker-base/poetry-install.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/docker-base/poetry-install.sh -------------------------------------------------------------------------------- /apps/git/git-credential-from-env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/git/git-credential-from-env.py -------------------------------------------------------------------------------- /apps/integration/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/README.md -------------------------------------------------------------------------------- /apps/integration/integration/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/__init__.py -------------------------------------------------------------------------------- /apps/integration/integration/automation/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /apps/integration/integration/automation/runtests.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/automation/runtests.sh -------------------------------------------------------------------------------- /apps/integration/integration/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/conftest.py -------------------------------------------------------------------------------- /apps/integration/integration/containers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /apps/integration/integration/containers/running.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/containers/running.py -------------------------------------------------------------------------------- /apps/integration/integration/containers/stack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/containers/stack.py -------------------------------------------------------------------------------- /apps/integration/integration/ingests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /apps/integration/integration/ingests/crawler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/ingests/crawler.py -------------------------------------------------------------------------------- /apps/integration/integration/ingests/index.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/ingests/index.py -------------------------------------------------------------------------------- /apps/integration/integration/ingests/index_info.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/ingests/index_info.py -------------------------------------------------------------------------------- /apps/integration/integration/ingests/jupyter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/ingests/jupyter.py -------------------------------------------------------------------------------- /apps/integration/integration/queries/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /apps/integration/integration/queries/opensearch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/queries/opensearch.py -------------------------------------------------------------------------------- /apps/integration/integration/queries/options.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/queries/options.py -------------------------------------------------------------------------------- /apps/integration/integration/queries/queries.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/queries/queries.py -------------------------------------------------------------------------------- /apps/integration/integration/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /apps/integration/integration/tests/test_basic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/integration/tests/test_basic.py -------------------------------------------------------------------------------- /apps/integration/poetry.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/poetry.lock -------------------------------------------------------------------------------- /apps/integration/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/integration/pyproject.toml -------------------------------------------------------------------------------- /apps/jupyter/Dockerfile.buildx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/jupyter/Dockerfile.buildx -------------------------------------------------------------------------------- /apps/jupyter/Makefile.jupyter: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/jupyter/Makefile.jupyter -------------------------------------------------------------------------------- /apps/jupyter/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/jupyter/README.md -------------------------------------------------------------------------------- /apps/jupyter/bind_dir/BIND_MOUNT_BETWEEN_DOCKER_AND_HOST: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /apps/jupyter/bind_dir/setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/jupyter/bind_dir/setup.sh -------------------------------------------------------------------------------- /apps/jupyter/entrypoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/jupyter/entrypoint.py -------------------------------------------------------------------------------- /apps/jupyter/poetry.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/jupyter/poetry.lock -------------------------------------------------------------------------------- /apps/jupyter/profile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/jupyter/profile -------------------------------------------------------------------------------- /apps/jupyter/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/jupyter/pyproject.toml -------------------------------------------------------------------------------- /apps/jupyter/run-jupyter.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/jupyter/run-jupyter.sh -------------------------------------------------------------------------------- /apps/jupyter/sudoers: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/jupyter/sudoers -------------------------------------------------------------------------------- /apps/opensearch/2.11/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/2.11/Dockerfile -------------------------------------------------------------------------------- /apps/opensearch/2.11/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/2.11/README.md -------------------------------------------------------------------------------- /apps/opensearch/2.11/opensearch.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/2.11/opensearch.yml -------------------------------------------------------------------------------- /apps/opensearch/2.11/sycamore-opensearch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/2.11/sycamore-opensearch.sh -------------------------------------------------------------------------------- /apps/opensearch/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/Dockerfile -------------------------------------------------------------------------------- /apps/opensearch/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/README.md -------------------------------------------------------------------------------- /apps/opensearch/authority.pem: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/authority.pem -------------------------------------------------------------------------------- /apps/opensearch/config.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/config.yml -------------------------------------------------------------------------------- /apps/opensearch/opensearch.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/opensearch.yml -------------------------------------------------------------------------------- /apps/opensearch/roles_mapping.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/roles_mapping.yml -------------------------------------------------------------------------------- /apps/opensearch/setup_models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/setup_models.py -------------------------------------------------------------------------------- /apps/opensearch/sycamore-opensearch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/opensearch/sycamore-opensearch.sh -------------------------------------------------------------------------------- /apps/remote-processor-service/Dockerfile.build: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/remote-processor-service/Dockerfile.build -------------------------------------------------------------------------------- /apps/remote-processor-service/Dockerfile.buildx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/remote-processor-service/Dockerfile.buildx -------------------------------------------------------------------------------- /apps/remote-processor-service/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/remote-processor-service/Makefile -------------------------------------------------------------------------------- /apps/remote-processor-service/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/remote-processor-service/README.md -------------------------------------------------------------------------------- /apps/remote-processor-service/config/pipelines.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/remote-processor-service/config/pipelines.yml -------------------------------------------------------------------------------- /apps/remote-processor-service/poetry.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/remote-processor-service/poetry.lock -------------------------------------------------------------------------------- /apps/remote-processor-service/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/remote-processor-service/pyproject.toml -------------------------------------------------------------------------------- /apps/remote-processor-service/remote_processor_service/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/remote-processor-service/remote_processor_service/cli.py -------------------------------------------------------------------------------- /apps/remote-processor-service/remote_processor_service/rps_docker_entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/remote-processor-service/remote_processor_service/rps_docker_entrypoint.sh -------------------------------------------------------------------------------- /apps/timetrace/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/timetrace/Makefile -------------------------------------------------------------------------------- /apps/timetrace/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/timetrace/README.md -------------------------------------------------------------------------------- /apps/timetrace/ttanal: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/timetrace/ttanal -------------------------------------------------------------------------------- /apps/timetrace/ttcat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/timetrace/ttcat -------------------------------------------------------------------------------- /apps/timetrace/ttviz.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/apps/timetrace/ttviz.cpp -------------------------------------------------------------------------------- /autogen-groups.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/autogen-groups.py -------------------------------------------------------------------------------- /compose.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/compose.yaml -------------------------------------------------------------------------------- /docs/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/Makefile -------------------------------------------------------------------------------- /docs/make.bat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/make.bat -------------------------------------------------------------------------------- /docs/source/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/conf.py -------------------------------------------------------------------------------- /docs/source/images/ArynArchitecture_APS+Sycamorev2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/images/ArynArchitecture_APS+Sycamorev2.png -------------------------------------------------------------------------------- /docs/source/images/SycamoreDataflowDiagramv2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/images/SycamoreDataflowDiagramv2.png -------------------------------------------------------------------------------- /docs/source/images/SycamoreDiagram2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/images/SycamoreDiagram2.png -------------------------------------------------------------------------------- /docs/source/images/favicon.ico: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/images/favicon.ico -------------------------------------------------------------------------------- /docs/source/images/query_execution.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/images/query_execution.svg -------------------------------------------------------------------------------- /docs/source/images/sycamore_logo.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/images/sycamore_logo.svg -------------------------------------------------------------------------------- /docs/source/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/index.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/context.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/context.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/docset.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/docset.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/docsetreader.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/docsetreader.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/docsetwriter.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/docsetwriter.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/document.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/document.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/functions.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/functions.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/gen: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/gen -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/llm.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/llm.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/assign_doc_properties.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/assign_doc_properties.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/augment_text.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/augment_text.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/basics.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/basics.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/bbox_merge.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/bbox_merge.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/detr_partitioner.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/detr_partitioner.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/embed.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/embed.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/explode.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/explode.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/extract_entity.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/extract_entity.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/extract_schema.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/extract_schema.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/extract_table.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/extract_table.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/extract_table_properties.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/extract_table_properties.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/llm_map.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/llm_map.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/llm_query.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/llm_query.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/map.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/map.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/mark_misc.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/mark_misc.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/merge_elements.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/merge_elements.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/partition.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/partition.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/query.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/query.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/random_sample.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/random_sample.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/regex_replace.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/regex_replace.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/sketcher.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/sketcher.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/split_elements.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/split_elements.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/spread_properties.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/spread_properties.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/standardizer.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/standardizer.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/summarize.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/summarize.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/low_level_transforms/summarize_images.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/low_level_transforms/summarize_images.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/node.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/node.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/prompts.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/prompts.rst -------------------------------------------------------------------------------- /docs/source/sycamore/APIs/query.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/APIs/query.rst -------------------------------------------------------------------------------- /docs/source/sycamore/connectors.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/connectors.rst -------------------------------------------------------------------------------- /docs/source/sycamore/connectors/duckdb.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/connectors/duckdb.md -------------------------------------------------------------------------------- /docs/source/sycamore/connectors/elasticsearch.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/connectors/elasticsearch.md -------------------------------------------------------------------------------- /docs/source/sycamore/connectors/neo4j.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/connectors/neo4j.md -------------------------------------------------------------------------------- /docs/source/sycamore/connectors/opensearch.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/connectors/opensearch.md -------------------------------------------------------------------------------- /docs/source/sycamore/connectors/pinecone.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/connectors/pinecone.md -------------------------------------------------------------------------------- /docs/source/sycamore/connectors/qdrant.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/connectors/qdrant.md -------------------------------------------------------------------------------- /docs/source/sycamore/connectors/weaviate.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/connectors/weaviate.md -------------------------------------------------------------------------------- /docs/source/sycamore/get_started.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/get_started.rst -------------------------------------------------------------------------------- /docs/source/sycamore/get_started/ai_configuration.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/get_started/ai_configuration.md -------------------------------------------------------------------------------- /docs/source/sycamore/get_started/concepts.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/get_started/concepts.md -------------------------------------------------------------------------------- /docs/source/sycamore/get_started/hardware.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/get_started/hardware.md -------------------------------------------------------------------------------- /docs/source/sycamore/query.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/query.rst -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/APIs/conversation_memory.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/APIs/conversation_memory.rst -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/APIs/conversation_memory/functions.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/APIs/conversation_memory/functions.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/APIs/gen: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/APIs/gen -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/architecture.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/architecture.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/imgs/ConversationMemoryMultiAgent.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/imgs/ConversationMemoryMultiAgent.jpg -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/imgs/ConversationMemoryMultiAgent.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/imgs/ConversationMemoryMultiAgent.png -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/imgs/resource-diagram.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/imgs/resource-diagram.png -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/overview.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/overview.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/storage_for_genai_agents.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/storage_for_genai_agents.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/using_with_conversational_search.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/conversation_memory/using_with_conversational_search.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/dedup.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/dedup.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/demo_query_ui.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/demo_query_ui.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/encryption.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/encryption.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/hybrid_search.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/hybrid_search.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/imgs/pipeline-architecture.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/imgs/pipeline-architecture.png -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/imgs/xlarge_DemoUI_FollowUpQuestion.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/imgs/xlarge_DemoUI_FollowUpQuestion.png -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/integrate_your_application.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/integrate_your_application.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/launching_with_Docker.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/launching_with_Docker.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/load_data.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/load_data.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/remote_processors.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/remote_processors.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/reranking.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/reranking.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/running_a_data_preparation_job.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/running_a_data_preparation_job.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/using_jupyter_container.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/using_jupyter_container.md -------------------------------------------------------------------------------- /docs/source/sycamore/querying_data/using_aryn_opensearch_stack/using_rag_pipelines.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/querying_data/using_aryn_opensearch_stack/using_rag_pipelines.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms.rst -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/embed.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/embed.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/explode.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/explode.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/extract_entity.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/extract_entity.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/extract_schema.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/extract_schema.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/filter.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/filter.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/flatmap.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/flatmap.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/llm_query.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/llm_query.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/map.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/map.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/map_batch.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/map_batch.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/materialize.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/materialize.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/merge.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/merge.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/partition.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/partition.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/sketch.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/sketch.md -------------------------------------------------------------------------------- /docs/source/sycamore/transforms/summarize.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/transforms/summarize.md -------------------------------------------------------------------------------- /docs/source/sycamore/tutorials.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/tutorials.rst -------------------------------------------------------------------------------- /docs/source/sycamore/tutorials/conversational_memory_with_langchain.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/tutorials/conversational_memory_with_langchain.md -------------------------------------------------------------------------------- /docs/source/sycamore/tutorials/etl_for_opensearch.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/tutorials/etl_for_opensearch.md -------------------------------------------------------------------------------- /docs/source/sycamore/tutorials/etl_for_weaviate_tutorial.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/tutorials/etl_for_weaviate_tutorial.md -------------------------------------------------------------------------------- /docs/source/sycamore/tutorials/etl_pinecone_tutorial.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/tutorials/etl_pinecone_tutorial.md -------------------------------------------------------------------------------- /docs/source/sycamore/tutorials/sycamore_jupyter_dev_example.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/tutorials/sycamore_jupyter_dev_example.md -------------------------------------------------------------------------------- /docs/source/sycamore/using_jupyter.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/docs/source/sycamore/using_jupyter.md -------------------------------------------------------------------------------- /examples/bench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bench.py -------------------------------------------------------------------------------- /examples/bigquery-docparse/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/README.md -------------------------------------------------------------------------------- /examples/bigquery-docparse/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/config.py -------------------------------------------------------------------------------- /examples/bigquery-docparse/deploy-cf.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/deploy-cf.sh -------------------------------------------------------------------------------- /examples/bigquery-docparse/download-finals.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/download-finals.py -------------------------------------------------------------------------------- /examples/bigquery-docparse/get_status/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/get_status/main.py -------------------------------------------------------------------------------- /examples/bigquery-docparse/get_status/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/get_status/requirements.txt -------------------------------------------------------------------------------- /examples/bigquery-docparse/info.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/info.sh -------------------------------------------------------------------------------- /examples/bigquery-docparse/populate_uris.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/populate_uris.py -------------------------------------------------------------------------------- /examples/bigquery-docparse/queue_async.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/queue_async.py -------------------------------------------------------------------------------- /examples/bigquery-docparse/sleep_until.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/sleep_until.py -------------------------------------------------------------------------------- /examples/bigquery-docparse/stored_procedures.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/stored_procedures.sql -------------------------------------------------------------------------------- /examples/bigquery-docparse/sync_code_with_bigquery.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/bigquery-docparse/sync_code_with_bigquery.py -------------------------------------------------------------------------------- /examples/html_ingest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/html_ingest.py -------------------------------------------------------------------------------- /examples/markdown.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/markdown.py -------------------------------------------------------------------------------- /examples/ndd_debug.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/ndd_debug.py -------------------------------------------------------------------------------- /examples/query/ntsb_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/query/ntsb_loader.py -------------------------------------------------------------------------------- /examples/query/ntsb_loader_materialized.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/query/ntsb_loader_materialized.py -------------------------------------------------------------------------------- /examples/query/simple_ntsb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/query/simple_ntsb.py -------------------------------------------------------------------------------- /examples/s3_ingest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/s3_ingest.py -------------------------------------------------------------------------------- /examples/simple_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/simple_config.py -------------------------------------------------------------------------------- /examples/simple_duckdb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/simple_duckdb.py -------------------------------------------------------------------------------- /examples/simple_ingest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/simple_ingest.py -------------------------------------------------------------------------------- /examples/simple_neo4j.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/simple_neo4j.py -------------------------------------------------------------------------------- /examples/simple_pinecone.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/simple_pinecone.py -------------------------------------------------------------------------------- /examples/simple_qdrant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/simple_qdrant.py -------------------------------------------------------------------------------- /examples/simple_weaviate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/examples/simple_weaviate.py -------------------------------------------------------------------------------- /lib/import_timer/README.md: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/import_timer/import_timer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/import_timer/import_timer.py -------------------------------------------------------------------------------- /lib/import_timer/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/import_timer/pyproject.toml -------------------------------------------------------------------------------- /lib/poetry-lock/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/poetry-lock/README.md -------------------------------------------------------------------------------- /lib/poetry-lock/poetry-lock-all.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/poetry-lock/poetry-lock-all.sh -------------------------------------------------------------------------------- /lib/poetry-lock/poetry.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/poetry-lock/poetry.lock -------------------------------------------------------------------------------- /lib/poetry-lock/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/poetry-lock/pyproject.toml -------------------------------------------------------------------------------- /lib/poetry-lock/sycamore_poetry_lock/noop.py: -------------------------------------------------------------------------------- 1 | pass 2 | -------------------------------------------------------------------------------- /lib/remote-processors/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/Makefile -------------------------------------------------------------------------------- /lib/remote-processors/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/README.md -------------------------------------------------------------------------------- /lib/remote-processors/img/RPS_Architecture.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/img/RPS_Architecture.svg -------------------------------------------------------------------------------- /lib/remote-processors/poetry.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/poetry.lock -------------------------------------------------------------------------------- /lib/remote-processors/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/pyproject.toml -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/__init__.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/processors/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/processors/__init__.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/processors/debug_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/processors/debug_processor.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/processors/dedup_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/processors/dedup_processor.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/processors/processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/processors/processor.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/search_request.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/search_request.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/search_response.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/search_response.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/server/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/server/__init__.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/server/pipeline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/server/pipeline.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/server/processor_registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/server/processor_registry.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/server/remote_processor_service.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/server/remote_processor_service.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/integration/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/integration/conftest.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/integration/test_integ_debug.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/integration/test_integ_debug.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/resources/configs/malformed/dupe_pipeline_names.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/resources/configs/malformed/dupe_pipeline_names.yml -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/resources/configs/malformed/not_a_list.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/resources/configs/malformed/not_a_list.yml -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/resources/configs/malformed/pipeline_not_a_map.yml: -------------------------------------------------------------------------------- 1 | - debug 2 | -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/resources/configs/malformed/pipeline_with_many_keys.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/resources/configs/malformed/pipeline_with_many_keys.yml -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/resources/configs/valid.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/resources/configs/valid.yml -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/resources/sb_processed.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/resources/sb_processed.jsonl -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/unit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/unit/processors/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/unit/processors/test_debug.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/unit/processors/test_debug.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/unit/processors/test_dedup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/unit/processors/test_dedup.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/unit/processors/test_library.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/unit/processors/test_library.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/unit/service/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/unit/service/test_pipeline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/unit/service/test_pipeline.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/unit/service/test_processor_registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/unit/service/test_processor_registry.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/unit/service/test_remote_processor_service.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/unit/service/test_remote_processor_service.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/unit/test_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/unit/test_base.py -------------------------------------------------------------------------------- /lib/remote-processors/remote_processors/test/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/remote-processors/remote_processors/test/utils.py -------------------------------------------------------------------------------- /lib/sycamore/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/README.md -------------------------------------------------------------------------------- /lib/sycamore/poetry.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/poetry.lock -------------------------------------------------------------------------------- /lib/sycamore/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/pyproject.toml -------------------------------------------------------------------------------- /lib/sycamore/sycamore/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/README.md -------------------------------------------------------------------------------- /lib/sycamore/sycamore/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/aryn/ArynReader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/aryn/ArynReader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/aryn/ArynWriter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/aryn/ArynWriter.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/aryn/client.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/aryn/client.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/base_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/base_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/base_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/base_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/common.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/doc_reconstruct.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/doc_reconstruct.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/duckdb/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/duckdb/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/duckdb/duckdb_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/duckdb/duckdb_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/duckdb/duckdb_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/duckdb/duckdb_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/elasticsearch/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/elasticsearch/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/elasticsearch/elasticsearch_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/elasticsearch/elasticsearch_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/elasticsearch/elasticsearch_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/elasticsearch/elasticsearch_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/file/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/file/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/file/file_scan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/file/file_scan.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/file/file_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/file/file_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/file/file_writer_ray.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/file/file_writer_ray.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/file/materialized_scan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/file/materialized_scan.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/iceberg/iceberg_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/iceberg/iceberg_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/neo4j/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/neo4j/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/neo4j/neo4j_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/neo4j/neo4j_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/opensearch/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/opensearch/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/opensearch/opensearch_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/opensearch/opensearch_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/opensearch/opensearch_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/opensearch/opensearch_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/opensearch/sync.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/opensearch/sync.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/opensearch/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/opensearch/utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/pinecone/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/pinecone/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/pinecone/pinecone_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/pinecone/pinecone_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/pinecone/pinecone_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/pinecone/pinecone_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/qdrant/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/qdrant/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/qdrant/qdrant_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/qdrant/qdrant_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/qdrant/qdrant_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/qdrant/qdrant_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/weaviate/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/weaviate/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/weaviate/weaviate_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/weaviate/weaviate_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/connectors/weaviate/weaviate_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/connectors/weaviate/weaviate_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/context.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/context.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/data/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/data/bbox.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/data/bbox.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/data/docid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/data/docid.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/data/document.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/data/document.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/data/element.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/data/element.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/data/metadata.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/data/metadata.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/data/table.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/data/table.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/decorators.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/decorators.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/docset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/docset.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/data.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/datasets.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/evaluate.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/metrics/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/metrics/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/metrics/generated_answer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/metrics/generated_answer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/metrics/retrieval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/metrics/retrieval.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/ocr/__main__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/ocr/__main__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/ocr/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/ocr/data.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/ocr/llm_ocr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/ocr/llm_ocr.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/ocr/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/ocr/metrics.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/ocr/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/ocr/models.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/pipeline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/pipeline.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/evaluation/subtasks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/evaluation/subtasks.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/executor.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/functions/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/functions/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/functions/basic_filters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/functions/basic_filters.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/functions/chunker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/functions/chunker.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/functions/document.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/functions/document.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/functions/elements.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/functions/elements.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/functions/rabin_karp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/functions/rabin_karp.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/functions/simhash.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/functions/simhash.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/functions/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/functions/tokenizer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/grouped_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/grouped_data.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/anthropic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/anthropic.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/bedrock.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/bedrock.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/chained_llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/chained_llm.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/config.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/gemini.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/gemini.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/llms.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/llms.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/openai.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/openai.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/prompts/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/prompts/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/prompts/default_prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/prompts/default_prompts.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/prompts/jinja_fragments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/prompts/jinja_fragments.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/llms/prompts/prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/llms/prompts/prompts.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/materialize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/materialize.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/materialize_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/materialize_config.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/plan_nodes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/plan_nodes.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/README.md -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/client.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/client.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/execution/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/execution/aggregation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/execution/aggregation.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/execution/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/execution/metrics.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/execution/operations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/execution/operations.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/execution/physical_operator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/execution/physical_operator.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/execution/sycamore_executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/execution/sycamore_executor.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/execution/sycamore_operator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/execution/sycamore_operator.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/logical_plan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/logical_plan.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/basic_filter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/basic_filter.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/clustering.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/clustering.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/count.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/count.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/field_in.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/field_in.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/groupby.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/groupby.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/limit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/limit.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/llm_extract_entity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/llm_extract_entity.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/llm_filter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/llm_filter.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/math.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/math.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/query_database.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/query_database.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/sort.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/sort.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/summarize_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/summarize_data.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/top_k.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/top_k.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/operators/unroll.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/operators/unroll.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/planner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/planner.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/planner_prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/planner_prompt.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/result.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/result.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/schema.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/schema.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/query/strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/query/strategy.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/rules/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/rules/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/rules/optimize_resource_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/rules/optimize_resource_args.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/schema.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/schema.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/README.md -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/config.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/conftest.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/aryn/test_aryn_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/aryn/test_aryn_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/aryn/test_aryn_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/aryn/test_aryn_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/aryn/test_client.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/aryn/test_client.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/common.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/duckdb/test_duckdb_read.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/duckdb/test_duckdb_read.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/duckdb/test_pdf_to_duckdb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/duckdb/test_pdf_to_duckdb.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/elasticsearch/test_elasticsearch_read.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/elasticsearch/test_elasticsearch_read.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/elasticsearch/test_pdf_to_elasticsearch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/elasticsearch/test_pdf_to_elasticsearch.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/file/test_file_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/file/test_file_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/file/test_file_writer_to_s3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/file/test_file_writer_to_s3.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/neo4j/test_docset_to_neo4j.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/neo4j/test_docset_to_neo4j.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/neo4j/test_neo4j_writer_methods.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/neo4j/test_neo4j_writer_methods.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/opensearch/test_html_to_opensearch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/opensearch/test_html_to_opensearch.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/opensearch/test_opensearch_read.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/opensearch/test_opensearch_read.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/opensearch/test_pdf_to_opensearch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/opensearch/test_pdf_to_opensearch.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/pinecone/test_pdf_to_pinecone.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/pinecone/test_pdf_to_pinecone.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/pinecone/test_pinecone_read.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/pinecone/test_pinecone_read.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/qdrant/test_qdrant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/qdrant/test_qdrant.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/weaviate/test_pdf_to_weaviate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/weaviate/test_pdf_to_weaviate.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/connectors/weaviate/test_weaviate_read.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/connectors/weaviate/test_weaviate_read.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/evaluation/test_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/evaluation/test_datasets.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/evaluation/test_evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/evaluation/test_evaluate.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/evaluation/test_pipeline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/evaluation/test_pipeline.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/functions/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/functions/test_document.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/functions/test_document.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/llms/test_anthropic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/llms/test_anthropic.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/llms/test_bedrock.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/llms/test_bedrock.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/llms/test_chained_llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/llms/test_chained_llm.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/llms/test_gemini.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/llms/test_gemini.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/llms/test_openai.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/llms/test_openai.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/query/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/query/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/query/conftest.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/query/execution/test_operations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/query/execution/test_operations.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/query/execution/test_sycamore_query.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/query/execution/test_sycamore_query.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/query/test_planner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/query/test_planner.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/query/test_query_opensearch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/query/test_query_opensearch.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/test_docset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/test_docset.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/test_executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/test_executor.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/test_image_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/test_image_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/test_materialize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/test_materialize.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/textractor/test_textractor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/textractor/test_textractor.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/property_extraction/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/property_extraction/test_schema_extract.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/property_extraction/test_schema_extract.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_aggregation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_aggregation.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_base.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_data_extraction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_data_extraction.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_embed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_embed.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_llm_filter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_llm_filter.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_map.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_map.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_ocr_models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_ocr_models.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_partition.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_partition.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_random_sample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_random_sample.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_rerank.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_rerank.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_sort.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_sort.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_summarize_images.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_summarize_images.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_table_extraction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_table_extraction.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/transforms/test_union.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/transforms/test_union.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/integration/utils/test_pdf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/integration/utils/test_pdf.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/manual/pdf2image_memusage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/manual/pdf2image_memusage.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/manual/test_fast_sycamore_import.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/manual/test_fast_sycamore_import.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/manual/test_opensearch_sync.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/manual/test_opensearch_sync.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/pytest.ini: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/docx/aryn_website_sample.docx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/docx/aryn_website_sample.docx -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/htmls/wikipedia_binary_search.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/htmls/wikipedia_binary_search.html -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/imgs/sample-detr-image.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/imgs/sample-detr-image.png -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/imgs/vert_table.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/imgs/vert_table.png -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/json/example.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/json/example.json -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/json/model_server_output_transformer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/json/model_server_output_transformer.json -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/json/model_server_output_transformer_extract_tables.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/json/model_server_output_transformer_extract_tables.json -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/materialize/json_writer/3fe9913e-60e2-11ef-90e5-e40d36f1e1ae.pickle: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/materialize/json_writer/3fe9913e-60e2-11ef-90e5-e40d36f1e1ae.pickle -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/materialize/json_writer/materialize.success: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/materialize/json_writer/md-9e6e68ee-ad8e-4e39-a2e1-7ef5befc588c.pickle: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/materialize/json_writer/md-9e6e68ee-ad8e-4e39-a2e1-7ef5befc588c.pickle -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/materialize.clean: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/materialize.success: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/md-d-07bgl12pc0intnh2y74po4c.a98b82d885005500fb664fb18283cf80864de0fb6116e5acd9c3060dd91086a7.pickle: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/md-d-07bgl12pc0intnh2y74po4c.a98b82d885005500fb664fb18283cf80864de0fb6116e5acd9c3060dd91086a7.pickle -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/md-d-6wi2aqr0b504zojkdqnyybf.97ae3a37a86700c4601f89551892eb79faeaa0c9afe66f26ee20d8b7f996f929.pickle: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/md-d-6wi2aqr0b504zojkdqnyybf.97ae3a37a86700c4601f89551892eb79faeaa0c9afe66f26ee20d8b7f996f929.pickle -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/md-d-75qp993ysz87aa1c1tsc5o0.0db762bad4ffb81bdde0f754087a65594f0cc8001986729f6ded86fa7ca7803e.pickle: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/md-d-75qp993ysz87aa1c1tsc5o0.0db762bad4ffb81bdde0f754087a65594f0cc8001986729f6ded86fa7ca7803e.pickle -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/md-d-89ww3vta189zsw6ac4vsjem.253ac204a7d81cc730b4a90202afaf3f78dbf27c87a17bcb94a23212b159cce6.pickle: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/md-d-89ww3vta189zsw6ac4vsjem.253ac204a7d81cc730b4a90202afaf3f78dbf27c87a17bcb94a23212b159cce6.pickle -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/md-d-a8pg30d1wqbff3zsf6c4l0w.c75fd5cba213cc7888ffe30f52d9fb7b637acd227a728b07ee7e1c50545c884e.pickle: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/materialize/llmfilter-ntsb-temp/md-d-a8pg30d1wqbff3zsf6c4l0w.c75fd5cba213cc7888ffe30f52d9fb7b637acd227a728b07ee7e1c50545c884e.pickle -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/nested_json/example.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/nested_json/example.json -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/ocr_pdfs/test_simple_ocr.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/ocr_pdfs/test_simple_ocr.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pdfs/Ray.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pdfs/Ray.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pdfs/Ray_page1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pdfs/Ray_page1.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pdfs/Ray_page11.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pdfs/Ray_page11.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pdfs/Transformer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pdfs/Transformer.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pdfs/basic_table.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pdfs/basic_table.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pdfs/doctor_testimonial.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pdfs/doctor_testimonial.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pdfs/ntsb-report.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pdfs/ntsb-report.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pdfs/ntsb0.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pdfs/ntsb0.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pdfs/ntsb1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pdfs/ntsb1.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pdfs/ntsb3.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pdfs/ntsb3.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pdfs/visit_aryn.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pdfs/visit_aryn.pdf -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/pptx/design.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/pptx/design.pptx -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/data/texts/Ray.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/data/texts/Ray.txt -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/resources/objects/weaviate/collection_params_b.pickle: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/resources/objects/weaviate/collection_params_b.pickle -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/aryn/test_aryn_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/aryn/test_aryn_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/common/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/common/test_base_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/common/test_base_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/common/test_base_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/common/test_base_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/common/test_common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/common/test_common.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/duckdb/test_duckdb_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/duckdb/test_duckdb_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/duckdb/test_duckdb_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/duckdb/test_duckdb_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/elasticsearch/test_elasticsearch_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/elasticsearch/test_elasticsearch_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/elasticsearch/test_elasticsearch_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/elasticsearch/test_elasticsearch_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/file/test_file_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/file/test_file_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/iceberg/test_iceberg_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/iceberg/test_iceberg_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/opensearch/test_opensearch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/opensearch/test_opensearch.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/opensearch/test_sync.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/opensearch/test_sync.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/pinecone/test_pinecone_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/pinecone/test_pinecone_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/pinecone/test_pinecone_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/pinecone/test_pinecone_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/qdrant/test_qdrant_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/qdrant/test_qdrant_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/weaviate/test_weaviate_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/weaviate/test_weaviate_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/connectors/weaviate/test_weaviate_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/connectors/weaviate/test_weaviate_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/data/test_bbox.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/data/test_bbox.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/data/test_docid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/data/test_docid.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/data/test_document.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/data/test_document.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/data/test_element.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/data/test_element.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/data/test_table.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/data/test_table.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/evaluation/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/evaluation/test_evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/evaluation/test_evaluate.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/evaluation/test_metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/evaluation/test_metrics.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/functions/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/functions/test_elements.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/functions/test_elements.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/functions/test_field_to_value.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/functions/test_field_to_value.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/functions/test_rabin_karp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/functions/test_rabin_karp.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/functions/test_simhash.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/functions/test_simhash.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/functions/test_text_chunker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/functions/test_text_chunker.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/functions/test_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/functions/test_tokenizer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/inmempyarrowfs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/inmempyarrowfs.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/llms/prompts/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/llms/prompts/test_prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/llms/prompts/test_prompts.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/llms/test_bedrock.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/llms/test_bedrock.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/llms/test_llms.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/llms/test_llms.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/query/conftest.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/execution/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/execution/test_sycamore_executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/query/execution/test_sycamore_executor.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/execution/test_sycamore_operator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/query/execution/test_sycamore_operator.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/test_node.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/query/test_node.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/test_operations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/query/test_operations.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/test_plan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/query/test_plan.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/test_planner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/query/test_planner.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/test_result.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/query/test_result.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/test_schema.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/query/test_schema.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/query/test_strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/query/test_strategy.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/scans/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/scans/test_file_scan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/scans/test_file_scan.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/scans/test_materialized_scan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/scans/test_materialized_scan.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/test_context.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/test_context.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/test_docset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/test_docset.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/test_executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/test_executor.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/test_grouped_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/test_grouped_data.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/test_import_speed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/test_import_speed.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/test_materialize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/test_materialize.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/test_node.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/test_node.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/test_reader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/test_reader.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/test_rewriter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/test_rewriter.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/test_schema.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/test_schema.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/test_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/test_writer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/check_partition_impl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/check_partition_impl.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_attribution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_attribution.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_extract.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_extract.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_prompts.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_schema_extract.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_schema_extract.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_strategy.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_types.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/property_extraction/test_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_aggregation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_aggregation.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_aryn_partitioner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_aryn_partitioner.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_assign_doc_properties.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_assign_doc_properties.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_augment_text.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_augment_text.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_base.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_base_llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_base_llm.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_basics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_basics.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_bbox_merge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_bbox_merge.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_clustering.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_clustering.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_detr_partitioner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_detr_partitioner.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_embed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_embed.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_explode.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_explode.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_extract_document_structure.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_extract_document_structure.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_extract_entity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_extract_entity.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_extract_table_properties.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_extract_table_properties.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_graph_entity_extractor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_graph_entity_extractor.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_graph_relationship_extractor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_graph_relationship_extractor.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_llm_filter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_llm_filter.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_llm_query.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_llm_query.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_mapping.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_mapping.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_merge_elements.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_merge_elements.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_partition.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_partition.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_random_sample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_random_sample.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_regex_replace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_regex_replace.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_resolve_graph_entities.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_resolve_graph_entities.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_schema.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_schema.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_similarity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_similarity.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_sketcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_sketcher.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_sort.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_sort.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_split_elements.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_split_elements.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_spread_properties.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_spread_properties.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_standardizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_standardizer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_summarize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_summarize.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_summarize_images.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_summarize_images.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_table_extractor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_table_extractor.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_table_transfomers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_table_transfomers.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_term_frequency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_term_frequency.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/test_union.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/test_union.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/transforms/text_extraction/test_ocr_models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/transforms/text_extraction/test_ocr_models.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_bbox_sort.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_bbox_sort.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_cache.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_cache.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_deep_eq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_deep_eq.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_derivation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_derivation.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_extract_json.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_extract_json.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_fileformat_tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_fileformat_tools.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_import_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_import_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_jupyter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_jupyter.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_markdown.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_markdown.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_nested.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_nested.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_pdf_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_pdf_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_pyarrow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_pyarrow.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_pydantic_pickling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_pydantic_pickling.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_ray_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_ray_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_rotation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_rotation.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_similarity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_similarity.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_strings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_strings.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_sycamore_logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_sycamore_logger.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_threading.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_threading.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_time_trace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_time_trace.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_xycut_sort.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_xycut_sort.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/unit/utils/test_zip_traverse.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/unit/utils/test_zip_traverse.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/tests/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/tests/utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/aggregation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/aggregation.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/assign_doc_properties.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/assign_doc_properties.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/augment_text.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/augment_text.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/base.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/base_llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/base_llm.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/basics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/basics.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/bbox_merge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/bbox_merge.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/clustering.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/clustering.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/dataset_scan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/dataset_scan.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/detr_partitioner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/detr_partitioner.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/detr_partitioner_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/detr_partitioner_config.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/embed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/embed.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/explode.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/explode.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/extract_document_structure.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/extract_document_structure.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/extract_entity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/extract_entity.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/extract_graph_entities.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/extract_graph_entities.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/extract_graph_relationships.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/extract_graph_relationships.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/extract_schema.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/extract_schema.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/extract_table.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/extract_table.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/extract_table_properties.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/extract_table_properties.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/groupby_count.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/groupby_count.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/llm_filter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/llm_filter.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/llm_query.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/llm_query.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/map.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/map.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/mark_misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/mark_misc.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/markdown.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/markdown.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/merge_elements.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/merge_elements.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/partition.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/partition.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/property_extraction/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/property_extraction/attribution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/property_extraction/attribution.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/property_extraction/extract.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/property_extraction/extract.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/property_extraction/merge_schemas.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/property_extraction/merge_schemas.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/property_extraction/prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/property_extraction/prompts.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/property_extraction/strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/property_extraction/strategy.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/property_extraction/types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/property_extraction/types.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/property_extraction/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/property_extraction/utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/query.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/query.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/random_sample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/random_sample.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/regex_replace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/regex_replace.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/resolve_graph_entities.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/resolve_graph_entities.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/similarity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/similarity.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/sketcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/sketcher.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/sort.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/sort.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/split_elements.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/split_elements.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/spread_properties.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/spread_properties.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/standardizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/standardizer.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/summarize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/summarize.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/summarize_images.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/summarize_images.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/table_structure/extract.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/table_structure/extract.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/table_structure/table_transformers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/table_structure/table_transformers.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/term_frequency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/term_frequency.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/text_extraction/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/text_extraction/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/text_extraction/ocr_models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/text_extraction/ocr_models.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/text_extraction/pdf_miner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/text_extraction/pdf_miner.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/text_extraction/text_extractor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/text_extraction/text_extractor.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/transforms/union.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/transforms/union.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/aryn_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/aryn_config.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/bbox_sort.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/bbox_sort.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/cache.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/cache.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/deep_eq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/deep_eq.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/deprecate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/deprecate.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/derivation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/derivation.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/element_sort.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/element_sort.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/extract_json.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/extract_json.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/fileformat_tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/fileformat_tools.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/html_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/html_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/http.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/http.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/image_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/image_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/import_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/import_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/jupyter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/jupyter.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/lineage_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/lineage_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/llm_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/llm_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/markdown.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/markdown.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/memory_debugging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/memory_debugging.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/merge_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/merge_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/model_load.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/model_load.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/nested.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/nested.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/pdf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/pdf.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/pdf_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/pdf_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/pickle_pydantic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/pickle_pydantic.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/pyarrow/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/pyarrow/__init__.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/pyarrow/fs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/pyarrow/fs.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/pyarrow/types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/pyarrow/types.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/pytorch_dir.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/pytorch_dir.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/ray_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/ray_utils.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/rotation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/rotation.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/similarity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/similarity.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/strings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/strings.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/sycamore_logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/sycamore_logger.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/thread_local.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/thread_local.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/threading.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/threading.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/time_trace.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/time_trace.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/xycut.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/xycut.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/utils/zip_traverse.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/utils/zip_traverse.py -------------------------------------------------------------------------------- /lib/sycamore/sycamore/writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/lib/sycamore/sycamore/writer.py -------------------------------------------------------------------------------- /notebooks/ArynPartitionerExample.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/ArynPartitionerExample.ipynb -------------------------------------------------------------------------------- /notebooks/ArynPartitionerPython.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/ArynPartitionerPython.ipynb -------------------------------------------------------------------------------- /notebooks/ArynPartitionerWithLangchain.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/ArynPartitionerWithLangchain.ipynb -------------------------------------------------------------------------------- /notebooks/EBGaramond-Bold.ttf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/EBGaramond-Bold.ttf -------------------------------------------------------------------------------- /notebooks/OpenAI-logprob.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/OpenAI-logprob.ipynb -------------------------------------------------------------------------------- /notebooks/VisualizePartitioner.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/VisualizePartitioner.ipynb -------------------------------------------------------------------------------- /notebooks/aryn-opensearch-bedrock-rag-example.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/aryn-opensearch-bedrock-rag-example.ipynb -------------------------------------------------------------------------------- /notebooks/default-prep-script.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/default-prep-script.ipynb -------------------------------------------------------------------------------- /notebooks/docprep/minilm-l6-v2_greedy-section-merger_duckdb.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/docprep/minilm-l6-v2_greedy-section-merger_duckdb.ipynb -------------------------------------------------------------------------------- /notebooks/docprep/minilm-l6-v2_greedy-section-merger_opensearch.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/docprep/minilm-l6-v2_greedy-section-merger_opensearch.ipynb -------------------------------------------------------------------------------- /notebooks/docprep/minilm-l6-v2_greedy-text-element-merger_duckdb.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/docprep/minilm-l6-v2_greedy-text-element-merger_duckdb.ipynb -------------------------------------------------------------------------------- /notebooks/docprep/minilm-l6-v2_marked-merger_duckdb.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/docprep/minilm-l6-v2_marked-merger_duckdb.ipynb -------------------------------------------------------------------------------- /notebooks/docprep/text-embedding-3-small_greedy-section-merger_duckdb.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/docprep/text-embedding-3-small_greedy-section-merger_duckdb.ipynb -------------------------------------------------------------------------------- /notebooks/docprep/text-embedding-3-small_greedy-section-merger_pinecone.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/docprep/text-embedding-3-small_greedy-section-merger_pinecone.ipynb -------------------------------------------------------------------------------- /notebooks/docprep/text-embedding-3-small_greedy-text-element-merger_opensearch.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/docprep/text-embedding-3-small_greedy-text-element-merger_opensearch.ipynb -------------------------------------------------------------------------------- /notebooks/docprep/text-embedding-3-small_marked-merger_pinecone.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/docprep/text-embedding-3-small_marked-merger_pinecone.ipynb -------------------------------------------------------------------------------- /notebooks/duckdb-writer.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/duckdb-writer.ipynb -------------------------------------------------------------------------------- /notebooks/earnings_calls_notebooks/workshop_nb_0.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/earnings_calls_notebooks/workshop_nb_0.ipynb -------------------------------------------------------------------------------- /notebooks/earnings_calls_notebooks/workshop_nb_1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/earnings_calls_notebooks/workshop_nb_1.ipynb -------------------------------------------------------------------------------- /notebooks/earnings_calls_notebooks/workshop_nb_2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/earnings_calls_notebooks/workshop_nb_2.ipynb -------------------------------------------------------------------------------- /notebooks/earnings_calls_notebooks/workshop_nb_3.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/earnings_calls_notebooks/workshop_nb_3.ipynb -------------------------------------------------------------------------------- /notebooks/earnings_calls_notebooks/workshop_nb_4.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/earnings_calls_notebooks/workshop_nb_4.ipynb -------------------------------------------------------------------------------- /notebooks/elasticsearch-writer.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/elasticsearch-writer.ipynb -------------------------------------------------------------------------------- /notebooks/financial-docs-10k-example.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/financial-docs-10k-example.ipynb -------------------------------------------------------------------------------- /notebooks/jupyter_dev_example.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/jupyter_dev_example.ipynb -------------------------------------------------------------------------------- /notebooks/metadata-extraction.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/metadata-extraction.ipynb -------------------------------------------------------------------------------- /notebooks/ndd_example.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/ndd_example.ipynb -------------------------------------------------------------------------------- /notebooks/ntsb-demo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/ntsb-demo.ipynb -------------------------------------------------------------------------------- /notebooks/opensearch-writer.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/opensearch-writer.ipynb -------------------------------------------------------------------------------- /notebooks/opensearch_docs_etl.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/opensearch_docs_etl.ipynb -------------------------------------------------------------------------------- /notebooks/pinecone-writer.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/pinecone-writer.ipynb -------------------------------------------------------------------------------- /notebooks/query-demo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/query-demo.ipynb -------------------------------------------------------------------------------- /notebooks/run-notebook-tests.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/run-notebook-tests.sh -------------------------------------------------------------------------------- /notebooks/subtask-sample.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/subtask-sample.ipynb -------------------------------------------------------------------------------- /notebooks/sycamore-tutorial-intermediate-etl.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/sycamore-tutorial-intermediate-etl.ipynb -------------------------------------------------------------------------------- /notebooks/sycamore_demo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/sycamore_demo.ipynb -------------------------------------------------------------------------------- /notebooks/tutorial.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/tutorial.ipynb -------------------------------------------------------------------------------- /notebooks/unpickle_query.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/unpickle_query.ipynb -------------------------------------------------------------------------------- /notebooks/weaviate-writer.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/notebooks/weaviate-writer.ipynb -------------------------------------------------------------------------------- /poetry.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/poetry.lock -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/aryn-ai/sycamore/HEAD/pyproject.toml --------------------------------------------------------------------------------