├── .gitattributes
├── .github
    └── workflows
    │   ├── build_docs.yml
    │   ├── doc-tests.yml
    │   └── pypi-auto-deploy.yml
├── .gitignore
├── LICENSE
├── MANIFEST.in
├── README.md
├── Rlibs.R
├── besca
    ├── Import
    │   ├── __init__.py
    │   ├── _labelings.py
    │   └── _read.py
    ├── README.md
    ├── Rlibs.R
    ├── __init__.py
    ├── _helper.py
    ├── _logging.py
    ├── _notebook.py
    ├── _version.py
    ├── datasets
    │   ├── __init__.py
    │   ├── _datasets.py
    │   ├── _helper.py
    │   ├── _mito.py
    │   ├── data
    │   │   └── __init__.py
    │   ├── genesets
    │   │   ├── CellNames_scseqCMs6_Extrasigs.gmt
    │   │   ├── CellNames_scseqCMs6_Extrasigs.mouse.gmt
    │   │   ├── CellNames_scseqCMs6_config.mouse.png
    │   │   ├── CellNames_scseqCMs6_config.mouse.tsv
    │   │   ├── CellNames_scseqCMs6_config.png
    │   │   ├── CellNames_scseqCMs6_config.tsv
    │   │   ├── CellNames_scseqCMs6_sigs.gmt
    │   │   ├── CellNames_scseqCMs6_sigs.mouse.gmt
    │   │   ├── CryptScoreParikh2019.gmt
    │   │   ├── HumanCD45p_scseqCMs6.gmt
    │   │   ├── Immune.gmt
    │   │   └── __init__.py
    │   ├── homologs
    │   │   ├── MGItoHGNC.tsv
    │   │   └── __init__.py
    │   ├── mito_files
    │   │   ├── __init__.py
    │   │   ├── cyno.mito.tsv
    │   │   ├── cynomolgus.mito.tsv
    │   │   ├── human.mito.tsv
    │   │   ├── human.ribosomal.tsv
    │   │   ├── mouse.mito.ensembl.list
    │   │   ├── mouse.mito.tsv
    │   │   ├── pig.mito.tsv
    │   │   ├── rat.mito.tsv
    │   │   └── test.mito.tsv
    │   └── nomenclature
    │   │   ├── CellTypes_v1.tsv
    │   │   └── __init__.py
    ├── examples
    │   ├── example_function.py
    │   ├── example_gallery.py
    │   ├── example_include_plot_in_documentation.py
    │   └── gallery_examples
    │   │   ├── README.txt
    │   │   ├── plotting
    │   │       ├── README.txt
    │   │       ├── plot_celltype_quantification.py
    │   │       ├── plot_filtering.py
    │   │       ├── plot_qc.py
    │   │       ├── plot_riverplot.py
    │   │       └── plot_split_gene_expression.py
    │   │   ├── preprocessing
    │   │       ├── README.txt
    │   │       ├── plot_example_filtering.py
    │   │       └── plot_pca_neighbors_clustering.py
    │   │   ├── tools
    │   │       ├── README.txt
    │   │       └── plot_reclustering_function.py
    │   │   └── workflows
    │   │       ├── README.txt
    │   │       └── plot_celltype_annotation.py
    ├── export
    │   ├── __init__.py
    │   └── _export.py
    ├── pl
    │   ├── __init__.py
    │   ├── _celltype_quantification.py
    │   ├── _crispr_plots.py
    │   ├── _dot_heatmap.py
    │   ├── _filter_threshold_plots.py
    │   ├── _general.py
    │   ├── _nomenclature_network.py
    │   ├── _qc_plots.py
    │   ├── _riverplot.py
    │   ├── _split_gene_expression.py
    │   └── _update_palette.py
    ├── pp
    │   ├── __init__.py
    │   ├── _crispr_pp.py
    │   ├── _filtering.py
    │   ├── _fraction_counts.py
    │   ├── _fraction_pos.py
    │   ├── _normalization.py
    │   └── _wrapper_Rfuncs.py
    ├── st
    │   ├── _FAIR_export.py
    │   ├── __init__.py
    │   ├── _qc_report.py
    │   ├── _setup_funcs.py
    │   ├── _wrapper_Rfuncs.py
    │   ├── _wrapper_funcs.py
    │   └── style.css
    └── tl
    │   ├── README.md
    │   ├── __init__.py
    │   ├── _annot_compare.py
    │   ├── _annotate_cellnames.py
    │   ├── _count_occurrences.py
    │   ├── auto_annot
    │       ├── __init__.py
    │       └── _auto_annot.py
    │   ├── bcor
    │       ├── __init__.py
    │       └── _mnnpy_batchcorrection.py
    │   ├── crispr
    │       ├── __init__.py
    │       └── _crispr_tools.py
    │   ├── dge
    │       ├── __init__.py
    │       └── _dge.py
    │   ├── rc
    │       ├── __init__.py
    │       └── _reclustering.py
    │   └── sig
    │       ├── __init__.py
    │       ├── _annot.py
    │       ├── _gems_link.py
    │       ├── _helper.py
    │       ├── _io_sig.py
    │       ├── _metrics.py
    │       ├── _sig.py
    │       └── _silhouette.py
├── devtools
    ├── README.md
    ├── install_besca_editable.bash
    ├── requirements.txt
    └── run_workbooks.bash
├── docs
    ├── Makefile
    └── source
    │   ├── _images
    │       ├── Thumbs.db
    │       └── besca_outline.jpg
    │   ├── _static
    │       └── css
    │       │   └── custom.css
    │   ├── adding_new_functions.rst
    │   ├── auto_examples
    │       ├── index.rst
    │       ├── plotting
    │       │   ├── images
    │       │   │   ├── sphx_glr_filtering_plots_001.png
    │       │   │   ├── sphx_glr_plot_celltype_quantification_001.png
    │       │   │   ├── sphx_glr_plot_celltype_quantification_002.png
    │       │   │   ├── sphx_glr_plot_celltype_quantification_003.png
    │       │   │   ├── sphx_glr_plot_celltype_quantification_004.png
    │       │   │   ├── sphx_glr_plot_filtering_001.png
    │       │   │   ├── sphx_glr_plot_qc_001.png
    │       │   │   ├── sphx_glr_plot_qc_002.png
    │       │   │   ├── sphx_glr_plot_qc_003.png
    │       │   │   ├── sphx_glr_plot_qc_004.png
    │       │   │   ├── sphx_glr_plot_qc_005.png
    │       │   │   ├── sphx_glr_plot_split_gene_expression_001.png
    │       │   │   ├── sphx_glr_plot_split_gene_expression_002.png
    │       │   │   ├── sphx_glr_plot_split_gene_expression_003.png
    │       │   │   └── thumb
    │       │   │   │   ├── sphx_glr_filtering_plots_thumb.png
    │       │   │   │   ├── sphx_glr_plot_celltype_quantification_thumb.png
    │       │   │   │   ├── sphx_glr_plot_filtering_thumb.png
    │       │   │   │   ├── sphx_glr_plot_qc_thumb.png
    │       │   │   │   └── sphx_glr_plot_split_gene_expression_thumb.png
    │       │   ├── plot_celltype_quantification.ipynb
    │       │   ├── plot_celltype_quantification.py
    │       │   ├── plot_celltype_quantification.py.md5
    │       │   ├── plot_celltype_quantification.rst
    │       │   ├── plot_filtering.ipynb
    │       │   ├── plot_filtering.py
    │       │   ├── plot_filtering.py.md5
    │       │   ├── plot_filtering.rst
    │       │   ├── plot_qc.ipynb
    │       │   ├── plot_qc.py
    │       │   ├── plot_qc.py.md5
    │       │   ├── plot_qc.rst
    │       │   ├── plot_riverplot.ipynb
    │       │   ├── plot_riverplot.py
    │       │   ├── plot_riverplot.py.md5
    │       │   ├── plot_riverplot.rst
    │       │   ├── plot_split_gene_expression.ipynb
    │       │   ├── plot_split_gene_expression.py
    │       │   ├── plot_split_gene_expression.py.md5
    │       │   ├── plot_split_gene_expression.rst
    │       │   └── sg_execution_times.rst
    │       ├── preprocessing
    │       │   ├── images
    │       │   │   ├── sphx_glr_plot_example_filtering_001.png
    │       │   │   ├── sphx_glr_plot_example_filtering_002.png
    │       │   │   ├── sphx_glr_plot_example_filtering_003.png
    │       │   │   ├── sphx_glr_plot_pca_neighbors_clustering_001.png
    │       │   │   ├── sphx_glr_plot_pca_neighbors_clustering_002.png
    │       │   │   ├── sphx_glr_plot_pca_neighbors_clustering_003.png
    │       │   │   ├── sphx_glr_plot_pca_neighbors_clustering_004.png
    │       │   │   ├── sphx_glr_plot_pca_neighbors_clustering_005.png
    │       │   │   └── thumb
    │       │   │   │   ├── sphx_glr_filtering_thumb.png
    │       │   │   │   ├── sphx_glr_plot_example_filtering_thumb.png
    │       │   │   │   └── sphx_glr_plot_pca_neighbors_clustering_thumb.png
    │       │   ├── plot_example_filtering.ipynb
    │       │   ├── plot_example_filtering.py
    │       │   ├── plot_example_filtering.py.md5
    │       │   ├── plot_example_filtering.rst
    │       │   ├── plot_pca_neighbors_clustering.ipynb
    │       │   ├── plot_pca_neighbors_clustering.py
    │       │   ├── plot_pca_neighbors_clustering.py.md5
    │       │   ├── plot_pca_neighbors_clustering.rst
    │       │   └── sg_execution_times.rst
    │       ├── tools
    │       │   ├── images
    │       │   │   ├── sphx_glr_plot_reclustering_function_001.png
    │       │   │   └── thumb
    │       │   │   │   ├── sphx_glr_plot_reclustering_function_thumb.png
    │       │   │   │   ├── sphx_glr_plot_simple_example_thumb.png
    │       │   │   │   └── sphx_glr_simple_example_thumb.png
    │       │   ├── plot_reclustering_function.ipynb
    │       │   ├── plot_reclustering_function.py
    │       │   ├── plot_reclustering_function.py.md5
    │       │   ├── plot_reclustering_function.rst
    │       │   ├── sg_execution_times.rst
    │       │   └── tt_plot_reclustering_function.py
    │       └── workflows
    │       │   ├── images
    │       │       ├── sphx_glr_plot_celltype_annotation_001.png
    │       │       ├── sphx_glr_plot_celltype_annotation_002.png
    │       │       ├── sphx_glr_plot_celltype_annotation_003.png
    │       │       ├── sphx_glr_plot_celltype_annotation_004.png
    │       │       ├── sphx_glr_plot_celltype_annotation_005.png
    │       │       ├── sphx_glr_plot_celltype_annotation_006.png
    │       │       ├── sphx_glr_plot_celltype_annotation_007.png
    │       │       ├── sphx_glr_plot_celltype_annotation_008.png
    │       │       ├── sphx_glr_plot_celltype_annotation_009.png
    │       │       ├── sphx_glr_plot_celltype_annotation_010.png
    │       │       └── thumb
    │       │       │   ├── sphx_glr_annotate_celltypes_thumb.png
    │       │       │   ├── sphx_glr_plot_celltype_annotation_thumb.png
    │       │       │   └── sphx_glr_plot_celltype_quantification_thumb.png
    │       │   ├── plot_celltype_annotation.ipynb
    │       │   ├── plot_celltype_annotation.py
    │       │   ├── plot_celltype_annotation.py.md5
    │       │   ├── plot_celltype_annotation.rst
    │       │   ├── plot_celltype_quantification.ipynb
    │       │   ├── plot_celltype_quantification.py
    │       │   ├── plot_celltype_quantification.py.md5
    │       │   ├── plot_celltype_quantification.rst
    │       │   └── sg_execution_times.rst
    │   ├── bc.rst
    │   ├── bcor
    │       ├── besca.tl.bcor.batch_correct.rst
    │       └── besca.tl.bcor.postprocess_mnnpy.rst
    │   ├── besca.rst
    │   ├── besca
    │       ├── besca.Import.add_cell_labeling.rst
    │       ├── besca.Import.assert_adata.rst
    │       ├── besca.Import.read_mtx.rst
    │       ├── besca.export.X_to_mtx.rst
    │       ├── besca.export.analysis_metadata.rst
    │       ├── besca.export.clustering.rst
    │       ├── besca.export.generate_gep.rst
    │       ├── besca.export.labeling.rst
    │       ├── besca.export.labeling_info.rst
    │       ├── besca.export.pseudobulk.rst
    │       ├── besca.export.ranked_genes.rst
    │       ├── besca.export.raw_to_mtx.rst
    │       ├── besca.pl.box_per_ind.rst
    │       ├── besca.pl.celllabel_quant_boxplot.rst
    │       ├── besca.pl.celllabel_quant_stackedbar.rst
    │       ├── besca.pl.detected_genes.rst
    │       ├── besca.pl.dot_heatmap.rst
    │       ├── besca.pl.dot_heatmap_split.rst
    │       ├── besca.pl.dot_heatmap_split_greyscale.rst
    │       ├── besca.pl.dropouts.rst
    │       ├── besca.pl.gene_expr_split.rst
    │       ├── besca.pl.gene_expr_split_stacked.rst
    │       ├── besca.pl.kp_cells.rst
    │       ├── besca.pl.kp_counts.rst
    │       ├── besca.pl.kp_genes.rst
    │       ├── besca.pl.library_size.rst
    │       ├── besca.pl.librarysize_overview.rst
    │       ├── besca.pl.max_counts.rst
    │       ├── besca.pl.max_genes.rst
    │       ├── besca.pl.max_mito.rst
    │       ├── besca.pl.nomenclature_network.rst
    │       ├── besca.pl.riverplot_2categories.rst
    │       ├── besca.pl.stacked_split_violin.rst
    │       ├── besca.pl.top_genes_counts.rst
    │       ├── besca.pl.transcript_capture_efficiency.rst
    │       ├── besca.pl.update_qualitative_palette.rst
    │       ├── besca.pp.filter.rst
    │       ├── besca.pp.filter_gene_list.rst
    │       ├── besca.pp.frac_pos.rst
    │       ├── besca.pp.frac_reads.rst
    │       ├── besca.pp.fraction_counts.rst
    │       ├── besca.pp.mean_expr.rst
    │       ├── besca.pp.normalize_geometric.rst
    │       ├── besca.pp.top_counts_genes.rst
    │       ├── besca.pp.top_expressed_genes.rst
    │       ├── besca.st.additional_labeling.rst
    │       ├── besca.st.celltype_labeling.rst
    │       ├── besca.st.export_celltype.rst
    │       ├── besca.st.export_clustering.rst
    │       ├── besca.st.export_cp10k.rst
    │       ├── besca.st.export_metadata.rst
    │       ├── besca.st.export_rank.rst
    │       ├── besca.st.export_regressedOut.rst
    │       ├── besca.st.filtering_cells_genes_min.rst
    │       ├── besca.st.filtering_mito_genes_max.rst
    │       ├── besca.st.read_matrix.rst
    │       ├── besca.tl.annotate_cells_clustering.rst
    │       ├── besca.tl.bcor.batch_correct.rst
    │       ├── besca.tl.bcor.postprocess_mnnpy.rst
    │       ├── besca.tl.count_occurrence.rst
    │       ├── besca.tl.count_occurrence_subset.rst
    │       ├── besca.tl.count_occurrence_subset_conditions.rst
    │       ├── besca.tl.dge.get_de.rst
    │       ├── besca.tl.dge.perform_dge.rst
    │       ├── besca.tl.dge.plot_interactive_volcano.rst
    │       ├── besca.tl.rc.annotate_new_cellnames.rst
    │       └── besca.tl.rc.recluster.rst
    │   ├── besca_standard_pipeline.rst
    │   ├── conf.py
    │   ├── dge
    │       ├── besca.tl.dge.get_de.rst
    │       ├── besca.tl.dge.perform_dge.rst
    │       └── besca.tl.dge.plot_interactive_volcano.rst
    │   ├── export
    │       ├── besca.export.X_to_mtx.rst
    │       ├── besca.export.analysis_metadata.rst
    │       ├── besca.export.clustering.rst
    │       ├── besca.export.generate_gep.rst
    │       ├── besca.export.labeling.rst
    │       ├── besca.export.labeling_info.rst
    │       ├── besca.export.pseudobulk.rst
    │       ├── besca.export.ranked_genes.rst
    │       └── besca.export.raw_to_mtx.rst
    │   ├── helper_functions
    │       ├── besca.concate_adata.rst
    │       ├── besca.convert_ensembl_to_symbol.rst
    │       ├── besca.convert_symbol_to_ensembl.rst
    │       ├── besca.get_ameans.rst
    │       ├── besca.get_means.rst
    │       ├── besca.get_raw.rst
    │       └── besca.subset_adata.rst
    │   ├── import
    │       ├── besca.Import.add_cell_labeling.rst
    │       ├── besca.Import.assert_adata.rst
    │       └── besca.Import.read_mtx.rst
    │   ├── index.rst
    │   ├── plotting
    │       ├── besca.pl.box_per_ind.rst
    │       ├── besca.pl.celllabel_quant_boxplot.rst
    │       ├── besca.pl.celllabel_quant_stackedbar.rst
    │       ├── besca.pl.detected_genes.rst
    │       ├── besca.pl.dot_heatmap.rst
    │       ├── besca.pl.dot_heatmap_split.rst
    │       ├── besca.pl.dot_heatmap_split_greyscale.rst
    │       ├── besca.pl.dropouts.rst
    │       ├── besca.pl.gene_expr_split.rst
    │       ├── besca.pl.gene_expr_split_stacked.rst
    │       ├── besca.pl.kp_cells.rst
    │       ├── besca.pl.kp_counts.rst
    │       ├── besca.pl.kp_genes.rst
    │       ├── besca.pl.library_size.rst
    │       ├── besca.pl.librarysize_overview.rst
    │       ├── besca.pl.max_counts.rst
    │       ├── besca.pl.max_genes.rst
    │       ├── besca.pl.max_mito.rst
    │       ├── besca.pl.nomenclature_network.rst
    │       ├── besca.pl.riverplot_2categories.rst
    │       ├── besca.pl.stacked_split_violin.rst
    │       ├── besca.pl.top_genes_counts.rst
    │       ├── besca.pl.transcript_capture_efficiency.rst
    │       └── besca.pl.update_qualitative_palette.rst
    │   ├── preprocessing
    │       ├── besca.pp.filter.rst
    │       ├── besca.pp.filter_gene_list.rst
    │       ├── besca.pp.frac_pos.rst
    │       ├── besca.pp.frac_reads.rst
    │       ├── besca.pp.fraction_counts.rst
    │       ├── besca.pp.mean_expr.rst
    │       ├── besca.pp.normalize_geometric.rst
    │       ├── besca.pp.top_counts_genes.rst
    │       └── besca.pp.top_expressed_genes.rst
    │   ├── reclustering
    │       ├── besca.tl.rc.annotate_new_cellnames.rst
    │       └── besca.tl.rc.recluster.rst
    │   ├── scripts
    │       ├── environment_besca.yml
    │       ├── environment_besca_test.yml
    │       ├── example_structure_environment.yml
    │       ├── example_structure_environment_combined.yml
    │       ├── example_structure_environment_pip.yml
    │       ├── gallery_package_structure.txt
    │       ├── python_minimal_package_structure.txt
    │       └── python_package_structure.txt
    │   ├── sig
    │       ├── besca.tl.sig.add_anno.rst
    │       ├── besca.tl.sig.combined_signature_score.rst
    │       ├── besca.tl.sig.compute_signed_score.rst
    │       ├── besca.tl.sig.export_annotconfig.rst
    │       ├── besca.tl.sig.filter_siggenes.rst
    │       ├── besca.tl.sig.get_gems.rst
    │       ├── besca.tl.sig.get_similar_geneset.rst
    │       ├── besca.tl.sig.getset.rst
    │       ├── besca.tl.sig.insert_gems.rst
    │       ├── besca.tl.sig.make_anno.rst
    │       ├── besca.tl.sig.match_cluster.rst
    │       ├── besca.tl.sig.obtain_dblabel.rst
    │       ├── besca.tl.sig.read_GMT_sign.rst
    │       ├── besca.tl.sig.read_annotconfig.rst
    │       └── besca.tl.sig.score_mw.rst
    │   ├── standardworkflow
    │       ├── besca.st.additional_labeling.rst
    │       ├── besca.st.celltype_labeling.rst
    │       ├── besca.st.export_celltype.rst
    │       ├── besca.st.export_clustering.rst
    │       ├── besca.st.export_cp10k.rst
    │       ├── besca.st.export_metadata.rst
    │       ├── besca.st.export_rank.rst
    │       ├── besca.st.export_regressedOut.rst
    │       ├── besca.st.filtering_cells_genes_min.rst
    │       ├── besca.st.filtering_mito_genes_max.rst
    │       └── besca.st.read_matrix.rst
    │   ├── tools
    │       ├── besca.tl.annotate_cells_clustering.rst
    │       ├── besca.tl.count_occurrence.rst
    │       ├── besca.tl.count_occurrence_subset.rst
    │       └── besca.tl.count_occurrence_subset_conditions.rst
    │   ├── tutorials.rst
    │   ├── tutorials
    │       ├── adata_to_eset.ipynb
    │       ├── auto_annot_tutorial.ipynb
    │       ├── bescape_tutorial.ipynb
    │       ├── notebook1_data_processing_pbmc3k.ipynb
    │       ├── notebook2_celltype_annotation_pbmc3k.ipynb
    │       ├── notebook3_batch_correction.ipynb
    │       ├── scRNAseq_tutorial.ipynb
    │       └── scRNAseq_tutorial.umap_comparison_figure.png
    │   └── tutorials_html
    │       ├── adata_to_eset.html
    │       ├── bescape_tutorial.html
    │       └── generate_tutorialHtml.sh
├── environment.lock.yml
├── environment.yml
├── pytest.ini
├── requirements.txt
├── setup.cfg
├── setup.py
├── tests
    ├── __init__.py
    ├── data
    │   └── st
    │   │   └── wrapper_funcs
    │   │       └── labeling_test_CTL_OLD
    │   │           └── labelings
    │   │               └── celltype
    │   │                   ├── WilxRank.gct
    │   │                   ├── WilxRank.logFC.gct
    │   │                   ├── WilxRank.pvalues.gct
    │   │                   ├── average.gct
    │   │                   ├── cell2labels.tsv
    │   │                   ├── celltype_labelinfo.tsv
    │   │                   ├── fract_pos.gct
    │   │                   └── labelinfo.tsv
    └── test_wrapper_funcs.py
├── versioneer.py
└── workbooks
    ├── README.md
    ├── Signature_exports.ipynb
    ├── celltype_annotation_besca.ipynb
    ├── minimal_notebook.ipynb
    └── standard_workflow_besca2.ipynb


/.gitattributes:
--------------------------------------------------------------------------------
1 | # Set the default behavior, in case people don't have core.autocrlf set.
2 | * text eol=lf
3 | # Denote all files that are truly binary and should not be modified.
4 | *.png binary
5 | *.jpg binary
6 | *.h5ad binary
7 | besca/_version.py export-subst
8 | 


--------------------------------------------------------------------------------
/.github/workflows/build_docs.yml:
--------------------------------------------------------------------------------
 1 | name: Build Sphinx Documentation
 2 | on:
 3 |   workflow_dispatch:
 4 | 
 5 | jobs:
 6 |   cached-job:
 7 |     name: Cached (${{ matrix.python-version }}, ${{ matrix.os }})
 8 |     runs-on: ${{ matrix.os }}
 9 |     strategy:
10 |       fail-fast: false
11 |       matrix:
12 |         os: ["ubuntu-latest"]
13 |         python-version: ["3.8"]
14 |     steps:
15 |       - name: Check out the repo and use mamba
16 |         uses: actions/checkout@v3
17 |       - uses: conda-incubator/setup-miniconda@v2
18 |         with:
19 |             miniforge-variant: Mambaforge
20 |             miniforge-version: latest
21 |             activate-environment: besca_create_docu
22 |             use-mamba: true
23 |       - name: Cache conda packages
24 |         id: cache-conda
25 |         uses: actions/cache@v3
26 |         env:
27 |           cache-name: cache-conda-packages
28 |         with:
29 |           path: ~/
30 |           key: ${{ runner.os }}-build-${{ env.cache-name }}-${{ hashFiles('**/docs/environment.lock.yml') }}
31 |           restore-keys: |
32 |             ${{ runner.os }}-build-${{ env.cache-name }}-${{ hashFiles('**/docs/environment.lock.yml') }}
33 |          
34 |       - name: Get Date
35 |         id: get-date
36 |         run: echo "::set-output name=today::$(/bin/date -u '+%Y%m%d')"
37 |         shell: bash
38 | 
39 |       - name: Cache conda env
40 |         uses: actions/cache@v3
41 |         with:
42 |           path: ${{ env.CONDA }}/envs
43 |           key: conda-${{ runner.os }}--${{ runner.arch }}--${{ steps.get-date.outputs.today }}-${{ hashFiles('**/docs/environment.lock.yml') }}-${{ env.CACHE_NUMBER }}
44 |         env:
45 |           # Increase this value to reset cache if etc/example-environment.yml has not changed
46 |           CACHE_NUMBER: 0
47 |         id: cache
48 | 
49 |       - name: Update environment
50 |         run: |
51 |           pwd
52 |           ls
53 |           cd docs
54 |           head environment.lock.yml
55 |           mamba env update -n besca_create_docu -f docs/environment.lock.yml
56 |         if: steps.cache.outputs.cache-hit != 'true'
57 | 
58 |       - name: Run Sphinx
59 |         run: |
60 |           mamba init
61 |           source ~/.bashrc
62 |           mamba activate besca_create_docu
63 |           cd docs
64 |           make html
65 | 


--------------------------------------------------------------------------------
/.github/workflows/doc-tests.yml:
--------------------------------------------------------------------------------
 1 | name: Run doctests
 2 | 
 3 | on: [release]
 4 | 
 5 | jobs:
 6 |   doc-test-job:
 7 |     name: Doctests
 8 |     runs-on: ubuntu-latest
 9 |     steps:
10 |       - name: Check out the repo
11 |         uses: actions/checkout@v3
12 |       - uses: conda-incubator/setup-miniconda@v2
13 |         with:
14 |           miniconda-version: "latest"
15 |       - name: Bash
16 |         shell: bash -l {0}
17 |         run: |
18 |           conda install -c conda-forge mamba
19 |           mamba init
20 |           source ~/.bashrc
21 |           mamba env create -f environment.yml
22 |           mamba activate besca_dev
23 |           pip install pytest
24 |           cd besca
25 |           export PYTHONDONTWRITEBYTECODE=1
26 |           pytest --doctest-modules -W ignore::PendingDeprecationWarning --durations=0
27 |           cd ..
28 |           pytest
29 | 


--------------------------------------------------------------------------------
/.github/workflows/pypi-auto-deploy.yml:
--------------------------------------------------------------------------------
  1 | name: Publish Python 🐍 distribution 📦 to PyPI and TestPyPI
  2 | 
  3 | on: push
  4 | 
  5 | jobs:
  6 |   build:
  7 |     name: Build distribution 📦
  8 |     runs-on: ubuntu-latest
  9 | 
 10 |     steps:
 11 |     - uses: actions/checkout@v4
 12 |     - name: Set up Python
 13 |       uses: actions/setup-python@v5
 14 |       with:
 15 |         python-version: "3.8"
 16 |     - name: Install pypa/build
 17 |       run: >-
 18 |         python3 -m
 19 |         pip install
 20 |         setuptools wheel
 21 |         --user
 22 |     - name: Build a binary wheel and a source tarball
 23 |       run: python3 setup.py sdist bdist_wheel
 24 |     - name: Store the distribution packages
 25 |       uses: actions/upload-artifact@v4
 26 |       with:
 27 |         name: python-package-distributions
 28 |         path: dist/
 29 | 
 30 |   publish-to-pypi:
 31 |     name: >-
 32 |       Publish Python 🐍 distribution 📦 to PyPI
 33 |     if: startsWith(github.ref, 'refs/tags/')  # only publish to PyPI on tag pushes
 34 |     needs:
 35 |     - build
 36 |     runs-on: ubuntu-latest
 37 |     environment:
 38 |       name: publishing
 39 |       url: https://pypi.org/p/besca
 40 |     permissions:
 41 |       id-token: write  # IMPORTANT: mandatory for trusted publishing
 42 | 
 43 |     steps:
 44 |     - name: Download all the dists
 45 |       uses: actions/download-artifact@v4
 46 |       with:
 47 |         name: python-package-distributions
 48 |         path: dist/
 49 |     - name: Publish distribution 📦 to PyPI
 50 |       uses: pypa/gh-action-pypi-publish@release/v1
 51 | 
 52 |   github-release:
 53 |     name: >-
 54 |       Sign the Python 🐍 distribution 📦 with Sigstore
 55 |       and upload them to GitHub Release
 56 |     needs:
 57 |     - publish-to-pypi
 58 |     runs-on: ubuntu-latest
 59 | 
 60 |     permissions:
 61 |       contents: write  # IMPORTANT: mandatory for making GitHub Releases
 62 |       id-token: write  # IMPORTANT: mandatory for sigstore
 63 | 
 64 |     steps:
 65 |     - name: Download all the dists
 66 |       uses: actions/download-artifact@v4
 67 |       with:
 68 |         name: python-package-distributions
 69 |         path: dist/
 70 |     - name: Sign the dists with Sigstore
 71 |       uses: sigstore/gh-action-sigstore-python@v2.1.1
 72 |       with:
 73 |         inputs: >-
 74 |           ./dist/*.tar.gz
 75 |           ./dist/*.whl
 76 |     - name: Create GitHub Release
 77 |       env:
 78 |         GITHUB_TOKEN: ${{ github.token }}
 79 |       run: >-
 80 |         gh release create
 81 |         '${{ github.ref_name }}'
 82 |         --repo '${{ github.repository }}'
 83 |         --notes ""
 84 |     - name: Upload artifact signatures to GitHub Release
 85 |       env:
 86 |         GITHUB_TOKEN: ${{ github.token }}
 87 |       # Upload to GitHub Release using the `gh` CLI.
 88 |       # `dist/` contains the built packages, and the
 89 |       # sigstore-produced signatures and certificates.
 90 |       run: >-
 91 |         gh release upload
 92 |         '${{ github.ref_name }}' dist/**
 93 |         --repo '${{ github.repository }}'
 94 | 
 95 |   # publish-to-testpypi:
 96 |   #   name: Publish Python 🐍 distribution 📦 to TestPyPI
 97 |   #   needs:
 98 |   #   - build
 99 |   #   runs-on: ubuntu-latest
100 | 
101 |   #   environment:
102 |   #     name: publishing
103 |   #     url: https://test.pypi.org/p/besca
104 | 
105 |   #   permissions:
106 |   #     id-token: write  # IMPORTANT: mandatory for trusted publishing
107 | 
108 |   #   steps:
109 |   #   - name: Download all the dists
110 |   #     uses: actions/download-artifact@v4
111 |   #     with:
112 |   #       name: python-package-distributions
113 |   #       path: dist/
114 |   #   - name: Publish distribution 📦 to TestPyPI
115 |   #     uses: pypa/gh-action-pypi-publish@release/v1
116 |   #     with:
117 |   #       repository-url: https://test.pypi.org/legacy/
118 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | __pycache__/
 2 | besca.egg-info/
 3 | .ipynb_checkpoints
 4 | cache/
 5 | workbooks/test.ipynb
 6 | workbooks/analyzed
 7 | workbooks/standard_workflow_besca2-requirements.txt
 8 | workbooks/*nbconvert.ipynb
 9 | workbooks/*requirements.txt
10 | figures_testing/
11 | *~
12 | *.swp
13 | 
14 | build
15 | pip
16 | *.pyc
17 | 
18 | README.private.md
19 | *_venv
20 | *.h5ad
21 | *.html
22 | besca_test
23 | *.gmtx
24 | dist
25 | 
26 | .DS_Store
27 | 
28 | # Unit test / coverage reports
29 | htmlcov/
30 | .tox/
31 | .coverage
32 | .coverage.*
33 | .cache
34 | junit.xml
35 | nosetests.xml
36 | coverage.xml
37 | *,cover
38 | 
39 | # Sphinx documentation
40 | docs/_build/
41 | 
42 | .vscode


--------------------------------------------------------------------------------
/MANIFEST.in:
--------------------------------------------------------------------------------
1 | include versioneer.py
2 | include besca/_version.py
3 | 


--------------------------------------------------------------------------------
/Rlibs.R:
--------------------------------------------------------------------------------
 1 | args = commandArgs(trailingOnly=TRUE)
 2 | libloc <-  args[1]
 3 | reposloc<-"https://cloud.r-project.org/" #consider args[2]
 4 | dir.create(libloc)
 5 | 
 6 | .libPaths(libloc)
 7 | if (!require("devtools")) install.packages("devtools", lib = libloc, repos = reposloc)
 8 | if (!require("remotes")) install.packages("remotes", lib = libloc, repos = reposloc)
 9 | if (!require("withr")) install.packages("withr", lib = libloc, repos = reposloc)
10 | if (!require("vctrs")) install.packages("vctrs", lib = libloc, repos = reposloc)
11 | if (!require("patchwork")) with_libpaths(new = libloc, devtools::install_github("thomasp85/patchwork"))
12 | if (!require("dsb")) install.packages("dsb", lib = libloc, repos = reposloc) #to verify if same
13 | if (!require("tidyverse")) install.packages("tidyverse", lib = libloc, repos = reposloc)
14 | if (!require("magrittr")) install.packages("magrittr", lib = libloc, repos = reposloc)
15 | if (!require("data.table")) install.packages("data.table", lib = libloc, repos = reposloc)
16 | if (!require("Matrix")) install.packages("Matrix", lib = libloc, repos = reposloc)
17 | if (!require("ggplot2")) install.packages("ggplot2", lib = libloc, repos = reposloc)
18 | if (!require("readr")) install.packages("readr", lib = libloc, repos = reposloc)
19 | if (!require("Seurat")) install.packages("Seurat", lib = libloc, repos = reposloc)
20 | if (!require("intrinsicDimension")) install.packages("intrinsicDimension", lib = libloc, repos = reposloc)
21 | if (!require("scater")) install.packages("scater", lib = libloc, repos = reposloc)
22 | if (!requireNamespace("BiocManager", quietly = TRUE))
23 |     install.packages("BiocManager",lib = libloc, repos = reposloc)
24 | if (!require("DropletUtils")) BiocManager::install("DropletUtils", lib = libloc)
25 | if (!require("scry")) BiocManager::install("scry", lib = libloc) #requires R >=4.0.3
26 | 


--------------------------------------------------------------------------------
/besca/Import/__init__.py:
--------------------------------------------------------------------------------
1 | from besca.Import._read import read_mtx, assert_adata
2 | from besca.Import._labelings import add_cell_labeling
3 | 
4 | __all__ = ["read_mtx", "add_cell_labeling", "assert_adata"]
5 | 


--------------------------------------------------------------------------------
/besca/Import/_labelings.py:
--------------------------------------------------------------------------------
 1 | from pandas import read_csv
 2 | from os.path import join as pathjoin
 3 | 
 4 | 
 5 | def add_cell_labeling(adata, filepath, label="celltype"):
 6 |     """add a labeling written out in the FAIR formating to adata.obs
 7 | 
 8 |     A laveling contained in the FAIR compliant cell2labels.tsv is added to adata.obs. The string supplied
 9 |     in the parameter label is used to name the column in adata.obs that contains the imported labeling.
10 | 
11 |     All cells that are not labeled in the cell2labels.tsv will be annotated with 'not labeled'.
12 | 
13 |     parameters
14 |     ----------
15 |     adata: `AnnData`
16 |         the AnnData object whose obs should be updated
17 |     filepath: `str`
18 |         filepath to the cell2labels.tsv that is to be appended to adata.obs
19 |     label: `str` | default = 'celltype'
20 |         string indicating the label that is to be added to the annotation that is being imported
21 | 
22 |     returns
23 |     -------
24 |     None
25 |         updates the supplied AnnData object
26 | 
27 |     """
28 | 
29 |     labeling = read_csv(pathjoin(filepath, "cell2labels.tsv"), sep="\t", index_col=0)
30 |     labeling.rename(columns={"LABEL": label}, inplace=True)
31 | 
32 |     adata.obs[label] = "not labeled"
33 |     adata.obs.update(labeling)
34 | 
35 |     return None
36 | 


--------------------------------------------------------------------------------
/besca/README.md:
--------------------------------------------------------------------------------
 1 | # Overview of Abbreviations
 2 | 
 3 | pp = preprocessing   
 4 | tl = tools  
 5 | pl = plotting  
 6 | st = standardpipeline  
 7 | Import = importing functions (note that we did not use `import` as module
 8 | because it is a keyword) 
 9 | export = exporting functions
10 | 


--------------------------------------------------------------------------------
/besca/Rlibs.R:
--------------------------------------------------------------------------------
 1 | args = commandArgs(trailingOnly=TRUE)
 2 | libloc <-  args[1]
 3 | 
 4 | dir.create(libloc)
 5 | 
 6 | .libPaths(libloc)
 7 | if (!require("devtools")) install.packages("devtools", lib = libloc)
 8 | if (!require("withr")) install.packages("withr", lib = libloc)
 9 | if (!require("vctrs")) install.packages("vctrs", lib = libloc)
10 | if (!require("patchwork")) install.packages("patchwork", lib = libloc)
11 | if (!require("dsb")) with_libpaths(new = libloc, install_github("MattPM/dsb"))
12 | if (!require("tidyverse")) install.packages("tidyverse", lib = libloc)
13 | if (!require("magrittr")) install.packages("magrittr", lib = libloc)
14 | if (!require("data.table")) install.packages("data.table", lib = libloc)
15 | if (!require("Matrix")) install.packages("Matrix", lib = libloc)
16 | if (!require("DropletUtils")) with_libpaths(new = libloc, install_github("MarioniLab/DropletUtils"))
17 | if (!require("BiocManager")) install.packages("BiocManager", lib = libloc)
18 | if (!require("scater")) BiocManager::install("scater", lib = libloc)
19 | 
20 | 


--------------------------------------------------------------------------------
/besca/__init__.py:
--------------------------------------------------------------------------------
 1 | from besca import pl
 2 | from besca import tl
 3 | from besca import pp
 4 | from besca import st
 5 | from besca import datasets
 6 | from besca import export
 7 | from besca import Import
 8 | 
 9 | 
10 | from besca._helper import (
11 |     subset_adata,
12 |     convert_ensembl_to_symbol,
13 |     convert_symbol_to_ensembl,
14 |     get_raw,
15 |     get_ameans,
16 |     get_means,
17 |     concate_adata,
18 |     get_singlegenedf,
19 |     print_software_versions
20 | )
21 | 
22 | from besca._notebook import (
23 |     save_notebook,
24 |     save_notebook_return_path,
25 |     convert_notebook_to_HTML
26 | )
27 | 
28 | __all__ = [
29 |     "pl",
30 |     "tl",
31 |     "pp",
32 |     "st",
33 |     "datasets",
34 |     "export",
35 |     "subset_adata",
36 |     "import",
37 |     "convert_ensembl_to_symbol",
38 |     "convert_symbol_to_ensembl",
39 |     "get_raw",
40 |     "get_ameans",
41 |     "get_means",
42 |     "concate_adata",
43 |     "get_singlegenedf",
44 |     "print_software_versions",
45 |     "convert_notebook_to_HTML"
46 | ]
47 | 
48 | from besca._version import get_versions
49 | 
50 | __version__ = get_versions()["version"]
51 | del get_versions
52 | 
53 | from . import _version
54 | __version__ = _version.get_versions()['version']
55 | 


--------------------------------------------------------------------------------
/besca/_logging.py:
--------------------------------------------------------------------------------
 1 | import logging
 2 | import os
 3 | import datetime
 4 | 
 5 | 
 6 | def initialize_logger(log_file):
 7 |     logger = logging.getLogger()
 8 |     logger.setLevel(logging.INFO)
 9 | 
10 |     # create standard log file handler and set level to info
11 |     handler = logging.FileHandler(log_file, "a", encoding=None, delay="true")
12 |     handler.setLevel(logging.INFO)
13 |     formatter = logging.Formatter("%(message)s")
14 |     handler.setFormatter(formatter)
15 |     logger.addHandler(handler)
16 | 
17 |     # create console handler and set level to info
18 |     handler = logging.StreamHandler()
19 |     handler.setLevel(logging.INFO)
20 |     formatter = logging.Formatter("LOG MESSAGE: %(message)s")
21 |     handler.setFormatter(formatter)
22 |     logger.addHandler(handler)
23 | 
24 | 
25 | def initialize_log_file(
26 |     analysis_name,
27 |     root_path,
28 |     species,
29 |     batch_to_correct,
30 |     standard_min_genes,
31 |     standard_min_cells,
32 |     standard_min_counts,
33 |     standard_n_genes,
34 |     standard_percent_mito,
35 |     standard_max_counts,
36 |     version,
37 | ):
38 | 
39 |     logging.info("Standard Pipeline Version " + version + " used")
40 |     logging.info(datetime.datetime.today().strftime("%Y-%m-%d"))
41 |     logging.info(
42 |         "Analysis '" + analysis_name + "' on data located in'" + root_path + "'"
43 |     )
44 |     logging.info("species: " + species)
45 |     logging.info("Batch effect to correct: " + batch_to_correct)
46 |     logging.info("Parameters:")
47 |     logging.info("\tstandard_min_genes = " + str(standard_min_genes))
48 |     logging.info("\tstandard_min_cells = " + str(standard_min_cells))
49 |     logging.info("\tstandard_min_counts = " + str(standard_min_counts))
50 |     logging.info("\tstandard_n_genes = " + str(standard_n_genes))
51 |     logging.info("\tstandard_max_counts = " + str(standard_max_counts))
52 |     logging.info("\tstandard_percent_mito = " + str(standard_percent_mito))
53 | 


--------------------------------------------------------------------------------
/besca/_notebook.py:
--------------------------------------------------------------------------------
 1 | """Helper functions for working with notebooks"""
 2 | 
 3 | from IPython.display import display, Javascript
 4 | from glob import glob
 5 | import os
 6 | import subprocess
 7 | import logging
 8 | 
 9 | def save_notebook():
10 |     """Use JavaScript to simulate saving notebook, which makes sure
11 |        that the current notebook is the last one in the current directory
12 |        that is modified"""
13 | 
14 |     display(Javascript(
15 |         "document.body.dispatchEvent("
16 |         "new KeyboardEvent('keydown', {key:'s', keyCode: 83, ctrlKey: true}"
17 |         "))"
18 |     ))
19 | 
20 | 
21 | def save_notebook_return_path():
22 |     """Save the current notebook and return its full path"""
23 | 
24 |     save_notebook()
25 |     ipynbs = glob("*.ipynb")
26 |     curr_dir = os.getcwd()
27 |     max_file = None
28 |     max_mtime = 0
29 |     for fname in ipynbs:
30 |         full_path = os.path.join(curr_dir, fname)
31 |         mtime = os.stat(full_path).st_mtime
32 |         if mtime > max_mtime:
33 |             max_mtime = mtime
34 |             max_file = full_path
35 |     return max_file
36 | 
37 | 
38 | def convert_notebook_to_HTML():
39 |     """Convert the current notebook to HTML"""
40 | 
41 |     current = save_notebook_return_path()
42 |     if current is not None:
43 |         res = subprocess.run(['jupyter', 'nbconvert',
44 |                               '--to', 'html', current],
45 |                              shell=False, capture_output=True)
46 |     else:
47 |         res = None
48 |         logging.warning('No notebook is found - no conversion is done')
49 |     
50 |     return(res)
51 | 


--------------------------------------------------------------------------------
/besca/datasets/__init__.py:
--------------------------------------------------------------------------------
 1 | from besca.datasets._datasets import (
 2 |     Baron2016_processed,
 3 |     Baron2016_raw,
 4 |     Granja2019_citeSeq,
 5 |     Granja2019_processed,
 6 |     Granja2019_raw,
 7 |     Haber2017_processed,
 8 |     Haber2017_raw,
 9 |     Kotliarov2020_processed,
10 |     Kotliarov2020_raw,
11 |     Kotliarov2020_citeSeq,
12 |     Lee2020_processed,
13 |     Lee2020_raw,
14 |     Martin2019_processed,
15 |     Martin2019_raw,
16 |     Peng2019_processed,
17 |     Peng2019_raw,
18 |     Segerstolpe2016_processed,
19 |     Smillie2019_processed,
20 |     Smillie2019_raw,
21 |     crispr_10x_filtered,
22 |     crispr_10x_unfiltered,
23 |     load_immune_signatures,
24 |     pbmc3k_filtered,
25 |     pbmc3k_processed,
26 |     pbmc3k_raw,
27 | )
28 | from besca.datasets._mito import get_mito_genes
29 | from besca.datasets._helper import (
30 |     simulated_pbmc3k_raw,
31 |     simulated_Kotliarov2020_processed,
32 |     simulated_pbmc3k_processed, 
33 |     simulated_Haber2017_processed,
34 |     simulated_Baron2016_processed
35 | )
36 | 
37 | __all__ = [
38 |     "pbmc3k_raw",
39 |     "pbmc3k_filtered",
40 |     "pbmc3k_processed",
41 |     "Smillie2019_raw",
42 |     "Smillie2019_processed",
43 |     "crispr_10x_filtered",
44 |     "crispr_10x_unfiltered",
45 |     "Martin2019_raw",
46 |     "Martin2019_processed",
47 |     "Haber2017_raw",
48 |     "Haber2017_processed",
49 |     "Granja2019_citeSeq",
50 |     "Granja2019_processed",
51 |     "Granja2019_raw",
52 |     "get_mito_genes",
53 |     "Kotliarov2020_raw",
54 |     "Kotliarov2020_citeSeq",
55 |     "Kotliarov2020_processed",
56 |     "Baron2016_raw",
57 |     "Baron2016_processed",
58 |     "Lee2020_raw",
59 |     "Lee2020_processed",
60 |     "Peng2019_raw",
61 |     "Peng2019_processed",
62 |     "Segerstolpe2016_processed",
63 |     "load_immune_signatures",
64 |     "simulated_pbmc3k_raw",
65 |     "simulated_Kotliarov2020_processed",
66 |     "simulated_pbmc3k_processed",
67 |     "simulated_Haber2017_processed",
68 |     "simulated_Baron2016_processed"
69 | ]
70 | 


--------------------------------------------------------------------------------
/besca/datasets/_mito.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import pytest
 3 | from pandas import read_csv
 4 | 
 5 | 
 6 | def get_mito_genes(species: str = "human", annotation_type: str = "ENSEMBL"):
 7 |     """Returns the array of genes annotated as mitochondrial in species.
 8 |     Parameters
 9 |     ----------
10 |     species:`str`| default = human ; species of the datasets.
11 |     Accepted: cyno, cynomolgus, human, mouse, rat, pig
12 |     annotation_type:`str`| default = ENSEMBL.  ENSEMBL or SYMBOL accepted
13 | 
14 |     Returns
15 |     -------
16 |     mito_genes : array of str
17 | 
18 |     Example
19 |     -------
20 |     >>> pytest.skip('Test will be skipped, because slow downloading of file in the github action job can occur a timeout')
21 |     >>> import besca as bc
22 |     >>> mito_genes = bc.datasets.get_mito_genes('human')
23 |     >>> mito_genes
24 |     ['ENSG00000198695', 'ENSG00000198712', 'ENSG00000198727', 'ENSG00000198763', 'ENSG00000198786', 'ENSG00000198804', 'ENSG00000198840', 'ENSG00000198886', 'ENSG00000198888', 'ENSG00000198899', 'ENSG00000198938', 'ENSG00000212907', 'ENSG00000228253']
25 | 
26 |     """
27 |     valid = {"cyno", "cynomolgus", "human", "mouse", "rat", "pig"}
28 |     if species not in valid:
29 |         raise ValueError("species must be one of %s." % valid)
30 |     ref_mito_file = os.path.dirname(__file__) + "/mito_files/" + species + ".mito.tsv"
31 |     # ENS_GENE_ID  GENE_SYMBOL (2 cols)
32 |     if annotation_type == "SYMBOL":
33 |         mito_list = list(read_csv(ref_mito_file, header=None, sep="\t")[1])
34 |     elif annotation_type == "ENSEMBL":
35 |         mito_list = list(read_csv(ref_mito_file, header=None, sep="\t")[0])
36 |     else:
37 |         raise ValueError("annotation_type must be either SYMBOL or ENSEMBL")
38 |     return mito_list
39 | 


--------------------------------------------------------------------------------
/besca/datasets/data/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/besca/datasets/data/__init__.py


--------------------------------------------------------------------------------
/besca/datasets/genesets/CellNames_scseqCMs6_config.mouse.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/besca/datasets/genesets/CellNames_scseqCMs6_config.mouse.png


--------------------------------------------------------------------------------
/besca/datasets/genesets/CellNames_scseqCMs6_config.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/besca/datasets/genesets/CellNames_scseqCMs6_config.png


--------------------------------------------------------------------------------
/besca/datasets/genesets/CryptScoreParikh2019.gmt:
--------------------------------------------------------------------------------
1 | CryptScoreParikh2019	Crypt score as defined in [Parikh et al. Nature. 2019]:From stem cells (low score) to undifferentiated cells to differentiated top crypt cells (high score)	SELENOP	CEACAM7	PLAC8	CEACAM1	TSPAN1	CEACAM5	CEACAM6	IFI27	DHRS9	KRT20	RHOC	CD177	PKIB	HPGD	LYPD8
2 | 


--------------------------------------------------------------------------------
/besca/datasets/genesets/Immune.gmt:
--------------------------------------------------------------------------------
 1 | lymphocyte		PTPRC
 2 | myeloid		S100A8	S100A9	CST3
 3 | Bcell		CD19	CD79A	MS4A1
 4 | Tcells		CD3E	CD3G	CD3D
 5 | CD4		CD4
 6 | CD8		CD8A	CD8B
 7 | NKcell		NKG7	GNLY	NCAM1
 8 | monocyte		CST3	CSF1R	ITGAM	CD14	FCGR3A	FCGR3B
 9 | macrophage		CD14	IL1B	LYZ	CD163	ITGAX	CD68	CSF1R	FCGR3A
10 | 


--------------------------------------------------------------------------------
/besca/datasets/genesets/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/besca/datasets/genesets/__init__.py


--------------------------------------------------------------------------------
/besca/datasets/homologs/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/besca/datasets/homologs/__init__.py


--------------------------------------------------------------------------------
/besca/datasets/mito_files/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/besca/datasets/mito_files/__init__.py


--------------------------------------------------------------------------------
/besca/datasets/mito_files/cyno.mito.tsv:
--------------------------------------------------------------------------------
 1 | ENSMFAG00000046415	ND1
 2 | ENSMFAG00000046416	ND2
 3 | ENSMFAG00000046417	COX1
 4 | ENSMFAG00000046418	COX2
 5 | ENSMFAG00000046419	ATP8
 6 | ENSMFAG00000046420	ATP6
 7 | ENSMFAG00000046421	COX3
 8 | ENSMFAG00000046422	ND3
 9 | ENSMFAG00000046423	ND4L
10 | ENSMFAG00000046424	ND4
11 | ENSMFAG00000046425	ND5
12 | ENSMFAG00000046426	ND6
13 | ENSMFAG00000046427	CYTB
14 | 


--------------------------------------------------------------------------------
/besca/datasets/mito_files/cynomolgus.mito.tsv:
--------------------------------------------------------------------------------
 1 | ENSMFAG00000046415	ND1
 2 | ENSMFAG00000046416	ND2
 3 | ENSMFAG00000046417	COX1
 4 | ENSMFAG00000046418	COX2
 5 | ENSMFAG00000046419	ATP8
 6 | ENSMFAG00000046420	ATP6
 7 | ENSMFAG00000046421	COX3
 8 | ENSMFAG00000046422	ND3
 9 | ENSMFAG00000046423	ND4L
10 | ENSMFAG00000046424	ND4
11 | ENSMFAG00000046425	ND5
12 | ENSMFAG00000046426	ND6
13 | ENSMFAG00000046427	CYTB
14 | 


--------------------------------------------------------------------------------
/besca/datasets/mito_files/human.mito.tsv:
--------------------------------------------------------------------------------
 1 | ENSG00000198695	MT-ND6
 2 | ENSG00000198712	MT-CO2
 3 | ENSG00000198727	MT-CYB
 4 | ENSG00000198763	MT-ND2
 5 | ENSG00000198786	MT-ND5
 6 | ENSG00000198804	MT-CO1
 7 | ENSG00000198840	MT-ND3
 8 | ENSG00000198886	MT-ND4
 9 | ENSG00000198888	MT-ND1
10 | ENSG00000198899	MT-ATP6
11 | ENSG00000198938	MT-CO3
12 | ENSG00000212907	MT-ND4L
13 | ENSG00000228253	MT-ATP8
14 | 


--------------------------------------------------------------------------------
/besca/datasets/mito_files/mouse.mito.ensembl.list:
--------------------------------------------------------------------------------
 1 | ENSMUSG00000102011
 2 | ENSMUSG00000100246
 3 | ENSMUSG00000100533
 4 | ENSMUSG00000096178
 5 | ENSMUSG00000100964
 6 | ENSMUSG00000099619
 7 | ENSMUSG00000099399
 8 | ENSMUSG00000095134
 9 | ENSMUSG00000095366
10 | ENSMUSG00000096768
11 | ENSMUSG00000099871
12 | ENSMUSG00000096850
13 | ENSMUSG00000064336
14 | ENSMUSG00000064337
15 | ENSMUSG00000064338
16 | ENSMUSG00000064339
17 | ENSMUSG00000064340
18 | ENSMUSG00000064341
19 | ENSMUSG00000064342
20 | ENSMUSG00000064343
21 | ENSMUSG00000064344
22 | ENSMUSG00000064345
23 | ENSMUSG00000064346
24 | ENSMUSG00000064347
25 | ENSMUSG00000064348
26 | ENSMUSG00000064349
27 | ENSMUSG00000064350
28 | ENSMUSG00000064351
29 | ENSMUSG00000064352
30 | ENSMUSG00000064353
31 | ENSMUSG00000064354
32 | ENSMUSG00000064355
33 | ENSMUSG00000064356
34 | ENSMUSG00000064357
35 | ENSMUSG00000064358
36 | ENSMUSG00000064359
37 | ENSMUSG00000064360
38 | ENSMUSG00000064361
39 | ENSMUSG00000065947
40 | ENSMUSG00000064363
41 | ENSMUSG00000064364
42 | ENSMUSG00000064365
43 | ENSMUSG00000064366
44 | ENSMUSG00000064367
45 | ENSMUSG00000064368
46 | ENSMUSG00000064369
47 | ENSMUSG00000064370
48 | ENSMUSG00000064371
49 | ENSMUSG00000064372
50 | 


--------------------------------------------------------------------------------
/besca/datasets/mito_files/mouse.mito.tsv:
--------------------------------------------------------------------------------
 1 | ENSMUSG00000064341	mt-Nd1
 2 | ENSMUSG00000064345	mt-Nd2
 3 | ENSMUSG00000064351	mt-Co1
 4 | ENSMUSG00000064354	mt-Co2
 5 | ENSMUSG00000064356	mt-Atp8
 6 | ENSMUSG00000064357	mt-Atp6
 7 | ENSMUSG00000064358	mt-Co3
 8 | ENSMUSG00000064360	mt-Nd3
 9 | ENSMUSG00000065947	mt-Nd4l
10 | ENSMUSG00000064363	mt-Nd4
11 | ENSMUSG00000064367	mt-Nd5
12 | ENSMUSG00000064368	mt-Nd6
13 | ENSMUSG00000064370	mt-Cytb
14 | 


--------------------------------------------------------------------------------
/besca/datasets/mito_files/pig.mito.tsv:
--------------------------------------------------------------------------------
 1 | ENSSSCG00000018080	ATP8
 2 | ENSSSCG00000018075	COX1
 3 | ENSSSCG00000018078	COX2
 4 | ENSSSCG00000018082	COX3
 5 | ENSSSCG00000018094	CYTB
 6 | ENSSSCG00000018069	ND2
 7 | ENSSSCG00000018084	ND3
 8 | ENSSSCG00000018086	ND4L
 9 | ENSSSCG00000018091	ND5
10 | ENSSSCG00000018092	ND6
11 | 


--------------------------------------------------------------------------------
/besca/datasets/mito_files/rat.mito.tsv:
--------------------------------------------------------------------------------
 1 | ENSRNOG00000029042	Mt-nd6
 2 | ENSRNOG00000029707	Mt-nd4
 3 | ENSRNOG00000029971	Mt-nd5
 4 | ENSRNOG00000030371	Mt-co2
 5 | ENSRNOG00000030644	Mt-nd1
 6 | ENSRNOG00000030700	Mt-cox3
 7 | ENSRNOG00000031033	Mt-nd2
 8 | ENSRNOG00000031053	Mt-nd4l
 9 | ENSRNOG00000031766	Mt-cyb
10 | ENSRNOG00000031979	Mt-atp6
11 | ENSRNOG00000033299	Mt-atp8
12 | ENSRNOG00000033615	Mt-nd3
13 | ENSRNOG00000034234	Mt-co1
14 | 


--------------------------------------------------------------------------------
/besca/datasets/mito_files/test.mito.tsv:
--------------------------------------------------------------------------------
1 | ENSMUSG00000064341	Gene_1
2 | ENSMUSG00000064345	Gene_2
3 | ENSMUSG00000064351	Gene_3
4 | ENSMUSG00000064354	Gene_4
5 | ENSMUSG00000064356	Gene_5
6 | ENSMUSG00000064357	Gene_6
7 | 


--------------------------------------------------------------------------------
/besca/datasets/nomenclature/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/besca/datasets/nomenclature/__init__.py


--------------------------------------------------------------------------------
/besca/examples/example_function.py:
--------------------------------------------------------------------------------
 1 | def function_name(
 2 |     param1="default_value1", param2="default_value2", param3="default_value3"
 3 | ):
 4 |     """one-line function description that shows up in summaries.
 5 | 
 6 |     more extensive multi line function description explaining exactly what the function
 7 |     does and is intended for examples for code execution of the function can also be
 8 |     provided here
 9 | 
10 |     Parameters
11 |     ----------
12 |     param1: `type` | default = default_value1
13 |         brief description of what param1 controls and to what it should be set
14 |     param2: `type` | default = default_value2
15 |         brief description of what param1 controls and to what it should be set
16 |     param3: `type` | default = default_value3
17 |         brief description of what param1 controls and to what it should be set
18 | 
19 |     Returns
20 |     -------
21 |     Type
22 |         Information on what the function returns
23 | 
24 |     Example
25 |     -------
26 | 
27 |     >>> #insert example code here
28 |     >>> 1 + 1
29 |     2
30 |     
31 |     # this code is only displayed not executed
32 | 
33 |     """
34 | 
35 |     # function body
36 |     # do something here
37 | 


--------------------------------------------------------------------------------
/besca/examples/example_gallery.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Title of example
 3 | ================
 4 | 
 5 | Here goes your description of the example
 6 | """
 7 | 
 8 | # start writing some code
 9 | 
10 | ###############################################################################
11 | # sub heading
12 | # -----------
13 | #
14 | # Here you add additional text you want to include
15 | # there is no need to finish this section with any specific syntax
16 | # just leave a line empty after this comment
17 | 
18 | # more code
19 | 
20 | ###############################################################################
21 | # this is an additional text comment without a heading
22 | # this is more of that comment
23 | 
24 | # more code
25 | 


--------------------------------------------------------------------------------
/besca/examples/example_include_plot_in_documentation.py:
--------------------------------------------------------------------------------
 1 | """
 2 | ...
 3 | 
 4 | Example
 5 | -------
 6 | 
 7 | Description of your example.
 8 | 
 9 | >>> # this is code that will be displayed but not executed
10 | >>> # it should be a duplicate of the code used to generate the plot 
11 | >>> #  people will not be able to see how you generated the plot
12 | >>> ## plotting code 1
13 | >>> ## plotting code 2
14 | 
15 | .. plot:: 
16 | 
17 |     >>> # this is code that will be displayed but not executed
18 |     >>> # it should be a duplicate of the code used to generate the plot 
19 |     >>> #  people will not be able to see how you generated the plot
20 |     >>> ## plotting code 1
21 |     >>> ## plotting code 2
22 |     
23 | """
24 | 


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/README.txt:
--------------------------------------------------------------------------------
1 | Code Examples
2 | =============
3 | 
4 | .. toctree::
5 |    :maxdepth: 4


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/plotting/README.txt:
--------------------------------------------------------------------------------
1 | Plotting examples
2 | -----------------
3 | 
4 | This is a gallery containing some plotting examples.
5 | 
6 | 
7 | 


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/plotting/plot_celltype_quantification.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Visualize cell fractions
 3 | ========================
 4 | 
 5 | This example demonstrates how to generate celltype quantification plots. These types of plots 
 6 | can be used to visually represent the number of cells that belong to a certain subset or condition.
 7 | 
 8 | """
 9 | 
10 | import besca as bc
11 | import pytest
12 | pytest.skip('Test is only for here as example and should not be executed')
13 | 
14 | # import dataset to workwith
15 | adata = bc.datasets.Peng2019_processed()
16 | 
17 | #####################
18 | # quantify specific celllabels as a stacked barplot
19 | 
20 | bc.pl.celllabel_quant_stackedbar(
21 |     adata, count_variable="Cell_type", subset_variable="Patient"
22 | )
23 | 
24 | 
25 | #####################
26 | # quantify number of cells belong to each condition in a specific subset
27 | #
28 | # here each dot represents one Patient, the boxplots are grouped according to tissue type (Normal or Tumoral)
29 | bc.pl.celllabel_quant_boxplot(
30 |     adata,
31 |     count_variable="Cell_type",
32 |     subset_variable="Patient",
33 |     condition_identifier="Type",
34 |     plot_percentage=True,
35 | )
36 | 
37 | #####################
38 | # here you can also choose to plot total counts instead of percentages
39 | bc.pl.celllabel_quant_boxplot(
40 |     adata,
41 |     count_variable="Cell_type",
42 |     subset_variable="Patient",
43 |     condition_identifier="Type",
44 |     plot_percentage=False,
45 | )
46 | 


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/plotting/plot_filtering.py:
--------------------------------------------------------------------------------
 1 | """
 2 | filtering functions
 3 | ===================
 4 | 
 5 | This example shows you how to generate plots to visualize the chosen filter threshold.
 6 | This way you can easily check (visually) if your chosen threshold is a good one.
 7 | 
 8 | """
 9 | 
10 | import besca as bc
11 | import matplotlib.pyplot as plt
12 | import pytest
13 | pytest.skip('Test is only for here as example and should not be executed')
14 | adata = bc.datasets.pbmc3k_raw()
15 | 
16 | # define thresholds
17 | min_genes = 600
18 | min_cells = 2
19 | min_UMI = 600
20 | max_UMI = 6500
21 | max_mito = 0.05
22 | max_genes = 1900
23 | 
24 | # Visualize filtering thresholds
25 | fig, ((ax1, ax2, ax3), (ax4, ax5, ax6)) = plt.subplots(ncols=3, nrows=2)
26 | fig.set_figwidth(15)
27 | fig.set_figheight(8)
28 | fig.tight_layout(pad=4.5)
29 | 
30 | bc.pl.kp_genes(adata, min_genes=min_genes, ax=ax1)
31 | bc.pl.kp_cells(adata, min_cells=min_cells, ax=ax2)
32 | bc.pl.kp_counts(adata, min_counts=min_UMI, ax=ax3)
33 | bc.pl.max_counts(adata, max_counts=max_UMI, ax=ax4)
34 | bc.pl.max_mito(
35 |     adata, max_mito=max_mito, annotation_type="SYMBOL", species="human", ax=ax5
36 | )
37 | bc.pl.max_genes(adata, max_genes=max_genes)
38 | 


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/plotting/plot_qc.py:
--------------------------------------------------------------------------------
 1 | """
 2 | quality control plots
 3 | =====================
 4 | 
 5 | This example shows you the inbuilt quality control plots from besca.
 6 | 
 7 | """
 8 | 
 9 | # import libraries
10 | import besca as bc
11 | import matplotlib.pyplot as plt
12 | import pytest
13 | pytest.skip('Test is only for here as example and should not be executed')
14 | ###############################################################################
15 | #
16 | # Before beginning any analysis it is useful to take a detailled look at your dataset
17 | # to get an understanding for its characteristics.
18 | 
19 | # import data
20 | adata = bc.datasets.pbmc3k_raw()
21 | 
22 | ###############################################################################
23 | # transcript capture efficiency
24 | # -----------------------------
25 | #
26 | # Plotting the transcript capture efficiency will give you an overview of the expression
27 | # of genes within cells relative to the total UMI counts.
28 | 
29 | # transcript capture efficiency
30 | fig, ax = plt.subplots(1)
31 | fig.set_figwidth(8)
32 | fig.set_figheight(5)
33 | fig.tight_layout()
34 | 
35 | bc.pl.transcript_capture_efficiency(adata, ax=ax)
36 | 
37 | ###############################################################################
38 | # overview of library size unprocessed
39 | # ------------------------------------
40 | #
41 | # This gives you an overview of the read distribution per cell. High quality cells
42 | # will have a larger number of reads per cell and this is a parameter you can use to
43 | # filter out low quality cells. The number of reads you would expect per cell is strongly
44 | # dependent on the single-cell sequencing method you used.
45 | 
46 | bc.pl.librarysize_overview(adata)
47 | 
48 | ###############################################################################
49 | # most strongly expressed transcripts
50 | # -----------------------------------
51 | #
52 | # This will let you identify the genes which dominant your experiment
53 | # (generally you would expect mitochondrial and ribosomal genes,
54 | # in this dataset these genes have been removed beforehand).
55 | 
56 | bc.pl.top_genes_counts(adata=adata, top_n=25)
57 | 
58 | ###############################################################################
59 | # visualize the processed dataset
60 | # -------------------------------
61 | #
62 | # After performing your filtering it is generally a good idea to take another look
63 | # at your dataset to ensure that the filtering parameters used were reasonable.
64 | 
65 | adata = bc.datasets.pbmc3k_processed()
66 | 
67 | ###############################################################################
68 | #
69 | # Please note that the displayed counts have already been scaled. You would now expect
70 | # a more or less normal distribution of library size within your dataset.
71 | 
72 | bc.pl.librarysize_overview(adata)
73 | 


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/plotting/plot_riverplot.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Comparing categorical variable
 3 | ===================
 4 | 
 5 | This example shows you how to generate riverplots to compare categorical columns, 
 6 | for example to compare multiple annotations
 7 | This way you can easily check (visually) discripancies.
 8 | 
 9 | """
10 | 
11 | 
12 | import besca as bc
13 | import pytest
14 | pytest.skip('Test is only for here as example and should not be executed')
15 | # import data
16 | adata = bc.datasets.Baron2016_processed()
17 | 
18 | ###############################################################################
19 | # compare two categories: annotations made by different annotators
20 | # ----------------------
21 | 
22 | 
23 | bc.pl.riverplot_2categories(adata, ["assigned_cluster", "celltype2"])
24 | 


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/plotting/plot_split_gene_expression.py:
--------------------------------------------------------------------------------
 1 | """
 2 | # TODO
 3 | plotting gene expression
 4 | ========================
 5 | 
 6 | This example shows you some of the different plots you can use to plot gene expression.
 7 | 
 8 | """
 9 | import besca as bc
10 | import pytest
11 | pytest.skip('Test is only for here as example and should not be executed')
12 | # import data
13 | adata = bc.datasets.Haber2017_processed()
14 | 
15 | ###############################################################################
16 | # compare two conditions
17 | # ----------------------
18 | #
19 | # You can use the split violin plot to compare gene expression for two different conditions.
20 | 
21 | bc.pl.gene_expr_split(adata, genes=["Defa24", "Gm15284"], split_variable="donor")
22 | 
23 | ###############################################################################
24 | #
25 | # use a stacked split violin plot to compare this for several genes at the same time
26 | 
27 | bc.pl.gene_expr_split_stacked(
28 |     adata=adata,
29 |     genes=["Defa24", "Gm15284"],
30 |     split_variable="donor",
31 |     subset_variable="region_x",
32 | )
33 | 


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/preprocessing/README.txt:
--------------------------------------------------------------------------------
1 | Preprocessing
2 | -------------
3 | 
4 | This section highlights some of the features of the preprocessing functions included within BESCA.


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/preprocessing/plot_example_filtering.py:
--------------------------------------------------------------------------------
 1 | """
 2 | performing filtering using besca
 3 | ================================
 4 | 
 5 | This example demonstrates the entire process of filtering out cells/genes ob subpar quality
 6 | before proceeding with analysis. 
 7 | 
 8 | """
 9 | 
10 | import besca as bc
11 | import scanpy as sc
12 | import matplotlib.pyplot as plt
13 | import pytest
14 | pytest.skip('Test is only for here as example and should not be executed')
15 | # load example dataset
16 | adata = bc.datasets.pbmc3k_raw()
17 | 
18 | # set standard filtering parameters
19 | min_genes = 600
20 | min_cells = 2
21 | min_UMI = 600
22 | max_UMI = 6500
23 | max_mito = 0.05
24 | max_genes = 1900
25 | 
26 | ###############################################################################
27 | # visualization of thresholds
28 | # ---------------------------
29 | #
30 | # First the chosen thresholds are visualized to ensure that a suitable cutoff has been chosen.
31 | 
32 | # Visualize filtering thresholds
33 | fig, ((ax1, ax2, ax3), (ax4, ax5, ax6)) = plt.subplots(ncols=3, nrows=2)
34 | fig.set_figwidth(15)
35 | fig.set_figheight(8)
36 | fig.tight_layout(pad=4.5)
37 | 
38 | bc.pl.kp_genes(adata, min_genes=min_genes, ax=ax1)
39 | bc.pl.kp_cells(adata, min_cells=min_cells, ax=ax2)
40 | bc.pl.kp_counts(adata, min_counts=min_UMI, ax=ax3)
41 | bc.pl.max_counts(adata, max_counts=max_UMI, ax=ax4)
42 | bc.pl.max_mito(
43 |     adata, max_mito=max_mito, annotation_type="SYMBOL", species="human", ax=ax5
44 | )
45 | bc.pl.max_genes(adata, max_genes=max_genes)
46 | 
47 | ###############################################################################
48 | # application of filtering thresholds
49 | # -----------------------------------
50 | #
51 | # Using the chosen thresholds the data is filtered. Before and after filtering results are depicted to compare.
52 | 
53 | # visualize data before filtering
54 | sc.pl.violin(
55 |     adata, ["n_counts", "n_genes", "percent_mito"], multi_panel=True, jitter=0.4
56 | )
57 | 
58 | print(
59 |     "The AnnData object currently contains:",
60 |     str(adata.shape[0]),
61 |     "cells and",
62 |     str(adata.shape[1]),
63 |     "genes",
64 | )
65 | print(adata)
66 | 
67 | # perform filtering
68 | adata = bc.pp.filter(
69 |     adata,
70 |     max_counts=max_UMI,
71 |     max_genes=max_genes,
72 |     max_mito=max_mito,
73 |     min_genes=min_genes,
74 |     min_counts=min_UMI,
75 |     min_cells=min_cells,
76 | )
77 | 
78 | # visualize data after filtering
79 | sc.pl.violin(
80 |     adata, ["n_counts", "n_genes", "percent_mito"], multi_panel=True, jitter=0.4
81 | )
82 | 
83 | print(
84 |     "The AnnData object now contains:",
85 |     str(adata.shape[0]),
86 |     "cells and",
87 |     str(adata.shape[1]),
88 |     "genes",
89 | )
90 | print(adata)
91 | 


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/preprocessing/plot_pca_neighbors_clustering.py:
--------------------------------------------------------------------------------
 1 | """
 2 | cluster generation
 3 | ==================
 4 | 
 5 | This example demonstrates how to perform highly variable gene selection, PCA, nearest neighbor calculation, and clustering.
 6 | 
 7 | """
 8 | 
 9 | import besca as bc
10 | import scanpy as sc
11 | import pytest
12 | pytest.skip('Test is only for here as example and should not be executed')
13 | # import example dataset that has previously been filtered
14 | adata = bc.datasets.pbmc3k_filtered()
15 | ## We get the raw matrix containing all the initial genes, keeping the filtering on the cells
16 | adata = bc.get_raw(adata)
17 | 
18 | ###############################################################################
19 | # highly variable gene selection
20 | # ------------------------------
21 | #
22 | # select highly variable genes (considers correction for gene expression level)
23 | 
24 | # define thresholds for highly variable genes
25 | variable_genes_min_mean = 0.01
26 | variable_genes_max_mean = 5
27 | variable_genes_min_disp = 0.4
28 | 
29 | # identify genes with variable expression
30 | filter_result = sc.pp.filter_genes_dispersion(
31 |     adata.X,
32 |     min_mean=variable_genes_min_mean,
33 |     max_mean=variable_genes_max_mean,
34 |     min_disp=variable_genes_min_disp,
35 | )
36 | sc.pl.filter_genes_dispersion(filter_result)
37 | nbr_variable_genes = sum(filter_result.gene_subset)
38 | print("number of variable genes selected ", nbr_variable_genes)
39 | 
40 | # perform the actual filtering
41 | adata = adata[:, filter_result.gene_subset]
42 | 
43 | ###############################################################################
44 | # set random seed
45 | # ---------------
46 | # To get reproducible results you need to define a random seed for all of the stochastic
47 | # processes, such as e.g. PCA, neighbors, etc.
48 | 
49 | # set random seed
50 | random_seed = 0
51 | 
52 | ###############################################################################
53 | # PCA
54 | # ---
55 | 
56 | # log transform our data (is easier to work with numbers like this)
57 | sc.pp.log1p(adata)
58 | 
59 | # Scale data to unit variance and zero mean, and cut-off at max value 10
60 | sc.pp.scale(adata, max_value=10)
61 | 
62 | # calculate 50 principle components of the dataset
63 | sc.tl.pca(adata, random_state=random_seed, svd_solver="arpack")
64 | 
65 | # visualize the amount of variance explained by each PC
66 | sc.pl.pca_variance_ratio(adata)
67 | 
68 | # visualize the loadings onto the first 3 PCs
69 | sc.pl.pca_loadings(adata)
70 | 
71 | ###############################################################################
72 | # nearest neighbors
73 | # -----------------
74 | 
75 | sc.pp.neighbors(adata, n_neighbors=15, random_state=random_seed, n_pcs=50)
76 | 
77 | ###############################################################################
78 | # leiden clustering
79 | # ------------------
80 | 
81 | sc.tl.leiden(adata, random_state=random_seed)
82 | 
83 | ###############################################################################
84 | # UMAP and t-SNE generation
85 | # -------------------------
86 | 
87 | # calculate UMAP
88 | sc.tl.umap(adata, random_state=random_seed)
89 | 
90 | # calculate t-SNE
91 | sc.tl.tsne(adata, random_state=random_seed)
92 | 
93 | ###############################################################################
94 | # visualize the results
95 | # ---------------------
96 | 
97 | sc.pl.umap(adata, color=["leiden"])
98 | sc.pl.tsne(adata, color=["leiden"])
99 | 


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/tools/README.txt:
--------------------------------------------------------------------------------
1 | Tools
2 | -----
3 | 
4 | This section contains all examples related to besca tools.


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/tools/plot_reclustering_function.py:
--------------------------------------------------------------------------------
 1 | """
 2 | reclustering on specific louvain clusters
 3 | =========================================
 4 | 
 5 | This example demonstrates who to perform a reclustering on a selected subset of
 6 | louvain clusters. You will want to do this for example during the process of celltype
 7 | annotation, when the  clusters do not have a sufficient resolution to seperate
 8 | all clusters and mixed cell populations still exist.
 9 | 
10 | """
11 | 
12 | import besca as bc
13 | import scanpy as sc
14 | import pytest
15 | pytest.skip('Test is only for here as example and should not be executed')
16 | # load and preprocess data (here we will start from a preprocessed dataset)
17 | adata = bc.datasets.pbmc3k_processed()
18 | 
19 | # extract subset using the recluster function whcih is part of the reclustering (rc) toolkit
20 | adata_subset = bc.tl.rc.recluster(
21 |     adata,
22 |     celltype=("2", "3", "4", "5", "6", "8", "9", "10", "11", "12"),
23 |     celltype_label="leiden",
24 |     resolution=1.2,
25 | )
26 | 
27 | 
28 | # visualize the new clusters
29 | sc.pl.umap(
30 |     adata_subset, color=["leiden", "CD3G", "CD8A", "CD4", "IL7R", "NKG7", "GNLY"]
31 | )
32 | 
33 | # append new celltype labels to the subclusters.
34 | # This is an approximative hand annotation that should be dealt into more widths.
35 | labels = [
36 |     "NK cell",  # 0
37 |     "CD4 T-cell",  # 1
38 |     "CD8 T-cell",  # 2
39 |     "CD4 T-cell",  # 3
40 |     "CD8 T-cell",  # 4
41 |     "CD8 T-cell",  # 5
42 |     "CD4 T-cell",  # 6
43 |     "CD4 T-cell",  # 7
44 |     "CD4 T-cell",  # 8
45 |     "CD4 T-cell",  # 9
46 |     "CD4 T-cell",  # 10
47 |     "CD4 T-cell",  # 11
48 |     "CD4 T-cell",  # 12
49 |     "CD4 T-cell",  # 13
50 |     "CD4 T-cell",  # 14
51 |     "CD4 T-cell",  # 15
52 |     "CD4 T-cell",  # 16
53 |     "CD4 T-cell",  # 17
54 |     "CD4 T-cell",  # 18
55 |     "CD4 T-cell",  # 19
56 | ]  # 10
57 | 
58 | new_labels = [labels[i] for i in range(len(adata_subset.obs.get("leiden").value_counts().index.tolist()))]
59 | 
60 | 
61 | # merge the labels back into the original adata object
62 | # note this will overwrite what ever was saved in adata.obs.celltype;
63 | # Here is was not assigned yet.
64 | bc.tl.rc.annotate_new_cellnames(
65 |     adata, adata_subset, names=new_labels, new_label="celltype"
66 | )
67 | 
68 | 


--------------------------------------------------------------------------------
/besca/examples/gallery_examples/workflows/README.txt:
--------------------------------------------------------------------------------
1 | Workflows
2 | ---------
3 | 
4 | Demonstration workflows showing you how to peform certain tasks


--------------------------------------------------------------------------------
/besca/export/__init__.py:
--------------------------------------------------------------------------------
 1 | from besca.export._export import (
 2 |     X_to_mtx,
 3 |     analysis_metadata,
 4 |     clustering,
 5 |     generate_gep,
 6 |     write_labeling_to_files,
 7 |     labeling_info,
 8 |     pseudobulk,
 9 |     ranked_genes,
10 |     raw_to_mtx,
11 | )
12 | 
13 | __all__ = [
14 |     "X_to_mtx",
15 |     "raw_to_mtx",
16 |     "clustering",
17 |     "write_labeling_to_files",
18 |     "labeling_info",
19 |     "analysis_metadata",
20 |     "generate_gep",
21 |     "ranked_genes",
22 |     "pseudobulk",
23 | ]
24 | 


--------------------------------------------------------------------------------
/besca/pl/__init__.py:
--------------------------------------------------------------------------------
 1 | from besca.pl._filter_threshold_plots import (
 2 |     kp_genes,
 3 |     kp_counts,
 4 |     kp_cells,
 5 |     max_counts,
 6 |     max_genes,
 7 |     max_mito,
 8 | )
 9 | from besca.pl._split_gene_expression import gene_expr_split, gene_expr_split_stacked
10 | from besca.pl._celltype_quantification import (
11 |     celllabel_quant_boxplot,
12 |     celllabel_quant_stackedbar,
13 | )
14 | from besca.pl._qc_plots import (
15 |     dropouts,
16 |     librarysize_overview,
17 |     detected_genes,
18 |     library_size,
19 |     transcript_capture_efficiency,
20 |     top_genes_counts,
21 | )
22 | 
23 | from besca.pl._crispr_plots import (
24 |     infection_count,
25 |     cell_per_KO,
26 |     infection_level,
27 |     plot_expression_by_sample,
28 |     avg_KO_persample,
29 |     KO_dotplot,
30 |     compute_plot_de_crispr,
31 |     enrichement_per_cluster,
32 |     plot_comparison_of_cells
33 | )
34 | from besca.pl._general import stacked_split_violin, box_per_ind, flex_dotplot
35 | from besca.pl._dot_heatmap import dot_heatmap, dot_heatmap_split, dot_heatmap_split_greyscale
36 | from besca.pl._update_palette import update_qualitative_palette
37 | from besca.pl._nomenclature_network import nomenclature_network
38 | from besca.pl._riverplot import riverplot_2categories
39 | 
40 | __all__ = [
41 |     "kp_genes",
42 |     "kp_counts",
43 |     "kp_cells",
44 |     "max_counts",
45 |     "max_genes",
46 |     "max_mito",
47 |     "dropouts",
48 |     "detected_genes",
49 |     "library_size",
50 |     "librarysize_overview",
51 |     "transcript_capture_efficiency",
52 |     "top_genes_counts",
53 |     "infection_count",
54 |     "cell_per_KO",
55 |     "infection_level",
56 |     "plot_expression_by_sample",
57 |     "avg_KO_persample",
58 |     "KO_dotplot",
59 |     "compute_plot_de_crispr",
60 |     "enrichement_per_cluster",
61 |     "plot_comparison_of_cells",
62 |     "gene_expr_split",
63 |     "gene_expr_split_stacked",
64 |     "box_per_ind",
65 |     "stacked_split_violin",
66 |     "celllabel_quant_boxplot",
67 |     "celllabel_quant_stackedbar",
68 |     "dot_heatmap",
69 |     "dot_heatmap_split",
70 |     "dot_heatmap_split_greyscale",
71 |     "update_qualitative_palette",
72 |     "nomenclature_network",
73 |     "riverplot_2categories",
74 |     "flex_dotplot",
75 | ]
76 | 


--------------------------------------------------------------------------------
/besca/pl/_nomenclature_network.py:
--------------------------------------------------------------------------------
 1 | import importlib
 2 | 
 3 | import networkx as nx
 4 | import pandas as pd
 5 | from matplotlib import pyplot as plt
 6 | 
 7 | def nomenclature_network(
 8 |     config_file: str,
 9 |     selected_roots=[],
10 |     root_term="None",
11 |     font_size=7,
12 |     node_size=200,
13 |     node_color="tan",
14 |     alpha=0.8,
15 |     figsize=(7,7)
16 | ):
17 |     """Plot a nomenclature network based on annotation config file.
18 | 
19 |     This function plots the relations between celltypes as described within an annotation config file, as the one provided with besca.
20 |     It displays parent - child term relation as a directed graph G ( V, E); Subsetting of such graph is possible using selected_roots argument.
21 | 
22 | 
23 |     Parameters
24 |     ----------
25 |     config_file: `str`
26 |         config file from besca, expects a path to a tab separated file containing Parent and Term columns
27 |     selected_roots: `list`
28 |         if list contained terms, will only display the hierarchy starting from those terms.
29 |     root_term : `str`
30 |         the string indicating in the config file that a term does not have a parent term.
31 |     figsize: (width, height) or None | default = (7,7)
32 |         optional parameter to define the figure size of the plot that is to be generated
33 | 
34 |     Returns
35 |     -------
36 |     Figure
37 |         A matplotlib plt object containing the generated plot.
38 | 
39 |     Example
40 |     -------
41 |     >>> import besca as bc
42 |     >>> import pkg_resources
43 |     >>> config_file = pkg_resources.resource_filename('besca', 'datasets/genesets/CellNames_scseqCMs6_config.tsv')
44 |     >>> plt = bc.pl.nomenclature_network(config_file)
45 |     >>> plt.show()
46 |     >>> plt = bc.pl.nomenclature_network(config_file, selected_roots = ['Epithelial', 'Tcell'])
47 |     >>> plt.show()
48 | 
49 |     """
50 |     pydot_import = importlib.util.find_spec("pydot")
51 | 
52 |     if pydot_import is None:
53 |         raise ImportError(
54 |             "_nomenclature_network.py requires pydot. Install with pip install pydot"
55 |         )
56 |     # read tsv file
57 |     df = pd.read_csv(config_file, sep="\t")
58 | 
59 |     # By default root parents have the entry "None". we need to replace this with its own name so a network per root is created
60 |     roots_to_set = df["Parent"] == root_term
61 |     for row, root in zip(df.iterrows(), roots_to_set):
62 |         if root:
63 |             df.at[row[0], "Parent"] = row[1]["Term"]
64 | 
65 |     # We create the network with networkx library
66 |     G = nx.from_pandas_edgelist(
67 |         df, target="Term", source="Parent", create_using=nx.DiGraph()
68 |     )
69 |     ## Subgraph extraction if specific roots were given
70 |     if selected_roots:
71 |         selected_nodes = set()
72 |         for ss in selected_roots:
73 |             try:
74 |                 selected_nodes.update(nx.descendants(G, ss))
75 |             except Exception as e:
76 |                 print(ss + " node not found in config file")
77 | 
78 |         G = G.subgraph(list(selected_nodes) + selected_roots)
79 | 
80 |     if figsize is not None:
81 |         plt.figure(3, figsize=(figsize[0], figsize[1]))
82 |     nx.draw_networkx(
83 |         G,
84 |         nx.nx_pydot.pydot_layout(G),
85 |         font_size=font_size,
86 |         node_size=node_size,
87 |         node_color=node_color,
88 |         alpha=alpha,
89 |     )
90 |     plt.axis("off")
91 |     plt.tight_layout()
92 | 
93 |     return plt
94 | 


--------------------------------------------------------------------------------
/besca/pl/_update_palette.py:
--------------------------------------------------------------------------------
 1 | import sys
 2 | import re
 3 | import pandas as pd
 4 | from anndata import AnnData
 5 | from typing import Dict
 6 | 
 7 | 
 8 | def check_colors(aColor):
 9 |     """
10 |     convert the color given in hex if needed. This avoid warning message a posteriori
11 |     parameters
12 |     ----------
13 |     aColor: ``
14 |       color to check; expected tupple. Hex would be returned as input
15 | 
16 |     returns
17 |     -------
18 |        the color in hex
19 |     """
20 |     if isinstance(aColor, tuple) and len(aColor) == 3:
21 |         if aColor < (1, 1, 1):
22 |             r = round(aColor[0] * 255)
23 |             g = round(aColor[1] * 255)
24 |             b = round(aColor[2] * 255)
25 |         else:  # assuming rgb
26 |             r = aColor[0]
27 |             g = aColor[1]
28 |             b = aColor[1]
29 |         return "#{:02x}{:02x}{:02x}".format(r, g, b)
30 |     else:
31 |         matchingHex = re.search(r"^#(?:[0-9a-fA-F]{3}){1,2}$", aColor)
32 |         if matchingHex:
33 |             return aColor
34 |         else:
35 |             sys.exit("Color " + str(aColor) + "could not be converted")
36 | 
37 | 
38 | def update_qualitative_palette(
39 |     adata: AnnData,
40 |     palette: Dict[str, str],
41 |     group: str = "leiden",
42 |     checkColors: bool = True,
43 | ) -> None:
44 |     """Update adata object such that the umap will adhere to the palette provided.
45 | 
46 |     parameters
47 |     ----------
48 |     adata: `AnnData`
49 |       the AnnData object
50 |     palette: `dict`
51 |         dict with keys as the values of the group observation. To avoid warning from matlib it is advised to have \
52 |             hex color values
53 |     group: `str`
54 |         string identifying the column name of adata.obs where colors will be set.
55 |         Used internally like this: `pd.Categorical(adata.obs[<group>]).categories.tolist()`
56 |     checkColors: `boolean`
57 |         check the colors inputed to transform them if needed into a hex values. tupple of RBG of 0-1 values cna be converted.
58 |      returns
59 |     -------
60 |     None; update the AnnData object, that the color order matches the order of the AnnData object categories
61 |     """
62 | 
63 |     # get the groups/categories in the same way as scanpy does it in scanpy/plotting/_tools/scatterplots.py: _get_palette
64 |     category_list = pd.Categorical(adata.obs[group]).categories.tolist()
65 | 
66 |     # Checking Validity
67 |     if not all(elem in palette.keys() for elem in category_list):
68 |         sys.exit(
69 |             "Please provide a palette dict containing all element of the group " + group
70 |         )
71 |     if checkColors:
72 |         palette = {k: check_colors(color) for k, color in palette.items()}
73 | 
74 |     newColorList = []
75 |     for category_name in category_list:
76 |         newColorList.append(palette[category_name])
77 | 
78 |     adata.uns[group + "_colors"] = newColorList.copy()
79 |     return None
80 | 


--------------------------------------------------------------------------------
/besca/pp/__init__.py:
--------------------------------------------------------------------------------
 1 | from besca.pp._filtering import filter, filter_gene_list
 2 | from besca.pp._fraction_pos import (
 3 |     frac_pos,
 4 |     frac_reads,
 5 |     mean_expr,
 6 |     top_counts_genes,
 7 |     top_expressed_genes,
 8 | )
 9 | from besca.pp._fraction_counts import fraction_counts
10 | from besca.pp._normalization import normalize_geometric
11 | from besca.pp._wrapper_Rfuncs import valOutlier, scTransform
12 | from besca.pp._crispr_pp import filter_perturb, extract_target
13 | 
14 | __all__ = [
15 |     "filter",
16 |     "filter_gene_list",
17 |     "frac_pos",
18 |     "frac_reads",
19 |     "mean_expr",
20 |     "top_expressed_genes",
21 |     "fraction_counts",
22 |     "top_counts_genes",
23 |     "normalize_geometric",
24 |     "valOutlier",
25 |     "scTransform",
26 |     "filter_perturb",
27 |     "extract_target"
28 | ]
29 | 


--------------------------------------------------------------------------------
/besca/pp/_fraction_counts.py:
--------------------------------------------------------------------------------
 1 | import sys
 2 | from pandas import read_csv
 3 | from numpy import sum, any
 4 | import warnings
 5 | from besca.datasets._mito import get_mito_genes
 6 | 
 7 | def fraction_counts(
 8 |     adata, species="human", name="percent_mito", use_genes="SYMBOL", specific_file=None
 9 | ):
10 |     """Function to calculate fraction of counts per cell from a gene list.
11 |     This function calculates the fraction of counts per cell for
12 |     a list of genes (for example mito genes) if no specific file is given.
13 |     Note that the input file consists of two columns
14 |     (ENSEMBL gene id and gene symbol) tab
15 |     separated
16 | 
17 |     Parameters
18 |     ----------
19 |     adata: `AnnData`
20 |         AnnData object
21 |     species: `str` | default = human
22 |         species for mitochondrial content evaluation
23 |     name: `str` | default = percent_mito
24 |         String identifying the column name to which the results
25 |         should be written to in the AnnData.obs object
26 |     use_genes: `SYMBOL` or `ENSEMBL` | default = SYMBOL
27 |         String defining whether ENSEMBL id's or gene symbols are used in the
28 |         adata.var_names (defines which column of input gene list is read)
29 |     specific_file: `str` | default None.
30 |         if indicated, the file will be used to extract the gene list
31 |     Returns
32 |     -------
33 |     None
34 |         Returns None but updates adata with new column named 'name'
35 |         containing calculated fraction of counts.
36 | 
37 |     Example
38 |     -------
39 |     >>> import besca as bc
40 |     >>> import os
41 |     >>> adata = bc.datasets.simulated_pbmc3k_raw()
42 |     >>> bc.pp.fraction_counts(adata,  'human', use_genes='SYMBOL', specific_file=f"{os.path.dirname(__file__)[:-3]}/datasets/mito_files/test.mito.tsv")
43 |     >>> counts = adata.obs.head(5)
44 |     """
45 |     if specific_file is None:
46 |         gene_list = get_mito_genes(species, use_genes)
47 |     else:
48 |         # ENS_GENE_ID  GENE_SYMBOL (2 cols)
49 |         if use_genes == "SYMBOL":
50 |             gene_list = list(read_csv(specific_file, header=None, sep="\t")[1])
51 |         elif use_genes == "ENSEMBL":
52 |             gene_list = list(read_csv(specific_file, header=None, sep="\t")[0])
53 |     genes = [i for i in adata.var_names if i in gene_list]
54 |     # for each cell compute fraction of counts in gene_list vs. all genes
55 |     # axis=1 --> sum over rows
56 |     if len(genes) > 0:
57 |         n_counts = sum(adata.X, axis=1).A1
58 |         if any(n_counts == 0):
59 |             warnings.warn(
60 |                 "Some of the cells contain no counts. \
61 |                            Do not forget to remove 'empty' cells from data."
62 |             )
63 |             n_counts[n_counts == 0] = float("inf")
64 |         adata.obs[name] = sum(adata[:, genes].X, axis=1).A1 / n_counts
65 |     else:
66 |         adata.obs[name] = 0.0
67 |         print(
68 |             "None of the genes from input list found in data set. \
69 |                Please ensure you have correctly specified use_genes to match \
70 |                the type of genes saved in adata.var_names."
71 |         )
72 |     return None
73 | 


--------------------------------------------------------------------------------
/besca/st/__init__.py:
--------------------------------------------------------------------------------
 1 | from besca.st._FAIR_export import (
 2 |     export_cp10k,
 3 |     export_regressedOut,
 4 |     export_norm_citeseq,
 5 |     export_clustering,
 6 |     export_metadata,
 7 |     export_rank,
 8 |     export_celltype,
 9 | )
10 | from besca.st._wrapper_funcs import (
11 |     setup,
12 |     setup_citeseq,
13 |     read_matrix,
14 |     filtering_cells_genes_min,
15 |     filtering_mito_genes_max,
16 |     per_cell_normalize,
17 |     clr_normalize,
18 |     highly_variable_genes,
19 |     regress_out,
20 |     batch_correction,
21 |     pca_neighbors_umap,
22 |     clustering,
23 |     additional_labeling,
24 |     celltype_labeling,
25 | )
26 | from besca.st._wrapper_Rfuncs import dsb_normalize, deviance, maxLikGlobalDimEst
27 | from besca.st._setup_funcs import create_button, create_popup
28 | from besca.st._qc_report import write_qc
29 | 
30 | __all__ = [
31 |     "read_matrix",
32 |     "filtering_cells_genes_min",
33 |     "filtering_mito_genes_max",
34 |     "export_cp10k",
35 |     "export_regressedOut",
36 |     "export_clustering",
37 |     "export_metadata",
38 |     "export_rank",
39 |     "export_celltype",
40 |     "additional_labeling",
41 |     "celltype_labeling",
42 | ]
43 | 


--------------------------------------------------------------------------------
/besca/st/_setup_funcs.py:
--------------------------------------------------------------------------------
 1 | from IPython.display import HTML
 2 | from IPython.display import Javascript
 3 | 
 4 | 
 5 | def create_button():
 6 |     input_form = """
 7 |     <div style="background-color:gainsboro; width:600px; padding:20px;">
 8 |     Continue running notebook with the given filtering parameters. <br>
 9 |     <button onclick="execute()">Continue</button>
10 |     </div>
11 |     """
12 | 
13 |     javascript = """
14 |     <script type="text/Javascript">
15 |         function execute(){
16 |             var command = IPython.notebook.execute_cells_below();
17 |             var kernel = IPython.notebook.kernel;
18 |             kernel.execute(command);
19 |         }
20 |     """
21 | 
22 |     return HTML(input_form + javascript)
23 | 
24 | 
25 | def create_popup():
26 |     return Javascript(
27 |         """
28 |     function execute(){
29 |             var command = IPython.notebook.execute_cells_below();
30 |             var kernel = IPython.notebook.kernel;
31 |             kernel.execute(command);
32 |         }
33 |     
34 |     function interrupt(){
35 |             var command = IPython.notebook.interrupt;
36 |             var kernel = IPython.notebook.kernel;
37 |             kernel.execute(command);
38 |         }
39 |     if(confirm("Continue running with the chosen standard parameters?")){execute()} else{interrupt()}
40 |     """
41 |     )
42 | 


--------------------------------------------------------------------------------
/besca/tl/README.md:
--------------------------------------------------------------------------------
1 | # Documentation of Abbreviations
2 | 
3 | bcor = batch correction  
4 | rc = reclustering  
5 | dge = differential gene expression  
6 | sig = signature scoring  
7 | 


--------------------------------------------------------------------------------
/besca/tl/__init__.py:
--------------------------------------------------------------------------------
 1 | from besca.tl import auto_annot, bcor, dge, rc, sig, crispr
 2 | from besca.tl._annotate_cellnames import annotate_cells_clustering
 3 | from besca.tl._count_occurrences import (
 4 |     count_occurrence,
 5 |     count_occurrence_subset,
 6 |     count_occurrence_subset_conditions,
 7 | )
 8 | from besca.tl._annot_compare import report, plot_confusion_matrix
 9 | 
10 | __all__ = [
11 |     "rc",
12 |     "dge",
13 |     "bcor",
14 |     "crispr",
15 |     "sig",
16 |     "crispr",
17 |     "count_occurrence",
18 |     "count_occurrence_subset",
19 |     "count_occurrence_subset_conditions",
20 |     "annotate_cells_clustering",
21 |     "auto_annot",
22 |     "report",
23 |     "plot_confusion_matrix",
24 | ]
25 | 


--------------------------------------------------------------------------------
/besca/tl/_annotate_cellnames.py:
--------------------------------------------------------------------------------
 1 | import sys
 2 | 
 3 | 
 4 | def annotate_cells_clustering(
 5 |     adata,
 6 |     new_cluster_labels,
 7 |     new_annotation_label="celltype",
 8 |     clustering_label="leiden",
 9 | ):
10 |     """Function to add annotation to adata.obs based on clustering
11 |     This function replaces the original cluster labels located in the column clustering_label with
12 |     the new values specified in the list new_cluster_lables. The values in this list need to be in the
13 |     same lexicographic order as the cluster values.
14 |     The order of this can be checked by running
15 |     ` sorted(adata.obs.get(clustering_label).unique(), key=int)` or
16 |     ` sorted(adata.obs.get(clustering_label).unique(), key=str)`
17 | 
18 |     parameters
19 |     ----------
20 | 
21 |     adata: AnnData
22 |         the AnnData object that is supposed to recieve a new annotation
23 |     new_cluster_labels: `list`
24 |         a list in correct lexicographic order of the new cluster labels
25 |     new_annotation_label: `str` | default = 'celltype'
26 |         string identifying the name underwhich the new cluster labels should be added to adata.obs
27 |     clustering_label: `str` | default = 'louvain'
28 |         string identifying the name underwhich the old cluster labels can be found in adata.obs
29 | 
30 |     returns
31 |     -------
32 | 
33 |     AnnData
34 |         The adata.obs has been updated with a new column containing the new annotation
35 | 
36 |     """
37 |     # get the cluster ids
38 |     if clustering_label not in adata.obs.columns:
39 |         sys.exit(clustering_label + " label not found")
40 |     try:
41 |         clusters = sorted(adata.obs.get(clustering_label).unique(), key=int)
42 |     # If int conversion does not work
43 |     except:
44 |         clusters = sorted(adata.obs.get(clustering_label).unique(), key=str)
45 |     # extract old clustering labels to a new dataframe
46 |     cluster_annotation = (
47 |         adata.obs.get(clustering_label).to_frame(name=new_annotation_label).copy()
48 |     )
49 |     # check if the number of new labels matches the number of clusters
50 |     if len(clusters) != len(new_cluster_labels):
51 |         sys.exit(
52 |             "Specified "
53 |             + str(len(new_cluster_labels))
54 |             + " new labels for a total of "
55 |             + str(len(clusters))
56 |             + " clusters. Numbers should match! No changes were made.\n"
57 |         )
58 | 
59 |     # replace old labels with the new labels
60 |     for i in range(0, len(clusters)):
61 |         cluster_annotation.get(new_annotation_label).replace(
62 |             clusters[i], new_cluster_labels[i], inplace=True
63 |         )
64 | 
65 |     # write results back into adata
66 |     adata.obs = adata.obs.merge(
67 |         cluster_annotation, how="outer", left_index=True, right_index=True
68 |     )
69 |     return None
70 | 


--------------------------------------------------------------------------------
/besca/tl/auto_annot/__init__.py:
--------------------------------------------------------------------------------
 1 | from besca.tl.auto_annot._auto_annot import (
 2 |     read_data,
 3 |     read_raw,
 4 |     read_adata,
 5 |     merge_data,
 6 |     naive_merge,
 7 |     scanorama_merge,
 8 |     remove_genes,
 9 |     intersect_genes,
10 |     remove_nonshared,
11 |     fit,
12 |     linear_svm,
13 |     rbf_svm,
14 |     sgd_svm,
15 |     random_forest,
16 |     logistic_regression,
17 |     logistic_regression_ovr,
18 |     logistic_regression_elastic,
19 |     adata_predict,
20 |     predict,
21 |     adata_pred_prob,
22 |     predict_proba,
23 |     report,
24 |     scanvi_predict,
25 |     scvi_merge,
26 |     visualise_scvi_merge,
27 | )
28 | 
29 | __all__ = [
30 |     "read_data",
31 |     "read_raw",
32 |     "read_adata",
33 |     "merge_data",
34 |     "naive_merge",
35 |     "scanorama_merge",
36 |     "remove_genes",
37 |     "intersect_genes",
38 |     "remove_nonshared",
39 |     "fit",
40 |     "linear_svm",
41 |     "rbf_svm",
42 |     "sgd_svm",
43 |     "random_forest",
44 |     "logistic_regression",
45 |     "logistic_regression_ovr",
46 |     "logistic_regression_elastic",
47 |     "adata_predict",
48 |     "predict",
49 |     "adata_pred_prob",
50 |     "predict_proba",
51 |     "report",
52 |     "scanvi_predict",
53 |     "scvi_merge",
54 |     "visualise_scvi_merge",
55 | ]
56 | 


--------------------------------------------------------------------------------
/besca/tl/bcor/__init__.py:
--------------------------------------------------------------------------------
1 | from besca.tl.bcor._mnnpy_batchcorrection import postprocess_mnnpy, batch_correct
2 | 
3 | __all__ = ["batch_correct", "postprocess_mnnpy"]
4 | 


--------------------------------------------------------------------------------
/besca/tl/crispr/__init__.py:
--------------------------------------------------------------------------------
1 | from besca.tl.crispr._crispr_tools import execute_de_sgRNA, find_distances
2 | 
3 | __all__ = ["execute_de_sgRNA", "find_distances"]
4 | 


--------------------------------------------------------------------------------
/besca/tl/dge/__init__.py:
--------------------------------------------------------------------------------
1 | from besca.tl.dge._dge import perform_dge, plot_interactive_volcano, get_de
2 | 
3 | __all__ = ["perform_dge", "plot_interactive_volcano", "get_de"]
4 | 


--------------------------------------------------------------------------------
/besca/tl/rc/__init__.py:
--------------------------------------------------------------------------------
1 | from besca.tl.rc._reclustering import recluster, annotate_new_cellnames
2 | 
3 | __all__ = ["recluster", "annotate_new_cellnames"]
4 | 


--------------------------------------------------------------------------------
/besca/tl/sig/__init__.py:
--------------------------------------------------------------------------------
 1 | from besca.tl.sig._annot import (
 2 |     add_anno,
 3 |     export_annotconfig,
 4 |     getset,
 5 |     make_anno,
 6 |     match_cluster,
 7 |     match_label,
 8 |     obtain_dblabel,
 9 |     obtain_new_label,
10 |     read_annotconfig,
11 |     score_mw,
12 | )
13 | from besca.tl.sig._gems_link import get_gems, get_similar_geneset, insert_gems
14 | from besca.tl.sig._io_sig import convert_to_directed, read_GMT_sign, write_gmtx_forgems
15 | from besca.tl.sig._sig import (
16 |     combined_signature_score,
17 |     compute_signed_score,
18 |     filter_by_set,
19 |     filter_siggenes,
20 |     convert_siggenes,
21 |     make_gmtx,
22 | )
23 | 
24 | from besca.tl.sig._silhouette import silhouette_computation
25 | 
26 | __all__ = [
27 |     "combined_signature_score",
28 |     "compute_signed_score",
29 |     "filter_by_set",
30 |     "filter_siggenes",
31 |     "convert_siggenes",
32 |     "read_GMT_sign",
33 |     "getset",
34 |     "score_mw",
35 |     "add_anno",
36 |     "make_anno",
37 |     "read_annotconfig",
38 |     "match_cluster",
39 |     "obtain_new_label",
40 |     "obtain_dblabel",
41 |     "get_gems",
42 |     "insert_gems",
43 |     "get_similar_geneset",
44 |     "export_annotconfig",
45 |     "convert_to_directed",
46 |     "make_gmtx",
47 |     "write_gmtx_forgems",
48 |     "silhouette_computation",
49 |     "match_label",
50 | ]
51 | 


--------------------------------------------------------------------------------
/besca/tl/sig/_helper.py:
--------------------------------------------------------------------------------
 1 | # this file contains the helper functions
 2 | # for signature scoring analysis in python using scanpy
 3 | 
 4 | 
 5 | def _to_geneid(conversionTable, symbol):
 6 |     """Convert the symbol into another using the conversionSymbol table,
 7 |     converting symbol from the first column of the table to the index of such.
 8 |     To use to convert from HGNC symobl to Ensembl and vice-versa e.g.
 9 | 
10 |     Parameters
11 |     ----------
12 |     conversionTable:class:`~Serie`
13 |         A serie containing
14 |     symbol:class`~str`: symbol to convert.
15 |         Should match in the first column of conversionTable
16 | 
17 |     Returns
18 |     -------
19 |     a str, the converted symbol.
20 | 
21 |     Example
22 |     -------
23 |     >>> import pandas as pd
24 |     >>> x = pd.Series(['aa', 'bb', 'cc', 'dd', 'ee'], index=['a', 'b', 'c', 'd', 'e'])
25 |     >>> _to_geneid( x, 'bb')
26 |     'b'
27 |     """
28 |     try:
29 |         res = conversionTable[conversionTable == symbol].index.format()[0]
30 |         return res
31 |     except IndexError:
32 |         return None
33 | 


--------------------------------------------------------------------------------
/besca/tl/sig/_metrics.py:
--------------------------------------------------------------------------------
 1 | # this file contains the metric functions for signature scoring analysis using scanpy
 2 | # those functions compute scores for each signature (genesets)
 3 | # import using the python version 1.3.2 at least is a prerequisit!
 4 | # needs to be checked in all functions
 5 | 
 6 | from scanpy import AnnData
 7 | from scanpy.tools import score_genes
 8 | 
 9 | 
10 | def _handle_signature(
11 |     signature: dict,
12 |     method: str,
13 |     adata: AnnData,
14 |     signature_name: str,
15 |     overwrite: bool,
16 |     verbose: bool,
17 |     use_raw: bool,
18 | ):
19 |     """Compute signed score combining UP and DN for a speficic signature
20 |     This function combines geneset (signature) scores compose of UP and DN.
21 |     The result is stored in adata.obs with the key:
22 |     "score_" + method + signature_name.
23 |     Multiples methods can be used to compute geneset scores.
24 |     The scanpy method is the score_gene method.
25 |     Combination of the scores is done substracting UP and DN (scanpy = UP - DN)
26 |     Method in development. Not all options implemented yet.
27 |     TODO : Score could be computed while reading the gmt (one loop less).
28 |     However here we divided geneset provenance and computation (to discuss)
29 | 
30 |     Parameters
31 |     ----------
32 |     signature: `dict`
33 |        dictionnary,; keys are the directions (UP/DN) and values are the genes.
34 |     method: `str` | default = scanpy
35 |         a string indicating which method to use ('scanpy' available)
36 |     adata:class:`~anndata.AnnData`
37 |         An AnnData object (from scanpy).
38 |         Following besca convention, var names (gene) are HGNC symbol. It should match the signatures values.
39 |     use_raw: `boolean`
40 |     Returns
41 |     -------
42 |     None
43 |     The adata object is modified.
44 |     """
45 |     scoreName = "score_" + signature_name + "_" + method
46 |     if verbose:
47 |         print("Computing " + scoreName)
48 |     if not overwrite:
49 |         if scoreName in adata.obs:
50 |             if verbose:
51 |                 print(
52 |                     signature_name
53 |                     + " skipped was already  precomputed with this method (",
54 |                     scoreName,
55 |                     ")",
56 |                 )
57 |             return None
58 |     score = [0] * adata.n_obs
59 |     # Not copying columns but rather deleting them afterward is faster. For each direction the column is computed in adata.obs.
60 |     # If the genes are not found, exception to manage as data.obs is not updated
61 |     # The scores are combined and then deleted.
62 |     for direction in signature[signature_name].keys():
63 |         if method == "scanpy":
64 |             currentName = scoreName + direction
65 |             score_genes(
66 |                 adata,
67 |                 signature[signature_name][direction],
68 |                 score_name=currentName,
69 |                 use_raw=use_raw,
70 |                 copy=False,
71 |             )
72 |             try:
73 |                 scoreTMP = adata.obs[currentName]
74 |                 adata.obs = adata.obs.drop(columns=currentName)
75 |                 if direction == "DN":
76 |                     scoreTMP = [x * -1 for x in scoreTMP]
77 |             except:
78 |                 scoreTMP = [0] * adata.n_obs
79 |                 if verbose:
80 |                     print("score " + currentName + " is 0. Exception")
81 |             # SUMMING
82 |             score = list(map(sum, zip(score, scoreTMP)))
83 |     adata.obs[scoreName] = score.copy()
84 |     return None
85 | 


--------------------------------------------------------------------------------
/besca/tl/sig/_silhouette.py:
--------------------------------------------------------------------------------
 1 | import logging
 2 | import sys
 3 | from dataclasses import dataclass
 4 | 
 5 | import anndata
 6 | import matplotlib
 7 | import pandas as pd
 8 | import seaborn as sns
 9 | import sklearn
10 | 
11 | @dataclass
12 | class silhouette_in:
13 |     show_samples: matplotlib.axes  # acces is obj.show_samples.get_figure()
14 |     averaged: float
15 | 
16 | 
17 | def silhouette_computation(
18 |     adata: anndata.AnnData,
19 |     cluster: str = "dblabel",
20 |     emb: str = "X_umap",
21 |     verbose: bool = False,
22 | ) -> silhouette_in:
23 |     """Compute the average and per cell (ie samples) silhouette score for
24 |     the cluster label (should be present in dataobs) (level 3 annotation),
25 |     computed level 2 annotation and a random cell assignbation.
26 |     Return a silhouette_in object
27 | 
28 |     parameters
29 |     ---------
30 |     adata:  anndata.AnnData
31 |     cluster: 'str'
32 |       clustering to evaluate (should be a column in adata.obs)
33 |     emb: str
34 |         embedding to use for computing the euclidian distance.
35 |         should be a key of  obsm
36 | 
37 |     returns
38 |     -------
39 |     silhouette_in dataclass object
40 | 
41 |      Example
42 |     -------
43 |     >>> import besca as bc
44 |     >>> adata = bc.datasets.simulated_pbmc3k_processed()
45 |     >>> sils = bc.tl.sig.silhouette_computation (adata)
46 |     >>> figure = sils.show_samples.get_figure()
47 | 
48 |     """
49 |     if cluster not in adata.obs.keys():
50 |         sys.exit(cluster + " label not found in the dataset (should be in obs)")
51 |     if emb not in adata.obsm.keys():
52 |         sys.exit(emb + " not found in the dataset (should be in obsm)")
53 | 
54 |     silhouette_avg = sklearn.metrics.silhouette_score(
55 |         adata.obsm[emb], adata.obs.get(cluster)
56 |     )
57 |     sample_silhouette_values = sklearn.metrics.silhouette_samples(
58 |         adata.obsm[emb], adata.obs.get(cluster)
59 |     )
60 |     if verbose:
61 |         logging.info("The average silhouette_score is :", silhouette_avg)
62 |     cluster_labels = adata.obs.get(cluster).unique()
63 |     n_clusters = len(cluster_labels)
64 |     ith_value = {}
65 |     size_cluster = {}
66 |     for i in range(n_clusters):
67 |         # Aggregate the silhouette scores for samples belonging to
68 |         # cluster i, and sort them
69 |         ith_cluster_silhouette_values = sample_silhouette_values[
70 |             adata.obs.get(cluster) == cluster_labels[i]
71 |         ]
72 |         ith_value[cluster_labels[i]] = ith_cluster_silhouette_values
73 |         size_cluster_i = ith_cluster_silhouette_values.shape[0]
74 |         size_cluster[cluster_labels[i]] = size_cluster_i
75 | 
76 |     long_df_silhouette = pd.concat(
77 |         pd.DataFrame({"label": k, "silhouette": v}) for k, v in ith_value.items()
78 |     )
79 |     # TODO ADD PROPER TITLE/ AXIS/ MEAN OVERALL  and mean per label ?
80 |     ax1 = sns.violinplot(
81 |         y=long_df_silhouette["label"], x=long_df_silhouette["silhouette"], scale="count"
82 |     )
83 |     matplotlib.pyplot.close()  # Avoid plooting in function; bad practice
84 |     silhouette_results = silhouette_in(ax1, silhouette_avg)
85 | 
86 |     return silhouette_results
87 | 


--------------------------------------------------------------------------------
/devtools/README.md:
--------------------------------------------------------------------------------
 1 | Scripts and tools used by BESCA developers
 2 | ===
 3 | Klas Hatj, Roland Schmucki, Jitao David Zhang
 4 | 
 5 | ## Test besca package in a virtual environment
 6 | 
 7 | The following commands can be used to test `besca` in a virtual environment.
 8 | 
 9 | ```
10 | ## load python 3.8
11 | ml purge
12 | ml load Python/3.8.2-GCCcore-9.3.0
13 | ## create and activate a virtual environment
14 | python -m venv test_besca
15 | source test_besca/bin/activate
16 | test_besca/bin/python -m pip install --upgrade pip
17 | ## clone besca and install it into the virtual environment
18 | git clone --branch scanpy1.8.2 git@github.com:Accio/besca.git
19 | cd test_besca/bin
20 | ./python -m pip install ../../besca
21 | ## run notebooks
22 | cd ../../besca
23 | bash devtools/run_workbooks.bash
24 | ## capture the version that we use
25 | ../../test_besca/bin/pip freeze | grep -v besca > devtools/requirements.txt
26 | ```
27 | 
28 | ## To fully recapitulate the environment where the development was done
29 | 
30 | You can use `pip install -r devtools/requirements.txt` to get an identical environment in which the test was done, except for besca.
31 | 
32 | ```bash
33 | ../../test_besca/bin/pip install -r devtools/requirements.txt
34 | ../../test_besca/bin/python setup.py install
35 | ```
36 | 
37 | ## Install dependencies with conda
38 | 
39 | Most packages can be installed by conda, which also manages dependencies. To initialize a conda environment with all dependent packages for besca, go to the root directory and run:
40 | 
41 | ```
42 | mamba env create -f environment.yml ## double check the BESCA URL, sometimes it can be another branch than master
43 | conda activate besca_dev
44 | ```
45 | 


--------------------------------------------------------------------------------
/devtools/install_besca_editable.bash:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | kernel=besca_dev
 4 | 
 5 | ## pre-conditions:
 6 | ## 1. you are in the root path of besca, and 
 7 | ## 2. the conda/venv environment for besca development is activated
 8 | python setup.py develop
 9 | python -m ipykernel install --user --name "$kernel" --display-name "$kernel"
10 | 
11 | 


--------------------------------------------------------------------------------
/devtools/run_workbooks.bash:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | ## the script should run without any error before major release
 4 | 
 5 | ## pre-conditions:
 6 | ## 1. you are in the root path of besca, and 
 7 | ## 2. the conda/venv environment for besca development is activated
 8 | ## 3. besca_dev kernel has been installed (see install_besca_anew_local.bash)
 9 | 
10 | for notebook in "minimal_notebook.ipynb" "standard_workflow_besca2.ipynb" "celltype_annotation_besca.ipynb" "Signature_exports.ipynb" "Testing_Notebook.ipynb"; do
11 |     echo Running notebook "$notebook"
12 |     jupyter nbconvert --to notebook --execute workbooks/"$notebook"
13 |     jupyter nbconvert --clear-output workbooks/"$notebook"
14 | done
15 | 


--------------------------------------------------------------------------------
/docs/Makefile:
--------------------------------------------------------------------------------
 1 | # Minimal makefile for Sphinx documentation
 2 | 
 3 | # You can set these variables from the command line.
 4 | SPHINXOPTS    =
 5 | SPHINXBUILD   = sphinx-build
 6 | SOURCEDIR     = source
 7 | BUILDDIR      =../../besca-docs
 8 | PDFBUILDDIR = /tmp
 9 | PDF = ../besca-manual.pdf
10 | 
11 | # Put it first so that "make" without argument is like "make help".
12 | help:
13 | 	@$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
14 | 
15 | .PHONY: help Makefile
16 | 
17 | # Catch-all target: route all unknown targets to Sphinx using the new
18 | # "make mode" option.  $(O) is meant as a shortcut for $(SPHINXOPTS).
19 | %: Makefile
20 | 	@$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
21 | 
22 | latexpdf:
23 | 	$(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(PDFBUILDDIR)/latex
24 | 	#                                          ^^^
25 | 	@echo "Running LaTeX files through pdflatex..."
26 | 	make -C $(PDFBUILDDIR)/latex all-pdf
27 | 	#         ^^^
28 | 	cp $(PDFBUILDDIR)/latex/*.pdf $(PDF)
29 | 	#^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
30 | 	@echo "pdflatex finished; see $(PDF)"
31 | 
32 | buildandcommithtml: html
33 | 
34 | 	cd $(BUILDDIR)/html; git add . ; git commit -m "rebuilt docs"; git push origin gh-pages
35 | 


--------------------------------------------------------------------------------
/docs/source/_images/Thumbs.db:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/_images/Thumbs.db


--------------------------------------------------------------------------------
/docs/source/_images/besca_outline.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/_images/besca_outline.jpg


--------------------------------------------------------------------------------
/docs/source/_static/css/custom.css:
--------------------------------------------------------------------------------
1 | .rst-content img {
2 |     max-width: 100%;
3 |     zoom: 50%;
4 | }


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_filtering_plots_001.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_filtering_plots_001.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_celltype_quantification_001.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_celltype_quantification_001.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_celltype_quantification_002.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_celltype_quantification_002.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_celltype_quantification_003.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_celltype_quantification_003.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_celltype_quantification_004.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_celltype_quantification_004.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_filtering_001.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_filtering_001.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_qc_001.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_qc_001.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_qc_002.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_qc_002.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_qc_003.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_qc_003.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_qc_004.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_qc_004.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_qc_005.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_qc_005.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_split_gene_expression_001.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_split_gene_expression_001.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_split_gene_expression_002.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_split_gene_expression_002.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/sphx_glr_plot_split_gene_expression_003.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/sphx_glr_plot_split_gene_expression_003.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/thumb/sphx_glr_filtering_plots_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/thumb/sphx_glr_filtering_plots_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/thumb/sphx_glr_plot_celltype_quantification_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/thumb/sphx_glr_plot_celltype_quantification_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/thumb/sphx_glr_plot_filtering_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/thumb/sphx_glr_plot_filtering_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/thumb/sphx_glr_plot_qc_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/thumb/sphx_glr_plot_qc_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/images/thumb/sphx_glr_plot_split_gene_expression_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/plotting/images/thumb/sphx_glr_plot_split_gene_expression_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_celltype_quantification.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "code",
  5 |    "execution_count": null,
  6 |    "metadata": {
  7 |     "collapsed": false
  8 |    },
  9 |    "outputs": [],
 10 |    "source": [
 11 |     "%matplotlib inline"
 12 |    ]
 13 |   },
 14 |   {
 15 |    "cell_type": "markdown",
 16 |    "metadata": {},
 17 |    "source": [
 18 |     "\n",
 19 |     "# Visualize cell fractions\n",
 20 |     "\n",
 21 |     "This example demonstrates how to generate celltype quantification plots. These types of plots \n",
 22 |     "can be used to visually represent the number of cells that belong to a certain subset or condition.\n"
 23 |    ]
 24 |   },
 25 |   {
 26 |    "cell_type": "code",
 27 |    "execution_count": null,
 28 |    "metadata": {
 29 |     "collapsed": false
 30 |    },
 31 |    "outputs": [],
 32 |    "source": [
 33 |     "import besca as bc \n",
 34 |     "\n",
 35 |     "#import dataset to workwith\n",
 36 |     "adata = bc.datasets.Peng2019_processed()"
 37 |    ]
 38 |   },
 39 |   {
 40 |    "cell_type": "markdown",
 41 |    "metadata": {},
 42 |    "source": [
 43 |     "quantify specific celllabels as a stacked barplot\n",
 44 |     "\n"
 45 |    ]
 46 |   },
 47 |   {
 48 |    "cell_type": "code",
 49 |    "execution_count": null,
 50 |    "metadata": {
 51 |     "collapsed": false
 52 |    },
 53 |    "outputs": [],
 54 |    "source": [
 55 |     "bc.pl.celllabel_quant_stackedbar(adata, count_variable = 'Cell_type', subset_variable = 'Patient')"
 56 |    ]
 57 |   },
 58 |   {
 59 |    "cell_type": "markdown",
 60 |    "metadata": {},
 61 |    "source": [
 62 |     "quantify number of cells belong to each condition in a specific subset\n",
 63 |     "\n",
 64 |     "here each dot represents one Patient, the boxplots are grouped according to tissue type (Normal or Tumoral)\n",
 65 |     "\n"
 66 |    ]
 67 |   },
 68 |   {
 69 |    "cell_type": "code",
 70 |    "execution_count": null,
 71 |    "metadata": {
 72 |     "collapsed": false
 73 |    },
 74 |    "outputs": [],
 75 |    "source": [
 76 |     "bc.pl.celllabel_quant_boxplot(adata, count_variable = 'Cell_type', subset_variable = 'Patient', condition_identifier = 'Type',  plot_percentage = True)"
 77 |    ]
 78 |   },
 79 |   {
 80 |    "cell_type": "markdown",
 81 |    "metadata": {},
 82 |    "source": [
 83 |     "here you can also choose to plot total counts instead of percentages\n",
 84 |     "\n"
 85 |    ]
 86 |   },
 87 |   {
 88 |    "cell_type": "code",
 89 |    "execution_count": null,
 90 |    "metadata": {
 91 |     "collapsed": false
 92 |    },
 93 |    "outputs": [],
 94 |    "source": [
 95 |     "bc.pl.celllabel_quant_boxplot(adata, count_variable = 'Cell_type', subset_variable = 'Patient', condition_identifier = 'Type',  plot_percentage = False)"
 96 |    ]
 97 |   }
 98 |  ],
 99 |  "metadata": {
100 |   "kernelspec": {
101 |    "display_name": "Python 3",
102 |    "language": "python",
103 |    "name": "python3"
104 |   },
105 |   "language_info": {
106 |    "codemirror_mode": {
107 |     "name": "ipython",
108 |     "version": 3
109 |    },
110 |    "file_extension": ".py",
111 |    "mimetype": "text/x-python",
112 |    "name": "python",
113 |    "nbconvert_exporter": "python",
114 |    "pygments_lexer": "ipython3",
115 |    "version": "3.7.8"
116 |   }
117 |  },
118 |  "nbformat": 4,
119 |  "nbformat_minor": 0
120 | }
121 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_celltype_quantification.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Visualize cell fractions
 3 | ========================
 4 | 
 5 | This example demonstrates how to generate celltype quantification plots. These types of plots 
 6 | can be used to visually represent the number of cells that belong to a certain subset or condition.
 7 | 
 8 | """
 9 | 
10 | import besca as bc 
11 | 
12 | #import dataset to workwith
13 | adata = bc.datasets.Peng2019_processed()
14 | 
15 | #####################
16 | #quantify specific celllabels as a stacked barplot
17 | 
18 | bc.pl.celllabel_quant_stackedbar(adata, count_variable = 'Cell_type', subset_variable = 'Patient')
19 | 
20 | 
21 | #####################
22 | # quantify number of cells belong to each condition in a specific subset
23 | #
24 | # here each dot represents one Patient, the boxplots are grouped according to tissue type (Normal or Tumoral)
25 | bc.pl.celllabel_quant_boxplot(adata, count_variable = 'Cell_type', subset_variable = 'Patient', condition_identifier = 'Type',  plot_percentage = True)
26 | 
27 | #####################
28 | # here you can also choose to plot total counts instead of percentages
29 | bc.pl.celllabel_quant_boxplot(adata, count_variable = 'Cell_type', subset_variable = 'Patient', condition_identifier = 'Type',  plot_percentage = False)


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_celltype_quantification.py.md5:
--------------------------------------------------------------------------------
1 | bf8788d314eaf4b64d62c64e6a0c2395


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_filtering.ipynb:
--------------------------------------------------------------------------------
 1 | {
 2 |  "cells": [
 3 |   {
 4 |    "cell_type": "code",
 5 |    "execution_count": null,
 6 |    "metadata": {
 7 |     "collapsed": false
 8 |    },
 9 |    "outputs": [],
10 |    "source": [
11 |     "%matplotlib inline"
12 |    ]
13 |   },
14 |   {
15 |    "cell_type": "markdown",
16 |    "metadata": {},
17 |    "source": [
18 |     "\n",
19 |     "# filtering functions\n",
20 |     "\n",
21 |     "This example shows you how to generate plots to visualize the chosen filter threshold.\n",
22 |     "This way you can easily check (visually) if your chosen threshold is a good one.\n"
23 |    ]
24 |   },
25 |   {
26 |    "cell_type": "code",
27 |    "execution_count": null,
28 |    "metadata": {
29 |     "collapsed": false
30 |    },
31 |    "outputs": [],
32 |    "source": [
33 |     "import besca as bc \n",
34 |     "import matplotlib.pyplot as plt\n",
35 |     "\n",
36 |     "adata = bc.datasets.pbmc3k_raw()\n",
37 |     "\n",
38 |     "#define thresholds\n",
39 |     "min_genes = 600\n",
40 |     "min_cells = 2\n",
41 |     "min_UMI = 600\n",
42 |     "max_UMI = 6500\n",
43 |     "max_mito = 0.05\n",
44 |     "max_genes = 1900\n",
45 |     "\n",
46 |     "#Visualize filtering thresholds\n",
47 |     "fig, ((ax1, ax2, ax3), (ax4, ax5, ax6))= plt.subplots(ncols=3, nrows=2)\n",
48 |     "fig.set_figwidth(15)\n",
49 |     "fig.set_figheight(8)\n",
50 |     "fig.tight_layout(pad=4.5)\n",
51 |     "\n",
52 |     "bc.pl.kp_genes(adata, min_genes=min_genes, ax = ax1)\n",
53 |     "bc.pl.kp_cells(adata, min_cells=min_cells, ax = ax2)\n",
54 |     "bc.pl.kp_counts(adata, min_counts=min_UMI, ax = ax3)\n",
55 |     "bc.pl.max_counts(adata, max_counts=max_UMI, ax = ax4)\n",
56 |     "bc.pl.max_mito(adata, max_mito=max_mito, annotation_type='SYMBOL', species='human', ax = ax5)\n",
57 |     "bc.pl.max_genes(adata, max_genes=max_genes)"
58 |    ]
59 |   }
60 |  ],
61 |  "metadata": {
62 |   "kernelspec": {
63 |    "display_name": "Python 3",
64 |    "language": "python",
65 |    "name": "python3"
66 |   },
67 |   "language_info": {
68 |    "codemirror_mode": {
69 |     "name": "ipython",
70 |     "version": 3
71 |    },
72 |    "file_extension": ".py",
73 |    "mimetype": "text/x-python",
74 |    "name": "python",
75 |    "nbconvert_exporter": "python",
76 |    "pygments_lexer": "ipython3",
77 |    "version": "3.7.8"
78 |   }
79 |  },
80 |  "nbformat": 4,
81 |  "nbformat_minor": 0
82 | }
83 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_filtering.py:
--------------------------------------------------------------------------------
 1 | """
 2 | filtering functions
 3 | ===================
 4 | 
 5 | This example shows you how to generate plots to visualize the chosen filter threshold.
 6 | This way you can easily check (visually) if your chosen threshold is a good one.
 7 | 
 8 | """
 9 | 
10 | import besca as bc 
11 | import matplotlib.pyplot as plt
12 | 
13 | adata = bc.datasets.pbmc3k_raw()
14 | 
15 | #define thresholds
16 | min_genes = 600
17 | min_cells = 2
18 | min_UMI = 600
19 | max_UMI = 6500
20 | max_mito = 0.05
21 | max_genes = 1900
22 | 
23 | #Visualize filtering thresholds
24 | fig, ((ax1, ax2, ax3), (ax4, ax5, ax6))= plt.subplots(ncols=3, nrows=2)
25 | fig.set_figwidth(15)
26 | fig.set_figheight(8)
27 | fig.tight_layout(pad=4.5)
28 | 
29 | bc.pl.kp_genes(adata, min_genes=min_genes, ax = ax1)
30 | bc.pl.kp_cells(adata, min_cells=min_cells, ax = ax2)
31 | bc.pl.kp_counts(adata, min_counts=min_UMI, ax = ax3)
32 | bc.pl.max_counts(adata, max_counts=max_UMI, ax = ax4)
33 | bc.pl.max_mito(adata, max_mito=max_mito, annotation_type='SYMBOL', species='human', ax = ax5)
34 | bc.pl.max_genes(adata, max_genes=max_genes)
35 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_filtering.py.md5:
--------------------------------------------------------------------------------
1 | 8d21e61fdaa7bb6b6aa4be744fc136ef


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_qc.py:
--------------------------------------------------------------------------------
 1 | """
 2 | quality control plots
 3 | =====================
 4 | 
 5 | This example shows you the inbuilt quality control plots from besca.
 6 | 
 7 | """
 8 | 
 9 | #import libraries
10 | import besca as bc
11 | import matplotlib.pyplot as plt
12 | 
13 | ###############################################################################
14 | #
15 | # Before beginning any analysis it is useful to take a detailled look at your dataset
16 | # to get an understanding for its characteristics.
17 | 
18 | #import data
19 | adata = bc.datasets.pbmc3k_raw()
20 | 
21 | ###############################################################################
22 | # transcript capture efficiency
23 | # -----------------------------
24 | #
25 | # Plotting the transcript capture efficiency will give you an overview of the expression
26 | # of genes within cells relative to the total UMI counts.
27 | 
28 | #transcript capture efficiency
29 | fig, ax = plt.subplots(1)
30 | fig.set_figwidth(8)
31 | fig.set_figheight(5)
32 | fig.tight_layout()
33 | 
34 | bc.pl.transcript_capture_efficiency(adata,ax=ax)
35 | 
36 | ###############################################################################
37 | # overview of library size unprocessed
38 | # ------------------------------------
39 | #
40 | # This gives you an overview of the read distribution per cell. High quality cells
41 | # will have a larger number of reads per cell and this is a parameter you can use to 
42 | # filter out low quality cells. The number of reads you would expect per cell is strongly
43 | # dependent on the single-cell sequencing method you used.
44 | 
45 | bc.pl.librarysize_overview(adata)
46 | 
47 | ###############################################################################
48 | # most strongly expressed transcripts
49 | # -----------------------------------
50 | #
51 | # This will let you identify the genes which dominant your experiment 
52 | # (generally you would expect mitochondrial and ribosomal genes, 
53 | # in this dataset these genes have been removed beforehand).
54 | 
55 | bc.pl.top_genes_counts(adata=adata, top_n=25)
56 | 
57 | ###############################################################################
58 | # visualize the processed dataset
59 | # -------------------------------
60 | #
61 | # After performing your filtering it is generally a good idea to take another look
62 | # at your dataset to ensure that the filtering parameters used were reasonable.
63 | 
64 | adata = bc.datasets.pbmc3k_processed()
65 | 
66 | ###############################################################################
67 | #
68 | # Please note that the displayed counts have already been scaled. You would now expect
69 | # a more or less normal distribution of library size within your dataset.
70 | 
71 | bc.pl.librarysize_overview(adata)
72 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_qc.py.md5:
--------------------------------------------------------------------------------
1 | b59ebc73f10824c5f3943c68687a2961


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_riverplot.ipynb:
--------------------------------------------------------------------------------
 1 | {
 2 |  "cells": [
 3 |   {
 4 |    "cell_type": "code",
 5 |    "execution_count": null,
 6 |    "metadata": {
 7 |     "collapsed": false
 8 |    },
 9 |    "outputs": [],
10 |    "source": [
11 |     "%matplotlib inline"
12 |    ]
13 |   },
14 |   {
15 |    "cell_type": "markdown",
16 |    "metadata": {},
17 |    "source": [
18 |     "\n",
19 |     "# Comparing categorical variable\n",
20 |     "\n",
21 |     "This example shows you how to generate riverplots to compare categorical columns, \n",
22 |     "for example to compare multiple annotations\n",
23 |     "This way you can easily check (visually) discripancies.\n"
24 |    ]
25 |   },
26 |   {
27 |    "cell_type": "code",
28 |    "execution_count": null,
29 |    "metadata": {
30 |     "collapsed": false
31 |    },
32 |    "outputs": [],
33 |    "source": [
34 |     "import besca as bc \n",
35 |     "\n",
36 |     "#import data\n",
37 |     "adata = bc.datasets.Baron2016_processed()"
38 |    ]
39 |   },
40 |   {
41 |    "cell_type": "markdown",
42 |    "metadata": {},
43 |    "source": [
44 |     "## compare two categories: annotations made by different annotators\n",
45 |     "\n"
46 |    ]
47 |   },
48 |   {
49 |    "cell_type": "code",
50 |    "execution_count": null,
51 |    "metadata": {
52 |     "collapsed": false
53 |    },
54 |    "outputs": [],
55 |    "source": [
56 |     "bc.pl.riverplot_2categories(adata,  [ 'assigned_cluster', 'celltype2'])"
57 |    ]
58 |   }
59 |  ],
60 |  "metadata": {
61 |   "kernelspec": {
62 |    "display_name": "Python 3",
63 |    "language": "python",
64 |    "name": "python3"
65 |   },
66 |   "language_info": {
67 |    "codemirror_mode": {
68 |     "name": "ipython",
69 |     "version": 3
70 |    },
71 |    "file_extension": ".py",
72 |    "mimetype": "text/x-python",
73 |    "name": "python",
74 |    "nbconvert_exporter": "python",
75 |    "pygments_lexer": "ipython3",
76 |    "version": "3.7.8"
77 |   }
78 |  },
79 |  "nbformat": 4,
80 |  "nbformat_minor": 0
81 | }
82 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_riverplot.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Comparing categorical variable
 3 | ===================
 4 | 
 5 | This example shows you how to generate riverplots to compare categorical columns, 
 6 | for example to compare multiple annotations
 7 | This way you can easily check (visually) discripancies.
 8 | 
 9 | """
10 | 
11 | 
12 | import besca as bc 
13 | 
14 | #import data
15 | adata = bc.datasets.Baron2016_processed()
16 | 
17 | ###############################################################################
18 | # compare two categories: annotations made by different annotators
19 | # ----------------------
20 | 
21 | 
22 | bc.pl.riverplot_2categories(adata,  [ 'assigned_cluster', 'celltype2'])
23 | 
24 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_riverplot.py.md5:
--------------------------------------------------------------------------------
1 | 12264720b98b8e19d525fc5488981ac7


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_split_gene_expression.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "code",
  5 |    "execution_count": null,
  6 |    "metadata": {
  7 |     "collapsed": false
  8 |    },
  9 |    "outputs": [],
 10 |    "source": [
 11 |     "%matplotlib inline"
 12 |    ]
 13 |   },
 14 |   {
 15 |    "cell_type": "markdown",
 16 |    "metadata": {},
 17 |    "source": [
 18 |     "\n",
 19 |     "# plotting gene expression\n",
 20 |     "\n",
 21 |     "This example shows you some of the different plots you can use to plot gene expression.\n"
 22 |    ]
 23 |   },
 24 |   {
 25 |    "cell_type": "code",
 26 |    "execution_count": null,
 27 |    "metadata": {
 28 |     "collapsed": false
 29 |    },
 30 |    "outputs": [],
 31 |    "source": [
 32 |     "import besca as bc\n",
 33 |     "\n",
 34 |     "#import data\n",
 35 |     "adata = bc.datasets.Haber2017_processed()"
 36 |    ]
 37 |   },
 38 |   {
 39 |    "cell_type": "markdown",
 40 |    "metadata": {},
 41 |    "source": [
 42 |     "## compare two conditions\n",
 43 |     "\n",
 44 |     "You can use the split violin plot to compare gene expression for two different conditions.\n",
 45 |     "\n"
 46 |    ]
 47 |   },
 48 |   {
 49 |    "cell_type": "code",
 50 |    "execution_count": null,
 51 |    "metadata": {
 52 |     "collapsed": false
 53 |    },
 54 |    "outputs": [],
 55 |    "source": [
 56 |     "bc.pl.gene_expr_split(adata, genes = ['Defa24', 'Gm15284'], split_variable='donor')"
 57 |    ]
 58 |   },
 59 |   {
 60 |    "cell_type": "markdown",
 61 |    "metadata": {},
 62 |    "source": [
 63 |     "use a stacked split violin plot to compare this for several genes at the same time\n",
 64 |     "\n"
 65 |    ]
 66 |   },
 67 |   {
 68 |    "cell_type": "code",
 69 |    "execution_count": null,
 70 |    "metadata": {
 71 |     "collapsed": false
 72 |    },
 73 |    "outputs": [],
 74 |    "source": [
 75 |     "bc.pl.gene_expr_split_stacked(adata=adata, genes=['Defa24', 'Gm15284'], split_variable='donor', subset_variable = 'region')"
 76 |    ]
 77 |   }
 78 |  ],
 79 |  "metadata": {
 80 |   "kernelspec": {
 81 |    "display_name": "Python 3",
 82 |    "language": "python",
 83 |    "name": "python3"
 84 |   },
 85 |   "language_info": {
 86 |    "codemirror_mode": {
 87 |     "name": "ipython",
 88 |     "version": 3
 89 |    },
 90 |    "file_extension": ".py",
 91 |    "mimetype": "text/x-python",
 92 |    "name": "python",
 93 |    "nbconvert_exporter": "python",
 94 |    "pygments_lexer": "ipython3",
 95 |    "version": "3.7.8"
 96 |   }
 97 |  },
 98 |  "nbformat": 4,
 99 |  "nbformat_minor": 0
100 | }
101 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_split_gene_expression.py:
--------------------------------------------------------------------------------
 1 | """
 2 | plotting gene expression
 3 | ========================
 4 | 
 5 | This example shows you some of the different plots you can use to plot gene expression.
 6 | 
 7 | """
 8 | import besca as bc
 9 | 
10 | #import data
11 | adata = bc.datasets.Haber2017_processed()
12 | 
13 | ###############################################################################
14 | # compare two conditions
15 | # ----------------------
16 | #
17 | # You can use the split violin plot to compare gene expression for two different conditions.
18 | 
19 | bc.pl.gene_expr_split(adata, genes = ['Defa24', 'Gm15284'], split_variable='donor')
20 | 
21 | ###############################################################################
22 | #
23 | # use a stacked split violin plot to compare this for several genes at the same time
24 | 
25 | bc.pl.gene_expr_split_stacked(adata=adata, genes=['Defa24', 'Gm15284'], split_variable='donor', subset_variable = 'region')


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_split_gene_expression.py.md5:
--------------------------------------------------------------------------------
1 | b903c3b8d5c94c0edcf0126c05080776


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/plot_split_gene_expression.rst:
--------------------------------------------------------------------------------
  1 | .. only:: html
  2 | 
  3 |     .. note::
  4 |         :class: sphx-glr-download-link-note
  5 | 
  6 |         Click :ref:`here <sphx_glr_download_auto_examples_plotting_plot_split_gene_expression.py>`     to download the full example code
  7 |     .. rst-class:: sphx-glr-example-title
  8 | 
  9 |     .. _sphx_glr_auto_examples_plotting_plot_split_gene_expression.py:
 10 | 
 11 | 
 12 | plotting gene expression
 13 | ========================
 14 | 
 15 | This example shows you some of the different plots you can use to plot gene expression.
 16 | 
 17 | 
 18 | .. code-block:: default
 19 | 
 20 |     import besca as bc
 21 | 
 22 |     #import data
 23 |     adata = bc.datasets.Haber2017_processed()
 24 | 
 25 | 
 26 | 
 27 | 
 28 | 
 29 | 
 30 | 
 31 | 
 32 | compare two conditions
 33 | ----------------------
 34 | 
 35 | You can use the split violin plot to compare gene expression for two different conditions.
 36 | 
 37 | 
 38 | .. code-block:: default
 39 | 
 40 | 
 41 |     bc.pl.gene_expr_split(adata, genes = ['Defa24', 'Gm15284'], split_variable='donor')
 42 | 
 43 | 
 44 | 
 45 | 
 46 | .. image:: /auto_examples/plotting/images/sphx_glr_plot_split_gene_expression_001.png
 47 |     :alt: plot split gene expression
 48 |     :class: sphx-glr-single-img
 49 | 
 50 | 
 51 | .. rst-class:: sphx-glr-script-out
 52 | 
 53 |  Out:
 54 | 
 55 |  .. code-block:: none
 56 | 
 57 |     /pstore/home/julienla/.local/lib/python3.7/site-packages/anndata/_core/anndata.py:1094: FutureWarning:
 58 | 
 59 |     is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead
 60 | 
 61 | 
 62 | 
 63 | 
 64 | 
 65 | use a stacked split violin plot to compare this for several genes at the same time
 66 | 
 67 | 
 68 | .. code-block:: default
 69 | 
 70 | 
 71 |     bc.pl.gene_expr_split_stacked(adata=adata, genes=['Defa24', 'Gm15284'], split_variable='donor', subset_variable = 'region')
 72 | 
 73 | 
 74 | .. image:: /auto_examples/plotting/images/sphx_glr_plot_split_gene_expression_002.png
 75 |     :alt: plot split gene expression
 76 |     :class: sphx-glr-single-img
 77 | 
 78 | 
 79 | .. rst-class:: sphx-glr-script-out
 80 | 
 81 |  Out:
 82 | 
 83 |  .. code-block:: none
 84 | 
 85 |     /pstore/home/julienla/.local/lib/python3.7/site-packages/anndata/_core/anndata.py:1094: FutureWarning:
 86 | 
 87 |     is_categorical is deprecated and will be removed in a future version.  Use is_categorical_dtype instead
 88 | 
 89 |     merging a total of  3  datasubset
 90 | 
 91 |     <Figure size 640x480 with 2 Axes>
 92 | 
 93 | 
 94 | 
 95 | 
 96 | .. rst-class:: sphx-glr-timing
 97 | 
 98 |    **Total running time of the script:** ( 0 minutes  27.807 seconds)
 99 | 
100 | 
101 | .. _sphx_glr_download_auto_examples_plotting_plot_split_gene_expression.py:
102 | 
103 | 
104 | .. only :: html
105 | 
106 |  .. container:: sphx-glr-footer
107 |     :class: sphx-glr-footer-example
108 | 
109 | 
110 | 
111 |   .. container:: sphx-glr-download sphx-glr-download-python
112 | 
113 |      :download:`Download Python source code: plot_split_gene_expression.py <plot_split_gene_expression.py>`
114 | 
115 | 
116 | 
117 |   .. container:: sphx-glr-download sphx-glr-download-jupyter
118 | 
119 |      :download:`Download Jupyter notebook: plot_split_gene_expression.ipynb <plot_split_gene_expression.ipynb>`
120 | 
121 | 
122 | .. only:: html
123 | 
124 |  .. rst-class:: sphx-glr-signature
125 | 
126 |     `Gallery generated by Sphinx-Gallery <https://sphinx-gallery.github.io>`_
127 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/plotting/sg_execution_times.rst:
--------------------------------------------------------------------------------
 1 | 
 2 | :orphan:
 3 | 
 4 | .. _sphx_glr_auto_examples_plotting_sg_execution_times:
 5 | 
 6 | Computation times
 7 | =================
 8 | **00:52.692** total execution time for **auto_examples_plotting** files:
 9 | 
10 | +--------------------------------------------------------------------------------------------------------------+-----------+--------+
11 | | :ref:`sphx_glr_auto_examples_plotting_plot_split_gene_expression.py` (``plot_split_gene_expression.py``)     | 00:27.807 | 0.0 MB |
12 | +--------------------------------------------------------------------------------------------------------------+-----------+--------+
13 | | :ref:`sphx_glr_auto_examples_plotting_plot_celltype_quantification.py` (``plot_celltype_quantification.py``) | 00:14.820 | 0.0 MB |
14 | +--------------------------------------------------------------------------------------------------------------+-----------+--------+
15 | | :ref:`sphx_glr_auto_examples_plotting_plot_qc.py` (``plot_qc.py``)                                           | 00:07.755 | 0.0 MB |
16 | +--------------------------------------------------------------------------------------------------------------+-----------+--------+
17 | | :ref:`sphx_glr_auto_examples_plotting_plot_filtering.py` (``plot_filtering.py``)                             | 00:01.581 | 0.0 MB |
18 | +--------------------------------------------------------------------------------------------------------------+-----------+--------+
19 | | :ref:`sphx_glr_auto_examples_plotting_plot_riverplot.py` (``plot_riverplot.py``)                             | 00:00.729 | 0.0 MB |
20 | +--------------------------------------------------------------------------------------------------------------+-----------+--------+
21 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_example_filtering_001.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_example_filtering_001.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_example_filtering_002.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_example_filtering_002.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_example_filtering_003.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_example_filtering_003.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_pca_neighbors_clustering_001.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_pca_neighbors_clustering_001.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_pca_neighbors_clustering_002.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_pca_neighbors_clustering_002.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_pca_neighbors_clustering_003.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_pca_neighbors_clustering_003.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_pca_neighbors_clustering_004.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_pca_neighbors_clustering_004.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_pca_neighbors_clustering_005.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/preprocessing/images/sphx_glr_plot_pca_neighbors_clustering_005.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/images/thumb/sphx_glr_filtering_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/preprocessing/images/thumb/sphx_glr_filtering_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/images/thumb/sphx_glr_plot_example_filtering_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/preprocessing/images/thumb/sphx_glr_plot_example_filtering_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/images/thumb/sphx_glr_plot_pca_neighbors_clustering_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/preprocessing/images/thumb/sphx_glr_plot_pca_neighbors_clustering_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/plot_example_filtering.py:
--------------------------------------------------------------------------------
 1 | """
 2 | performing filtering using besca
 3 | ================================
 4 | 
 5 | This example demonstrates the entire process of filtering out cells/genes ob subpar quality
 6 | before proceeding with analysis. 
 7 | 
 8 | """
 9 | 
10 | import besca as bc
11 | import scanpy as sc
12 | import matplotlib.pyplot as plt
13 | 
14 | #load example dataset
15 | adata = bc.datasets.pbmc3k_raw()
16 | 
17 | #set standard filtering parameters
18 | min_genes = 600
19 | min_cells = 2
20 | min_UMI = 600
21 | max_UMI = 6500
22 | max_mito = 0.05
23 | max_genes = 1900
24 | 
25 | ###############################################################################
26 | # visualization of thresholds
27 | # ---------------------------
28 | #
29 | # First the chosen thresholds are visualized to ensure that a suitable cutoff has been chosen.
30 | 
31 | #Visualize filtering thresholds
32 | fig, ((ax1, ax2, ax3), (ax4, ax5, ax6))= plt.subplots(ncols=3, nrows=2)
33 | fig.set_figwidth(15)
34 | fig.set_figheight(8)
35 | fig.tight_layout(pad=4.5)
36 | 
37 | bc.pl.kp_genes(adata, min_genes=min_genes, ax = ax1)
38 | bc.pl.kp_cells(adata, min_cells=min_cells, ax = ax2)
39 | bc.pl.kp_counts(adata, min_counts=min_UMI, ax = ax3)
40 | bc.pl.max_counts(adata, max_counts=max_UMI, ax = ax4)
41 | bc.pl.max_mito(adata, max_mito=max_mito, annotation_type='SYMBOL', species='human', ax = ax5)
42 | bc.pl.max_genes(adata, max_genes=max_genes)
43 | 
44 | ###############################################################################
45 | # application of filtering thresholds
46 | # -----------------------------------
47 | #
48 | # Using the chosen thresholds the data is filtered. Before and after filtering results are depicted to compare.
49 | 
50 | #visualize data before filtering
51 | sc.pl.violin(adata, ['n_counts', 'n_genes', 'percent_mito'], multi_panel=True, jitter = 0.4)
52 | 
53 | print('The AnnData object currently contains:', str(adata.shape[0]), 'cells and', str(adata.shape[1]), 'genes')
54 | print(adata)
55 | 
56 | #perform filtering
57 | adata = bc.pp.filter(adata, max_counts=max_UMI, max_genes=max_genes, max_mito=max_mito,min_genes=min_genes, min_counts=min_UMI, min_cells=min_cells)
58 | 
59 | #visualize data after filtering
60 | sc.pl.violin(adata, ['n_counts', 'n_genes', 'percent_mito'], multi_panel=True, jitter = 0.4)
61 | 
62 | print('The AnnData object now contains:', str(adata.shape[0]), 'cells and', str(adata.shape[1]), 'genes')
63 | print(adata)


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/plot_example_filtering.py.md5:
--------------------------------------------------------------------------------
1 | 53705858c847ac9c0428c4af8dfde771


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/plot_pca_neighbors_clustering.py:
--------------------------------------------------------------------------------
 1 | """
 2 | cluster generation
 3 | ==================
 4 | 
 5 | This example demonstrates how to perform highly variable gene selection, PCA, nearest neighbor calculation, and clustering.
 6 | 
 7 | """
 8 | 
 9 | import besca as bc
10 | import scanpy as sc
11 | 
12 | #import example dataset that has previously been filtered
13 | adata = bc.datasets.pbmc3k_filtered()
14 | ## We get the raw matrix containing all the initial genes, keeping the filtering on the cells
15 | adata = bc.get_raw(adata)
16 | 
17 | ###############################################################################
18 | # highly variable gene selection
19 | # ------------------------------
20 | #
21 | # select highly variable genes (considers correction for gene expression level)
22 | 
23 | #define thresholds for highly variable genes
24 | variable_genes_min_mean = 0.01
25 | variable_genes_max_mean = 5
26 | variable_genes_min_disp = 0.4
27 | 
28 | #identify genes with variable expression
29 | filter_result = sc.pp.filter_genes_dispersion(adata.X, min_mean=variable_genes_min_mean, max_mean=variable_genes_max_mean, min_disp=variable_genes_min_disp) 
30 | sc.pl.filter_genes_dispersion(filter_result)
31 | nbr_variable_genes = sum(filter_result.gene_subset)
32 | print('number of variable genes selected ', nbr_variable_genes )
33 | 
34 | #perform the actual filtering
35 | adata = adata[:, filter_result.gene_subset]
36 | 
37 | ###############################################################################
38 | # set random seed
39 | # ---------------
40 | # To get reproducible results you need to define a random seed for all of the stochastic
41 | # processes, such as e.g. PCA, neighbors, etc.
42 | 
43 | #set random seed
44 | random_seed = 0
45 | 
46 | ###############################################################################
47 | # PCA
48 | # ---
49 | 
50 | #log transform our data (is easier to work with numbers like this)
51 | sc.pp.log1p(adata)
52 | 
53 | # Scale data to unit variance and zero mean, and cut-off at max value 10
54 | sc.pp.scale(adata, max_value=10) 
55 | 
56 | #calculate 50 principle components of the dataset
57 | sc.tl.pca(adata, random_state=random_seed, svd_solver='arpack')
58 | 
59 | #visualize the amount of variance explained by each PC
60 | sc.pl.pca_variance_ratio(adata)
61 | 
62 | #visualize the loadings onto the first 3 PCs
63 | sc.pl.pca_loadings(adata)
64 | 
65 | ###############################################################################
66 | # nearest neighbors
67 | # -----------------
68 | 
69 | sc.pp.neighbors(adata, n_neighbors=15, random_state = random_seed, n_pcs=50)
70 | 
71 | ###############################################################################
72 | # louvain clustering
73 | # ------------------
74 | 
75 | sc.tl.leiden(adata, random_state=random_seed)
76 | 
77 | ###############################################################################
78 | # UMAP and t-SNE generation
79 | # -------------------------
80 | 
81 | #calculate UMAP
82 | sc.tl.umap(adata, random_state = random_seed)
83 | 
84 | #calculate t-SNE
85 | sc.tl.tsne(adata, random_state = random_seed)
86 | 
87 | ###############################################################################
88 | # visualize the results
89 | # ---------------------
90 | 
91 | sc.pl.umap(adata, color = ['leiden'])
92 | sc.pl.tsne(adata, color = ['leiden'])
93 | 
94 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/plot_pca_neighbors_clustering.py.md5:
--------------------------------------------------------------------------------
1 | 50b70d169ccc94f0721ac725d7102338


--------------------------------------------------------------------------------
/docs/source/auto_examples/preprocessing/sg_execution_times.rst:
--------------------------------------------------------------------------------
 1 | 
 2 | :orphan:
 3 | 
 4 | .. _sphx_glr_auto_examples_preprocessing_sg_execution_times:
 5 | 
 6 | Computation times
 7 | =================
 8 | **41:07.887** total execution time for **auto_examples_preprocessing** files:
 9 | 
10 | +---------------------------------------------------------------------------------------------------------------------+-----------+--------+
11 | | :ref:`sphx_glr_auto_examples_preprocessing_plot_pca_neighbors_clustering.py` (``plot_pca_neighbors_clustering.py``) | 41:07.887 | 0.0 MB |
12 | +---------------------------------------------------------------------------------------------------------------------+-----------+--------+
13 | | :ref:`sphx_glr_auto_examples_preprocessing_plot_example_filtering.py` (``plot_example_filtering.py``)               | 00:00.000 | 0.0 MB |
14 | +---------------------------------------------------------------------------------------------------------------------+-----------+--------+
15 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/tools/images/sphx_glr_plot_reclustering_function_001.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/tools/images/sphx_glr_plot_reclustering_function_001.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/tools/images/thumb/sphx_glr_plot_reclustering_function_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/tools/images/thumb/sphx_glr_plot_reclustering_function_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/tools/images/thumb/sphx_glr_plot_simple_example_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/tools/images/thumb/sphx_glr_plot_simple_example_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/tools/images/thumb/sphx_glr_simple_example_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/tools/images/thumb/sphx_glr_simple_example_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/tools/plot_reclustering_function.ipynb:
--------------------------------------------------------------------------------
 1 | {
 2 |  "cells": [
 3 |   {
 4 |    "cell_type": "code",
 5 |    "execution_count": null,
 6 |    "metadata": {
 7 |     "collapsed": false
 8 |    },
 9 |    "outputs": [],
10 |    "source": [
11 |     "%matplotlib inline"
12 |    ]
13 |   },
14 |   {
15 |    "cell_type": "markdown",
16 |    "metadata": {},
17 |    "source": [
18 |     "\n",
19 |     "# reclustering on specific louvain clusters\n",
20 |     "\n",
21 |     "This example demonstrates who to perform a reclustering on a selected subset of\n",
22 |     "louvain clusters. You will want to do this for example during the process of celltype\n",
23 |     "annotation, when the  clusters do not have a sufficient resolution to seperate\n",
24 |     "all clusters and mixed cell populations still exist.\n"
25 |    ]
26 |   },
27 |   {
28 |    "cell_type": "code",
29 |    "execution_count": null,
30 |    "metadata": {
31 |     "collapsed": false
32 |    },
33 |    "outputs": [],
34 |    "source": [
35 |     "import besca as bc\n",
36 |     "import scanpy as sc\n",
37 |     "\n",
38 |     "#load and preprocess data (here we will start from a preprocessed dataset)\n",
39 |     "adata = bc.datasets.pbmc3k_processed()\n",
40 |     "\n",
41 |     "#extract subset using the recluster function whcih is part of the reclustering (rc) toolkit\n",
42 |     "adata_subset = bc.tl.rc.recluster(adata, celltype=('2', '3', '4', '5', '6','8', '9', '10', '11', '12'), celltype_label = 'leiden', resolution = 1.2)\n",
43 |     "\n",
44 |     "\n",
45 |     "\n",
46 |     "\n",
47 |     "#visualize the new clusters\n",
48 |     "sc.pl.umap(adata_subset, color = ['leiden', 'CD3G', 'CD8A', 'CD4', 'IL7R', 'NKG7', 'GNLY'])\n",
49 |     "\n",
50 |     "#append new celltype labels to the subclusters.\n",
51 |     "# This is an approximative hand annotation that should be dealt into more widths.\n",
52 |     "new_labels = [\"NK cell\", #0\n",
53 |     "              \"CD4 T-cell\", #1\n",
54 |     "              \"CD8 T-cell\", #2\n",
55 |     "              \"CD4 T-cell\", #3\n",
56 |     "              \"CD8 T-cell\", #4\n",
57 |     "              \"CD8 T-cell\", #5\n",
58 |     "              \"CD4 T-cell\", #6\n",
59 |     "              \"CD4 T-cell\",  #7\n",
60 |     "              \"CD4 T-cell\",  #8\n",
61 |     "              \"CD4 T-cell\",  #9\n",
62 |     "              \"CD4 T-cell\", #10\n",
63 |     "              \"CD4 T-cell\", #11\n",
64 |     "              \"CD4 T-cell\" #12\n",
65 |     "              ] #10\n",
66 |     "\n",
67 |     "#merge the labels back into the original adata object\n",
68 |     "#note this will overwrite what ever was saved in adata.obs.celltype;\n",
69 |     "#Here is was not assigned yet.\n",
70 |     "bc.tl.rc.annotate_new_cellnames(adata, adata_subset, names=new_labels, new_label = 'celltype')\n",
71 |     "\n",
72 |     "print(adata.obs.celltype.value_counts())"
73 |    ]
74 |   }
75 |  ],
76 |  "metadata": {
77 |   "kernelspec": {
78 |    "display_name": "Python 3",
79 |    "language": "python",
80 |    "name": "python3"
81 |   },
82 |   "language_info": {
83 |    "codemirror_mode": {
84 |     "name": "ipython",
85 |     "version": 3
86 |    },
87 |    "file_extension": ".py",
88 |    "mimetype": "text/x-python",
89 |    "name": "python",
90 |    "nbconvert_exporter": "python",
91 |    "pygments_lexer": "ipython3",
92 |    "version": "3.7.8"
93 |   }
94 |  },
95 |  "nbformat": 4,
96 |  "nbformat_minor": 0
97 | }
98 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/tools/plot_reclustering_function.py:
--------------------------------------------------------------------------------
 1 | """
 2 | reclustering on specific louvain clusters
 3 | =========================================
 4 | 
 5 | This example demonstrates who to perform a reclustering on a selected subset of
 6 | louvain clusters. You will want to do this for example during the process of celltype
 7 | annotation, when the  clusters do not have a sufficient resolution to seperate
 8 | all clusters and mixed cell populations still exist.
 9 | 
10 | """
11 | 
12 | import besca as bc
13 | import scanpy as sc
14 | 
15 | #load and preprocess data (here we will start from a preprocessed dataset)
16 | adata = bc.datasets.pbmc3k_processed()
17 | 
18 | #extract subset using the recluster function whcih is part of the reclustering (rc) toolkit
19 | adata_subset = bc.tl.rc.recluster(adata, celltype=('2', '3', '4', '5', '6','8', '9', '10', '11', '12'), celltype_label = 'leiden', resolution = 1.2)
20 | 
21 | 
22 | 
23 | 
24 | #visualize the new clusters
25 | sc.pl.umap(adata_subset, color = ['leiden', 'CD3G', 'CD8A', 'CD4', 'IL7R', 'NKG7', 'GNLY'])
26 | 
27 | #append new celltype labels to the subclusters.
28 | # This is an approximative hand annotation that should be dealt into more widths.
29 | new_labels = ["NK cell", #0
30 |               "CD4 T-cell", #1
31 |               "CD8 T-cell", #2
32 |               "CD4 T-cell", #3
33 |               "CD8 T-cell", #4
34 |               "CD8 T-cell", #5
35 |               "CD4 T-cell", #6
36 |               "CD4 T-cell",  #7
37 |               "CD4 T-cell",  #8
38 |               "CD4 T-cell",  #9
39 |               "CD4 T-cell", #10
40 |               "CD4 T-cell", #11
41 |               "CD4 T-cell" #12
42 |               ] #10
43 | 
44 | #merge the labels back into the original adata object
45 | #note this will overwrite what ever was saved in adata.obs.celltype;
46 | #Here is was not assigned yet.
47 | bc.tl.rc.annotate_new_cellnames(adata, adata_subset, names=new_labels, new_label = 'celltype')
48 | 
49 | print(adata.obs.celltype.value_counts())
50 | 
51 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/tools/plot_reclustering_function.py.md5:
--------------------------------------------------------------------------------
1 | 1f8fcaca11e7c195060e7a50e03d12e3


--------------------------------------------------------------------------------
/docs/source/auto_examples/tools/sg_execution_times.rst:
--------------------------------------------------------------------------------
 1 | 
 2 | :orphan:
 3 | 
 4 | .. _sphx_glr_auto_examples_tools_sg_execution_times:
 5 | 
 6 | Computation times
 7 | =================
 8 | **00:13.716** total execution time for **auto_examples_tools** files:
 9 | 
10 | +-------------------------------------------------------------------------------------------------------+-----------+--------+
11 | | :ref:`sphx_glr_auto_examples_tools_plot_reclustering_function.py` (``plot_reclustering_function.py``) | 00:13.716 | 0.0 MB |
12 | +-------------------------------------------------------------------------------------------------------+-----------+--------+
13 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/tools/tt_plot_reclustering_function.py:
--------------------------------------------------------------------------------
 1 | """
 2 | reclustering on specific leiden clusters
 3 | =========================================
 4 | 
 5 | This example demonstrates who to perform a reclustering on a selected subset of
 6 | leiden clusters. You will want to do this for example during the process of celltype
 7 | annotation, when the leiden clusters do not have a sufficient resolution to seperate
 8 | all clusters and mixed cell populations still exist.
 9 | 
10 | """
11 | 
12 | import besca as bc
13 | import scanpy as sc
14 | 
15 | #load and preprocess data (here we will start from a preprocessed dataset)
16 | adata = bc.datasets.pbmc3k_processed()
17 | 
18 | #extract subset using the recluster function whcih is part of the reclustering (rc) toolkit
19 | adata_subset = bc.tl.rc.recluster(adata, celltype=('CD4-positive, alpha-beta T cell', 'CD8-positive, alpha-beta T cell'), celltype_label = 'celltype2', resolution = 1)
20 | 
21 | #visualize the new clusters
22 | sc.pl.umap(adata_subset, color = ['leiden',  'CD3G', 'CD8A', 'CD8B','CD4', 'IL7R', 'NKG7', 'GNLY'], color_map = 'viridis')
23 | 
24 | 
25 | 
26 | # We advise to go back to the annotation procedures using auto-annot/sig-annot. 
27 | # As an example here, we performed an a-priori hand annotation.
28 | 
29 | #append new celltype labels to the subclusters
30 | new_labels = ["CD4 T-cell", #0
31 |               "CD4 T-cell", #1
32 |               "CD8 T-cell", #2
33 |               "NK cell", #3
34 |               "CD8 T-cell", #4
35 |               "CD8 T-cell", #5
36 |               "CD4 T-cell",#6
37 |               "T cell" #7
38 |               ] #10
39 | 
40 | #merge the labels back into the original adata object
41 | #note this will overwrite what ever was saved in adata.obs.celltype
42 | bc.tl.rc.annotate_new_cellnames(adata, adata_subset, names=new_labels, new_label = 'celltype_rc')
43 | 
44 | 
45 | print(adata.obs.celltype_rc.value_counts())
46 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_001.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_001.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_002.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_002.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_003.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_003.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_004.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_004.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_005.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_005.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_006.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_006.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_007.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_007.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_008.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_008.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_009.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_009.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_010.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/sphx_glr_plot_celltype_annotation_010.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/thumb/sphx_glr_annotate_celltypes_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/thumb/sphx_glr_annotate_celltypes_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/thumb/sphx_glr_plot_celltype_annotation_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/thumb/sphx_glr_plot_celltype_annotation_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/images/thumb/sphx_glr_plot_celltype_quantification_thumb.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/auto_examples/workflows/images/thumb/sphx_glr_plot_celltype_quantification_thumb.png


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/plot_celltype_annotation.py.md5:
--------------------------------------------------------------------------------
1 | b536781773b6d198dcaf76e506ca70cc


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/plot_celltype_quantification.ipynb:
--------------------------------------------------------------------------------
 1 | {
 2 |  "cells": [
 3 |   {
 4 |    "cell_type": "code",
 5 |    "execution_count": 1,
 6 |    "metadata": {},
 7 |    "outputs": [],
 8 |    "source": [
 9 |     "%matplotlib inline"
10 |    ]
11 |   },
12 |   {
13 |    "cell_type": "markdown",
14 |    "metadata": {},
15 |    "source": [
16 |     "\n",
17 |     "Visualize Cell Fractions\n",
18 |     "========================\n",
19 |     "\n",
20 |     "This example demonstrates how to generate celltype quantification plots.\n",
21 |     "\n",
22 |     "\n"
23 |    ]
24 |   },
25 |   {
26 |    "cell_type": "code",
27 |    "execution_count": 2,
28 |    "metadata": {},
29 |    "outputs": [],
30 |    "source": [
31 |     "import besca as bc \n",
32 |     "\n",
33 |     "#import dataset to workwith\n",
34 |     "\n",
35 |     "adata = bc.datasets.pbmc3k_processed()\n",
36 |     "\n",
37 |     "#continue with rest"
38 |    ]
39 |   }
40 |  ],
41 |  "metadata": {
42 |   "kernelspec": {
43 |    "display_name": "Python3.7 (besca_test_auto_annot)",
44 |    "language": "python",
45 |    "name": "besca_test_auto_annot"
46 |   },
47 |   "language_info": {
48 |    "codemirror_mode": {
49 |     "name": "ipython",
50 |     "version": 3
51 |    },
52 |    "file_extension": ".py",
53 |    "mimetype": "text/x-python",
54 |    "name": "python",
55 |    "nbconvert_exporter": "python",
56 |    "pygments_lexer": "ipython3",
57 |    "version": "3.6.7"
58 |   }
59 |  },
60 |  "nbformat": 4,
61 |  "nbformat_minor": 1
62 | }
63 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/plot_celltype_quantification.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Visualize Cell Fractions
 3 | ========================
 4 | 
 5 | This example demonstrates how to generate celltype quantification plots.
 6 | 
 7 | """
 8 | 
 9 | import besca as bc 
10 | 
11 | #import dataset to workwith
12 | 
13 | adata = bc.datasets.pbmc3k_processed()
14 | 
15 | #continue with rest
16 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/plot_celltype_quantification.py.md5:
--------------------------------------------------------------------------------
1 | 29fc08b0a3c51da7c3aa97964217e2de


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/plot_celltype_quantification.rst:
--------------------------------------------------------------------------------
 1 | .. note::
 2 |     :class: sphx-glr-download-link-note
 3 | 
 4 |     Click :ref:`here <sphx_glr_download_auto_examples_workflows_plot_celltype_quantification.py>` to download the full example code
 5 | .. rst-class:: sphx-glr-example-title
 6 | 
 7 | .. _sphx_glr_auto_examples_workflows_plot_celltype_quantification.py:
 8 | 
 9 | 
10 | Visualize Cell Fractions
11 | ========================
12 | 
13 | This example demonstrates how to generate celltype quantification plots.
14 | 
15 | 
16 | 
17 | 
18 | 
19 | 
20 | 
21 | 
22 | 
23 | .. code-block:: python
24 | 
25 | 
26 |     import besca as bc 
27 | 
28 |     #import dataset to workwith
29 | 
30 |     adata = bc.datasets.pbmc3k_processed()
31 | 
32 |     #continue with rest
33 | 
34 | **Total running time of the script:** ( 0 minutes  1.792 seconds)
35 | 
36 | 
37 | .. _sphx_glr_download_auto_examples_workflows_plot_celltype_quantification.py:
38 | 
39 | 
40 | .. only :: html
41 | 
42 |  .. container:: sphx-glr-footer
43 |     :class: sphx-glr-footer-example
44 | 
45 | 
46 | 
47 |   .. container:: sphx-glr-download
48 | 
49 |      :download:`Download Python source code: plot_celltype_quantification.py <plot_celltype_quantification.py>`
50 | 
51 | 
52 | 
53 |   .. container:: sphx-glr-download
54 | 
55 |      :download:`Download Jupyter notebook: plot_celltype_quantification.ipynb <plot_celltype_quantification.ipynb>`
56 | 
57 | 
58 | .. only:: html
59 | 
60 |  .. rst-class:: sphx-glr-signature
61 | 
62 |     `Gallery generated by Sphinx-Gallery <https://sphinx-gallery.readthedocs.io>`_
63 | 


--------------------------------------------------------------------------------
/docs/source/auto_examples/workflows/sg_execution_times.rst:
--------------------------------------------------------------------------------
 1 | 
 2 | :orphan:
 3 | 
 4 | .. _sphx_glr_auto_examples_workflows_sg_execution_times:
 5 | 
 6 | Computation times
 7 | =================
 8 | **00:22.833** total execution time for **auto_examples_workflows** files:
 9 | 
10 | +-------------------------------------------------------------------------------------------------------+-----------+--------+
11 | | :ref:`sphx_glr_auto_examples_workflows_plot_celltype_annotation.py` (``plot_celltype_annotation.py``) | 00:22.833 | 0.0 MB |
12 | +-------------------------------------------------------------------------------------------------------+-----------+--------+
13 | 


--------------------------------------------------------------------------------
/docs/source/bc.rst:
--------------------------------------------------------------------------------
1 | .. automodapi:: besca.pp
2 | .. automodapi:: besca.pl
3 | .. automodapi:: besca.tl
4 | .. automodapi:: besca.tl.bcor
5 | .. automodapi:: besca.tl.dge
6 | .. automodapi:: besca.tl.rc
7 | .. automodapi:: besca.Import
8 | .. automodapi:: besca.export
9 | .. automodapi:: besca.st


--------------------------------------------------------------------------------
/docs/source/bcor/besca.tl.bcor.batch_correct.rst:
--------------------------------------------------------------------------------
1 | batch_correct
2 | =============
3 | 
4 | .. currentmodule:: besca.tl.bcor
5 | 
6 | .. autofunction:: batch_correct
7 | 


--------------------------------------------------------------------------------
/docs/source/bcor/besca.tl.bcor.postprocess_mnnpy.rst:
--------------------------------------------------------------------------------
1 | postprocess_mnnpy
2 | =================
3 | 
4 | .. currentmodule:: besca.tl.bcor
5 | 
6 | .. autofunction:: postprocess_mnnpy
7 | 


--------------------------------------------------------------------------------
/docs/source/besca.rst:
--------------------------------------------------------------------------------
  1 | besca
  2 | =====
  3 | 
  4 | .. _helper-functions:
  5 | 
  6 | helper functions
  7 | ----------------
  8 | 
  9 | .. autosummary::
 10 | 	:toctree: helper_functions
 11 | 
 12 | 	besca.get_raw
 13 | 	besca.subset_adata
 14 | 	besca.convert_ensembl_to_symbol
 15 | 	besca.convert_symbol_to_ensembl
 16 | 	besca.get_raw
 17 | 	besca.get_means
 18 | 	besca.get_ameans
 19 | 	besca.concate_adata
 20 | 
 21 | .. _preprocessing-functions:
 22 | 
 23 | preprocessing
 24 | -------------
 25 | .. automodsumm:: besca.pp
 26 | 	:toctree: preprocessing
 27 | 
 28 | .. _plotting-functions:
 29 | 
 30 | plotting
 31 | --------
 32 | .. automodsumm:: besca.pl
 33 | 	:toctree: plotting
 34 | 
 35 | .. _tools-functions:
 36 | 
 37 | tools
 38 | -----
 39 | .. automodsumm:: besca.tl
 40 | 	:toctree: tools
 41 | 
 42 | .. _toolkits-functions:
 43 | 
 44 | toolkits
 45 | ^^^^^^^^
 46 | 
 47 | batch correction
 48 | ++++++++++++++++
 49 | Collection of functions to perform batch correction.
 50 | 
 51 | .. automodsumm:: besca.tl.bcor
 52 | 	:toctree: bcor
 53 | 
 54 | differential gene expression
 55 | ++++++++++++++++++++++++++++
 56 | Collection of functions to aid in differential gene expression analysis.
 57 | 
 58 | .. automodsumm:: besca.tl.dge
 59 | 	:toctree:  dge
 60 | 
 61 | signature scoring
 62 | +++++++++++++++++
 63 | Collection of functions to aid in signature scoring.
 64 | 
 65 | .. automodsumm:: besca.tl.sig
 66 |         :toctree:  sig
 67 | 
 68 | reclustering
 69 | ++++++++++++
 70 | Collection of functions to perform reclustering on selected subclusters.
 71 | 
 72 | .. automodsumm:: besca.tl.rc
 73 | 	:toctree: reclustering
 74 | 
 75 | .. _import-functions:
 76 | 
 77 | auto-annot
 78 | ++++++++++++
 79 | Collection of functions to perform auto-annot : annotating a sc datasets based on a reference one.
 80 | 
 81 | .. automodsumm:: besca.tl.auto_annot
 82 | 	:toctree: auto_annot
 83 | 
 84 | 
 85 | Import
 86 | ------
 87 | .. automodsumm:: besca.Import
 88 | 	:toctree: import
 89 | 
 90 | .. _export-functions:
 91 | 
 92 | export
 93 | ------
 94 | .. automodsumm:: besca.export
 95 | 	:toctree: export
 96 | 
 97 | .. _standardworkflow-functions:
 98 | 
 99 | standardworkflow
100 | ----------------
101 | .. automodsumm:: besca.st
102 | 	:toctree: standardworkflow
103 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.Import.add_cell_labeling.rst:
--------------------------------------------------------------------------------
1 | add_cell_labeling
2 | =================
3 | 
4 | .. currentmodule:: besca.Import
5 | 
6 | .. autofunction:: add_cell_labeling
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.Import.assert_adata.rst:
--------------------------------------------------------------------------------
1 | assert_adata
2 | ============
3 | 
4 | .. currentmodule:: besca.Import
5 | 
6 | .. autofunction:: assert_adata
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.Import.read_mtx.rst:
--------------------------------------------------------------------------------
1 | read_mtx
2 | ========
3 | 
4 | .. currentmodule:: besca.Import
5 | 
6 | .. autofunction:: read_mtx
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.export.X_to_mtx.rst:
--------------------------------------------------------------------------------
1 | X_to_mtx
2 | ========
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: X_to_mtx
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.export.analysis_metadata.rst:
--------------------------------------------------------------------------------
1 | analysis_metadata
2 | =================
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: analysis_metadata
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.export.clustering.rst:
--------------------------------------------------------------------------------
1 | clustering
2 | ==========
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: clustering
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.export.generate_gep.rst:
--------------------------------------------------------------------------------
1 | generate_gep
2 | ============
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: generate_gep
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.export.labeling.rst:
--------------------------------------------------------------------------------
1 | labeling
2 | ========
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: labeling
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.export.labeling_info.rst:
--------------------------------------------------------------------------------
1 | labeling_info
2 | =============
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: labeling_info
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.export.pseudobulk.rst:
--------------------------------------------------------------------------------
1 | pseudobulk
2 | ==========
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: pseudobulk
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.export.ranked_genes.rst:
--------------------------------------------------------------------------------
1 | ranked_genes
2 | ============
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: ranked_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.export.raw_to_mtx.rst:
--------------------------------------------------------------------------------
1 | raw_to_mtx
2 | ==========
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: raw_to_mtx
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.box_per_ind.rst:
--------------------------------------------------------------------------------
1 | box_per_ind
2 | ===========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: box_per_ind
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.celllabel_quant_boxplot.rst:
--------------------------------------------------------------------------------
1 | celllabel_quant_boxplot
2 | =======================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: celllabel_quant_boxplot
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.celllabel_quant_stackedbar.rst:
--------------------------------------------------------------------------------
1 | celllabel_quant_stackedbar
2 | ==========================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: celllabel_quant_stackedbar
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.detected_genes.rst:
--------------------------------------------------------------------------------
1 | detected_genes
2 | ==============
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: detected_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.dot_heatmap.rst:
--------------------------------------------------------------------------------
1 | dot_heatmap
2 | ===========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: dot_heatmap
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.dot_heatmap_split.rst:
--------------------------------------------------------------------------------
1 | dot_heatmap_split
2 | =================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: dot_heatmap_split
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.dot_heatmap_split_greyscale.rst:
--------------------------------------------------------------------------------
1 | dot_heatmap_split_greyscale
2 | ===========================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: dot_heatmap_split_greyscale
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.dropouts.rst:
--------------------------------------------------------------------------------
1 | dropouts
2 | ========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: dropouts
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.gene_expr_split.rst:
--------------------------------------------------------------------------------
1 | gene_expr_split
2 | ===============
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: gene_expr_split
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.gene_expr_split_stacked.rst:
--------------------------------------------------------------------------------
1 | gene_expr_split_stacked
2 | =======================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: gene_expr_split_stacked
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.kp_cells.rst:
--------------------------------------------------------------------------------
1 | kp_cells
2 | ========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: kp_cells
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.kp_counts.rst:
--------------------------------------------------------------------------------
1 | kp_counts
2 | =========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: kp_counts
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.kp_genes.rst:
--------------------------------------------------------------------------------
1 | kp_genes
2 | ========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: kp_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.library_size.rst:
--------------------------------------------------------------------------------
1 | library_size
2 | ============
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: library_size
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.librarysize_overview.rst:
--------------------------------------------------------------------------------
1 | librarysize_overview
2 | ====================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: librarysize_overview
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.max_counts.rst:
--------------------------------------------------------------------------------
1 | max_counts
2 | ==========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: max_counts
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.max_genes.rst:
--------------------------------------------------------------------------------
1 | max_genes
2 | =========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: max_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.max_mito.rst:
--------------------------------------------------------------------------------
1 | max_mito
2 | ========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: max_mito
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.nomenclature_network.rst:
--------------------------------------------------------------------------------
1 | nomenclature_network
2 | ====================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: nomenclature_network
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.riverplot_2categories.rst:
--------------------------------------------------------------------------------
1 | riverplot_2categories
2 | =====================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: riverplot_2categories
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.stacked_split_violin.rst:
--------------------------------------------------------------------------------
1 | stacked_split_violin
2 | ====================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: stacked_split_violin
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.top_genes_counts.rst:
--------------------------------------------------------------------------------
1 | top_genes_counts
2 | ================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: top_genes_counts
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.transcript_capture_efficiency.rst:
--------------------------------------------------------------------------------
1 | transcript_capture_efficiency
2 | =============================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: transcript_capture_efficiency
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pl.update_qualitative_palette.rst:
--------------------------------------------------------------------------------
1 | update_qualitative_palette
2 | ==========================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: update_qualitative_palette
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pp.filter.rst:
--------------------------------------------------------------------------------
1 | filter
2 | ======
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: filter
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pp.filter_gene_list.rst:
--------------------------------------------------------------------------------
1 | filter_gene_list
2 | ================
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: filter_gene_list
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pp.frac_pos.rst:
--------------------------------------------------------------------------------
1 | frac_pos
2 | ========
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: frac_pos
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pp.frac_reads.rst:
--------------------------------------------------------------------------------
1 | frac_reads
2 | ==========
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: frac_reads
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pp.fraction_counts.rst:
--------------------------------------------------------------------------------
1 | fraction_counts
2 | ===============
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: fraction_counts
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pp.mean_expr.rst:
--------------------------------------------------------------------------------
1 | mean_expr
2 | =========
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: mean_expr
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pp.normalize_geometric.rst:
--------------------------------------------------------------------------------
1 | normalize_geometric
2 | ===================
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: normalize_geometric
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pp.top_counts_genes.rst:
--------------------------------------------------------------------------------
1 | top_counts_genes
2 | ================
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: top_counts_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.pp.top_expressed_genes.rst:
--------------------------------------------------------------------------------
1 | top_expressed_genes
2 | ===================
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: top_expressed_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.st.additional_labeling.rst:
--------------------------------------------------------------------------------
1 | additional_labeling
2 | ===================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: additional_labeling
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.st.celltype_labeling.rst:
--------------------------------------------------------------------------------
1 | celltype_labeling
2 | =================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: celltype_labeling
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.st.export_celltype.rst:
--------------------------------------------------------------------------------
1 | export_celltype
2 | ===============
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_celltype
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.st.export_clustering.rst:
--------------------------------------------------------------------------------
1 | export_clustering
2 | =================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_clustering
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.st.export_cp10k.rst:
--------------------------------------------------------------------------------
1 | export_cp10k
2 | ============
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_cp10k
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.st.export_metadata.rst:
--------------------------------------------------------------------------------
1 | export_metadata
2 | ===============
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_metadata
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.st.export_rank.rst:
--------------------------------------------------------------------------------
1 | export_rank
2 | ===========
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_rank
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.st.export_regressedOut.rst:
--------------------------------------------------------------------------------
1 | export_regressedOut
2 | ===================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_regressedOut
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.st.filtering_cells_genes_min.rst:
--------------------------------------------------------------------------------
1 | filtering_cells_genes_min
2 | =========================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: filtering_cells_genes_min
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.st.filtering_mito_genes_max.rst:
--------------------------------------------------------------------------------
1 | filtering_mito_genes_max
2 | ========================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: filtering_mito_genes_max
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.st.read_matrix.rst:
--------------------------------------------------------------------------------
1 | read_matrix
2 | ===========
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: read_matrix
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.tl.annotate_cells_clustering.rst:
--------------------------------------------------------------------------------
1 | annotate_cells_clustering
2 | =========================
3 | 
4 | .. currentmodule:: besca.tl
5 | 
6 | .. autofunction:: annotate_cells_clustering
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.tl.bcor.batch_correct.rst:
--------------------------------------------------------------------------------
1 | batch_correct
2 | =============
3 | 
4 | .. currentmodule:: besca.tl.bcor
5 | 
6 | .. autofunction:: batch_correct
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.tl.bcor.postprocess_mnnpy.rst:
--------------------------------------------------------------------------------
1 | postprocess_mnnpy
2 | =================
3 | 
4 | .. currentmodule:: besca.tl.bcor
5 | 
6 | .. autofunction:: postprocess_mnnpy
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.tl.count_occurrence.rst:
--------------------------------------------------------------------------------
1 | count_occurrence
2 | ===============
3 | 
4 | .. currentmodule:: besca.tl
5 | 
6 | .. autofunction:: count_occurrence
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.tl.count_occurrence_subset.rst:
--------------------------------------------------------------------------------
1 | count_occurrence_subset
2 | ======================
3 | 
4 | .. currentmodule:: besca.tl
5 | 
6 | .. autofunction:: count_occurrence_subset
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.tl.count_occurrence_subset_conditions.rst:
--------------------------------------------------------------------------------
1 | count_occurrence_subset_conditions
2 | =================================
3 | 
4 | .. currentmodule:: besca.tl
5 | 
6 | .. autofunction:: count_occurrence_subset_conditions
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.tl.dge.get_de.rst:
--------------------------------------------------------------------------------
1 | get_de
2 | ======
3 | 
4 | .. currentmodule:: besca.tl.dge
5 | 
6 | .. autofunction:: get_de
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.tl.dge.perform_dge.rst:
--------------------------------------------------------------------------------
1 | perform_dge
2 | ===========
3 | 
4 | .. currentmodule:: besca.tl.dge
5 | 
6 | .. autofunction:: perform_dge
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.tl.dge.plot_interactive_volcano.rst:
--------------------------------------------------------------------------------
1 | plot_interactive_volcano
2 | ========================
3 | 
4 | .. currentmodule:: besca.tl.dge
5 | 
6 | .. autofunction:: plot_interactive_volcano
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.tl.rc.annotate_new_cellnames.rst:
--------------------------------------------------------------------------------
1 | annotate_new_cellnames
2 | ======================
3 | 
4 | .. currentmodule:: besca.tl.rc
5 | 
6 | .. autofunction:: annotate_new_cellnames
7 | 


--------------------------------------------------------------------------------
/docs/source/besca/besca.tl.rc.recluster.rst:
--------------------------------------------------------------------------------
1 | recluster
2 | =========
3 | 
4 | .. currentmodule:: besca.tl.rc
5 | 
6 | .. autofunction:: recluster
7 | 


--------------------------------------------------------------------------------
/docs/source/besca_standard_pipeline.rst:
--------------------------------------------------------------------------------
 1 | .. _besca-standard-pipeline:
 2 | 
 3 | =======================
 4 | besca standard pipeline
 5 | =======================
 6 | 
 7 | 
 8 | 
 9 | Besca standard worklow offers a standardized series of steps from raw-data to filtered one in order to start the annotation processes.
10 | 
11 | 
12 | 
13 | 
14 | Besca is distributed with such workflow available as a notebook:
15 | https://github.com/bedapub/besca/blob/master/workbooks/standard_workflow_besca2.ipynb
16 | 
17 | 
18 | The differents individuals steps are described in the tutorial:
19 | :doc:`data processing <tutorials/notebook1_data_processing_pbmc3k>` 
20 | 
21 | 
22 | 
23 | And different examples are available in the publication results repository:
24 | 
25 | `PBMC3K standard workflow <https://github.com/bedapub/besca_publication_results/blob/master/hematopoietic/pbmc3k/standard_workflow_besca2-Raw.ipynb>`_
26 | 
27 | `Lee 2020 Intestine standard workflow <https://github.com/bedapub/besca_publication_results/blob/master/intestine/Lee2020/standard_workflow_besca2.1_sc145_bescapub.ipynb>`_
28 | 
29 | `Granja 2019 hematopoietic standard workflow <https://github.com/bedapub/besca_publication_results/blob/master/hematopoietic/Granja2019/standard_workflow_besca2.0_updated.ipynb>`_
30 | 
31 | 
32 | 
33 | 
34 | 
35 | 


--------------------------------------------------------------------------------
/docs/source/dge/besca.tl.dge.get_de.rst:
--------------------------------------------------------------------------------
1 | get_de
2 | ======
3 | 
4 | .. currentmodule:: besca.tl.dge
5 | 
6 | .. autofunction:: get_de
7 | 


--------------------------------------------------------------------------------
/docs/source/dge/besca.tl.dge.perform_dge.rst:
--------------------------------------------------------------------------------
1 | perform_dge
2 | ===========
3 | 
4 | .. currentmodule:: besca.tl.dge
5 | 
6 | .. autofunction:: perform_dge
7 | 


--------------------------------------------------------------------------------
/docs/source/dge/besca.tl.dge.plot_interactive_volcano.rst:
--------------------------------------------------------------------------------
1 | plot_interactive_volcano
2 | ========================
3 | 
4 | .. currentmodule:: besca.tl.dge
5 | 
6 | .. autofunction:: plot_interactive_volcano
7 | 


--------------------------------------------------------------------------------
/docs/source/export/besca.export.X_to_mtx.rst:
--------------------------------------------------------------------------------
1 | X_to_mtx
2 | ========
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: X_to_mtx
7 | 


--------------------------------------------------------------------------------
/docs/source/export/besca.export.analysis_metadata.rst:
--------------------------------------------------------------------------------
1 | analysis_metadata
2 | =================
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: analysis_metadata
7 | 


--------------------------------------------------------------------------------
/docs/source/export/besca.export.clustering.rst:
--------------------------------------------------------------------------------
1 | clustering
2 | ==========
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: clustering
7 | 


--------------------------------------------------------------------------------
/docs/source/export/besca.export.generate_gep.rst:
--------------------------------------------------------------------------------
1 | generate_gep
2 | ============
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: generate_gep
7 | 


--------------------------------------------------------------------------------
/docs/source/export/besca.export.labeling.rst:
--------------------------------------------------------------------------------
1 | labeling
2 | ========
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: labeling
7 | 


--------------------------------------------------------------------------------
/docs/source/export/besca.export.labeling_info.rst:
--------------------------------------------------------------------------------
1 | labeling_info
2 | =============
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: labeling_info
7 | 


--------------------------------------------------------------------------------
/docs/source/export/besca.export.pseudobulk.rst:
--------------------------------------------------------------------------------
1 | pseudobulk
2 | ==========
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: pseudobulk
7 | 


--------------------------------------------------------------------------------
/docs/source/export/besca.export.ranked_genes.rst:
--------------------------------------------------------------------------------
1 | ranked_genes
2 | ============
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: ranked_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/export/besca.export.raw_to_mtx.rst:
--------------------------------------------------------------------------------
1 | raw_to_mtx
2 | ==========
3 | 
4 | .. currentmodule:: besca.export
5 | 
6 | .. autofunction:: raw_to_mtx
7 | 


--------------------------------------------------------------------------------
/docs/source/helper_functions/besca.concate_adata.rst:
--------------------------------------------------------------------------------
1 | ﻿besca.concate\_adata
2 | ====================
3 | 
4 | .. currentmodule:: besca
5 | 
6 | .. autofunction:: concate_adata


--------------------------------------------------------------------------------
/docs/source/helper_functions/besca.convert_ensembl_to_symbol.rst:
--------------------------------------------------------------------------------
1 | ﻿besca.convert\_ensembl\_to\_symbol
2 | ==================================
3 | 
4 | .. currentmodule:: besca
5 | 
6 | .. autofunction:: convert_ensembl_to_symbol


--------------------------------------------------------------------------------
/docs/source/helper_functions/besca.convert_symbol_to_ensembl.rst:
--------------------------------------------------------------------------------
1 | ﻿besca.convert\_symbol\_to\_ensembl
2 | ==================================
3 | 
4 | .. currentmodule:: besca
5 | 
6 | .. autofunction:: convert_symbol_to_ensembl


--------------------------------------------------------------------------------
/docs/source/helper_functions/besca.get_ameans.rst:
--------------------------------------------------------------------------------
1 | ﻿besca.get\_ameans
2 | =================
3 | 
4 | .. currentmodule:: besca
5 | 
6 | .. autofunction:: get_ameans


--------------------------------------------------------------------------------
/docs/source/helper_functions/besca.get_means.rst:
--------------------------------------------------------------------------------
1 | ﻿besca.get\_means
2 | ================
3 | 
4 | .. currentmodule:: besca
5 | 
6 | .. autofunction:: get_means


--------------------------------------------------------------------------------
/docs/source/helper_functions/besca.get_raw.rst:
--------------------------------------------------------------------------------
1 | ﻿besca.get\_raw
2 | ==============
3 | 
4 | .. currentmodule:: besca
5 | 
6 | .. autofunction:: get_raw


--------------------------------------------------------------------------------
/docs/source/helper_functions/besca.subset_adata.rst:
--------------------------------------------------------------------------------
1 | ﻿besca.subset\_adata
2 | ===================
3 | 
4 | .. currentmodule:: besca
5 | 
6 | .. autofunction:: subset_adata


--------------------------------------------------------------------------------
/docs/source/import/besca.Import.add_cell_labeling.rst:
--------------------------------------------------------------------------------
1 | add_cell_labeling
2 | =================
3 | 
4 | .. currentmodule:: besca.Import
5 | 
6 | .. autofunction:: add_cell_labeling
7 | 


--------------------------------------------------------------------------------
/docs/source/import/besca.Import.assert_adata.rst:
--------------------------------------------------------------------------------
1 | assert_adata
2 | ============
3 | 
4 | .. currentmodule:: besca.Import
5 | 
6 | .. autofunction:: assert_adata
7 | 


--------------------------------------------------------------------------------
/docs/source/import/besca.Import.read_mtx.rst:
--------------------------------------------------------------------------------
1 | read_mtx
2 | ========
3 | 
4 | .. currentmodule:: besca.Import
5 | 
6 | .. autofunction:: read_mtx
7 | 


--------------------------------------------------------------------------------
/docs/source/index.rst:
--------------------------------------------------------------------------------
 1 | .. _index:
 2 | 
 3 | .. toctree::
 4 |    :maxdepth: 2
 5 |    :caption: contents:
 6 |    :hidden:
 7 | 
 8 |    besca <besca>
 9 |    code examples <auto_examples/index>
10 |    tutorials <tutorials>
11 |    standard pipeline <besca_standard_pipeline>
12 |    adding new functions to besca <adding_new_functions>
13 | 
14 | Welcome to besca's documentation!
15 | =================================
16 | 
17 | The besca (BEDA's single-cell sequencing analysis) package builds upon the scanpy library and offers additional data structures and functions for single-cell analysis.
18 | 
19 | .. image:: _images/besca_outline.jpg
20 |    :align: center
21 | 
22 | The package has grouped into 6 modules:
23 | 
24 | - :ref:`preprocessing functions<preprocessing-functions>`: the `pp` module contains functions relevant for data preprocessing.
25 | - :ref:`plotting functions <plotting-functions>`: the `pl` module offers additional plot types not available in the scanpy package  
26 | - :ref:`tools <tools-functions>`: the `tl` module contains additional tools, for instance tools to perform differential gene analysis
27 | - :ref:`standardworkflow <standardworkflow-functions>`: the `st` module contains functions optimized for besca standard single-cell sequencing analysis pipeline
28 | - :ref:`import<import-functions>`/:ref:`export <export-functions>`: the `Import` and `export` modules are collection of functions to export/load data from the FAIR data format
29 | 
30 | In addition you will find example code and output (including some short tutorials) :doc:`here <auto_examples/index>`, as well as extensive documentation on :ref:`adding functions to besca <adding-new-functions>`.
31 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.box_per_ind.rst:
--------------------------------------------------------------------------------
1 | box_per_ind
2 | ===========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: box_per_ind
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.celllabel_quant_boxplot.rst:
--------------------------------------------------------------------------------
1 | celllabel_quant_boxplot
2 | =======================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: celllabel_quant_boxplot
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.celllabel_quant_stackedbar.rst:
--------------------------------------------------------------------------------
1 | celllabel_quant_stackedbar
2 | ==========================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: celllabel_quant_stackedbar
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.detected_genes.rst:
--------------------------------------------------------------------------------
1 | detected_genes
2 | ==============
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: detected_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.dot_heatmap.rst:
--------------------------------------------------------------------------------
1 | dot_heatmap
2 | ===========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: dot_heatmap
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.dot_heatmap_split.rst:
--------------------------------------------------------------------------------
1 | dot_heatmap_split
2 | =================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: dot_heatmap_split
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.dot_heatmap_split_greyscale.rst:
--------------------------------------------------------------------------------
1 | dot_heatmap_split_greyscale
2 | ===========================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: dot_heatmap_split_greyscale
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.dropouts.rst:
--------------------------------------------------------------------------------
1 | dropouts
2 | ========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: dropouts
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.gene_expr_split.rst:
--------------------------------------------------------------------------------
1 | gene_expr_split
2 | ===============
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: gene_expr_split
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.gene_expr_split_stacked.rst:
--------------------------------------------------------------------------------
1 | gene_expr_split_stacked
2 | =======================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: gene_expr_split_stacked
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.kp_cells.rst:
--------------------------------------------------------------------------------
1 | kp_cells
2 | ========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: kp_cells
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.kp_counts.rst:
--------------------------------------------------------------------------------
1 | kp_counts
2 | =========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: kp_counts
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.kp_genes.rst:
--------------------------------------------------------------------------------
1 | kp_genes
2 | ========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: kp_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.library_size.rst:
--------------------------------------------------------------------------------
1 | library_size
2 | ============
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: library_size
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.librarysize_overview.rst:
--------------------------------------------------------------------------------
1 | librarysize_overview
2 | ====================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: librarysize_overview
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.max_counts.rst:
--------------------------------------------------------------------------------
1 | max_counts
2 | ==========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: max_counts
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.max_genes.rst:
--------------------------------------------------------------------------------
1 | max_genes
2 | =========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: max_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.max_mito.rst:
--------------------------------------------------------------------------------
1 | max_mito
2 | ========
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: max_mito
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.nomenclature_network.rst:
--------------------------------------------------------------------------------
1 | nomenclature_network
2 | ====================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: nomenclature_network
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.riverplot_2categories.rst:
--------------------------------------------------------------------------------
1 | riverplot_2categories
2 | =====================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: riverplot_2categories
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.stacked_split_violin.rst:
--------------------------------------------------------------------------------
1 | stacked_split_violin
2 | ====================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: stacked_split_violin
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.top_genes_counts.rst:
--------------------------------------------------------------------------------
1 | top_genes_counts
2 | ================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: top_genes_counts
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.transcript_capture_efficiency.rst:
--------------------------------------------------------------------------------
1 | transcript_capture_efficiency
2 | =============================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: transcript_capture_efficiency
7 | 


--------------------------------------------------------------------------------
/docs/source/plotting/besca.pl.update_qualitative_palette.rst:
--------------------------------------------------------------------------------
1 | update_qualitative_palette
2 | ==========================
3 | 
4 | .. currentmodule:: besca.pl
5 | 
6 | .. autofunction:: update_qualitative_palette
7 | 


--------------------------------------------------------------------------------
/docs/source/preprocessing/besca.pp.filter.rst:
--------------------------------------------------------------------------------
1 | filter
2 | ======
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: filter
7 | 


--------------------------------------------------------------------------------
/docs/source/preprocessing/besca.pp.filter_gene_list.rst:
--------------------------------------------------------------------------------
1 | filter_gene_list
2 | ================
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: filter_gene_list
7 | 


--------------------------------------------------------------------------------
/docs/source/preprocessing/besca.pp.frac_pos.rst:
--------------------------------------------------------------------------------
1 | frac_pos
2 | ========
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: frac_pos
7 | 


--------------------------------------------------------------------------------
/docs/source/preprocessing/besca.pp.frac_reads.rst:
--------------------------------------------------------------------------------
1 | frac_reads
2 | ==========
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: frac_reads
7 | 


--------------------------------------------------------------------------------
/docs/source/preprocessing/besca.pp.fraction_counts.rst:
--------------------------------------------------------------------------------
1 | fraction_counts
2 | ===============
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: fraction_counts
7 | 


--------------------------------------------------------------------------------
/docs/source/preprocessing/besca.pp.mean_expr.rst:
--------------------------------------------------------------------------------
1 | mean_expr
2 | =========
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: mean_expr
7 | 


--------------------------------------------------------------------------------
/docs/source/preprocessing/besca.pp.normalize_geometric.rst:
--------------------------------------------------------------------------------
1 | normalize_geometric
2 | ===================
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: normalize_geometric
7 | 


--------------------------------------------------------------------------------
/docs/source/preprocessing/besca.pp.top_counts_genes.rst:
--------------------------------------------------------------------------------
1 | top_counts_genes
2 | ================
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: top_counts_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/preprocessing/besca.pp.top_expressed_genes.rst:
--------------------------------------------------------------------------------
1 | top_expressed_genes
2 | ===================
3 | 
4 | .. currentmodule:: besca.pp
5 | 
6 | .. autofunction:: top_expressed_genes
7 | 


--------------------------------------------------------------------------------
/docs/source/reclustering/besca.tl.rc.annotate_new_cellnames.rst:
--------------------------------------------------------------------------------
1 | annotate_new_cellnames
2 | ======================
3 | 
4 | .. currentmodule:: besca.tl.rc
5 | 
6 | .. autofunction:: annotate_new_cellnames
7 | 


--------------------------------------------------------------------------------
/docs/source/reclustering/besca.tl.rc.recluster.rst:
--------------------------------------------------------------------------------
1 | recluster
2 | =========
3 | 
4 | .. currentmodule:: besca.tl.rc
5 | 
6 | .. autofunction:: recluster
7 | 


--------------------------------------------------------------------------------
/docs/source/scripts/example_structure_environment.yml:
--------------------------------------------------------------------------------
1 | name: myenv
2 | channels:
3 | - conda-forge
4 | - defaults
5 | dependencies:
6 | - ca-certificates=2018.11.29=ha4d7672_0
7 | - cairo=1.14.12=ha4e643d_1006
8 | - ... list of all conda packages in the above format


--------------------------------------------------------------------------------
/docs/source/scripts/example_structure_environment_combined.yml:
--------------------------------------------------------------------------------
 1 | name: myenv
 2 | channels:
 3 | - conda-forge
 4 | - defaults
 5 | dependencies:
 6 | - ca-certificates=2018.11.29=ha4d7672_0
 7 | - cairo=1.14.12=ha4e643d_1006
 8 | - ... list of all conda packages in the above format
 9 | - pip:
10 |   - alabaster==0.7.12
11 |   - anndata==0.6.18
12 |   - ... list of all pip packages in the above format


--------------------------------------------------------------------------------
/docs/source/scripts/example_structure_environment_pip.yml:
--------------------------------------------------------------------------------
1 | alabaster==0.7.12
2 | anndata==0.6.18
3 | ... list of all pip packages in the above format


--------------------------------------------------------------------------------
/docs/source/scripts/gallery_package_structure.txt:
--------------------------------------------------------------------------------
 1 |  examples
 2 |   ├── gallery_examples
 3 |   │   ├── README.txt
 4 |   │   ├── plotting
 5 |   │   │   ├── README.txt
 6 |   │   │   └── ... (examples as .py files)
 7 |   │   ├── preprocessing
 8 |   │   │   ├── README.txt
 9 |   │   │   └── ... (examples as .py files)
10 |   │   ├── tools
11 |   │   │   ├── README.txt
12 |   │   │   └── ... (examples as .py files)
13 |   │   ├── workflows
14 |   │   │   ├── README.txt
15 |   │   │   └── ... (examples as .py files)
16 |   │   └── figures_testing
17 |   │       └── ... (figures generated by the examples within the gallery)
18 |   └── ... other example scripts not intended for gallery


--------------------------------------------------------------------------------
/docs/source/scripts/python_minimal_package_structure.txt:
--------------------------------------------------------------------------------
 1 |  besca
 2 |   ├── datasets
 3 |   │   └── __init__.py
 4 |   ├── export
 5 |   │   ├── __init__.py
 6 |   │   └── ... (export functions)
 7 |   ├── Import
 8 |   │   ├── __init__.py
 9 |   │   └── ... (Import functions)
10 |   ├── __init__.py
11 |   ├── pl
12 |   │   ├── __init__.py
13 |   │   └── ... (plotting functions)
14 |   ├── pp
15 |   │   ├── __init__.py
16 |   │   └── ... (preprocessing functions)
17 |   ├── st
18 |   │   ├── __init__.py
19 |   │   └── ... (standard pipeline functions)
20 |   └── tl
21 |       ├── ... (tl functions)
22 |       └── submodule
23 |           ├── __init__.py
24 |           └── ... (functions of submodule)


--------------------------------------------------------------------------------
/docs/source/scripts/python_package_structure.txt:
--------------------------------------------------------------------------------
 1 | ﻿.
 2 | ├── besca
 3 | │   ├── datasets
 4 | │   │   ├── data
 5 | │   │   │   └── ... (contains .h5ad files of all datasets included in besca)
 6 | │   │   ├── _datasets.py
 7 | │   │   └── __init__.py
 8 | │   ├── examples
 9 | │   │   ├── ... (example functions for documentation)
10 | │   │   ├── gallery_examples
11 | │   │   │   ├── figures_testing
12 | │   │   │   │   └── ... (figures generated by gallery scripts)
13 | │   │   │   ├── plotting
14 | │   │   │   │   ├── ... (gallery examples for plotting)
15 | │   │   │   │   └── README.txt
16 | │   │   │   ├── preprocessing
17 | │   │   │   │   ├── ... (gallery examples for preprocessing)
18 | │   │   │   │   └── README.txt
19 | │   │   │   ├── README.txt
20 | │   │   │   ├── tools
21 | │   │   │   │   ├── ... (gallery examples for tools)
22 | │   │   │   │   └── README.txt
23 | │   │   │   └── workflows
24 | │   │   │       ├── ... (gallery examples for workflows)
25 | │   │   │       └── README.txt
26 | │   ├── export
27 | │   │   ├── __init__.py
28 | │   │   └── ... (export functions)
29 | │   ├── _helper.py
30 | │   ├── Import
31 | │   │   ├── __init__.py
32 | │   │   └── ... (Import functions)
33 | │   ├── __init__.py
34 | │   ├── _logging.py
35 | │   ├── pl
36 | │   │   ├── __init__.py
37 | │   │   └── ... (plotting functions)
38 | │   ├── pp
39 | │   │   ├── __init__.py
40 | │   │   └── ... (preprocessing functions)
41 | │   ├── st
42 | │   │   ├── __init__.py
43 | │   │   └── ... (standard pipeline functions)
44 | │   └── tl
45 | │       ├── ... (tl functions)
46 | │       └── submodule
47 | │           ├── __init__.py
48 | │           └── ... (functions of submodule)
49 | ├── docs
50 | │   ├── Makefile
51 | │   └── source
52 | │       ├── adding_new_functions.rst
53 | │       ├── auto_examples
54 | │       │   └── ... (lots of automatically generated files (DONT MODIFY))
55 | │       ├── bcor
56 | │       │   ├── besca.tl.bcor.batch_correct.rst
57 | │       │   └── besca.tl.bcor.postprocess_mnnpy.rst
58 | │       ├── bc.rst
59 | │       ├── besca
60 | │       │   └── ... (automatically generated)
61 | │       ├── besca_maintenance.rst
62 | │       ├── besca.rst
63 | │       ├── conf.py
64 | │       ├── export
65 | │       │   └── ... (automatically generated)
66 | │       ├── images
67 | │       │   └── besca_outline.PNG
68 | │       ├── import
69 | │       │   └── ... (automatically generated)
70 | │       ├── index.rst
71 | │       ├── plotting
72 | │       │   └── ... (automatically generated)
73 | │       ├── preprocessing
74 | │       │   └── ... (automatically generated)
75 | │       ├── reclustering
76 | │       │   └── ... (automatically generated)
77 | │       ├── scripts
78 | │       │   └── ... (collection of scripts/text files for documentation)
79 | │       ├── standardworkflow
80 | │       │   └── ... (automatically generated)
81 | │       ├── tools
82 | │       │   └── ... (automatically generated)
83 | │       └── tutorials.rst
84 | ├── MANIFEST.in
85 | ├── README.md
86 | ├── requirements.txt
87 | ├── setup.py
88 | └── workbooks
89 |     ├── standard_workflow_v2.6_besca.ipynb
90 |     ├── Testing_Notebook.ipynb
91 |     └── ... (tutorial notebooks)


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.add_anno.rst:
--------------------------------------------------------------------------------
1 | add_anno
2 | ========
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: add_anno
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.combined_signature_score.rst:
--------------------------------------------------------------------------------
1 | combined_signature_score
2 | ========================
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: combined_signature_score
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.compute_signed_score.rst:
--------------------------------------------------------------------------------
1 | compute_signed_score
2 | ====================
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: compute_signed_score
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.export_annotconfig.rst:
--------------------------------------------------------------------------------
1 | export_annotconfig
2 | ==================
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: export_annotconfig
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.filter_siggenes.rst:
--------------------------------------------------------------------------------
1 | filter_siggenes
2 | ===============
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: filter_siggenes
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.get_gems.rst:
--------------------------------------------------------------------------------
1 | get_gems
2 | ========
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: get_gems
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.get_similar_geneset.rst:
--------------------------------------------------------------------------------
1 | get_similar_geneset
2 | ===================
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: get_similar_geneset
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.getset.rst:
--------------------------------------------------------------------------------
1 | getset
2 | ======
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: getset
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.insert_gems.rst:
--------------------------------------------------------------------------------
1 | insert_gems
2 | ===========
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: insert_gems
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.make_anno.rst:
--------------------------------------------------------------------------------
1 | make_anno
2 | =========
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: make_anno
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.match_cluster.rst:
--------------------------------------------------------------------------------
1 | match_cluster
2 | =============
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: match_cluster
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.obtain_dblabel.rst:
--------------------------------------------------------------------------------
1 | obtain_dblabel
2 | ==============
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: obtain_dblabel
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.read_GMT_sign.rst:
--------------------------------------------------------------------------------
1 | read_GMT_sign
2 | =============
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: read_GMT_sign
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.read_annotconfig.rst:
--------------------------------------------------------------------------------
1 | read_annotconfig
2 | ================
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: read_annotconfig
7 | 


--------------------------------------------------------------------------------
/docs/source/sig/besca.tl.sig.score_mw.rst:
--------------------------------------------------------------------------------
1 | score_mw
2 | ========
3 | 
4 | .. currentmodule:: besca.tl.sig
5 | 
6 | .. autofunction:: score_mw
7 | 


--------------------------------------------------------------------------------
/docs/source/standardworkflow/besca.st.additional_labeling.rst:
--------------------------------------------------------------------------------
1 | additional_labeling
2 | ===================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: additional_labeling
7 | 


--------------------------------------------------------------------------------
/docs/source/standardworkflow/besca.st.celltype_labeling.rst:
--------------------------------------------------------------------------------
1 | celltype_labeling
2 | =================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: celltype_labeling
7 | 


--------------------------------------------------------------------------------
/docs/source/standardworkflow/besca.st.export_celltype.rst:
--------------------------------------------------------------------------------
1 | export_celltype
2 | ===============
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_celltype
7 | 


--------------------------------------------------------------------------------
/docs/source/standardworkflow/besca.st.export_clustering.rst:
--------------------------------------------------------------------------------
1 | export_clustering
2 | =================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_clustering
7 | 


--------------------------------------------------------------------------------
/docs/source/standardworkflow/besca.st.export_cp10k.rst:
--------------------------------------------------------------------------------
1 | export_cp10k
2 | ============
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_cp10k
7 | 


--------------------------------------------------------------------------------
/docs/source/standardworkflow/besca.st.export_metadata.rst:
--------------------------------------------------------------------------------
1 | export_metadata
2 | ===============
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_metadata
7 | 


--------------------------------------------------------------------------------
/docs/source/standardworkflow/besca.st.export_rank.rst:
--------------------------------------------------------------------------------
1 | export_rank
2 | ===========
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_rank
7 | 


--------------------------------------------------------------------------------
/docs/source/standardworkflow/besca.st.export_regressedOut.rst:
--------------------------------------------------------------------------------
1 | export_regressedOut
2 | ===================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: export_regressedOut
7 | 


--------------------------------------------------------------------------------
/docs/source/standardworkflow/besca.st.filtering_cells_genes_min.rst:
--------------------------------------------------------------------------------
1 | filtering_cells_genes_min
2 | =========================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: filtering_cells_genes_min
7 | 


--------------------------------------------------------------------------------
/docs/source/standardworkflow/besca.st.filtering_mito_genes_max.rst:
--------------------------------------------------------------------------------
1 | filtering_mito_genes_max
2 | ========================
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: filtering_mito_genes_max
7 | 


--------------------------------------------------------------------------------
/docs/source/standardworkflow/besca.st.read_matrix.rst:
--------------------------------------------------------------------------------
1 | read_matrix
2 | ===========
3 | 
4 | .. currentmodule:: besca.st
5 | 
6 | .. autofunction:: read_matrix
7 | 


--------------------------------------------------------------------------------
/docs/source/tools/besca.tl.annotate_cells_clustering.rst:
--------------------------------------------------------------------------------
1 | annotate_cells_clustering
2 | =========================
3 | 
4 | .. currentmodule:: besca.tl
5 | 
6 | .. autofunction:: annotate_cells_clustering
7 | 


--------------------------------------------------------------------------------
/docs/source/tools/besca.tl.count_occurrence.rst:
--------------------------------------------------------------------------------
1 | count_occurrence
2 | ===============
3 | 
4 | .. currentmodule:: besca.tl
5 | 
6 | .. autofunction:: count_occurrence
7 | 


--------------------------------------------------------------------------------
/docs/source/tools/besca.tl.count_occurrence_subset.rst:
--------------------------------------------------------------------------------
1 | count_occurrence_subset
2 | ======================
3 | 
4 | .. currentmodule:: besca.tl
5 | 
6 | .. autofunction:: count_occurrence_subset
7 | 


--------------------------------------------------------------------------------
/docs/source/tools/besca.tl.count_occurrence_subset_conditions.rst:
--------------------------------------------------------------------------------
1 | count_occurrence_subset_conditions
2 | =================================
3 | 
4 | .. currentmodule:: besca.tl
5 | 
6 | .. autofunction:: count_occurrence_subset_conditions
7 | 


--------------------------------------------------------------------------------
/docs/source/tutorials.rst:
--------------------------------------------------------------------------------
 1 | .. _tutorials:
 2 | 
 3 | tutorials
 4 | =========
 5 | 
 6 | 
 7 | .. toctree::
 8 |    :hidden:
 9 |    :maxdepth: 2
10 | 
11 |    tutorials/notebook1_data_processing_pbmc3k.ipynb
12 |    tutorials/notebook2_celltype_annotation_pbmc3k.ipynb
13 |    tutorials/notebook3_batch_correction.ipynb
14 |    tutorials/auto_annot_tutorial.ipynb
15 |    tutorials_html/bescape_tutorial.html
16 |    tutorials_html/adata_to_eset.html
17 | 
18 | 
19 | single cell sequencing general tutorials
20 | ---------------------------------------------------------------
21 | 
22 | This tutorial will give you a general introduction into single-cell sequencing analysis using scanpy and besca. It is divided into three seperate notebooks that should be looked at in consecutive order (they build up on results from the previous notebooks).
23 | 
24 | **Part 1**: :doc:`data processing <tutorials/notebook1_data_processing_pbmc3k>` 
25 | 
26 | **Part 2**: :doc:`celltype annotation <tutorials/notebook2_celltype_annotation_pbmc3k>`
27 | 
28 | **Part 3**: :doc:`batch correction <tutorials/notebook3_batch_correction>`
29 | 
30 | After looking at the introductory tutorial you can download the hands-on tutorial yourself from `here <github.com/bedapub/besca/blob/master/docs/source/tutorials/scRNAseq_tutorial.ipynb>`_  (please save the link as a :code:`.ipynb` file) and compare with the results published :doc:`here <tutorials/scRNAseq_tutorial>`.
31 | 
32 | 
33 | single cell auto_annot tutorial for cell type annotation
34 | ---------------------------------------------------------------
35 | 
36 | We also provide a tutorial for the auto_annot package, which allows to automatically annotate cell types using supervised machine learning, 
37 | you can download it from `here <http://github.com/bedapub/besca/blob/master/docs/source/tutorials/auto_annot_tutorial.ipynb>`_  
38 | (please save the link as a :code:`.ipynb` file) and compare with the results published
39 |  :doc:`here <tutorials/auto_annot_tutorial>`.
40 | 
41 | 
42 | Bescape: cell deconvolution tutorial
43 | ---------------------------------------------------------------
44 | 
45 | 
46 | Bescape (BESCA proportion estimator) is a deconvolution module. It utilises single-cell annotations coming from the BESCA workflow to build a Gene Expression Profile (GEP). This GEP is used as a basis vector to deconvolute bulk RNA samples i.e. predict cell type proportions within a sample.
47 | 
48 | **Deconvolution tutorial**:   :download:`Bescape <tutorials_html/bescape_tutorial.html>`
49 | 
50 | 
51 | Some deconvolution methods provided by Bescape are written in R. 
52 | Thus, we need to convert the AnnData objects to R ExpressionSet objects. This has been semi-automated : 
53 | 
54 | **adata_to_eset tutorial:**   :download:`here <tutorials_html/adata_to_eset.html>`
55 | 
56 | 


--------------------------------------------------------------------------------
/docs/source/tutorials/scRNAseq_tutorial.umap_comparison_figure.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bedapub/besca/27c36b5e7d22790f429056cb8b1c2539469bc50a/docs/source/tutorials/scRNAseq_tutorial.umap_comparison_figure.png


--------------------------------------------------------------------------------
/docs/source/tutorials_html/generate_tutorialHtml.sh:
--------------------------------------------------------------------------------
1 | # GET static file:
2 | for file in adata_to_eset.ipynb bescape_tutorial.ipynb
3 | do
4 |     jupyter nbconvert --to html ../tutorials/$file 
5 | done
6 | mv ../tutorials/*.html .
7 | 


--------------------------------------------------------------------------------
/environment.yml:
--------------------------------------------------------------------------------
 1 | name: besca_dev
 2 | channels:
 3 |   - conda-forge
 4 |   - bioconda
 5 |   - defaults
 6 | dependencies:
 7 |   - python=3.9
 8 |   - scipy
 9 |   - flask-restful
10 |   - dominate
11 |   - requests
12 |   - numpy<1.24
13 |   - scanpy
14 |   - plotly
15 |   - anndata
16 |   - seaborn
17 |   - mygene
18 |   - pandas
19 |   - matplotlib
20 |   - python-igraph
21 |   - leidenalg
22 |   - scanorama
23 |   - scvelo
24 |   - umap-learn
25 |   - session-info
26 |   - pydot
27 |   - scvi-tools
28 |   - ipython
29 |   - pytest
30 |   - deprecation
31 |   - gseapy
32 |   - pip
33 |   - pip:
34 |       - scikit_learn>=1.0.0
35 |       - git+https://github.com/matchy233/bbknn.git@fix
36 |       - nbclean>=0.3.2
37 |       - jax==0.4.7
38 |       - jaxlib==0.4.7
39 |       - git+https://github.com/bedapub/besca.git
40 | 


--------------------------------------------------------------------------------
/pytest.ini:
--------------------------------------------------------------------------------
1 | [pytest]
2 | addopts = -p no:warnings --junit-xml=tests/output_junit.xml


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
 1 | scipy>=1.5.4
 2 | flask-restful
 3 | dominate
 4 | requests
 5 | numpy>=1.18.0
 6 | scanpy>=1.7.2
 7 | plotly
 8 | anndata>=0.7.4
 9 | seaborn
10 | mygene
11 | pandas>=1.1.0
12 | matplotlib>=3.5.0
13 | bbknn
14 | ipython
15 | nbclean
16 | scikit_learn>=1.0.2
17 | python-igraph
18 | leidenalg>=0.8.3
19 | scanorama
20 | scvelo
21 | umap-learn
22 | session-info
23 | pydot
24 | scvi-tools
25 | ipython
26 | pytest
27 | deprecation
28 | gseapy
29 | 


--------------------------------------------------------------------------------
/setup.cfg:
--------------------------------------------------------------------------------
1 | [versioneer]
2 | VCS = git
3 | style = pep440
4 | versionfile_source = besca/_version.py
5 | versionfile_build = besca/_version.py
6 | tag_prefix =
7 | parentdir_prefix = besca-
8 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | """ setup procedure """
 2 | 
 3 | if __name__ == "__main__":
 4 | 
 5 |     from setuptools import setup, find_packages
 6 |     import versioneer
 7 | 
 8 |     reqs = open("requirements.txt", encoding="utf-8").readlines()
 9 |     requires = [req.strip() for req in reqs]
10 | 
11 |     with open("README.md", "r") as fh:
12 |         long_description = fh.read()
13 | 
14 |     setup(
15 |         name="besca",
16 |         version=versioneer.get_version(),
17 |         cmdclass=versioneer.get_cmdclass(),
18 |         description="Collection of BEDA internal python functions for analysing single cell RNAseq data.",
19 |         long_description=long_description,
20 |         long_description_content_type="text/markdown",
21 |         classifiers=[
22 |             "Development Status :: 5 - Production/Stable",
23 |             "Intended Audience :: Developers",
24 |             "Topic :: Software Development :: Build Tools",
25 |             "License :: OSI Approved :: GNU General Public License v3 (GPLv3)",
26 |             "Programming Language :: Python :: 3",
27 |             "Programming Language :: Python :: 3.8",
28 |         ],
29 |         url="https://github.com/bedapub/besca",
30 |         license="GPLv3",
31 |         author="BEDA community",
32 |         author_email="manuel.kohler@roche.com",
33 |         packages=find_packages(exclude=["devtools", "tests"]),
34 |         zip_safe=False,
35 |         package_data={
36 |             "besca.datasets.data": ["*.h5ad"],
37 |             "besca.st": ["*.css"],
38 |             "besca.datasets.nomenclature": ["*.tsv"],
39 |             "besca.datasets.mito_files": ["*.tsv"],
40 |             "besca.datasets.genesets": ["*.gmt", "*.tsv"],
41 |             "besca.datasets.homologs": ["*.tsv"],
42 |         },
43 |         install_requires=requires,
44 |     )
45 | 


--------------------------------------------------------------------------------
/tests/__init__.py:
--------------------------------------------------------------------------------
 1 | from besca import pl
 2 | from besca import tl
 3 | from besca import pp
 4 | from besca import st
 5 | from besca import datasets
 6 | from besca import export
 7 | from besca import Import
 8 | 
 9 | 
10 | from besca._helper import (
11 |     subset_adata,
12 |     convert_ensembl_to_symbol,
13 |     convert_symbol_to_ensembl,
14 |     get_raw,
15 |     get_ameans,
16 |     get_means,
17 |     concate_adata,
18 |     get_singlegenedf,
19 |     print_software_versions,
20 | )
21 | 
22 | from besca._notebook import (
23 |     save_notebook,
24 |     save_notebook_return_path,
25 |     convert_notebook_to_HTML,
26 | )
27 | 
28 | __all__ = [
29 |     "pl",
30 |     "tl",
31 |     "pp",
32 |     "st",
33 |     "datasets",
34 |     "export",
35 |     "Import",
36 |     "subset_adata",
37 |     "import",
38 |     "convert_ensembl_to_symbol",
39 |     "convert_symbol_to_ensembl",
40 |     "get_raw",
41 |     "get_ameans",
42 |     "get_means",
43 |     "concate_adata",
44 |     "get_singlegenedf",
45 |     "print_software_versions",
46 |     "save_notebook",
47 |     "save_notebook_return_path",
48 |     "convert_notebook_to_HTML",
49 | ]
50 | 
51 | from besca._version import get_versions
52 | 
53 | __version__ = get_versions()["version"]
54 | del get_versions
55 | 


--------------------------------------------------------------------------------
/tests/data/st/wrapper_funcs/labeling_test_CTL_OLD/labelings/celltype/celltype_labelinfo.tsv:
--------------------------------------------------------------------------------
1 | description	isPublic	isDefault	isExpert	isReference	method	annotated_version_of
2 | manual celltype annotation	FALSE	FALSE	TRUE	FALSE	MK	louvain
3 | 


--------------------------------------------------------------------------------
/tests/data/st/wrapper_funcs/labeling_test_CTL_OLD/labelings/celltype/labelinfo.tsv:
--------------------------------------------------------------------------------
1 | description	isPublic	isDefault	isExpert	isReference	method	annotated_version_of
2 | ctl_new	TRUE	FALSE	FALSE	TRUE	MK	-
3 | 


--------------------------------------------------------------------------------
/workbooks/README.md:
--------------------------------------------------------------------------------
 1 | # BESCA notebooks (and tutorials)
 2 | 
 3 | This directory includes the major notebooks to run 
 4 | - the standard workflow [standard_workflow_besca2.ipynb](https://github.com/bedapub/besca/blob/master/workbooks/standard_workflow_besca2.ipynb) 
 5 | - the Sig-Annot cell type annotation workflow [celltype_annotation_besca.ipynb](https://github.com/bedapub/besca/blob/master/workbooks/celltype_annotation_besca.ipynb)
 6 | 
 7 | Additional tutorials are described in the documentation: https://bedapub.github.io/besca/tutorials.html
 8 | 
 9 | The associated notebooks are available from here: https://github.com/bedapub/besca/tree/master/docs/source/tutorials
10 | 
11 | Basic tutorial notebooks:
12 | - [notebook1_data_processing_pbmc3k.ipynb](https://github.com/bedapub/besca/blob/master/docs/source/tutorials/notebook1_data_processing_pbmc3k.ipynb)
13 | - [notebook2_celltype_annotation_pbmc3k.ipynb](https://github.com/bedapub/besca/blob/master/docs/source/tutorials/notebook2_celltype_annotation_pbmc3k.ipynb)
14 | - [notebook3_batch_correction.ipynb](https://github.com/bedapub/besca/blob/master/docs/source/tutorials/notebook3_batch_correction.ipynb)
15 | - [scRNAseq_tutorial.ipynb](https://github.com/bedapub/besca/blob/master/docs/source/tutorials/scRNAseq_tutorial.ipynb)
16 | 
17 | Auto-annot tutorial notebook:
18 | - [auto_annot_tutorial.ipynb](https://github.com/bedapub/besca/blob/master/docs/source/tutorials/auto_annot_tutorial.ipynb)
19 | 
20 | Bescape notebooks
21 | - [bescape_tutorial.ipynb](https://github.com/bedapub/besca/blob/master/docs/source/tutorials/bescape_tutorial.ipynb)
22 | - [adata_to_eset.ipynb](https://github.com/bedapub/besca/blob/master/docs/source/tutorials/adata_to_eset.ipynb)
23 | 
24 | Additional examples and notebooks are available from the Besca manuscript repository:
25 | https://github.com/bedapub/besca_publication_results
26 | 


--------------------------------------------------------------------------------
/workbooks/minimal_notebook.ipynb:
--------------------------------------------------------------------------------
 1 | {
 2 |  "cells": [
 3 |   {
 4 |    "cell_type": "markdown",
 5 |    "metadata": {},
 6 |    "source": [
 7 |     "# Minimalal notebook to test convert_notebook_to_HTML()"
 8 |    ]
 9 |   },
10 |   {
11 |    "cell_type": "code",
12 |    "execution_count": null,
13 |    "metadata": {},
14 |    "outputs": [],
15 |    "source": [
16 |     "import besca as bc"
17 |    ]
18 |   },
19 |   {
20 |    "cell_type": "code",
21 |    "execution_count": null,
22 |    "metadata": {},
23 |    "outputs": [],
24 |    "source": [
25 |     "bc.print_software_versions()"
26 |    ]
27 |   },
28 |   {
29 |    "cell_type": "code",
30 |    "execution_count": null,
31 |    "metadata": {},
32 |    "outputs": [],
33 |    "source": [
34 |     "bc.convert_notebook_to_HTML()"
35 |    ]
36 |   }
37 |  ],
38 |  "metadata": {
39 |   "kernelspec": {
40 |    "display_name": "Python 3",
41 |    "language": "python",
42 |    "name": "python3"
43 |   },
44 |   "language_info": {
45 |    "codemirror_mode": {
46 |     "name": "ipython",
47 |     "version": 3
48 |    },
49 |    "file_extension": ".py",
50 |    "mimetype": "text/x-python",
51 |    "name": "python",
52 |    "nbconvert_exporter": "python",
53 |    "pygments_lexer": "ipython3",
54 |    "version": "3.9.12"
55 |   }
56 |  },
57 |  "nbformat": 4,
58 |  "nbformat_minor": 4
59 | }
60 | 


--------------------------------------------------------------------------------