├── .cursor └── rules │ ├── sae_evaluation.mdc │ ├── sae_training.mdc │ └── sparse_autoencoder_overview.mdc ├── .cursorrules ├── .github └── workflows │ ├── checks.yml │ └── publish.yml ├── .gitignore ├── .gitmodules ├── .pre-commit-config.yaml ├── README.md ├── docs ├── assets │ └── images │ │ └── lm-saes-overview.svg ├── concepts.md ├── index.md ├── javascripts │ └── katex.js └── style-guide.md ├── examples ├── generate_pythia_activation_1d.py ├── generate_pythia_activation_2d.py ├── reproduce_evolution_of_concepts │ ├── README.md │ ├── analyze_pythia_crosscoder.py │ ├── generate_pythia_activations_1d.py │ ├── generate_pythia_activations_2d.py │ └── train_pythia_crosscoder.py ├── train_pythia_sae.py └── train_pythia_sae_with_pre_generated_activations.py ├── mkdocs.yml ├── pyproject.toml ├── scripts └── gen_ref_pages.py ├── server ├── .env.example ├── __init__.py └── app.py ├── src └── lm_saes │ ├── __init__.py │ ├── abstract_sae.py │ ├── activation │ ├── __init__.py │ ├── factory.py │ ├── processors │ │ ├── __init__.py │ │ ├── activation.py │ │ ├── cached_activation.py │ │ ├── core.py │ │ ├── huggingface.py │ │ └── token.py │ └── writer.py │ ├── activation_functions.py │ ├── analysis │ ├── __init__.py │ ├── direct_logit_attributor.py │ ├── feature_analyzer.py │ ├── feature_interpreter.py │ └── post_analysis │ │ ├── __init__.py │ │ ├── base.py │ │ ├── clt.py │ │ ├── crosscoder.py │ │ ├── generic.py │ │ └── lorsa.py │ ├── backend │ ├── __init__.py │ └── language_model.py │ ├── circuit │ ├── __init__.py │ ├── attribution.py │ ├── autointerp4graph.py │ ├── graph.py │ ├── replacement_model.py │ └── utils │ │ ├── argument_graph_file.py │ │ ├── create_graph_files.py │ │ ├── disk_offload.py │ │ └── load_transcoder_set.py │ ├── clt.py │ ├── config.py │ ├── crosscoder.py │ ├── database.py │ ├── entrypoint.py │ ├── evaluator.py │ ├── initializer.py │ ├── kernels │ ├── __init__.py │ ├── entrypoints.py │ └── kernels.py │ ├── lorsa.py │ ├── molt.py │ ├── optim.py │ ├── resource_loaders.py │ ├── runners │ ├── __init__.py │ ├── analyze.py │ ├── autointerp.py │ ├── eval.py │ ├── generate.py │ ├── topk_to_jumprelu_conversion.py │ ├── train.py │ └── utils.py │ ├── sae.py │ ├── trainer.py │ └── utils │ ├── __init__.py │ ├── bytes.py │ ├── discrete.py │ ├── distributed │ ├── __init__.py │ ├── dimmap.py │ ├── ops.py │ └── utils.py │ ├── huggingface.py │ ├── logging.py │ ├── math.py │ ├── misc.py │ ├── tensor_dict.py │ ├── timer.py │ └── topk_to_jumprelu_conversion.py ├── tests ├── __init__.py ├── integration │ ├── test_activation_factory.py │ ├── test_attribution.py │ └── test_train_sae.py └── unit │ ├── test_activation_processors.py │ ├── test_activation_processors_distributed.py │ ├── test_activation_writer.py │ ├── test_attribution.py │ ├── test_clt.py │ ├── test_clt_distributed.py │ ├── test_crosscoder.py │ ├── test_database.py │ ├── test_discrete_mapper.py │ ├── test_dla.py │ ├── test_evaluator.py │ ├── test_example.py │ ├── test_feature_analyzer.py │ ├── test_feature_interpreter.py │ ├── test_hf_backend.py │ ├── test_initializer.py │ ├── test_misc.py │ ├── test_sae.py │ └── test_util_distributed.py └── ui ├── .env.example ├── .eslintrc.cjs ├── .gitignore ├── .prettierrc.cjs ├── README.md ├── bun.lockb ├── components.json ├── index.html ├── package.json ├── postcss.config.js ├── public ├── circuits │ ├── addition │ │ ├── index.html │ │ ├── init-add-big-feature.js │ │ ├── init-add-connections.js │ │ ├── init.js │ │ ├── style.css │ │ └── util-add.js │ ├── attribution_graph │ │ ├── cg.css │ │ ├── gridsnap │ │ │ ├── gridsnap.css │ │ │ └── init-gridsnap.js │ │ ├── init-cg-button-container.js │ │ ├── init-cg-clerp-list.js │ │ ├── init-cg-feature-detail.js │ │ ├── init-cg-feature-scatter.js │ │ ├── init-cg-link-graph.js │ │ ├── init-cg-node-connections.js │ │ ├── init-cg-subgraph.js │ │ ├── init-cg.js │ │ └── util-cg.js │ ├── example_data │ │ └── capital-state-dallas.json │ ├── feature_examples │ │ ├── feature-examples.css │ │ ├── init-feature-examples-list.js │ │ ├── init-feature-examples-logits.js │ │ └── init-feature-examples.js │ ├── style.css │ └── util.js ├── openmoss.ico └── vite.svg ├── src ├── components │ ├── app │ │ ├── feature-preview.tsx │ │ ├── navbar.tsx │ │ ├── sample.tsx │ │ ├── section-navigator.tsx │ │ └── token.tsx │ ├── attn-head │ │ └── attn-head-card.tsx │ ├── circuits │ │ ├── circuit-styles.css │ │ ├── circuit-visualization.tsx │ │ ├── link-graph-container.tsx │ │ ├── link-graph │ │ │ ├── atomic-components.tsx │ │ │ ├── grid-lines.tsx │ │ │ ├── index.ts │ │ │ ├── link-graph.css │ │ │ ├── link-graph.tsx │ │ │ ├── links.tsx │ │ │ ├── nodes.tsx │ │ │ ├── row-backgrounds.tsx │ │ │ ├── token-labels.tsx │ │ │ ├── tooltips.tsx │ │ │ ├── types.ts │ │ │ ├── utils.ts │ │ │ └── y-axis.tsx │ │ ├── node-connections.tsx │ │ ├── static_js │ │ │ ├── d3.js │ │ │ ├── jetpack_2024-07-20.js │ │ │ └── npy_v0.js │ │ ├── style.css │ │ └── util.js │ ├── dictionary │ │ ├── dictionary-card.tsx │ │ └── sample.tsx │ ├── feature │ │ ├── feature-card.tsx │ │ ├── interpret.tsx │ │ └── sample.tsx │ ├── model │ │ └── model-card.tsx │ └── ui │ │ ├── accordion.tsx │ │ ├── badge.tsx │ │ ├── button.tsx │ │ ├── card.tsx │ │ ├── combobox.tsx │ │ ├── command.tsx │ │ ├── context-menu.tsx │ │ ├── data-table.tsx │ │ ├── dialog.tsx │ │ ├── dropdown-menu.tsx │ │ ├── hover-card.tsx │ │ ├── input.tsx │ │ ├── label.tsx │ │ ├── multiple-selector.tsx │ │ ├── pagination.tsx │ │ ├── popover.tsx │ │ ├── select.tsx │ │ ├── separator.tsx │ │ ├── switch.tsx │ │ ├── table.tsx │ │ ├── tabs.tsx │ │ ├── textarea.tsx │ │ ├── toggle.tsx │ │ └── tooltip.tsx ├── contexts │ └── AppStateContext.tsx ├── globals.css ├── lib │ └── utils.ts ├── main.tsx ├── routes │ ├── attn-heads │ │ └── page.tsx │ ├── bookmarks │ │ └── page.tsx │ ├── circuits │ │ └── page.tsx │ ├── dictionaries │ │ └── page.tsx │ ├── features │ │ └── page.tsx │ ├── models │ │ └── page.tsx │ └── page.tsx ├── tanstack.d.ts ├── types │ ├── attn-head.ts │ ├── dictionary.ts │ ├── feature.ts │ └── model.ts ├── utils │ ├── api.ts │ ├── array.ts │ ├── statePersistence.ts │ ├── style.ts │ └── token.ts └── vite-env.d.ts ├── tailwind.config.js ├── test-integration.html ├── tsconfig.json ├── tsconfig.node.json └── vite.config.ts /.cursor/rules/sae_evaluation.mdc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/.cursor/rules/sae_evaluation.mdc -------------------------------------------------------------------------------- /.cursor/rules/sae_training.mdc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/.cursor/rules/sae_training.mdc -------------------------------------------------------------------------------- /.cursor/rules/sparse_autoencoder_overview.mdc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/.cursor/rules/sparse_autoencoder_overview.mdc -------------------------------------------------------------------------------- /.cursorrules: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/.cursorrules -------------------------------------------------------------------------------- /.github/workflows/checks.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/.github/workflows/checks.yml -------------------------------------------------------------------------------- /.github/workflows/publish.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/.github/workflows/publish.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/.gitignore -------------------------------------------------------------------------------- /.gitmodules: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/.gitmodules -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/README.md -------------------------------------------------------------------------------- /docs/assets/images/lm-saes-overview.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/docs/assets/images/lm-saes-overview.svg -------------------------------------------------------------------------------- /docs/concepts.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/docs/concepts.md -------------------------------------------------------------------------------- /docs/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/docs/index.md -------------------------------------------------------------------------------- /docs/javascripts/katex.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/docs/javascripts/katex.js -------------------------------------------------------------------------------- /docs/style-guide.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/docs/style-guide.md -------------------------------------------------------------------------------- /examples/generate_pythia_activation_1d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/examples/generate_pythia_activation_1d.py -------------------------------------------------------------------------------- /examples/generate_pythia_activation_2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/examples/generate_pythia_activation_2d.py -------------------------------------------------------------------------------- /examples/reproduce_evolution_of_concepts/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/examples/reproduce_evolution_of_concepts/README.md -------------------------------------------------------------------------------- /examples/reproduce_evolution_of_concepts/analyze_pythia_crosscoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/examples/reproduce_evolution_of_concepts/analyze_pythia_crosscoder.py -------------------------------------------------------------------------------- /examples/reproduce_evolution_of_concepts/generate_pythia_activations_1d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/examples/reproduce_evolution_of_concepts/generate_pythia_activations_1d.py -------------------------------------------------------------------------------- /examples/reproduce_evolution_of_concepts/generate_pythia_activations_2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/examples/reproduce_evolution_of_concepts/generate_pythia_activations_2d.py -------------------------------------------------------------------------------- /examples/reproduce_evolution_of_concepts/train_pythia_crosscoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/examples/reproduce_evolution_of_concepts/train_pythia_crosscoder.py -------------------------------------------------------------------------------- /examples/train_pythia_sae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/examples/train_pythia_sae.py -------------------------------------------------------------------------------- /examples/train_pythia_sae_with_pre_generated_activations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/examples/train_pythia_sae_with_pre_generated_activations.py -------------------------------------------------------------------------------- /mkdocs.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/mkdocs.yml -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/pyproject.toml -------------------------------------------------------------------------------- /scripts/gen_ref_pages.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/scripts/gen_ref_pages.py -------------------------------------------------------------------------------- /server/.env.example: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/server/.env.example -------------------------------------------------------------------------------- /server/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /server/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/server/app.py -------------------------------------------------------------------------------- /src/lm_saes/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/__init__.py -------------------------------------------------------------------------------- /src/lm_saes/abstract_sae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/abstract_sae.py -------------------------------------------------------------------------------- /src/lm_saes/activation/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/activation/__init__.py -------------------------------------------------------------------------------- /src/lm_saes/activation/factory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/activation/factory.py -------------------------------------------------------------------------------- /src/lm_saes/activation/processors/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/activation/processors/__init__.py -------------------------------------------------------------------------------- /src/lm_saes/activation/processors/activation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/activation/processors/activation.py -------------------------------------------------------------------------------- /src/lm_saes/activation/processors/cached_activation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/activation/processors/cached_activation.py -------------------------------------------------------------------------------- /src/lm_saes/activation/processors/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/activation/processors/core.py -------------------------------------------------------------------------------- /src/lm_saes/activation/processors/huggingface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/activation/processors/huggingface.py -------------------------------------------------------------------------------- /src/lm_saes/activation/processors/token.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/activation/processors/token.py -------------------------------------------------------------------------------- /src/lm_saes/activation/writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/activation/writer.py -------------------------------------------------------------------------------- /src/lm_saes/activation_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/activation_functions.py -------------------------------------------------------------------------------- /src/lm_saes/analysis/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/analysis/__init__.py -------------------------------------------------------------------------------- /src/lm_saes/analysis/direct_logit_attributor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/analysis/direct_logit_attributor.py -------------------------------------------------------------------------------- /src/lm_saes/analysis/feature_analyzer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/analysis/feature_analyzer.py -------------------------------------------------------------------------------- /src/lm_saes/analysis/feature_interpreter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/analysis/feature_interpreter.py -------------------------------------------------------------------------------- /src/lm_saes/analysis/post_analysis/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/analysis/post_analysis/__init__.py -------------------------------------------------------------------------------- /src/lm_saes/analysis/post_analysis/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/analysis/post_analysis/base.py -------------------------------------------------------------------------------- /src/lm_saes/analysis/post_analysis/clt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/analysis/post_analysis/clt.py -------------------------------------------------------------------------------- /src/lm_saes/analysis/post_analysis/crosscoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/analysis/post_analysis/crosscoder.py -------------------------------------------------------------------------------- /src/lm_saes/analysis/post_analysis/generic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/analysis/post_analysis/generic.py -------------------------------------------------------------------------------- /src/lm_saes/analysis/post_analysis/lorsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/analysis/post_analysis/lorsa.py -------------------------------------------------------------------------------- /src/lm_saes/backend/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/backend/__init__.py -------------------------------------------------------------------------------- /src/lm_saes/backend/language_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/backend/language_model.py -------------------------------------------------------------------------------- /src/lm_saes/circuit/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/circuit/__init__.py -------------------------------------------------------------------------------- /src/lm_saes/circuit/attribution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/circuit/attribution.py -------------------------------------------------------------------------------- /src/lm_saes/circuit/autointerp4graph.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/circuit/autointerp4graph.py -------------------------------------------------------------------------------- /src/lm_saes/circuit/graph.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/circuit/graph.py -------------------------------------------------------------------------------- /src/lm_saes/circuit/replacement_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/circuit/replacement_model.py -------------------------------------------------------------------------------- /src/lm_saes/circuit/utils/argument_graph_file.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/circuit/utils/argument_graph_file.py -------------------------------------------------------------------------------- /src/lm_saes/circuit/utils/create_graph_files.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/circuit/utils/create_graph_files.py -------------------------------------------------------------------------------- /src/lm_saes/circuit/utils/disk_offload.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/circuit/utils/disk_offload.py -------------------------------------------------------------------------------- /src/lm_saes/circuit/utils/load_transcoder_set.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/circuit/utils/load_transcoder_set.py -------------------------------------------------------------------------------- /src/lm_saes/clt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/clt.py -------------------------------------------------------------------------------- /src/lm_saes/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/config.py -------------------------------------------------------------------------------- /src/lm_saes/crosscoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/crosscoder.py -------------------------------------------------------------------------------- /src/lm_saes/database.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/database.py -------------------------------------------------------------------------------- /src/lm_saes/entrypoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/entrypoint.py -------------------------------------------------------------------------------- /src/lm_saes/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/evaluator.py -------------------------------------------------------------------------------- /src/lm_saes/initializer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/initializer.py -------------------------------------------------------------------------------- /src/lm_saes/kernels/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/kernels/__init__.py -------------------------------------------------------------------------------- /src/lm_saes/kernels/entrypoints.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/kernels/entrypoints.py -------------------------------------------------------------------------------- /src/lm_saes/kernels/kernels.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/kernels/kernels.py -------------------------------------------------------------------------------- /src/lm_saes/lorsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/lorsa.py -------------------------------------------------------------------------------- /src/lm_saes/molt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/molt.py -------------------------------------------------------------------------------- /src/lm_saes/optim.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/optim.py -------------------------------------------------------------------------------- /src/lm_saes/resource_loaders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/resource_loaders.py -------------------------------------------------------------------------------- /src/lm_saes/runners/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/runners/__init__.py -------------------------------------------------------------------------------- /src/lm_saes/runners/analyze.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/runners/analyze.py -------------------------------------------------------------------------------- /src/lm_saes/runners/autointerp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/runners/autointerp.py -------------------------------------------------------------------------------- /src/lm_saes/runners/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/runners/eval.py -------------------------------------------------------------------------------- /src/lm_saes/runners/generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/runners/generate.py -------------------------------------------------------------------------------- /src/lm_saes/runners/topk_to_jumprelu_conversion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/runners/topk_to_jumprelu_conversion.py -------------------------------------------------------------------------------- /src/lm_saes/runners/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/runners/train.py -------------------------------------------------------------------------------- /src/lm_saes/runners/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/runners/utils.py -------------------------------------------------------------------------------- /src/lm_saes/sae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/sae.py -------------------------------------------------------------------------------- /src/lm_saes/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/trainer.py -------------------------------------------------------------------------------- /src/lm_saes/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/lm_saes/utils/bytes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/bytes.py -------------------------------------------------------------------------------- /src/lm_saes/utils/discrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/discrete.py -------------------------------------------------------------------------------- /src/lm_saes/utils/distributed/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/distributed/__init__.py -------------------------------------------------------------------------------- /src/lm_saes/utils/distributed/dimmap.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/distributed/dimmap.py -------------------------------------------------------------------------------- /src/lm_saes/utils/distributed/ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/distributed/ops.py -------------------------------------------------------------------------------- /src/lm_saes/utils/distributed/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/distributed/utils.py -------------------------------------------------------------------------------- /src/lm_saes/utils/huggingface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/huggingface.py -------------------------------------------------------------------------------- /src/lm_saes/utils/logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/logging.py -------------------------------------------------------------------------------- /src/lm_saes/utils/math.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/math.py -------------------------------------------------------------------------------- /src/lm_saes/utils/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/misc.py -------------------------------------------------------------------------------- /src/lm_saes/utils/tensor_dict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/tensor_dict.py -------------------------------------------------------------------------------- /src/lm_saes/utils/timer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/timer.py -------------------------------------------------------------------------------- /src/lm_saes/utils/topk_to_jumprelu_conversion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/src/lm_saes/utils/topk_to_jumprelu_conversion.py -------------------------------------------------------------------------------- /tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /tests/integration/test_activation_factory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/integration/test_activation_factory.py -------------------------------------------------------------------------------- /tests/integration/test_attribution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/integration/test_attribution.py -------------------------------------------------------------------------------- /tests/integration/test_train_sae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/integration/test_train_sae.py -------------------------------------------------------------------------------- /tests/unit/test_activation_processors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_activation_processors.py -------------------------------------------------------------------------------- /tests/unit/test_activation_processors_distributed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_activation_processors_distributed.py -------------------------------------------------------------------------------- /tests/unit/test_activation_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_activation_writer.py -------------------------------------------------------------------------------- /tests/unit/test_attribution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_attribution.py -------------------------------------------------------------------------------- /tests/unit/test_clt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_clt.py -------------------------------------------------------------------------------- /tests/unit/test_clt_distributed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_clt_distributed.py -------------------------------------------------------------------------------- /tests/unit/test_crosscoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_crosscoder.py -------------------------------------------------------------------------------- /tests/unit/test_database.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_database.py -------------------------------------------------------------------------------- /tests/unit/test_discrete_mapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_discrete_mapper.py -------------------------------------------------------------------------------- /tests/unit/test_dla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_dla.py -------------------------------------------------------------------------------- /tests/unit/test_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_evaluator.py -------------------------------------------------------------------------------- /tests/unit/test_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_example.py -------------------------------------------------------------------------------- /tests/unit/test_feature_analyzer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_feature_analyzer.py -------------------------------------------------------------------------------- /tests/unit/test_feature_interpreter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_feature_interpreter.py -------------------------------------------------------------------------------- /tests/unit/test_hf_backend.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_hf_backend.py -------------------------------------------------------------------------------- /tests/unit/test_initializer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_initializer.py -------------------------------------------------------------------------------- /tests/unit/test_misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_misc.py -------------------------------------------------------------------------------- /tests/unit/test_sae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_sae.py -------------------------------------------------------------------------------- /tests/unit/test_util_distributed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/tests/unit/test_util_distributed.py -------------------------------------------------------------------------------- /ui/.env.example: -------------------------------------------------------------------------------- 1 | VITE_BACKEND_URL=http://localhost:24577 -------------------------------------------------------------------------------- /ui/.eslintrc.cjs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/.eslintrc.cjs -------------------------------------------------------------------------------- /ui/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/.gitignore -------------------------------------------------------------------------------- /ui/.prettierrc.cjs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/.prettierrc.cjs -------------------------------------------------------------------------------- /ui/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/README.md -------------------------------------------------------------------------------- /ui/bun.lockb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/bun.lockb -------------------------------------------------------------------------------- /ui/components.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/components.json -------------------------------------------------------------------------------- /ui/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/index.html -------------------------------------------------------------------------------- /ui/package.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/package.json -------------------------------------------------------------------------------- /ui/postcss.config.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/postcss.config.js -------------------------------------------------------------------------------- /ui/public/circuits/addition/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/addition/index.html -------------------------------------------------------------------------------- /ui/public/circuits/addition/init-add-big-feature.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/addition/init-add-big-feature.js -------------------------------------------------------------------------------- /ui/public/circuits/addition/init-add-connections.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/addition/init-add-connections.js -------------------------------------------------------------------------------- /ui/public/circuits/addition/init.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/addition/init.js -------------------------------------------------------------------------------- /ui/public/circuits/addition/style.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/addition/style.css -------------------------------------------------------------------------------- /ui/public/circuits/addition/util-add.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/addition/util-add.js -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/cg.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/cg.css -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/gridsnap/gridsnap.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/gridsnap/gridsnap.css -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/gridsnap/init-gridsnap.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/gridsnap/init-gridsnap.js -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/init-cg-button-container.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/init-cg-button-container.js -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/init-cg-clerp-list.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/init-cg-clerp-list.js -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/init-cg-feature-detail.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/init-cg-feature-detail.js -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/init-cg-feature-scatter.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/init-cg-feature-scatter.js -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/init-cg-link-graph.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/init-cg-link-graph.js -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/init-cg-node-connections.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/init-cg-node-connections.js -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/init-cg-subgraph.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/init-cg-subgraph.js -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/init-cg.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/init-cg.js -------------------------------------------------------------------------------- /ui/public/circuits/attribution_graph/util-cg.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/attribution_graph/util-cg.js -------------------------------------------------------------------------------- /ui/public/circuits/example_data/capital-state-dallas.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/example_data/capital-state-dallas.json -------------------------------------------------------------------------------- /ui/public/circuits/feature_examples/feature-examples.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/feature_examples/feature-examples.css -------------------------------------------------------------------------------- /ui/public/circuits/feature_examples/init-feature-examples-list.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/feature_examples/init-feature-examples-list.js -------------------------------------------------------------------------------- /ui/public/circuits/feature_examples/init-feature-examples-logits.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/feature_examples/init-feature-examples-logits.js -------------------------------------------------------------------------------- /ui/public/circuits/feature_examples/init-feature-examples.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/feature_examples/init-feature-examples.js -------------------------------------------------------------------------------- /ui/public/circuits/style.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/style.css -------------------------------------------------------------------------------- /ui/public/circuits/util.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/circuits/util.js -------------------------------------------------------------------------------- /ui/public/openmoss.ico: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/openmoss.ico -------------------------------------------------------------------------------- /ui/public/vite.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/public/vite.svg -------------------------------------------------------------------------------- /ui/src/components/app/feature-preview.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/app/feature-preview.tsx -------------------------------------------------------------------------------- /ui/src/components/app/navbar.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/app/navbar.tsx -------------------------------------------------------------------------------- /ui/src/components/app/sample.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/app/sample.tsx -------------------------------------------------------------------------------- /ui/src/components/app/section-navigator.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/app/section-navigator.tsx -------------------------------------------------------------------------------- /ui/src/components/app/token.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/app/token.tsx -------------------------------------------------------------------------------- /ui/src/components/attn-head/attn-head-card.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/attn-head/attn-head-card.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/circuit-styles.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/circuit-styles.css -------------------------------------------------------------------------------- /ui/src/components/circuits/circuit-visualization.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/circuit-visualization.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph-container.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph-container.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/atomic-components.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/atomic-components.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/grid-lines.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/grid-lines.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/index.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/index.ts -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/link-graph.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/link-graph.css -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/link-graph.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/link-graph.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/links.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/links.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/nodes.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/nodes.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/row-backgrounds.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/row-backgrounds.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/token-labels.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/token-labels.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/tooltips.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/tooltips.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/types.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/types.ts -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/utils.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/utils.ts -------------------------------------------------------------------------------- /ui/src/components/circuits/link-graph/y-axis.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/link-graph/y-axis.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/node-connections.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/node-connections.tsx -------------------------------------------------------------------------------- /ui/src/components/circuits/static_js/d3.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/static_js/d3.js -------------------------------------------------------------------------------- /ui/src/components/circuits/static_js/jetpack_2024-07-20.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/static_js/jetpack_2024-07-20.js -------------------------------------------------------------------------------- /ui/src/components/circuits/static_js/npy_v0.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/static_js/npy_v0.js -------------------------------------------------------------------------------- /ui/src/components/circuits/style.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/style.css -------------------------------------------------------------------------------- /ui/src/components/circuits/util.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/circuits/util.js -------------------------------------------------------------------------------- /ui/src/components/dictionary/dictionary-card.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/dictionary/dictionary-card.tsx -------------------------------------------------------------------------------- /ui/src/components/dictionary/sample.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/dictionary/sample.tsx -------------------------------------------------------------------------------- /ui/src/components/feature/feature-card.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/feature/feature-card.tsx -------------------------------------------------------------------------------- /ui/src/components/feature/interpret.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/feature/interpret.tsx -------------------------------------------------------------------------------- /ui/src/components/feature/sample.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/feature/sample.tsx -------------------------------------------------------------------------------- /ui/src/components/model/model-card.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/model/model-card.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/accordion.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/accordion.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/badge.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/badge.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/button.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/button.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/card.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/card.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/combobox.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/combobox.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/command.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/command.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/context-menu.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/context-menu.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/data-table.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/data-table.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/dialog.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/dialog.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/dropdown-menu.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/dropdown-menu.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/hover-card.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/hover-card.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/input.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/input.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/label.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/label.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/multiple-selector.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/multiple-selector.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/pagination.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/pagination.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/popover.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/popover.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/select.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/select.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/separator.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/separator.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/switch.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/switch.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/table.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/table.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/tabs.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/tabs.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/textarea.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/textarea.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/toggle.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/toggle.tsx -------------------------------------------------------------------------------- /ui/src/components/ui/tooltip.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/components/ui/tooltip.tsx -------------------------------------------------------------------------------- /ui/src/contexts/AppStateContext.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/contexts/AppStateContext.tsx -------------------------------------------------------------------------------- /ui/src/globals.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/globals.css -------------------------------------------------------------------------------- /ui/src/lib/utils.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/lib/utils.ts -------------------------------------------------------------------------------- /ui/src/main.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/main.tsx -------------------------------------------------------------------------------- /ui/src/routes/attn-heads/page.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/routes/attn-heads/page.tsx -------------------------------------------------------------------------------- /ui/src/routes/bookmarks/page.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/routes/bookmarks/page.tsx -------------------------------------------------------------------------------- /ui/src/routes/circuits/page.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/routes/circuits/page.tsx -------------------------------------------------------------------------------- /ui/src/routes/dictionaries/page.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/routes/dictionaries/page.tsx -------------------------------------------------------------------------------- /ui/src/routes/features/page.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/routes/features/page.tsx -------------------------------------------------------------------------------- /ui/src/routes/models/page.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/routes/models/page.tsx -------------------------------------------------------------------------------- /ui/src/routes/page.tsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/routes/page.tsx -------------------------------------------------------------------------------- /ui/src/tanstack.d.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/tanstack.d.ts -------------------------------------------------------------------------------- /ui/src/types/attn-head.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/types/attn-head.ts -------------------------------------------------------------------------------- /ui/src/types/dictionary.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/types/dictionary.ts -------------------------------------------------------------------------------- /ui/src/types/feature.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/types/feature.ts -------------------------------------------------------------------------------- /ui/src/types/model.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/types/model.ts -------------------------------------------------------------------------------- /ui/src/utils/api.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/utils/api.ts -------------------------------------------------------------------------------- /ui/src/utils/array.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/utils/array.ts -------------------------------------------------------------------------------- /ui/src/utils/statePersistence.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/utils/statePersistence.ts -------------------------------------------------------------------------------- /ui/src/utils/style.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/utils/style.ts -------------------------------------------------------------------------------- /ui/src/utils/token.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/src/utils/token.ts -------------------------------------------------------------------------------- /ui/src/vite-env.d.ts: -------------------------------------------------------------------------------- 1 | /// 2 | -------------------------------------------------------------------------------- /ui/tailwind.config.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/tailwind.config.js -------------------------------------------------------------------------------- /ui/test-integration.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/test-integration.html -------------------------------------------------------------------------------- /ui/tsconfig.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/tsconfig.json -------------------------------------------------------------------------------- /ui/tsconfig.node.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/tsconfig.node.json -------------------------------------------------------------------------------- /ui/vite.config.ts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMOSS/Language-Model-SAEs/HEAD/ui/vite.config.ts --------------------------------------------------------------------------------