├── .gitignore ├── .vscode ├── launch.json └── settings.json ├── README.md ├── dataset ├── __init__.py ├── image │ ├── __init__.py │ ├── cifar.py │ ├── classification_dataset.py │ ├── fashion_mnist.py │ └── permuted_mnist.py └── text │ ├── enwik8.py │ ├── lm_dataset.py │ └── wikitext_word_level.py ├── framework ├── .gitignore ├── __init__.py ├── data_structures │ ├── __init__.py │ ├── dotdict.py │ └── vocabulary.py ├── helpers │ ├── __init__.py │ ├── argument_parser.py │ ├── distributed.py │ ├── saver.py │ ├── stopping_parallel_loop.py │ └── training_helper.py ├── loader │ ├── __init__.py │ ├── collate.py │ ├── dataset_merger.py │ ├── dataset_splitter.py │ └── sampler.py ├── utils │ ├── __init__.py │ ├── average.py │ ├── download.py │ ├── gpu_allocator.py │ ├── lockfile.py │ ├── lstm_init.py │ ├── parallel_map.py │ ├── port.py │ ├── process.py │ ├── seed.py │ ├── set_lr.py │ ├── time_meter.py │ └── universal.py └── visualize │ ├── __init__.py │ ├── plot.py │ └── tensorboard.py ├── interfaces ├── __init__.py ├── common.py ├── conv_classifier_interface.py ├── feedforward_image_classifier_interface.py ├── language_model_interface.py ├── model_interface.py └── result.py ├── main.py ├── models ├── __init__.py ├── feedforward.py └── rnn_language_model.py ├── paper ├── .gitignore ├── ff_as_attention │ ├── .gitignore │ ├── config.json │ ├── lib │ ├── plot_attention.py │ ├── plot_inputs.py │ └── print_predictive_power.py └── lib │ ├── __init__.py │ ├── common.py │ ├── config.py │ ├── cross_validate_stats.py │ ├── matplotlib_config.py │ ├── source.py │ └── stat_tracker.py ├── requirements.txt ├── run.py ├── sweeps └── ff_as_attention │ ├── ff_as_attention_aeshop.yaml │ ├── ff_as_attention_aeshop_always_reset.yaml │ ├── ff_as_attention_cifar10_10samples.yaml │ ├── ff_as_attention_mixed_ds_10samples.yaml │ ├── ff_as_attention_mnist_10samples.yaml │ ├── ff_as_attention_sequential_10samples.yaml │ ├── ff_as_attention_sequential_long.yaml │ └── ff_as_attention_wikitext2.yaml └── tasks ├── __init__.py ├── simple ├── __init__.py ├── ff_as_attention │ ├── __init__.py │ ├── cifar10_ff_attention.py │ ├── language_lstm_ff_attention.py │ ├── language_lstm_ff_attention_overfit.py │ ├── mnist_ff_attention.py │ ├── mnist_fmnist_ff_attention.py │ └── mnist_fmnist_sequential.py ├── language_model │ ├── __init__.py │ ├── aeshops_fables_lstm.py │ ├── enwik8_lstm.py │ └── wikitext2_lstm.py └── simple_task.py ├── task.py └── task_db.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/.gitignore -------------------------------------------------------------------------------- /.vscode/launch.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/.vscode/launch.json -------------------------------------------------------------------------------- /.vscode/settings.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/.vscode/settings.json -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/README.md -------------------------------------------------------------------------------- /dataset/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/dataset/__init__.py -------------------------------------------------------------------------------- /dataset/image/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/dataset/image/__init__.py -------------------------------------------------------------------------------- /dataset/image/cifar.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/dataset/image/cifar.py -------------------------------------------------------------------------------- /dataset/image/classification_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/dataset/image/classification_dataset.py -------------------------------------------------------------------------------- /dataset/image/fashion_mnist.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/dataset/image/fashion_mnist.py -------------------------------------------------------------------------------- /dataset/image/permuted_mnist.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/dataset/image/permuted_mnist.py -------------------------------------------------------------------------------- /dataset/text/enwik8.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/dataset/text/enwik8.py -------------------------------------------------------------------------------- /dataset/text/lm_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/dataset/text/lm_dataset.py -------------------------------------------------------------------------------- /dataset/text/wikitext_word_level.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/dataset/text/wikitext_word_level.py -------------------------------------------------------------------------------- /framework/.gitignore: -------------------------------------------------------------------------------- 1 | .idea 2 | __pycache__ 3 | -------------------------------------------------------------------------------- /framework/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/__init__.py -------------------------------------------------------------------------------- /framework/data_structures/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/data_structures/__init__.py -------------------------------------------------------------------------------- /framework/data_structures/dotdict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/data_structures/dotdict.py -------------------------------------------------------------------------------- /framework/data_structures/vocabulary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/data_structures/vocabulary.py -------------------------------------------------------------------------------- /framework/helpers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/helpers/__init__.py -------------------------------------------------------------------------------- /framework/helpers/argument_parser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/helpers/argument_parser.py -------------------------------------------------------------------------------- /framework/helpers/distributed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/helpers/distributed.py -------------------------------------------------------------------------------- /framework/helpers/saver.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/helpers/saver.py -------------------------------------------------------------------------------- /framework/helpers/stopping_parallel_loop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/helpers/stopping_parallel_loop.py -------------------------------------------------------------------------------- /framework/helpers/training_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/helpers/training_helper.py -------------------------------------------------------------------------------- /framework/loader/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/loader/__init__.py -------------------------------------------------------------------------------- /framework/loader/collate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/loader/collate.py -------------------------------------------------------------------------------- /framework/loader/dataset_merger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/loader/dataset_merger.py -------------------------------------------------------------------------------- /framework/loader/dataset_splitter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/loader/dataset_splitter.py -------------------------------------------------------------------------------- /framework/loader/sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/loader/sampler.py -------------------------------------------------------------------------------- /framework/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/__init__.py -------------------------------------------------------------------------------- /framework/utils/average.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/average.py -------------------------------------------------------------------------------- /framework/utils/download.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/download.py -------------------------------------------------------------------------------- /framework/utils/gpu_allocator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/gpu_allocator.py -------------------------------------------------------------------------------- /framework/utils/lockfile.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/lockfile.py -------------------------------------------------------------------------------- /framework/utils/lstm_init.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/lstm_init.py -------------------------------------------------------------------------------- /framework/utils/parallel_map.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/parallel_map.py -------------------------------------------------------------------------------- /framework/utils/port.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/port.py -------------------------------------------------------------------------------- /framework/utils/process.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/process.py -------------------------------------------------------------------------------- /framework/utils/seed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/seed.py -------------------------------------------------------------------------------- /framework/utils/set_lr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/set_lr.py -------------------------------------------------------------------------------- /framework/utils/time_meter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/time_meter.py -------------------------------------------------------------------------------- /framework/utils/universal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/utils/universal.py -------------------------------------------------------------------------------- /framework/visualize/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/visualize/__init__.py -------------------------------------------------------------------------------- /framework/visualize/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/visualize/plot.py -------------------------------------------------------------------------------- /framework/visualize/tensorboard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/framework/visualize/tensorboard.py -------------------------------------------------------------------------------- /interfaces/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/interfaces/__init__.py -------------------------------------------------------------------------------- /interfaces/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/interfaces/common.py -------------------------------------------------------------------------------- /interfaces/conv_classifier_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/interfaces/conv_classifier_interface.py -------------------------------------------------------------------------------- /interfaces/feedforward_image_classifier_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/interfaces/feedforward_image_classifier_interface.py -------------------------------------------------------------------------------- /interfaces/language_model_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/interfaces/language_model_interface.py -------------------------------------------------------------------------------- /interfaces/model_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/interfaces/model_interface.py -------------------------------------------------------------------------------- /interfaces/result.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/interfaces/result.py -------------------------------------------------------------------------------- /main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/main.py -------------------------------------------------------------------------------- /models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/models/__init__.py -------------------------------------------------------------------------------- /models/feedforward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/models/feedforward.py -------------------------------------------------------------------------------- /models/rnn_language_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/models/rnn_language_model.py -------------------------------------------------------------------------------- /paper/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/paper/.gitignore -------------------------------------------------------------------------------- /paper/ff_as_attention/.gitignore: -------------------------------------------------------------------------------- 1 | out 2 | media 3 | cache -------------------------------------------------------------------------------- /paper/ff_as_attention/config.json: -------------------------------------------------------------------------------- 1 | { 2 | "wandb_project": "username/ff_as_attention" 3 | } 4 | -------------------------------------------------------------------------------- /paper/ff_as_attention/lib: -------------------------------------------------------------------------------- 1 | ../lib -------------------------------------------------------------------------------- /paper/ff_as_attention/plot_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/paper/ff_as_attention/plot_attention.py -------------------------------------------------------------------------------- /paper/ff_as_attention/plot_inputs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/paper/ff_as_attention/plot_inputs.py -------------------------------------------------------------------------------- /paper/ff_as_attention/print_predictive_power.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/paper/ff_as_attention/print_predictive_power.py -------------------------------------------------------------------------------- /paper/lib/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/paper/lib/__init__.py -------------------------------------------------------------------------------- /paper/lib/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/paper/lib/common.py -------------------------------------------------------------------------------- /paper/lib/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/paper/lib/config.py -------------------------------------------------------------------------------- /paper/lib/cross_validate_stats.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/paper/lib/cross_validate_stats.py -------------------------------------------------------------------------------- /paper/lib/matplotlib_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/paper/lib/matplotlib_config.py -------------------------------------------------------------------------------- /paper/lib/source.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/paper/lib/source.py -------------------------------------------------------------------------------- /paper/lib/stat_tracker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/paper/lib/stat_tracker.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/requirements.txt -------------------------------------------------------------------------------- /run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/run.py -------------------------------------------------------------------------------- /sweeps/ff_as_attention/ff_as_attention_aeshop.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/sweeps/ff_as_attention/ff_as_attention_aeshop.yaml -------------------------------------------------------------------------------- /sweeps/ff_as_attention/ff_as_attention_aeshop_always_reset.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/sweeps/ff_as_attention/ff_as_attention_aeshop_always_reset.yaml -------------------------------------------------------------------------------- /sweeps/ff_as_attention/ff_as_attention_cifar10_10samples.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/sweeps/ff_as_attention/ff_as_attention_cifar10_10samples.yaml -------------------------------------------------------------------------------- /sweeps/ff_as_attention/ff_as_attention_mixed_ds_10samples.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/sweeps/ff_as_attention/ff_as_attention_mixed_ds_10samples.yaml -------------------------------------------------------------------------------- /sweeps/ff_as_attention/ff_as_attention_mnist_10samples.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/sweeps/ff_as_attention/ff_as_attention_mnist_10samples.yaml -------------------------------------------------------------------------------- /sweeps/ff_as_attention/ff_as_attention_sequential_10samples.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/sweeps/ff_as_attention/ff_as_attention_sequential_10samples.yaml -------------------------------------------------------------------------------- /sweeps/ff_as_attention/ff_as_attention_sequential_long.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/sweeps/ff_as_attention/ff_as_attention_sequential_long.yaml -------------------------------------------------------------------------------- /sweeps/ff_as_attention/ff_as_attention_wikitext2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/sweeps/ff_as_attention/ff_as_attention_wikitext2.yaml -------------------------------------------------------------------------------- /tasks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/__init__.py -------------------------------------------------------------------------------- /tasks/simple/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/__init__.py -------------------------------------------------------------------------------- /tasks/simple/ff_as_attention/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/ff_as_attention/__init__.py -------------------------------------------------------------------------------- /tasks/simple/ff_as_attention/cifar10_ff_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/ff_as_attention/cifar10_ff_attention.py -------------------------------------------------------------------------------- /tasks/simple/ff_as_attention/language_lstm_ff_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/ff_as_attention/language_lstm_ff_attention.py -------------------------------------------------------------------------------- /tasks/simple/ff_as_attention/language_lstm_ff_attention_overfit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/ff_as_attention/language_lstm_ff_attention_overfit.py -------------------------------------------------------------------------------- /tasks/simple/ff_as_attention/mnist_ff_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/ff_as_attention/mnist_ff_attention.py -------------------------------------------------------------------------------- /tasks/simple/ff_as_attention/mnist_fmnist_ff_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/ff_as_attention/mnist_fmnist_ff_attention.py -------------------------------------------------------------------------------- /tasks/simple/ff_as_attention/mnist_fmnist_sequential.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/ff_as_attention/mnist_fmnist_sequential.py -------------------------------------------------------------------------------- /tasks/simple/language_model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/language_model/__init__.py -------------------------------------------------------------------------------- /tasks/simple/language_model/aeshops_fables_lstm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/language_model/aeshops_fables_lstm.py -------------------------------------------------------------------------------- /tasks/simple/language_model/enwik8_lstm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/language_model/enwik8_lstm.py -------------------------------------------------------------------------------- /tasks/simple/language_model/wikitext2_lstm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/language_model/wikitext2_lstm.py -------------------------------------------------------------------------------- /tasks/simple/simple_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/simple/simple_task.py -------------------------------------------------------------------------------- /tasks/task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/task.py -------------------------------------------------------------------------------- /tasks/task_db.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/linear_layer_as_attention/HEAD/tasks/task_db.py --------------------------------------------------------------------------------