├── .gitignore ├── LICENSE ├── README.md ├── data_parallel.py ├── dataset ├── __init__.py ├── dm_math.py ├── double_op.py ├── helpers │ ├── __init__.py │ └── split_digits.py ├── image │ ├── __init__.py │ ├── cifar.py │ ├── classification_dataset.py │ ├── convert.py │ └── permuted_mnist.py ├── scan.py ├── sequence.py └── tuple_arithmetic.py ├── draw.py ├── framework ├── .gitignore ├── __init__.py ├── data_structures │ ├── __init__.py │ ├── dotdict.py │ └── vocabulary.py ├── helpers │ ├── __init__.py │ ├── argument_parser.py │ ├── saver.py │ └── training_helper.py ├── layers │ ├── __init__.py │ ├── gumbel_sigmoid.py │ └── positional_encoding.py ├── loader │ ├── __init__.py │ ├── collate.py │ └── sampler.py ├── utils │ ├── __init__.py │ ├── average.py │ ├── download.py │ ├── gpu_allocator.py │ ├── lockfile.py │ ├── lstm_init.py │ ├── parallel_map.py │ ├── port.py │ ├── process.py │ ├── seed.py │ ├── set_lr.py │ ├── time_meter.py │ └── universal.py └── visualize │ ├── __init__.py │ ├── plot.py │ └── tensorboard.py ├── grad_norm.py ├── interfaces ├── __init__.py ├── common.py ├── conv_classifier_interface.py ├── feedforward │ ├── __init__.py │ ├── add_mul.py │ └── tuple_arithmetic.py ├── feedforward_image_classifier_interface.py ├── model_interface.py ├── recurrent │ ├── __init__.py │ ├── add_mul.py │ ├── encoder_decoder_interface.py │ └── tuple_arithmetic.py ├── result.py └── transformer │ ├── __init__.py │ └── encoder_decoder_interface.py ├── layers ├── __init__.py ├── batch_ops.py ├── batchnorm.py ├── masked_conv2d.py ├── masked_layernorm.py ├── masked_linear.py ├── masked_lstm.py ├── masked_module.py └── transformer │ ├── __init__.py │ ├── multi_head_attention.py │ └── transformer.py ├── main.py ├── masked_model.py ├── models ├── __init__.py ├── conv.py ├── encoder_decoder.py ├── feedforward.py ├── lstm.py ├── resnet.py └── transformer_enc_dec.py ├── optimizer ├── __init__.py └── step_lr_sched.py ├── paper ├── .gitignore ├── config.json ├── lib │ ├── __init__.py │ ├── common.py │ ├── config.py │ ├── matplotlib_config.py │ ├── source.py │ └── stat_tracker.py ├── plot_addmul_confusion.py ├── plot_addmul_iou.py ├── plot_addmul_performance.py ├── plot_addmul_weight_proportion.py ├── plot_cifar10_confusion_diff.py ├── plot_cifar10_drop_per_class.py ├── plot_cifar10_drop_statistics.py ├── plot_dm_math.py ├── plot_halfmask.py ├── plot_mask_histogram.py ├── plot_mask_iou.py ├── plot_mask_weight_sensivity.py ├── plot_scan_accuracies.py ├── plot_scan_output_token_removed_percentage.py ├── plot_scan_removed_vs_baseline.py ├── plot_transfer_sharing.py ├── plot_tuple_iou.py ├── plot_tuple_performance.py ├── plot_weight_sharing_vs_size.py └── run_all.sh ├── requirements.txt ├── run.py ├── sweeps ├── addmul_feedforward.yaml ├── addmul_feedforward_big.yaml ├── addmul_feedforward_huge.yaml ├── addmul_ff_alpha_analysis.yaml ├── addmul_rnn.yaml ├── cifar10.yaml ├── cifar10_mask_stability.yaml ├── cifar10_no_dropout.yaml ├── cifar10_resnet.yaml ├── dm_math │ ├── dm_math_add_or_sub.yaml │ ├── dm_math_diff.yaml │ ├── dm_math_lin1d.yaml │ ├── dm_math_polycollect.yaml │ └── dm_math_sort.yaml ├── scan.yaml ├── scan_baseline.yaml ├── trafo_scan.yaml ├── transfer_sharing.yaml ├── transfer_sharing_prefer_old.yaml ├── transfer_sharing_prefer_old_even_more.yaml ├── tuple_feedforward_big.yaml ├── tuple_feedforward_big_copyweight.yaml ├── tuple_feedforward_big_first_full_mask.yaml ├── tuple_feedforward_small_halfmask.yaml ├── tuple_rnn.yaml └── tuple_rnn_first_full_mask.yaml └── tasks ├── __init__.py ├── add_mul.py ├── add_mul_ff.py ├── cifar10_class_removal.py ├── cifar10_cos_distance.py ├── cifar10_mask_stability.py ├── cifar10_resnet_high_performance.py ├── dm_math.py ├── permuted_mnist.py ├── scan.py ├── scan_transformer.py ├── task.py ├── transformer_task.py ├── tuple.py ├── tuple_ff.py └── tuple_ff_copyweight.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/README.md -------------------------------------------------------------------------------- /data_parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/data_parallel.py -------------------------------------------------------------------------------- /dataset/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/__init__.py -------------------------------------------------------------------------------- /dataset/dm_math.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/dm_math.py -------------------------------------------------------------------------------- /dataset/double_op.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/double_op.py -------------------------------------------------------------------------------- /dataset/helpers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/helpers/__init__.py -------------------------------------------------------------------------------- /dataset/helpers/split_digits.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/helpers/split_digits.py -------------------------------------------------------------------------------- /dataset/image/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/image/__init__.py -------------------------------------------------------------------------------- /dataset/image/cifar.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/image/cifar.py -------------------------------------------------------------------------------- /dataset/image/classification_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/image/classification_dataset.py -------------------------------------------------------------------------------- /dataset/image/convert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/image/convert.py -------------------------------------------------------------------------------- /dataset/image/permuted_mnist.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/image/permuted_mnist.py -------------------------------------------------------------------------------- /dataset/scan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/scan.py -------------------------------------------------------------------------------- /dataset/sequence.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/sequence.py -------------------------------------------------------------------------------- /dataset/tuple_arithmetic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/dataset/tuple_arithmetic.py -------------------------------------------------------------------------------- /draw.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/draw.py -------------------------------------------------------------------------------- /framework/.gitignore: -------------------------------------------------------------------------------- 1 | .idea 2 | __pycache__ 3 | -------------------------------------------------------------------------------- /framework/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/__init__.py -------------------------------------------------------------------------------- /framework/data_structures/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/data_structures/__init__.py -------------------------------------------------------------------------------- /framework/data_structures/dotdict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/data_structures/dotdict.py -------------------------------------------------------------------------------- /framework/data_structures/vocabulary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/data_structures/vocabulary.py -------------------------------------------------------------------------------- /framework/helpers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/helpers/__init__.py -------------------------------------------------------------------------------- /framework/helpers/argument_parser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/helpers/argument_parser.py -------------------------------------------------------------------------------- /framework/helpers/saver.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/helpers/saver.py -------------------------------------------------------------------------------- /framework/helpers/training_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/helpers/training_helper.py -------------------------------------------------------------------------------- /framework/layers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/layers/__init__.py -------------------------------------------------------------------------------- /framework/layers/gumbel_sigmoid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/layers/gumbel_sigmoid.py -------------------------------------------------------------------------------- /framework/layers/positional_encoding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/layers/positional_encoding.py -------------------------------------------------------------------------------- /framework/loader/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/loader/__init__.py -------------------------------------------------------------------------------- /framework/loader/collate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/loader/collate.py -------------------------------------------------------------------------------- /framework/loader/sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/loader/sampler.py -------------------------------------------------------------------------------- /framework/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/__init__.py -------------------------------------------------------------------------------- /framework/utils/average.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/average.py -------------------------------------------------------------------------------- /framework/utils/download.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/download.py -------------------------------------------------------------------------------- /framework/utils/gpu_allocator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/gpu_allocator.py -------------------------------------------------------------------------------- /framework/utils/lockfile.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/lockfile.py -------------------------------------------------------------------------------- /framework/utils/lstm_init.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/lstm_init.py -------------------------------------------------------------------------------- /framework/utils/parallel_map.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/parallel_map.py -------------------------------------------------------------------------------- /framework/utils/port.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/port.py -------------------------------------------------------------------------------- /framework/utils/process.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/process.py -------------------------------------------------------------------------------- /framework/utils/seed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/seed.py -------------------------------------------------------------------------------- /framework/utils/set_lr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/set_lr.py -------------------------------------------------------------------------------- /framework/utils/time_meter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/time_meter.py -------------------------------------------------------------------------------- /framework/utils/universal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/utils/universal.py -------------------------------------------------------------------------------- /framework/visualize/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/visualize/__init__.py -------------------------------------------------------------------------------- /framework/visualize/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/visualize/plot.py -------------------------------------------------------------------------------- /framework/visualize/tensorboard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/framework/visualize/tensorboard.py -------------------------------------------------------------------------------- /grad_norm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/grad_norm.py -------------------------------------------------------------------------------- /interfaces/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/__init__.py -------------------------------------------------------------------------------- /interfaces/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/common.py -------------------------------------------------------------------------------- /interfaces/conv_classifier_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/conv_classifier_interface.py -------------------------------------------------------------------------------- /interfaces/feedforward/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/feedforward/__init__.py -------------------------------------------------------------------------------- /interfaces/feedforward/add_mul.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/feedforward/add_mul.py -------------------------------------------------------------------------------- /interfaces/feedforward/tuple_arithmetic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/feedforward/tuple_arithmetic.py -------------------------------------------------------------------------------- /interfaces/feedforward_image_classifier_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/feedforward_image_classifier_interface.py -------------------------------------------------------------------------------- /interfaces/model_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/model_interface.py -------------------------------------------------------------------------------- /interfaces/recurrent/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/recurrent/__init__.py -------------------------------------------------------------------------------- /interfaces/recurrent/add_mul.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/recurrent/add_mul.py -------------------------------------------------------------------------------- /interfaces/recurrent/encoder_decoder_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/recurrent/encoder_decoder_interface.py -------------------------------------------------------------------------------- /interfaces/recurrent/tuple_arithmetic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/recurrent/tuple_arithmetic.py -------------------------------------------------------------------------------- /interfaces/result.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/result.py -------------------------------------------------------------------------------- /interfaces/transformer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/transformer/__init__.py -------------------------------------------------------------------------------- /interfaces/transformer/encoder_decoder_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/interfaces/transformer/encoder_decoder_interface.py -------------------------------------------------------------------------------- /layers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/layers/__init__.py -------------------------------------------------------------------------------- /layers/batch_ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/layers/batch_ops.py -------------------------------------------------------------------------------- /layers/batchnorm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/layers/batchnorm.py -------------------------------------------------------------------------------- /layers/masked_conv2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/layers/masked_conv2d.py -------------------------------------------------------------------------------- /layers/masked_layernorm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/layers/masked_layernorm.py -------------------------------------------------------------------------------- /layers/masked_linear.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/layers/masked_linear.py -------------------------------------------------------------------------------- /layers/masked_lstm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/layers/masked_lstm.py -------------------------------------------------------------------------------- /layers/masked_module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/layers/masked_module.py -------------------------------------------------------------------------------- /layers/transformer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/layers/transformer/__init__.py -------------------------------------------------------------------------------- /layers/transformer/multi_head_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/layers/transformer/multi_head_attention.py -------------------------------------------------------------------------------- /layers/transformer/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/layers/transformer/transformer.py -------------------------------------------------------------------------------- /main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/main.py -------------------------------------------------------------------------------- /masked_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/masked_model.py -------------------------------------------------------------------------------- /models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/models/__init__.py -------------------------------------------------------------------------------- /models/conv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/models/conv.py -------------------------------------------------------------------------------- /models/encoder_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/models/encoder_decoder.py -------------------------------------------------------------------------------- /models/feedforward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/models/feedforward.py -------------------------------------------------------------------------------- /models/lstm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/models/lstm.py -------------------------------------------------------------------------------- /models/resnet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/models/resnet.py -------------------------------------------------------------------------------- /models/transformer_enc_dec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/models/transformer_enc_dec.py -------------------------------------------------------------------------------- /optimizer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/optimizer/__init__.py -------------------------------------------------------------------------------- /optimizer/step_lr_sched.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/optimizer/step_lr_sched.py -------------------------------------------------------------------------------- /paper/.gitignore: -------------------------------------------------------------------------------- 1 | wandb 2 | out -------------------------------------------------------------------------------- /paper/config.json: -------------------------------------------------------------------------------- 1 | { 2 | "wandb_project": "username/modules" 3 | } 4 | -------------------------------------------------------------------------------- /paper/lib/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/lib/__init__.py -------------------------------------------------------------------------------- /paper/lib/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/lib/common.py -------------------------------------------------------------------------------- /paper/lib/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/lib/config.py -------------------------------------------------------------------------------- /paper/lib/matplotlib_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/lib/matplotlib_config.py -------------------------------------------------------------------------------- /paper/lib/source.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/lib/source.py -------------------------------------------------------------------------------- /paper/lib/stat_tracker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/lib/stat_tracker.py -------------------------------------------------------------------------------- /paper/plot_addmul_confusion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_addmul_confusion.py -------------------------------------------------------------------------------- /paper/plot_addmul_iou.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_addmul_iou.py -------------------------------------------------------------------------------- /paper/plot_addmul_performance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_addmul_performance.py -------------------------------------------------------------------------------- /paper/plot_addmul_weight_proportion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_addmul_weight_proportion.py -------------------------------------------------------------------------------- /paper/plot_cifar10_confusion_diff.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_cifar10_confusion_diff.py -------------------------------------------------------------------------------- /paper/plot_cifar10_drop_per_class.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_cifar10_drop_per_class.py -------------------------------------------------------------------------------- /paper/plot_cifar10_drop_statistics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_cifar10_drop_statistics.py -------------------------------------------------------------------------------- /paper/plot_dm_math.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_dm_math.py -------------------------------------------------------------------------------- /paper/plot_halfmask.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_halfmask.py -------------------------------------------------------------------------------- /paper/plot_mask_histogram.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_mask_histogram.py -------------------------------------------------------------------------------- /paper/plot_mask_iou.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_mask_iou.py -------------------------------------------------------------------------------- /paper/plot_mask_weight_sensivity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_mask_weight_sensivity.py -------------------------------------------------------------------------------- /paper/plot_scan_accuracies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_scan_accuracies.py -------------------------------------------------------------------------------- /paper/plot_scan_output_token_removed_percentage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_scan_output_token_removed_percentage.py -------------------------------------------------------------------------------- /paper/plot_scan_removed_vs_baseline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_scan_removed_vs_baseline.py -------------------------------------------------------------------------------- /paper/plot_transfer_sharing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_transfer_sharing.py -------------------------------------------------------------------------------- /paper/plot_tuple_iou.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_tuple_iou.py -------------------------------------------------------------------------------- /paper/plot_tuple_performance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_tuple_performance.py -------------------------------------------------------------------------------- /paper/plot_weight_sharing_vs_size.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/plot_weight_sharing_vs_size.py -------------------------------------------------------------------------------- /paper/run_all.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/paper/run_all.sh -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/requirements.txt -------------------------------------------------------------------------------- /run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/run.py -------------------------------------------------------------------------------- /sweeps/addmul_feedforward.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/addmul_feedforward.yaml -------------------------------------------------------------------------------- /sweeps/addmul_feedforward_big.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/addmul_feedforward_big.yaml -------------------------------------------------------------------------------- /sweeps/addmul_feedforward_huge.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/addmul_feedforward_huge.yaml -------------------------------------------------------------------------------- /sweeps/addmul_ff_alpha_analysis.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/addmul_ff_alpha_analysis.yaml -------------------------------------------------------------------------------- /sweeps/addmul_rnn.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/addmul_rnn.yaml -------------------------------------------------------------------------------- /sweeps/cifar10.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/cifar10.yaml -------------------------------------------------------------------------------- /sweeps/cifar10_mask_stability.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/cifar10_mask_stability.yaml -------------------------------------------------------------------------------- /sweeps/cifar10_no_dropout.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/cifar10_no_dropout.yaml -------------------------------------------------------------------------------- /sweeps/cifar10_resnet.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/cifar10_resnet.yaml -------------------------------------------------------------------------------- /sweeps/dm_math/dm_math_add_or_sub.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/dm_math/dm_math_add_or_sub.yaml -------------------------------------------------------------------------------- /sweeps/dm_math/dm_math_diff.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/dm_math/dm_math_diff.yaml -------------------------------------------------------------------------------- /sweeps/dm_math/dm_math_lin1d.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/dm_math/dm_math_lin1d.yaml -------------------------------------------------------------------------------- /sweeps/dm_math/dm_math_polycollect.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/dm_math/dm_math_polycollect.yaml -------------------------------------------------------------------------------- /sweeps/dm_math/dm_math_sort.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/dm_math/dm_math_sort.yaml -------------------------------------------------------------------------------- /sweeps/scan.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/scan.yaml -------------------------------------------------------------------------------- /sweeps/scan_baseline.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/scan_baseline.yaml -------------------------------------------------------------------------------- /sweeps/trafo_scan.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/trafo_scan.yaml -------------------------------------------------------------------------------- /sweeps/transfer_sharing.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/transfer_sharing.yaml -------------------------------------------------------------------------------- /sweeps/transfer_sharing_prefer_old.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/transfer_sharing_prefer_old.yaml -------------------------------------------------------------------------------- /sweeps/transfer_sharing_prefer_old_even_more.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/transfer_sharing_prefer_old_even_more.yaml -------------------------------------------------------------------------------- /sweeps/tuple_feedforward_big.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/tuple_feedforward_big.yaml -------------------------------------------------------------------------------- /sweeps/tuple_feedforward_big_copyweight.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/tuple_feedforward_big_copyweight.yaml -------------------------------------------------------------------------------- /sweeps/tuple_feedforward_big_first_full_mask.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/tuple_feedforward_big_first_full_mask.yaml -------------------------------------------------------------------------------- /sweeps/tuple_feedforward_small_halfmask.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/tuple_feedforward_small_halfmask.yaml -------------------------------------------------------------------------------- /sweeps/tuple_rnn.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/tuple_rnn.yaml -------------------------------------------------------------------------------- /sweeps/tuple_rnn_first_full_mask.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/sweeps/tuple_rnn_first_full_mask.yaml -------------------------------------------------------------------------------- /tasks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/__init__.py -------------------------------------------------------------------------------- /tasks/add_mul.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/add_mul.py -------------------------------------------------------------------------------- /tasks/add_mul_ff.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/add_mul_ff.py -------------------------------------------------------------------------------- /tasks/cifar10_class_removal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/cifar10_class_removal.py -------------------------------------------------------------------------------- /tasks/cifar10_cos_distance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/cifar10_cos_distance.py -------------------------------------------------------------------------------- /tasks/cifar10_mask_stability.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/cifar10_mask_stability.py -------------------------------------------------------------------------------- /tasks/cifar10_resnet_high_performance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/cifar10_resnet_high_performance.py -------------------------------------------------------------------------------- /tasks/dm_math.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/dm_math.py -------------------------------------------------------------------------------- /tasks/permuted_mnist.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/permuted_mnist.py -------------------------------------------------------------------------------- /tasks/scan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/scan.py -------------------------------------------------------------------------------- /tasks/scan_transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/scan_transformer.py -------------------------------------------------------------------------------- /tasks/task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/task.py -------------------------------------------------------------------------------- /tasks/transformer_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/transformer_task.py -------------------------------------------------------------------------------- /tasks/tuple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/tuple.py -------------------------------------------------------------------------------- /tasks/tuple_ff.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/tuple_ff.py -------------------------------------------------------------------------------- /tasks/tuple_ff_copyweight.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RobertCsordas/modules/HEAD/tasks/tuple_ff_copyweight.py --------------------------------------------------------------------------------