├── 1_run_mae.py ├── 2_train_sat.py ├── LICENSE ├── README.md ├── config ├── mae │ ├── mae_base.yaml │ ├── mae_small.yaml │ └── mae_tiny.yaml └── sat │ ├── balanced_sat_s_1s.yaml │ ├── balanced_sat_s_2s.yaml │ ├── balanced_sat_t_1s.yaml │ └── balanced_sat_t_2s.yaml ├── dataset.py ├── datasets ├── __init__.py ├── audioset │ ├── 1_download_audioset.sh │ └── 2_prepare_data.sh └── utils │ ├── dump_audio_to_hdf5.py │ └── prepare_label_list.py ├── inference.py ├── models ├── __init__.py ├── audiotransformer.py ├── checkpoints.py ├── layers.py └── mae.py ├── requirements.txt ├── samples ├── jkLRith2wcc.wav └── mg4kDY_hy6o.wav └── utils.py /1_run_mae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/1_run_mae.py -------------------------------------------------------------------------------- /2_train_sat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/2_train_sat.py -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/README.md -------------------------------------------------------------------------------- /config/mae/mae_base.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/config/mae/mae_base.yaml -------------------------------------------------------------------------------- /config/mae/mae_small.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/config/mae/mae_small.yaml -------------------------------------------------------------------------------- /config/mae/mae_tiny.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/config/mae/mae_tiny.yaml -------------------------------------------------------------------------------- /config/sat/balanced_sat_s_1s.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/config/sat/balanced_sat_s_1s.yaml -------------------------------------------------------------------------------- /config/sat/balanced_sat_s_2s.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/config/sat/balanced_sat_s_2s.yaml -------------------------------------------------------------------------------- /config/sat/balanced_sat_t_1s.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/config/sat/balanced_sat_t_1s.yaml -------------------------------------------------------------------------------- /config/sat/balanced_sat_t_2s.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/config/sat/balanced_sat_t_2s.yaml -------------------------------------------------------------------------------- /dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/dataset.py -------------------------------------------------------------------------------- /datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /datasets/audioset/1_download_audioset.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/datasets/audioset/1_download_audioset.sh -------------------------------------------------------------------------------- /datasets/audioset/2_prepare_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/datasets/audioset/2_prepare_data.sh -------------------------------------------------------------------------------- /datasets/utils/dump_audio_to_hdf5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/datasets/utils/dump_audio_to_hdf5.py -------------------------------------------------------------------------------- /datasets/utils/prepare_label_list.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/datasets/utils/prepare_label_list.py -------------------------------------------------------------------------------- /inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/inference.py -------------------------------------------------------------------------------- /models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/models/__init__.py -------------------------------------------------------------------------------- /models/audiotransformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/models/audiotransformer.py -------------------------------------------------------------------------------- /models/checkpoints.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/models/checkpoints.py -------------------------------------------------------------------------------- /models/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/models/layers.py -------------------------------------------------------------------------------- /models/mae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/models/mae.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/requirements.txt -------------------------------------------------------------------------------- /samples/jkLRith2wcc.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/samples/jkLRith2wcc.wav -------------------------------------------------------------------------------- /samples/mg4kDY_hy6o.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/samples/mg4kDY_hy6o.wav -------------------------------------------------------------------------------- /utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RicherMans/SAT/HEAD/utils.py --------------------------------------------------------------------------------