├── .github └── workflows │ ├── autoblack.yml │ └── sphinx.yml ├── LICENSE ├── README.md ├── clap ├── __init__.py ├── datasets.py ├── layers │ ├── __init__.py │ ├── attentions │ │ ├── __init__.py │ │ ├── attention.py │ │ ├── cvt_attention.py │ │ └── talking_heads.py │ ├── feedforwards │ │ ├── __init__.py │ │ ├── ff.py │ │ └── leff.py │ ├── normalizations │ │ ├── __init__.py │ │ └── layerscale.py │ ├── position_embed.py │ ├── regularization │ │ ├── __init__.py │ │ └── stochastic_depth.py │ ├── squeeze_excite.py │ └── stems │ │ ├── __init__.py │ │ ├── image_to_token.py │ │ └── patch_embed.py ├── models.py └── trunks │ ├── __init__.py │ ├── cait.py │ ├── create_trunk.py │ ├── mlp_mixer.py │ ├── tnt.py │ ├── transformer.py │ └── vit.py ├── configs ├── model │ ├── audio │ │ ├── cait.yaml │ │ ├── mixer.yaml │ │ ├── tnt.yaml │ │ └── vit.yaml │ └── text │ │ └── transformer.yaml ├── optimizer │ └── standard.yaml ├── preprocessing │ └── dataset │ │ └── commonvoice.yaml └── training │ └── standard.yaml ├── preprocess.py ├── setup.py └── train.py /.github/workflows/autoblack.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/.github/workflows/autoblack.yml -------------------------------------------------------------------------------- /.github/workflows/sphinx.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/.github/workflows/sphinx.yml -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/README.md -------------------------------------------------------------------------------- /clap/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/__init__.py -------------------------------------------------------------------------------- /clap/datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/datasets.py -------------------------------------------------------------------------------- /clap/layers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/__init__.py -------------------------------------------------------------------------------- /clap/layers/attentions/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/attentions/__init__.py -------------------------------------------------------------------------------- /clap/layers/attentions/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/attentions/attention.py -------------------------------------------------------------------------------- /clap/layers/attentions/cvt_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/attentions/cvt_attention.py -------------------------------------------------------------------------------- /clap/layers/attentions/talking_heads.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/attentions/talking_heads.py -------------------------------------------------------------------------------- /clap/layers/feedforwards/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/feedforwards/__init__.py -------------------------------------------------------------------------------- /clap/layers/feedforwards/ff.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/feedforwards/ff.py -------------------------------------------------------------------------------- /clap/layers/feedforwards/leff.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/feedforwards/leff.py -------------------------------------------------------------------------------- /clap/layers/normalizations/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/normalizations/__init__.py -------------------------------------------------------------------------------- /clap/layers/normalizations/layerscale.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/normalizations/layerscale.py -------------------------------------------------------------------------------- /clap/layers/position_embed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/position_embed.py -------------------------------------------------------------------------------- /clap/layers/regularization/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/regularization/__init__.py -------------------------------------------------------------------------------- /clap/layers/regularization/stochastic_depth.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/regularization/stochastic_depth.py -------------------------------------------------------------------------------- /clap/layers/squeeze_excite.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/squeeze_excite.py -------------------------------------------------------------------------------- /clap/layers/stems/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/stems/__init__.py -------------------------------------------------------------------------------- /clap/layers/stems/image_to_token.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/stems/image_to_token.py -------------------------------------------------------------------------------- /clap/layers/stems/patch_embed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/layers/stems/patch_embed.py -------------------------------------------------------------------------------- /clap/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/models.py -------------------------------------------------------------------------------- /clap/trunks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/trunks/__init__.py -------------------------------------------------------------------------------- /clap/trunks/cait.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/trunks/cait.py -------------------------------------------------------------------------------- /clap/trunks/create_trunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/trunks/create_trunk.py -------------------------------------------------------------------------------- /clap/trunks/mlp_mixer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/trunks/mlp_mixer.py -------------------------------------------------------------------------------- /clap/trunks/tnt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/trunks/tnt.py -------------------------------------------------------------------------------- /clap/trunks/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/trunks/transformer.py -------------------------------------------------------------------------------- /clap/trunks/vit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/clap/trunks/vit.py -------------------------------------------------------------------------------- /configs/model/audio/cait.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/configs/model/audio/cait.yaml -------------------------------------------------------------------------------- /configs/model/audio/mixer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/configs/model/audio/mixer.yaml -------------------------------------------------------------------------------- /configs/model/audio/tnt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/configs/model/audio/tnt.yaml -------------------------------------------------------------------------------- /configs/model/audio/vit.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/configs/model/audio/vit.yaml -------------------------------------------------------------------------------- /configs/model/text/transformer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/configs/model/text/transformer.yaml -------------------------------------------------------------------------------- /configs/optimizer/standard.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/configs/optimizer/standard.yaml -------------------------------------------------------------------------------- /configs/preprocessing/dataset/commonvoice.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/configs/preprocessing/dataset/commonvoice.yaml -------------------------------------------------------------------------------- /configs/training/standard.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/configs/training/standard.yaml -------------------------------------------------------------------------------- /preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/preprocess.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/setup.py -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/cfoster0/CLAP/HEAD/train.py --------------------------------------------------------------------------------