├── chat_gradio.py ├── config.py ├── dataloader.py ├── download_mmlu.py ├── evaluation.py ├── finetune.py ├── loss ├── instruct_retriever_tv2_110M_8B_loss1.28.txt ├── plot_instruct_loss.py ├── plot_loss.py ├── retriever_110M_100B_loss2.94.txt ├── retriever_35M_42B_loss3.29.txt ├── retriever_small_loss3.49.txt ├── retriever_small_step8w_batch256_loss3.48.txt ├── retriever_small_step8w_loss3.51.txt ├── retriever_small_step8w_mlp_soft_silu__intersize_loss3.40.txt ├── retriever_small_step8w_mlp_soft_silu__intersize_rotary_loss3.36.txt ├── retriever_small_step8w_mlp_soft_silu_loss3.44.txt ├── retriever_tv2_110M_78B_loss2.66.txt └── retriever_tv2_396M_96B_loss2.40.txt ├── main.py ├── mmlu_categories.py ├── model.py ├── preprocess.py ├── text.txt ├── tokenization.py ├── tokenization_v2.py └── tokenizer_models ├── tokenizer_300G.json ├── tokenizer_gwb.json ├── tokenizer_u32.json └── tokenizer_v2_600G.json /chat_gradio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/chat_gradio.py -------------------------------------------------------------------------------- /config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/config.py -------------------------------------------------------------------------------- /dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/dataloader.py -------------------------------------------------------------------------------- /download_mmlu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/download_mmlu.py -------------------------------------------------------------------------------- /evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/evaluation.py -------------------------------------------------------------------------------- /finetune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/finetune.py -------------------------------------------------------------------------------- /loss/instruct_retriever_tv2_110M_8B_loss1.28.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/instruct_retriever_tv2_110M_8B_loss1.28.txt -------------------------------------------------------------------------------- /loss/plot_instruct_loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/plot_instruct_loss.py -------------------------------------------------------------------------------- /loss/plot_loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/plot_loss.py -------------------------------------------------------------------------------- /loss/retriever_110M_100B_loss2.94.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/retriever_110M_100B_loss2.94.txt -------------------------------------------------------------------------------- /loss/retriever_35M_42B_loss3.29.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/retriever_35M_42B_loss3.29.txt -------------------------------------------------------------------------------- /loss/retriever_small_loss3.49.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/retriever_small_loss3.49.txt -------------------------------------------------------------------------------- /loss/retriever_small_step8w_batch256_loss3.48.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/retriever_small_step8w_batch256_loss3.48.txt -------------------------------------------------------------------------------- /loss/retriever_small_step8w_loss3.51.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/retriever_small_step8w_loss3.51.txt -------------------------------------------------------------------------------- /loss/retriever_small_step8w_mlp_soft_silu__intersize_loss3.40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/retriever_small_step8w_mlp_soft_silu__intersize_loss3.40.txt -------------------------------------------------------------------------------- /loss/retriever_small_step8w_mlp_soft_silu__intersize_rotary_loss3.36.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/retriever_small_step8w_mlp_soft_silu__intersize_rotary_loss3.36.txt -------------------------------------------------------------------------------- /loss/retriever_small_step8w_mlp_soft_silu_loss3.44.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/retriever_small_step8w_mlp_soft_silu_loss3.44.txt -------------------------------------------------------------------------------- /loss/retriever_tv2_110M_78B_loss2.66.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/retriever_tv2_110M_78B_loss2.66.txt -------------------------------------------------------------------------------- /loss/retriever_tv2_396M_96B_loss2.40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/loss/retriever_tv2_396M_96B_loss2.40.txt -------------------------------------------------------------------------------- /main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/main.py -------------------------------------------------------------------------------- /mmlu_categories.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/mmlu_categories.py -------------------------------------------------------------------------------- /model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/model.py -------------------------------------------------------------------------------- /preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/preprocess.py -------------------------------------------------------------------------------- /text.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/text.txt -------------------------------------------------------------------------------- /tokenization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/tokenization.py -------------------------------------------------------------------------------- /tokenization_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/tokenization_v2.py -------------------------------------------------------------------------------- /tokenizer_models/tokenizer_300G.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/tokenizer_models/tokenizer_300G.json -------------------------------------------------------------------------------- /tokenizer_models/tokenizer_gwb.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/tokenizer_models/tokenizer_gwb.json -------------------------------------------------------------------------------- /tokenizer_models/tokenizer_u32.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/tokenizer_models/tokenizer_u32.json -------------------------------------------------------------------------------- /tokenizer_models/tokenizer_v2_600G.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaibowen/Retriever/HEAD/tokenizer_models/tokenizer_v2_600G.json --------------------------------------------------------------------------------