├── .gitattributes ├── .gitignore ├── LICENSE ├── NOTICE ├── README.md ├── configs ├── gpt2_tiny_v1.json ├── gpt_neo_small_v1.json ├── gpt_neo_small_v2.json ├── gpt_neo_tiny_v1.json └── gpt_neo_tiny_v2.json ├── data_processing ├── calc_ngrams.py ├── clean_ficbook.py ├── convert_math.py ├── convert_mc4.py ├── convert_opensubtitles.py ├── convert_pikabu.py ├── convert_wiki.py ├── convert_yandex_q.py ├── create_ficbook.py ├── create_habr.py ├── create_librusec.py ├── create_ru_news.py ├── create_stackoverflow.py ├── create_stihi.py ├── exact_undup.py ├── filter_with_tokenizer.py ├── hf_to_instruct.py ├── lang_detector.py ├── merge.py ├── parse_fb2.py ├── parse_zip_fb2.py ├── requirements.txt ├── run.sh ├── save_hf.py ├── save_mc4.py ├── split.py ├── undup.py └── util.py ├── requirements.txt ├── resources ├── mc4_bad_hosts.txt ├── mc4_good_hosts.txt ├── mc4_news_hosts.txt └── mc4_ru_bad_words.txt ├── rulm ├── generate.py ├── jsonl_loader.py ├── preprocess.py ├── train.py ├── train_tokenizer.py └── util.py ├── self_instruct ├── .gitattributes ├── README.md ├── configs │ ├── fred_deepspeed.json │ ├── gigasaiga_13b.json │ ├── llama2_13b_rsg.json │ ├── llama2_13b_rsg_rcb.json │ ├── llama2_13b_rsg_rucos.json │ ├── llama2_13b_rsg_russe.json │ ├── llama2_13b_rsg_terra.json │ ├── llama_13b_lora.json │ ├── llama_13b_rsg.json │ ├── llama_13b_rsg_rucos.json │ ├── llama_13b_rsg_russe.json │ ├── llama_7b_lora.json │ ├── mistral_7b_128k.json │ ├── mistral_7b_rsg.json │ ├── mistral_7b_rsg_danetqa.json │ ├── mistral_7b_rsg_parus.json │ ├── mistral_7b_rsg_rucos.json │ ├── mistral_7b_rsg_russe.json │ ├── mistral_7b_rsg_terra.json │ ├── mpt_30b.json │ ├── mpt_7b_8k.json │ ├── mpt_7b_storywriter.json │ ├── mt0_large_deepspeed.json │ ├── mt0_xl_lora.json │ ├── mt0_xxl_deepspeed.json │ ├── mt0_xxl_mt_lora.json │ ├── rugpt_large_plain.json │ ├── rugpt_medium_plain.json │ ├── rut5_base_plain.json │ ├── rut5_large_plain.json │ ├── saicuna_13b.json │ ├── saiga2_13b.json │ ├── saiga2_70b.json │ ├── saiga2_7b.json │ ├── saiga_13b.json │ ├── saiga_13b_rsg.json │ ├── saiga_13b_rsg_parus.json │ ├── saiga_13b_rsg_rucos.json │ ├── saiga_13b_rsg_russe.json │ ├── saiga_13b_rsg_rwsd.json │ ├── saiga_30b.json │ ├── saiga_30b_4bit.json │ ├── saiga_65b_4bit.json │ ├── saiga_7b.json │ ├── saiga_aya23_8b_m1.json │ ├── saiga_kto.json │ ├── saiga_llama3_8b.json │ ├── saiga_llama3_8b_galore.json │ ├── saiga_llama3_8b_lm_head.json │ ├── saiga_llama3_8b_m1.json │ ├── saiga_llama3_8b_m2.json │ ├── saiga_llama3_8b_m3.json │ ├── saiga_llama3_8b_sfr.json │ ├── saiga_mistral_7b.json │ ├── saiga_orpo.json │ ├── saiga_reward.json │ └── xglm_3B_deepspeed.json ├── crowd │ ├── aggregate.py │ ├── examples │ │ ├── honey.jsonl │ │ └── training.json │ ├── pool_settings.json │ ├── settings.json │ └── upload.py ├── data │ ├── .gitattributes │ ├── en_chargen_seed.jsonl │ ├── gpt4_evals │ │ └── saiga_vs_vicuna.jsonl │ ├── lmsys_clean_ru_queries_chatgpt_3_5_answers.jsonl │ ├── lmsys_clean_ru_queries_chatgpt_4_answers.jsonl │ ├── lmsys_clean_ru_queries_llama_3_8b_answers.jsonl │ ├── lmsys_clean_ru_queries_saiga_llama3_8b_answers.jsonl │ ├── lmsys_clean_ru_queries_suzume_answers.jsonl │ ├── output.json │ ├── preferences_prompts.jsonl │ ├── preferences_prompts_gemma2_9b_it_abliterated_answers.jsonl │ ├── preferences_prompts_gpt4_4o_answers.jsonl │ ├── preferences_prompts_saiga_gemma2_9b_sft_m2_d8_answers.jsonl │ ├── preferences_prompts_saiga_llama3_8b_v6_answers.jsonl │ ├── preferences_prompts_saiga_phi3_medium_sft_m1_d2_awq_4bit_answers.jsonl │ ├── ru_alpaca_seed_tasks.jsonl │ ├── ru_chargen_seed.jsonl │ ├── saiga_bot_user_multiturn_prompts.jsonl │ ├── saiga_bot_user_multiturn_prompts_aya_23_8b_answers.jsonl │ ├── saiga_bot_user_multiturn_prompts_chatgpt_3_5_turbo_answers.jsonl │ ├── saiga_bot_user_multiturn_prompts_gpt4_4o_answers.jsonl │ ├── saiga_bot_user_multiturn_prompts_llama3_8b_answers.jsonl │ ├── saiga_bot_user_multiturn_prompts_saiga_llama3_8b_v4_answers.jsonl │ ├── saiga_bot_user_multiturn_prompts_saiga_llama3_8b_v5_answers.jsonl │ ├── saiga_bot_user_multiturn_prompts_sfr_answers.jsonl │ ├── tasks.jsonl │ ├── tasks_aya_23_8b_answers.jsonl │ ├── tasks_chatgpt_3_5_turbo_answers.jsonl │ ├── tasks_chatgpt_4_turbo_answers.jsonl │ ├── tasks_gemma_2_9b_it_abliterated_answers.jsonl │ ├── tasks_gemma_2_9b_it_abliterated_v2_answers.jsonl │ ├── tasks_gemma_2_9b_it_answers.jsonl │ ├── tasks_llama3_70b_answers.jsonl │ ├── tasks_llama3_8b_answers.jsonl │ ├── tasks_saicuna_13b_answers.jsonl │ ├── tasks_saiga2_13b_answers.jsonl │ ├── tasks_saiga2_7b_answers.jsonl │ ├── tasks_saiga_aya_23_35b_sft_m1_d5_answers.jsonl │ ├── tasks_saiga_aya_23_35b_sft_m1_d5_awq_4bit_answers.jsonl │ ├── tasks_saiga_gemma2_9b_abliterated_sft_m2_d7_answers.jsonl │ ├── tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_answers.jsonl │ ├── tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d10_answers.jsonl │ ├── tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d11_answers.jsonl │ ├── tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d12_answers.jsonl │ ├── tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d9_answers.jsonl │ ├── tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_answers.jsonl │ ├── tasks_saiga_gemma2_9b_abliterated_sft_m3_d9_abliterated_answers.jsonl │ ├── tasks_saiga_gemma2_9b_abliterated_sft_m3_d9_abliterated_kto_m1_d13_answers.jsonl │ ├── tasks_saiga_gemma2_9b_abliterated_sft_m3_d9_abliterated_kto_m2_d13_answers.jsonl │ ├── tasks_saiga_gemma2_9b_sft_m1_d7_answers.jsonl │ ├── tasks_saiga_gemma2_9b_sft_m2_d8_answers.jsonl │ ├── tasks_saiga_kto_v4_answers.json │ ├── tasks_saiga_kto_v4_answers.jsonl │ ├── tasks_saiga_kto_v5_answers.jsonl │ ├── tasks_saiga_llama3_70b_sft_m1_d5_abliterated_answers.jsonl │ ├── tasks_saiga_llama3_70b_sft_m1_d5_abliterated_awq_4bit_answers.jsonl │ ├── tasks_saiga_llama3_70b_sft_m1_d5_abliterated_gptq_3bit_answers.jsonl │ ├── tasks_saiga_llama3_70b_sft_m1_d5_abliterated_gptq_4bit_answers.jsonl │ ├── tasks_saiga_llama3_70b_sft_m1_d5_abliterated_kto_m1_d2_answers.jsonl │ ├── tasks_saiga_llama3_70b_sft_m1_d5_abliterated_kto_m1_d2_awq_4bit_answers.jsonl │ ├── tasks_saiga_llama3_70b_sft_m1_d5_answers.jsonl │ ├── tasks_saiga_llama3_8b_abliterated_sft_m11_d7_answers.jsonl │ ├── tasks_saiga_llama3_8b_abliterated_sft_m11_d7_kto_m7_d7_answers.jsonl │ ├── tasks_saiga_llama3_8b_answers.jsonl │ ├── tasks_saiga_llama3_8b_kto_m1_d2_answers.jsonl │ ├── tasks_saiga_llama3_8b_m1_d1_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m10_d1_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m10_d1_kto_m2_d2_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d5_abliterated_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m3_d2_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m5_d2_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m5_d3_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m5_d4_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m6_d5_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m6_d6_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d5_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d7_abliterated_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d7_abliterated_dpo_m1_d7_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d7_abliterated_dpo_m2_d8_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d7_abliterated_kto_m5_d7_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d7_abliterated_kto_m7_d7_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m11_d7_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m12_d7_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m13_d7_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m14_d7_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m3_d4_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m5_d1_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m5_d2_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m6_d1_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m7_d1_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m8_d1_answers.jsonl │ ├── tasks_saiga_llama3_8b_sft_m9_d1_answers.jsonl │ ├── tasks_saiga_llama3_8b_slim_answers.jsonl │ ├── tasks_saiga_llama3_8b_v4_answers.jsonl │ ├── tasks_saiga_llama3_8b_v5_vllm_answers.jsonl │ ├── tasks_saiga_mistral_7b_answers.jsonl │ ├── tasks_saiga_phi3_medium_m1_d2_awq_answers.jsonl │ ├── tasks_saiga_phi3_medium_sft_m1_d2_answers.jsonl │ ├── tasks_saiga_phi3_medium_sft_m1_d2_kto_m1_d2_answers.jsonl │ ├── tasks_saiga_phi3_medium_sft_m1_d2_kto_m1_d2_awq_4bit_answers.jsonl │ ├── tasks_saiga_phi3_medium_sft_m1_d2_kto_m5_d7_answers.jsonl │ ├── tasks_saiga_phi3_medium_sft_m2_d2_answers.jsonl │ ├── tasks_saiga_suzume_8b_answers.jsonl │ ├── tasks_saiga_tlite_8b_abliterated_sft_m1_d9_answers.jsonl │ ├── tasks_saiga_tlite_8b_abliterated_sft_m1_d9_kto_m1_d13_answers.jsonl │ ├── tasks_saiga_yi_9b_answers.jsonl │ ├── tasks_sfr_answers.jsonl │ ├── tasks_suzume_8b_answers.jsonl │ ├── tasks_suzume_orpo_borda_half_answers.jsonl │ ├── tasks_t_lite_abliterated_answers.jsonl │ ├── tasks_t_lite_answers.jsonl │ ├── tasks_vicuna_13b_v1_5_answers.jsonl │ ├── user_oriented_ru.jsonl │ ├── user_oriented_ru_v2.jsonl │ ├── user_rualpaca13b_answers.jsonl │ ├── user_rualpaca7b_answers.jsonl │ ├── user_saiga13b_answers.jsonl │ ├── user_saiga30b_answers.jsonl │ ├── user_saiga7b_answers.jsonl │ ├── user_v2_den4ik_fred_answers.jsonl │ ├── user_v2_den4ik_fred_new_answers.jsonl │ ├── user_v2_gigasaiga_answers.jsonl │ ├── user_v2_gigasaiga_v2_answers.jsonl │ ├── user_v2_gpt4_answers.jsonl │ ├── user_v2_saiga13b_answers.jsonl │ ├── user_v2_saiga13b_v2_answers.jsonl │ ├── user_v2_saiga2_13b_answers.jsonl │ ├── user_v2_saiga2_70b_answers.jsonl │ ├── user_v2_saiga2_70b_v2_answers.jsonl │ ├── user_v2_saiga2_7b_answers.jsonl │ ├── user_v2_saiga2_7b_fp16_answers.jsonl │ ├── user_v2_saiga2_7b_v2_answers.jsonl │ ├── user_v2_saiga30b_answers.jsonl │ ├── user_v2_saiga30b_v2_answers.jsonl │ ├── user_v2_saiga30b_v3_answers.jsonl │ ├── user_v2_saiga30bq4_1_answers.jsonl │ ├── user_v2_saiga65b_answers.jsonl │ ├── user_v2_saiga7b_fast_answers.jsonl │ ├── user_v2_saiga7b_v2_answers.jsonl │ ├── user_v2_saiga7b_v4_answers.jsonl │ ├── user_v2_saiga7b_v5_answers.jsonl │ ├── user_v2_turbo_answers.jsonl │ ├── user_v2_vicuna_13b_v1_5_answers.jsonl │ ├── vicuna_den4ik_fred_answers.jsonl │ ├── vicuna_den4ik_fred_new_answers.jsonl │ ├── vicuna_gigasaiga_answers.jsonl │ ├── vicuna_gigasaiga_v2_answers.jsonl │ ├── vicuna_gpt4_answers.jsonl │ ├── vicuna_question_ru.jsonl │ ├── vicuna_rualpaca13b_answers.jsonl │ ├── vicuna_rualpaca7b_answers.jsonl │ ├── vicuna_saiga13b_answers.jsonl │ ├── vicuna_saiga13b_v2_answers.jsonl │ ├── vicuna_saiga2_13b_answers.jsonl │ ├── vicuna_saiga2_70b_answers.jsonl │ ├── vicuna_saiga2_70b_v2_answers.jsonl │ ├── vicuna_saiga2_7b_answers.jsonl │ ├── vicuna_saiga2_7b_fp16_answers.jsonl │ ├── vicuna_saiga2_7b_v2_answers.jsonl │ ├── vicuna_saiga30b_answers.jsonl │ ├── vicuna_saiga30b_v2_answers.jsonl │ ├── vicuna_saiga30b_v3_answers.jsonl │ ├── vicuna_saiga30bq4_1_answers.jsonl │ ├── vicuna_saiga65b_answers.jsonl │ ├── vicuna_saiga7b_answers.jsonl │ ├── vicuna_saiga7b_fast_answer.jsonl │ ├── vicuna_saiga7b_v4_answers.jsonl │ ├── vicuna_saiga7b_v5_answers.jsonl │ ├── vicuna_turbo_answers.jsonl │ └── vicuna_vicuna_13b_v1_5_answers.jsonl ├── dataset_configs │ ├── pref_d1.json │ ├── pref_d2.json │ ├── sft_d1.json │ ├── sft_d2.json │ ├── sft_d3.json │ └── sft_d4.json ├── eval.sh ├── external_prompts │ ├── char_image_prompt.txt │ ├── custom_exec.txt │ ├── en_char.txt │ ├── en_char_chat.txt │ ├── en_char_topics.txt │ ├── ru_char.txt │ ├── ru_char_chat.txt │ ├── ru_char_topics.txt │ ├── ru_chat.txt │ ├── ru_exec.txt │ ├── ru_gen_settings.json │ ├── ru_instruct.txt │ ├── ru_sbs.txt │ ├── ru_wizard_breadth.txt │ ├── ru_wizard_depth.txt │ ├── ru_wizard_depth_methods.txt │ ├── ru_wizard_elimination.txt │ ├── ru_wizard_few_shot.txt │ ├── ru_wizard_json.txt │ └── ru_wizard_xml.txt ├── internal_prompts │ ├── chatml.json │ ├── gigasaiga.json │ ├── llama3.json │ ├── saiga_v2.json │ └── vicuna.json ├── models │ └── lid.176.bin ├── src │ ├── analyze_alpaca_eval.py │ ├── anthropic_wrapper.py │ ├── benchmarks │ │ ├── eval_lora_rsg.py │ │ ├── eval_zs_rsg.py │ │ └── eval_zs_tape.py │ ├── bot │ │ ├── calc_sbs_agreement.py │ │ ├── convert_to_db.py │ │ ├── get_markup.py │ │ ├── get_stat.py │ │ ├── merge.py │ │ ├── run.py │ │ └── run_sbs.py │ ├── data_processing │ │ ├── annotate_meta_claude.py │ │ ├── bad_substrings.py │ │ ├── clean_user_conversations.py │ │ ├── clean_wizard_instructions.py │ │ ├── compose_pref_dataset.py │ │ ├── compose_sft_dataset.py │ │ ├── convert_rsg.py │ │ ├── convert_to_char_card.py │ │ ├── create_chat_set.py │ │ ├── create_instruct_set.py │ │ ├── create_short_chat_set.py │ │ ├── embedder.py │ │ ├── exec_instructions.py │ │ ├── fetch_chat_seeds.py │ │ ├── fetch_new_multiturn_queries.py │ │ ├── fetch_new_queries.py │ │ ├── fetch_reward.py │ │ ├── fetch_slim.py │ │ ├── fetch_tagengo.py │ │ ├── fetch_wildchat.py │ │ ├── filter_claude.py │ │ ├── generate_char_chats.py │ │ ├── generate_char_image_prompts.py │ │ ├── generate_char_topics.py │ │ ├── generate_chars.py │ │ ├── generate_chat.py │ │ ├── generate_instructions.py │ │ ├── get_oasst_ru.py │ │ ├── get_oasst_ru_v2.py │ │ ├── improve_instructions.py │ │ ├── infer_kandinsky.py │ │ ├── lang_detector.py │ │ ├── postprocess_chat.py │ │ ├── process_annotations.py │ │ ├── to_parquet.py │ │ ├── to_preferences.py │ │ └── to_reward_dataset.py │ ├── dataset.py │ ├── infer_chatgpt.py │ ├── infer_fred.py │ ├── infer_llama3.py │ ├── infer_saiga.py │ ├── infer_saiga_llamacpp.py │ ├── infer_saiga_vllm.py │ ├── interact.py │ ├── interact_llama3_llamacpp.py │ ├── interact_llamacpp.py │ ├── interact_mistral_llamacpp.py │ ├── sbs │ │ ├── create_pairs.py │ │ ├── eval_gpt.py │ │ ├── pairs_config.json │ │ └── prompt.jinja │ ├── to_alpaca_eval.py │ ├── tools │ │ ├── convert_json2jsonl.py │ │ ├── convert_to_native.py │ │ ├── ingest.py │ │ └── merge_lora.py │ ├── train.py │ ├── train_kto.py │ ├── train_orpo.py │ ├── train_reward.py │ ├── train_unsloth.py │ └── util │ │ ├── chat.py │ │ ├── dl.py │ │ ├── generate.py │ │ ├── io.py │ │ ├── langdetect.py │ │ ├── load.py │ │ └── openai.py ├── tests │ └── test_fix_tokenizer.py └── tune_llama_7b.ipynb └── setup.py /.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/.gitattributes -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/LICENSE -------------------------------------------------------------------------------- /NOTICE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/NOTICE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/README.md -------------------------------------------------------------------------------- /configs/gpt2_tiny_v1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/configs/gpt2_tiny_v1.json -------------------------------------------------------------------------------- /configs/gpt_neo_small_v1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/configs/gpt_neo_small_v1.json -------------------------------------------------------------------------------- /configs/gpt_neo_small_v2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/configs/gpt_neo_small_v2.json -------------------------------------------------------------------------------- /configs/gpt_neo_tiny_v1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/configs/gpt_neo_tiny_v1.json -------------------------------------------------------------------------------- /configs/gpt_neo_tiny_v2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/configs/gpt_neo_tiny_v2.json -------------------------------------------------------------------------------- /data_processing/calc_ngrams.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/calc_ngrams.py -------------------------------------------------------------------------------- /data_processing/clean_ficbook.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/clean_ficbook.py -------------------------------------------------------------------------------- /data_processing/convert_math.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/convert_math.py -------------------------------------------------------------------------------- /data_processing/convert_mc4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/convert_mc4.py -------------------------------------------------------------------------------- /data_processing/convert_opensubtitles.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/convert_opensubtitles.py -------------------------------------------------------------------------------- /data_processing/convert_pikabu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/convert_pikabu.py -------------------------------------------------------------------------------- /data_processing/convert_wiki.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/convert_wiki.py -------------------------------------------------------------------------------- /data_processing/convert_yandex_q.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/convert_yandex_q.py -------------------------------------------------------------------------------- /data_processing/create_ficbook.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/create_ficbook.py -------------------------------------------------------------------------------- /data_processing/create_habr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/create_habr.py -------------------------------------------------------------------------------- /data_processing/create_librusec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/create_librusec.py -------------------------------------------------------------------------------- /data_processing/create_ru_news.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/create_ru_news.py -------------------------------------------------------------------------------- /data_processing/create_stackoverflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/create_stackoverflow.py -------------------------------------------------------------------------------- /data_processing/create_stihi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/create_stihi.py -------------------------------------------------------------------------------- /data_processing/exact_undup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/exact_undup.py -------------------------------------------------------------------------------- /data_processing/filter_with_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/filter_with_tokenizer.py -------------------------------------------------------------------------------- /data_processing/hf_to_instruct.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/hf_to_instruct.py -------------------------------------------------------------------------------- /data_processing/lang_detector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/lang_detector.py -------------------------------------------------------------------------------- /data_processing/merge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/merge.py -------------------------------------------------------------------------------- /data_processing/parse_fb2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/parse_fb2.py -------------------------------------------------------------------------------- /data_processing/parse_zip_fb2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/parse_zip_fb2.py -------------------------------------------------------------------------------- /data_processing/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/requirements.txt -------------------------------------------------------------------------------- /data_processing/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/run.sh -------------------------------------------------------------------------------- /data_processing/save_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/save_hf.py -------------------------------------------------------------------------------- /data_processing/save_mc4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/save_mc4.py -------------------------------------------------------------------------------- /data_processing/split.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/split.py -------------------------------------------------------------------------------- /data_processing/undup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/undup.py -------------------------------------------------------------------------------- /data_processing/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/data_processing/util.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/requirements.txt -------------------------------------------------------------------------------- /resources/mc4_bad_hosts.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/resources/mc4_bad_hosts.txt -------------------------------------------------------------------------------- /resources/mc4_good_hosts.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/resources/mc4_good_hosts.txt -------------------------------------------------------------------------------- /resources/mc4_news_hosts.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/resources/mc4_news_hosts.txt -------------------------------------------------------------------------------- /resources/mc4_ru_bad_words.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/resources/mc4_ru_bad_words.txt -------------------------------------------------------------------------------- /rulm/generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/rulm/generate.py -------------------------------------------------------------------------------- /rulm/jsonl_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/rulm/jsonl_loader.py -------------------------------------------------------------------------------- /rulm/preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/rulm/preprocess.py -------------------------------------------------------------------------------- /rulm/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/rulm/train.py -------------------------------------------------------------------------------- /rulm/train_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/rulm/train_tokenizer.py -------------------------------------------------------------------------------- /rulm/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/rulm/util.py -------------------------------------------------------------------------------- /self_instruct/.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/.gitattributes -------------------------------------------------------------------------------- /self_instruct/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/README.md -------------------------------------------------------------------------------- /self_instruct/configs/fred_deepspeed.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/fred_deepspeed.json -------------------------------------------------------------------------------- /self_instruct/configs/gigasaiga_13b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/gigasaiga_13b.json -------------------------------------------------------------------------------- /self_instruct/configs/llama2_13b_rsg.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/llama2_13b_rsg.json -------------------------------------------------------------------------------- /self_instruct/configs/llama2_13b_rsg_rcb.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/llama2_13b_rsg_rcb.json -------------------------------------------------------------------------------- /self_instruct/configs/llama2_13b_rsg_rucos.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/llama2_13b_rsg_rucos.json -------------------------------------------------------------------------------- /self_instruct/configs/llama2_13b_rsg_russe.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/llama2_13b_rsg_russe.json -------------------------------------------------------------------------------- /self_instruct/configs/llama2_13b_rsg_terra.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/llama2_13b_rsg_terra.json -------------------------------------------------------------------------------- /self_instruct/configs/llama_13b_lora.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/llama_13b_lora.json -------------------------------------------------------------------------------- /self_instruct/configs/llama_13b_rsg.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/llama_13b_rsg.json -------------------------------------------------------------------------------- /self_instruct/configs/llama_13b_rsg_rucos.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/llama_13b_rsg_rucos.json -------------------------------------------------------------------------------- /self_instruct/configs/llama_13b_rsg_russe.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/llama_13b_rsg_russe.json -------------------------------------------------------------------------------- /self_instruct/configs/llama_7b_lora.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/llama_7b_lora.json -------------------------------------------------------------------------------- /self_instruct/configs/mistral_7b_128k.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mistral_7b_128k.json -------------------------------------------------------------------------------- /self_instruct/configs/mistral_7b_rsg.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mistral_7b_rsg.json -------------------------------------------------------------------------------- /self_instruct/configs/mistral_7b_rsg_danetqa.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mistral_7b_rsg_danetqa.json -------------------------------------------------------------------------------- /self_instruct/configs/mistral_7b_rsg_parus.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mistral_7b_rsg_parus.json -------------------------------------------------------------------------------- /self_instruct/configs/mistral_7b_rsg_rucos.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mistral_7b_rsg_rucos.json -------------------------------------------------------------------------------- /self_instruct/configs/mistral_7b_rsg_russe.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mistral_7b_rsg_russe.json -------------------------------------------------------------------------------- /self_instruct/configs/mistral_7b_rsg_terra.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mistral_7b_rsg_terra.json -------------------------------------------------------------------------------- /self_instruct/configs/mpt_30b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mpt_30b.json -------------------------------------------------------------------------------- /self_instruct/configs/mpt_7b_8k.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mpt_7b_8k.json -------------------------------------------------------------------------------- /self_instruct/configs/mpt_7b_storywriter.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mpt_7b_storywriter.json -------------------------------------------------------------------------------- /self_instruct/configs/mt0_large_deepspeed.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mt0_large_deepspeed.json -------------------------------------------------------------------------------- /self_instruct/configs/mt0_xl_lora.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mt0_xl_lora.json -------------------------------------------------------------------------------- /self_instruct/configs/mt0_xxl_deepspeed.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mt0_xxl_deepspeed.json -------------------------------------------------------------------------------- /self_instruct/configs/mt0_xxl_mt_lora.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/mt0_xxl_mt_lora.json -------------------------------------------------------------------------------- /self_instruct/configs/rugpt_large_plain.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/rugpt_large_plain.json -------------------------------------------------------------------------------- /self_instruct/configs/rugpt_medium_plain.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/rugpt_medium_plain.json -------------------------------------------------------------------------------- /self_instruct/configs/rut5_base_plain.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/rut5_base_plain.json -------------------------------------------------------------------------------- /self_instruct/configs/rut5_large_plain.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/rut5_large_plain.json -------------------------------------------------------------------------------- /self_instruct/configs/saicuna_13b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saicuna_13b.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga2_13b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga2_13b.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga2_70b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga2_70b.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga2_7b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga2_7b.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_13b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_13b.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_13b_rsg.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_13b_rsg.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_13b_rsg_parus.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_13b_rsg_parus.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_13b_rsg_rucos.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_13b_rsg_rucos.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_13b_rsg_russe.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_13b_rsg_russe.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_13b_rsg_rwsd.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_13b_rsg_rwsd.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_30b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_30b.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_30b_4bit.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_30b_4bit.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_65b_4bit.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_65b_4bit.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_7b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_7b.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_aya23_8b_m1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_aya23_8b_m1.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_kto.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_kto.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_llama3_8b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_llama3_8b.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_llama3_8b_galore.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_llama3_8b_galore.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_llama3_8b_lm_head.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_llama3_8b_lm_head.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_llama3_8b_m1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_llama3_8b_m1.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_llama3_8b_m2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_llama3_8b_m2.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_llama3_8b_m3.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_llama3_8b_m3.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_llama3_8b_sfr.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_llama3_8b_sfr.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_mistral_7b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_mistral_7b.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_orpo.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_orpo.json -------------------------------------------------------------------------------- /self_instruct/configs/saiga_reward.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/saiga_reward.json -------------------------------------------------------------------------------- /self_instruct/configs/xglm_3B_deepspeed.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/configs/xglm_3B_deepspeed.json -------------------------------------------------------------------------------- /self_instruct/crowd/aggregate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/crowd/aggregate.py -------------------------------------------------------------------------------- /self_instruct/crowd/examples/honey.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/crowd/examples/honey.jsonl -------------------------------------------------------------------------------- /self_instruct/crowd/examples/training.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/crowd/examples/training.json -------------------------------------------------------------------------------- /self_instruct/crowd/pool_settings.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/crowd/pool_settings.json -------------------------------------------------------------------------------- /self_instruct/crowd/settings.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/crowd/settings.json -------------------------------------------------------------------------------- /self_instruct/crowd/upload.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/crowd/upload.py -------------------------------------------------------------------------------- /self_instruct/data/.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/.gitattributes -------------------------------------------------------------------------------- /self_instruct/data/en_chargen_seed.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/en_chargen_seed.jsonl -------------------------------------------------------------------------------- /self_instruct/data/gpt4_evals/saiga_vs_vicuna.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/gpt4_evals/saiga_vs_vicuna.jsonl -------------------------------------------------------------------------------- /self_instruct/data/lmsys_clean_ru_queries_chatgpt_3_5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/lmsys_clean_ru_queries_chatgpt_3_5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/lmsys_clean_ru_queries_chatgpt_4_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/lmsys_clean_ru_queries_chatgpt_4_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/lmsys_clean_ru_queries_llama_3_8b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/lmsys_clean_ru_queries_llama_3_8b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/lmsys_clean_ru_queries_saiga_llama3_8b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/lmsys_clean_ru_queries_saiga_llama3_8b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/lmsys_clean_ru_queries_suzume_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/lmsys_clean_ru_queries_suzume_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/output.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/output.json -------------------------------------------------------------------------------- /self_instruct/data/preferences_prompts.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/preferences_prompts.jsonl -------------------------------------------------------------------------------- /self_instruct/data/preferences_prompts_gemma2_9b_it_abliterated_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/preferences_prompts_gemma2_9b_it_abliterated_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/preferences_prompts_gpt4_4o_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/preferences_prompts_gpt4_4o_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/preferences_prompts_saiga_gemma2_9b_sft_m2_d8_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/preferences_prompts_saiga_gemma2_9b_sft_m2_d8_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/preferences_prompts_saiga_llama3_8b_v6_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/preferences_prompts_saiga_llama3_8b_v6_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/preferences_prompts_saiga_phi3_medium_sft_m1_d2_awq_4bit_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/preferences_prompts_saiga_phi3_medium_sft_m1_d2_awq_4bit_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/ru_alpaca_seed_tasks.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/ru_alpaca_seed_tasks.jsonl -------------------------------------------------------------------------------- /self_instruct/data/ru_chargen_seed.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/ru_chargen_seed.jsonl -------------------------------------------------------------------------------- /self_instruct/data/saiga_bot_user_multiturn_prompts.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/saiga_bot_user_multiturn_prompts.jsonl -------------------------------------------------------------------------------- /self_instruct/data/saiga_bot_user_multiturn_prompts_aya_23_8b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/saiga_bot_user_multiturn_prompts_aya_23_8b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/saiga_bot_user_multiturn_prompts_chatgpt_3_5_turbo_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/saiga_bot_user_multiturn_prompts_chatgpt_3_5_turbo_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/saiga_bot_user_multiturn_prompts_gpt4_4o_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/saiga_bot_user_multiturn_prompts_gpt4_4o_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/saiga_bot_user_multiturn_prompts_llama3_8b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/saiga_bot_user_multiturn_prompts_llama3_8b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/saiga_bot_user_multiturn_prompts_saiga_llama3_8b_v4_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/saiga_bot_user_multiturn_prompts_saiga_llama3_8b_v4_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/saiga_bot_user_multiturn_prompts_saiga_llama3_8b_v5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/saiga_bot_user_multiturn_prompts_saiga_llama3_8b_v5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/saiga_bot_user_multiturn_prompts_sfr_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/saiga_bot_user_multiturn_prompts_sfr_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_aya_23_8b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_aya_23_8b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_chatgpt_3_5_turbo_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_chatgpt_3_5_turbo_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_chatgpt_4_turbo_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_chatgpt_4_turbo_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_gemma_2_9b_it_abliterated_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_gemma_2_9b_it_abliterated_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_gemma_2_9b_it_abliterated_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_gemma_2_9b_it_abliterated_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_gemma_2_9b_it_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_gemma_2_9b_it_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_llama3_70b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_llama3_70b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_llama3_8b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_llama3_8b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saicuna_13b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saicuna_13b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga2_13b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga2_13b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga2_7b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga2_7b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_aya_23_35b_sft_m1_d5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_aya_23_35b_sft_m1_d5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_aya_23_35b_sft_m1_d5_awq_4bit_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_aya_23_35b_sft_m1_d5_awq_4bit_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d10_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d10_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d11_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d11_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d12_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d12_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d9_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_abliterated_kto_m1_d9_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m2_d9_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m3_d9_abliterated_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m3_d9_abliterated_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m3_d9_abliterated_kto_m1_d13_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m3_d9_abliterated_kto_m1_d13_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m3_d9_abliterated_kto_m2_d13_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_abliterated_sft_m3_d9_abliterated_kto_m2_d13_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_sft_m1_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_sft_m1_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_gemma2_9b_sft_m2_d8_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_gemma2_9b_sft_m2_d8_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_kto_v4_answers.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_kto_v4_answers.json -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_kto_v4_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_kto_v4_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_kto_v5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_kto_v5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_awq_4bit_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_awq_4bit_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_gptq_3bit_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_gptq_3bit_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_gptq_4bit_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_gptq_4bit_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_kto_m1_d2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_kto_m1_d2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_kto_m1_d2_awq_4bit_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_abliterated_kto_m1_d2_awq_4bit_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_70b_sft_m1_d5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_abliterated_sft_m11_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_abliterated_sft_m11_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_abliterated_sft_m11_d7_kto_m7_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_abliterated_sft_m11_d7_kto_m7_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_kto_m1_d2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_kto_m1_d2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_m1_d1_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_m1_d1_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m10_d1_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m10_d1_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m10_d1_kto_m2_d2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m10_d1_kto_m2_d2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m3_d2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m3_d2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m5_d2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m5_d2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m5_d3_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m5_d3_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m5_d4_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m5_d4_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m6_d5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m6_d5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m6_d6_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_abliterated_kto_m6_d6_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_abliterated_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_abliterated_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_abliterated_dpo_m1_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_abliterated_dpo_m1_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_abliterated_dpo_m2_d8_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_abliterated_dpo_m2_d8_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_abliterated_kto_m5_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_abliterated_kto_m5_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_abliterated_kto_m7_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_abliterated_kto_m7_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m11_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m12_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m12_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m13_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m13_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m14_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m14_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m3_d4_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m3_d4_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m5_d1_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m5_d1_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m5_d2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m5_d2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m6_d1_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m6_d1_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m7_d1_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m7_d1_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m8_d1_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m8_d1_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_sft_m9_d1_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_sft_m9_d1_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_slim_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_slim_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_v4_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_v4_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_llama3_8b_v5_vllm_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_llama3_8b_v5_vllm_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_mistral_7b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_mistral_7b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_phi3_medium_m1_d2_awq_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_phi3_medium_m1_d2_awq_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_phi3_medium_sft_m1_d2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_phi3_medium_sft_m1_d2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_phi3_medium_sft_m1_d2_kto_m1_d2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_phi3_medium_sft_m1_d2_kto_m1_d2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_phi3_medium_sft_m1_d2_kto_m1_d2_awq_4bit_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_phi3_medium_sft_m1_d2_kto_m1_d2_awq_4bit_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_phi3_medium_sft_m1_d2_kto_m5_d7_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_phi3_medium_sft_m1_d2_kto_m5_d7_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_phi3_medium_sft_m2_d2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_phi3_medium_sft_m2_d2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_suzume_8b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_suzume_8b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_tlite_8b_abliterated_sft_m1_d9_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_tlite_8b_abliterated_sft_m1_d9_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_tlite_8b_abliterated_sft_m1_d9_kto_m1_d13_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_tlite_8b_abliterated_sft_m1_d9_kto_m1_d13_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_saiga_yi_9b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_saiga_yi_9b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_sfr_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_sfr_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_suzume_8b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_suzume_8b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_suzume_orpo_borda_half_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_suzume_orpo_borda_half_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_t_lite_abliterated_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_t_lite_abliterated_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_t_lite_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_t_lite_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/tasks_vicuna_13b_v1_5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/tasks_vicuna_13b_v1_5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_oriented_ru.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_oriented_ru.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_oriented_ru_v2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_oriented_ru_v2.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_rualpaca13b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_rualpaca13b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_rualpaca7b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_rualpaca7b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_saiga13b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_saiga13b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_saiga30b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_saiga30b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_saiga7b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_saiga7b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_den4ik_fred_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_den4ik_fred_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_den4ik_fred_new_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_den4ik_fred_new_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_gigasaiga_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_gigasaiga_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_gigasaiga_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_gigasaiga_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_gpt4_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_gpt4_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga13b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga13b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga13b_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga13b_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga2_13b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga2_13b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga2_70b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga2_70b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga2_70b_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga2_70b_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga2_7b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga2_7b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga2_7b_fp16_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga2_7b_fp16_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga2_7b_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga2_7b_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga30b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga30b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga30b_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga30b_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga30b_v3_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga30b_v3_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga30bq4_1_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga30bq4_1_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga65b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga65b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga7b_fast_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga7b_fast_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga7b_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga7b_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga7b_v4_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga7b_v4_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_saiga7b_v5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_saiga7b_v5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_turbo_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_turbo_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/user_v2_vicuna_13b_v1_5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/user_v2_vicuna_13b_v1_5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_den4ik_fred_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_den4ik_fred_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_den4ik_fred_new_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_den4ik_fred_new_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_gigasaiga_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_gigasaiga_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_gigasaiga_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_gigasaiga_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_gpt4_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_gpt4_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_question_ru.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_question_ru.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_rualpaca13b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_rualpaca13b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_rualpaca7b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_rualpaca7b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga13b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga13b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga13b_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga13b_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga2_13b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga2_13b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga2_70b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga2_70b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga2_70b_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga2_70b_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga2_7b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga2_7b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga2_7b_fp16_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga2_7b_fp16_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga2_7b_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga2_7b_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga30b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga30b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga30b_v2_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga30b_v2_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga30b_v3_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga30b_v3_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga30bq4_1_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga30bq4_1_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga65b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga65b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga7b_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga7b_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga7b_fast_answer.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga7b_fast_answer.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga7b_v4_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga7b_v4_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_saiga7b_v5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_saiga7b_v5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_turbo_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_turbo_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/data/vicuna_vicuna_13b_v1_5_answers.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/data/vicuna_vicuna_13b_v1_5_answers.jsonl -------------------------------------------------------------------------------- /self_instruct/dataset_configs/pref_d1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/dataset_configs/pref_d1.json -------------------------------------------------------------------------------- /self_instruct/dataset_configs/pref_d2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/dataset_configs/pref_d2.json -------------------------------------------------------------------------------- /self_instruct/dataset_configs/sft_d1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/dataset_configs/sft_d1.json -------------------------------------------------------------------------------- /self_instruct/dataset_configs/sft_d2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/dataset_configs/sft_d2.json -------------------------------------------------------------------------------- /self_instruct/dataset_configs/sft_d3.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/dataset_configs/sft_d3.json -------------------------------------------------------------------------------- /self_instruct/dataset_configs/sft_d4.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/dataset_configs/sft_d4.json -------------------------------------------------------------------------------- /self_instruct/eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/eval.sh -------------------------------------------------------------------------------- /self_instruct/external_prompts/char_image_prompt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/char_image_prompt.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/custom_exec.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/custom_exec.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/en_char.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/en_char.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/en_char_chat.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/en_char_chat.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/en_char_topics.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/en_char_topics.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_char.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_char.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_char_chat.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_char_chat.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_char_topics.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_char_topics.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_chat.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_chat.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_exec.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_exec.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_gen_settings.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_gen_settings.json -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_instruct.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_instruct.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_sbs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_sbs.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_wizard_breadth.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_wizard_breadth.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_wizard_depth.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_wizard_depth.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_wizard_depth_methods.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_wizard_depth_methods.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_wizard_elimination.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_wizard_elimination.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_wizard_few_shot.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_wizard_few_shot.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_wizard_json.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_wizard_json.txt -------------------------------------------------------------------------------- /self_instruct/external_prompts/ru_wizard_xml.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/external_prompts/ru_wizard_xml.txt -------------------------------------------------------------------------------- /self_instruct/internal_prompts/chatml.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/internal_prompts/chatml.json -------------------------------------------------------------------------------- /self_instruct/internal_prompts/gigasaiga.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/internal_prompts/gigasaiga.json -------------------------------------------------------------------------------- /self_instruct/internal_prompts/llama3.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/internal_prompts/llama3.json -------------------------------------------------------------------------------- /self_instruct/internal_prompts/saiga_v2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/internal_prompts/saiga_v2.json -------------------------------------------------------------------------------- /self_instruct/internal_prompts/vicuna.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/internal_prompts/vicuna.json -------------------------------------------------------------------------------- /self_instruct/models/lid.176.bin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/models/lid.176.bin -------------------------------------------------------------------------------- /self_instruct/src/analyze_alpaca_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/analyze_alpaca_eval.py -------------------------------------------------------------------------------- /self_instruct/src/anthropic_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/anthropic_wrapper.py -------------------------------------------------------------------------------- /self_instruct/src/benchmarks/eval_lora_rsg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/benchmarks/eval_lora_rsg.py -------------------------------------------------------------------------------- /self_instruct/src/benchmarks/eval_zs_rsg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/benchmarks/eval_zs_rsg.py -------------------------------------------------------------------------------- /self_instruct/src/benchmarks/eval_zs_tape.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/benchmarks/eval_zs_tape.py -------------------------------------------------------------------------------- /self_instruct/src/bot/calc_sbs_agreement.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/bot/calc_sbs_agreement.py -------------------------------------------------------------------------------- /self_instruct/src/bot/convert_to_db.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/bot/convert_to_db.py -------------------------------------------------------------------------------- /self_instruct/src/bot/get_markup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/bot/get_markup.py -------------------------------------------------------------------------------- /self_instruct/src/bot/get_stat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/bot/get_stat.py -------------------------------------------------------------------------------- /self_instruct/src/bot/merge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/bot/merge.py -------------------------------------------------------------------------------- /self_instruct/src/bot/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/bot/run.py -------------------------------------------------------------------------------- /self_instruct/src/bot/run_sbs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/bot/run_sbs.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/annotate_meta_claude.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/annotate_meta_claude.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/bad_substrings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/bad_substrings.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/clean_user_conversations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/clean_user_conversations.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/clean_wizard_instructions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/clean_wizard_instructions.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/compose_pref_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/compose_pref_dataset.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/compose_sft_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/compose_sft_dataset.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/convert_rsg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/convert_rsg.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/convert_to_char_card.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/convert_to_char_card.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/create_chat_set.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/create_chat_set.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/create_instruct_set.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/create_instruct_set.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/create_short_chat_set.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/create_short_chat_set.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/embedder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/embedder.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/exec_instructions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/exec_instructions.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/fetch_chat_seeds.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/fetch_chat_seeds.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/fetch_new_multiturn_queries.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/fetch_new_multiturn_queries.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/fetch_new_queries.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/fetch_new_queries.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/fetch_reward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/fetch_reward.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/fetch_slim.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/fetch_slim.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/fetch_tagengo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/fetch_tagengo.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/fetch_wildchat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/fetch_wildchat.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/filter_claude.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/filter_claude.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/generate_char_chats.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/generate_char_chats.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/generate_char_image_prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/generate_char_image_prompts.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/generate_char_topics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/generate_char_topics.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/generate_chars.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/generate_chars.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/generate_chat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/generate_chat.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/generate_instructions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/generate_instructions.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/get_oasst_ru.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/get_oasst_ru.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/get_oasst_ru_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/get_oasst_ru_v2.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/improve_instructions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/improve_instructions.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/infer_kandinsky.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/infer_kandinsky.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/lang_detector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/lang_detector.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/postprocess_chat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/postprocess_chat.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/process_annotations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/process_annotations.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/to_parquet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/to_parquet.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/to_preferences.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/to_preferences.py -------------------------------------------------------------------------------- /self_instruct/src/data_processing/to_reward_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/data_processing/to_reward_dataset.py -------------------------------------------------------------------------------- /self_instruct/src/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/dataset.py -------------------------------------------------------------------------------- /self_instruct/src/infer_chatgpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/infer_chatgpt.py -------------------------------------------------------------------------------- /self_instruct/src/infer_fred.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/infer_fred.py -------------------------------------------------------------------------------- /self_instruct/src/infer_llama3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/infer_llama3.py -------------------------------------------------------------------------------- /self_instruct/src/infer_saiga.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/infer_saiga.py -------------------------------------------------------------------------------- /self_instruct/src/infer_saiga_llamacpp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/infer_saiga_llamacpp.py -------------------------------------------------------------------------------- /self_instruct/src/infer_saiga_vllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/infer_saiga_vllm.py -------------------------------------------------------------------------------- /self_instruct/src/interact.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/interact.py -------------------------------------------------------------------------------- /self_instruct/src/interact_llama3_llamacpp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/interact_llama3_llamacpp.py -------------------------------------------------------------------------------- /self_instruct/src/interact_llamacpp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/interact_llamacpp.py -------------------------------------------------------------------------------- /self_instruct/src/interact_mistral_llamacpp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/interact_mistral_llamacpp.py -------------------------------------------------------------------------------- /self_instruct/src/sbs/create_pairs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/sbs/create_pairs.py -------------------------------------------------------------------------------- /self_instruct/src/sbs/eval_gpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/sbs/eval_gpt.py -------------------------------------------------------------------------------- /self_instruct/src/sbs/pairs_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/sbs/pairs_config.json -------------------------------------------------------------------------------- /self_instruct/src/sbs/prompt.jinja: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/sbs/prompt.jinja -------------------------------------------------------------------------------- /self_instruct/src/to_alpaca_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/to_alpaca_eval.py -------------------------------------------------------------------------------- /self_instruct/src/tools/convert_json2jsonl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/tools/convert_json2jsonl.py -------------------------------------------------------------------------------- /self_instruct/src/tools/convert_to_native.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/tools/convert_to_native.py -------------------------------------------------------------------------------- /self_instruct/src/tools/ingest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/tools/ingest.py -------------------------------------------------------------------------------- /self_instruct/src/tools/merge_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/tools/merge_lora.py -------------------------------------------------------------------------------- /self_instruct/src/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/train.py -------------------------------------------------------------------------------- /self_instruct/src/train_kto.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/train_kto.py -------------------------------------------------------------------------------- /self_instruct/src/train_orpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/train_orpo.py -------------------------------------------------------------------------------- /self_instruct/src/train_reward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/train_reward.py -------------------------------------------------------------------------------- /self_instruct/src/train_unsloth.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/train_unsloth.py -------------------------------------------------------------------------------- /self_instruct/src/util/chat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/util/chat.py -------------------------------------------------------------------------------- /self_instruct/src/util/dl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/util/dl.py -------------------------------------------------------------------------------- /self_instruct/src/util/generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/util/generate.py -------------------------------------------------------------------------------- /self_instruct/src/util/io.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/util/io.py -------------------------------------------------------------------------------- /self_instruct/src/util/langdetect.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/util/langdetect.py -------------------------------------------------------------------------------- /self_instruct/src/util/load.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/util/load.py -------------------------------------------------------------------------------- /self_instruct/src/util/openai.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/src/util/openai.py -------------------------------------------------------------------------------- /self_instruct/tests/test_fix_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/tests/test_fix_tokenizer.py -------------------------------------------------------------------------------- /self_instruct/tune_llama_7b.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/self_instruct/tune_llama_7b.ipynb -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IlyaGusev/rulm/HEAD/setup.py --------------------------------------------------------------------------------