├── .github └── ISSUE_TEMPLATE │ ├── bug_report.yml │ ├── config.yml │ ├── feature_request.yml │ └── study_feedback.yml ├── .gitignore ├── README.md ├── code ├── C11 │ ├── 03_peft_pythia-2.8b.ipynb │ ├── 04_dataset_gen.ipynb │ ├── 04_qwen2.5_qlora.ipynb │ ├── 04_qwen2.5_test.ipynb │ └── data │ │ ├── blackwukong.md │ │ ├── wukong_base_20251109_201117.jsonl │ │ └── wukong_dataset_20251109_215706.jsonl ├── C14 │ ├── 01_main.py │ ├── 01_test.py │ └── ner_deployment │ │ ├── Dockerfile │ │ ├── checkpoints │ │ └── config.json │ │ ├── data │ │ ├── categories.json │ │ └── vocabulary.json │ │ ├── docker-compose.yml │ │ ├── main.py │ │ ├── predict.py │ │ ├── pyproject.toml │ │ └── src │ │ ├── __init__.py │ │ ├── tokenizer │ │ ├── __init__.py │ │ ├── base.py │ │ ├── char_tokenizer.py │ │ └── vocabulary.py │ │ └── utils │ │ ├── __init__.py │ │ └── file_io.py ├── C2 │ ├── 01_jieba.py │ ├── 04_gensim.ipynb │ ├── user_dict.txt │ └── user_pos_dict.txt ├── C3 │ ├── 01_RNN.py │ └── 02_LSTM.py ├── C4 │ ├── 01_Seq2Seq.py │ ├── 02_attention.py │ └── 03_Self-Attention.py ├── C5 │ ├── 01_bert_usage.py │ ├── 02_gpt_usage.py │ ├── 03_bucket_id.py │ ├── 03_t5_usage.py │ ├── 04_hf_usage.ipynb │ └── cat.jpg ├── C6 │ ├── MoE │ │ ├── main.py │ │ └── src │ │ │ ├── __init__.py │ │ │ ├── attention.py │ │ │ ├── ffn.py │ │ │ ├── norm.py │ │ │ ├── rope.py │ │ │ └── transformer.py │ └── llama2 │ │ ├── main.py │ │ └── src │ │ ├── __init__.py │ │ ├── attention.py │ │ ├── ffn.py │ │ ├── norm.py │ │ ├── rope.py │ │ └── transformer.py ├── C7 │ ├── 01_text_classification.ipynb │ ├── 02_lstm_text_classification.ipynb │ └── 03_bert_text_classification.ipynb └── C8 │ ├── 01_build_category.py │ ├── 02_build_vocabulary.py │ ├── 03_data_loader.py │ ├── 04_model.py │ ├── 05_train.py │ ├── 06_predict.py │ ├── data │ ├── CMeEE-V2_dev.json │ ├── CMeEE-V2_train.json │ ├── categories.json │ └── vocabulary.json │ └── src │ ├── configs │ ├── __init__.py │ └── configs.py │ ├── data │ ├── __init__.py │ ├── data_loader.py │ └── dataset.py │ ├── loss │ ├── __init__.py │ └── ner_loss.py │ ├── metrics │ ├── __init__.py │ └── entity_metrics.py │ ├── models │ ├── __init__.py │ ├── base.py │ └── ner_model.py │ ├── tokenizer │ ├── __init__.py │ ├── base.py │ ├── char_tokenizer.py │ └── vocabulary.py │ ├── trainer │ ├── __init__.py │ └── trainer.py │ └── utils │ ├── __init__.py │ ├── early_stop.py │ ├── file_io.py │ └── logger.py ├── docs ├── .nojekyll ├── README.md ├── _sidebar.md ├── chapter1 │ ├── 01_nlp_intro.md │ └── images │ │ └── 1_1_1.gif ├── chapter11 │ ├── 01_PEFT.md │ ├── 02_lora.md │ ├── 03_peft_lora.md │ ├── 04_qwen2.5_qlora.md │ └── images │ │ ├── 11_1_1.png │ │ ├── 11_1_2.png │ │ ├── 11_1_3.png │ │ ├── 11_1_4.png │ │ ├── 11_1_5.png │ │ ├── 11_1_6.png │ │ ├── 11_2_1.svg │ │ ├── 11_2_2.png │ │ ├── 11_2_3.png │ │ ├── 11_2_4.png │ │ ├── 11_3_1.png │ │ ├── 11_4_1.png │ │ └── 11_4_2.svg ├── chapter12 │ ├── 01_RLHF.md │ ├── 02_llama_factory.md │ └── images │ │ ├── 12_1_1.png │ │ ├── 12_1_2.png │ │ ├── 12_1_3.png │ │ ├── 12_1_4.png │ │ ├── 12_1_5.png │ │ ├── 12_1_6.png │ │ ├── 12_1_7.png │ │ ├── 12_1_8.png │ │ ├── 12_2_1.png │ │ ├── 12_2_10.png │ │ ├── 12_2_11.png │ │ ├── 12_2_2.png │ │ ├── 12_2_3.png │ │ ├── 12_2_4.png │ │ ├── 12_2_5.png │ │ ├── 12_2_6.png │ │ ├── 12_2_7.png │ │ ├── 12_2_8.png │ │ └── 12_2_9.png ├── chapter14 │ ├── 01_fastapi.md │ ├── 02_uv_linux.md │ ├── 03_docker_deploy.md │ └── images │ │ ├── 14_1_1.png │ │ ├── 14_1_2.png │ │ ├── 14_1_3.png │ │ ├── 14_2_1.png │ │ ├── 14_2_10.png │ │ ├── 14_2_11.png │ │ ├── 14_2_12.png │ │ ├── 14_2_2.png │ │ ├── 14_2_3.png │ │ ├── 14_2_4.png │ │ ├── 14_2_5.png │ │ ├── 14_2_6.png │ │ ├── 14_2_7.png │ │ ├── 14_2_8.png │ │ ├── 14_2_9.png │ │ ├── 14_3_1.png │ │ ├── 14_3_2.png │ │ ├── 14_3_3.png │ │ ├── 14_3_4.png │ │ ├── 14_3_5.png │ │ ├── 14_3_6.png │ │ ├── 14_3_7.png │ │ ├── 14_3_8.png │ │ └── 14_3_9.png ├── chapter16 │ ├── 01_LLM_safety_overview.md │ ├── 02_threat_modeling_analysis.md │ └── images │ │ ├── 16_1_1.png │ │ ├── 16_1_2.png │ │ ├── 16_1_3.png │ │ └── 16_1_4.png ├── chapter2 │ ├── 03_tokenization.md │ ├── 04_word_vector.md │ ├── 05_Word2Vec.md │ ├── 06_gensim.md │ └── images │ │ ├── 2_1_1.svg │ │ ├── 2_3_1.gif │ │ └── 2_3_2.svg ├── chapter3 │ ├── 08_RNN.md │ ├── 09_LSTM&GRU.md │ └── images │ │ ├── 3_1_1.svg │ │ ├── 3_2_1.svg │ │ └── 3_2_2.svg ├── chapter4 │ ├── 10_seq2seq.md │ ├── 11_attention.md │ ├── 12_transformer.md │ └── images │ │ ├── 4_1_1.svg │ │ ├── 4_2_1.svg │ │ └── 4_3_1.svg ├── chapter5 │ ├── 13_Bert.md │ ├── 14_GPT.md │ ├── 15_T5.md │ ├── 16_HuggingFace.md │ └── images │ │ ├── 5_1_1.png │ │ ├── 5_1_2.svg │ │ ├── 5_1_3.svg │ │ ├── 5_2_1.png │ │ ├── 5_3_1.png │ │ ├── 5_3_2.png │ │ └── 5_4_1.png ├── chapter6 │ ├── 17_handcraft_llama2.md │ ├── 18_MoE.md │ └── images │ │ ├── 6_1_1.svg │ │ ├── 6_1_2.png │ │ ├── 6_2_1.png │ │ ├── 6_2_10.png │ │ ├── 6_2_11.png │ │ ├── 6_2_12.png │ │ ├── 6_2_13.svg │ │ ├── 6_2_2.png │ │ ├── 6_2_3.png │ │ ├── 6_2_4.png │ │ ├── 6_2_5.png │ │ ├── 6_2_6.png │ │ ├── 6_2_7.png │ │ ├── 6_2_8.png │ │ └── 6_2_9.png ├── chapter7 │ ├── 01_text_classification.md │ ├── 02_lstm_text_classification.md │ ├── 03_bert_text_classification.md │ └── images │ │ ├── 7_1_1.png │ │ ├── 7_1_2.png │ │ ├── 7_1_3.png │ │ ├── 7_2_1.png │ │ ├── 7_2_2.png │ │ └── 7_3_1.png ├── chapter8 │ ├── 01_named_entity_recognition.md │ ├── 02_data_processing.md │ ├── 03_model_building_and_training.md │ ├── 04_evaluation_and_prediction.md │ └── images │ │ ├── 8_2_1.png │ │ ├── 8_2_2.png │ │ └── 8_3_1.png ├── index.html ├── logo.svg └── 约定.md └── logo.svg /.github/ISSUE_TEMPLATE/bug_report.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/.github/ISSUE_TEMPLATE/bug_report.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/config.yml: -------------------------------------------------------------------------------- 1 | blank_issues_enabled: false 2 | 3 | 4 | -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/feature_request.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/.github/ISSUE_TEMPLATE/feature_request.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/study_feedback.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/.github/ISSUE_TEMPLATE/study_feedback.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/README.md -------------------------------------------------------------------------------- /code/C11/03_peft_pythia-2.8b.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C11/03_peft_pythia-2.8b.ipynb -------------------------------------------------------------------------------- /code/C11/04_dataset_gen.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C11/04_dataset_gen.ipynb -------------------------------------------------------------------------------- /code/C11/04_qwen2.5_qlora.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C11/04_qwen2.5_qlora.ipynb -------------------------------------------------------------------------------- /code/C11/04_qwen2.5_test.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C11/04_qwen2.5_test.ipynb -------------------------------------------------------------------------------- /code/C11/data/blackwukong.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C11/data/blackwukong.md -------------------------------------------------------------------------------- /code/C11/data/wukong_base_20251109_201117.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C11/data/wukong_base_20251109_201117.jsonl -------------------------------------------------------------------------------- /code/C11/data/wukong_dataset_20251109_215706.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C11/data/wukong_dataset_20251109_215706.jsonl -------------------------------------------------------------------------------- /code/C14/01_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/01_main.py -------------------------------------------------------------------------------- /code/C14/01_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/01_test.py -------------------------------------------------------------------------------- /code/C14/ner_deployment/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/Dockerfile -------------------------------------------------------------------------------- /code/C14/ner_deployment/checkpoints/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/checkpoints/config.json -------------------------------------------------------------------------------- /code/C14/ner_deployment/data/categories.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/data/categories.json -------------------------------------------------------------------------------- /code/C14/ner_deployment/data/vocabulary.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/data/vocabulary.json -------------------------------------------------------------------------------- /code/C14/ner_deployment/docker-compose.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/docker-compose.yml -------------------------------------------------------------------------------- /code/C14/ner_deployment/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/main.py -------------------------------------------------------------------------------- /code/C14/ner_deployment/predict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/predict.py -------------------------------------------------------------------------------- /code/C14/ner_deployment/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/pyproject.toml -------------------------------------------------------------------------------- /code/C14/ner_deployment/src/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /code/C14/ner_deployment/src/tokenizer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /code/C14/ner_deployment/src/tokenizer/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/src/tokenizer/base.py -------------------------------------------------------------------------------- /code/C14/ner_deployment/src/tokenizer/char_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/src/tokenizer/char_tokenizer.py -------------------------------------------------------------------------------- /code/C14/ner_deployment/src/tokenizer/vocabulary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/src/tokenizer/vocabulary.py -------------------------------------------------------------------------------- /code/C14/ner_deployment/src/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /code/C14/ner_deployment/src/utils/file_io.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C14/ner_deployment/src/utils/file_io.py -------------------------------------------------------------------------------- /code/C2/01_jieba.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C2/01_jieba.py -------------------------------------------------------------------------------- /code/C2/04_gensim.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C2/04_gensim.ipynb -------------------------------------------------------------------------------- /code/C2/user_dict.txt: -------------------------------------------------------------------------------- 1 | 九头虫 2 | 奔波儿灞 -------------------------------------------------------------------------------- /code/C2/user_pos_dict.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C2/user_pos_dict.txt -------------------------------------------------------------------------------- /code/C3/01_RNN.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C3/01_RNN.py -------------------------------------------------------------------------------- /code/C3/02_LSTM.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C3/02_LSTM.py -------------------------------------------------------------------------------- /code/C4/01_Seq2Seq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C4/01_Seq2Seq.py -------------------------------------------------------------------------------- /code/C4/02_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C4/02_attention.py -------------------------------------------------------------------------------- /code/C4/03_Self-Attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C4/03_Self-Attention.py -------------------------------------------------------------------------------- /code/C5/01_bert_usage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C5/01_bert_usage.py -------------------------------------------------------------------------------- /code/C5/02_gpt_usage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C5/02_gpt_usage.py -------------------------------------------------------------------------------- /code/C5/03_bucket_id.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C5/03_bucket_id.py -------------------------------------------------------------------------------- /code/C5/03_t5_usage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C5/03_t5_usage.py -------------------------------------------------------------------------------- /code/C5/04_hf_usage.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C5/04_hf_usage.ipynb -------------------------------------------------------------------------------- /code/C5/cat.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C5/cat.jpg -------------------------------------------------------------------------------- /code/C6/MoE/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/MoE/main.py -------------------------------------------------------------------------------- /code/C6/MoE/src/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/MoE/src/__init__.py -------------------------------------------------------------------------------- /code/C6/MoE/src/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/MoE/src/attention.py -------------------------------------------------------------------------------- /code/C6/MoE/src/ffn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/MoE/src/ffn.py -------------------------------------------------------------------------------- /code/C6/MoE/src/norm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/MoE/src/norm.py -------------------------------------------------------------------------------- /code/C6/MoE/src/rope.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/MoE/src/rope.py -------------------------------------------------------------------------------- /code/C6/MoE/src/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/MoE/src/transformer.py -------------------------------------------------------------------------------- /code/C6/llama2/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/llama2/main.py -------------------------------------------------------------------------------- /code/C6/llama2/src/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/llama2/src/__init__.py -------------------------------------------------------------------------------- /code/C6/llama2/src/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/llama2/src/attention.py -------------------------------------------------------------------------------- /code/C6/llama2/src/ffn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/llama2/src/ffn.py -------------------------------------------------------------------------------- /code/C6/llama2/src/norm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/llama2/src/norm.py -------------------------------------------------------------------------------- /code/C6/llama2/src/rope.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/llama2/src/rope.py -------------------------------------------------------------------------------- /code/C6/llama2/src/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C6/llama2/src/transformer.py -------------------------------------------------------------------------------- /code/C7/01_text_classification.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C7/01_text_classification.ipynb -------------------------------------------------------------------------------- /code/C7/02_lstm_text_classification.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C7/02_lstm_text_classification.ipynb -------------------------------------------------------------------------------- /code/C7/03_bert_text_classification.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C7/03_bert_text_classification.ipynb -------------------------------------------------------------------------------- /code/C8/01_build_category.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/01_build_category.py -------------------------------------------------------------------------------- /code/C8/02_build_vocabulary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/02_build_vocabulary.py -------------------------------------------------------------------------------- /code/C8/03_data_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/03_data_loader.py -------------------------------------------------------------------------------- /code/C8/04_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/04_model.py -------------------------------------------------------------------------------- /code/C8/05_train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/05_train.py -------------------------------------------------------------------------------- /code/C8/06_predict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/06_predict.py -------------------------------------------------------------------------------- /code/C8/data/CMeEE-V2_dev.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/data/CMeEE-V2_dev.json -------------------------------------------------------------------------------- /code/C8/data/CMeEE-V2_train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/data/CMeEE-V2_train.json -------------------------------------------------------------------------------- /code/C8/data/categories.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/data/categories.json -------------------------------------------------------------------------------- /code/C8/data/vocabulary.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/data/vocabulary.json -------------------------------------------------------------------------------- /code/C8/src/configs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /code/C8/src/configs/configs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/configs/configs.py -------------------------------------------------------------------------------- /code/C8/src/data/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /code/C8/src/data/data_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/data/data_loader.py -------------------------------------------------------------------------------- /code/C8/src/data/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/data/dataset.py -------------------------------------------------------------------------------- /code/C8/src/loss/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /code/C8/src/loss/ner_loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/loss/ner_loss.py -------------------------------------------------------------------------------- /code/C8/src/metrics/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /code/C8/src/metrics/entity_metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/metrics/entity_metrics.py -------------------------------------------------------------------------------- /code/C8/src/models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /code/C8/src/models/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/models/base.py -------------------------------------------------------------------------------- /code/C8/src/models/ner_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/models/ner_model.py -------------------------------------------------------------------------------- /code/C8/src/tokenizer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /code/C8/src/tokenizer/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/tokenizer/base.py -------------------------------------------------------------------------------- /code/C8/src/tokenizer/char_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/tokenizer/char_tokenizer.py -------------------------------------------------------------------------------- /code/C8/src/tokenizer/vocabulary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/tokenizer/vocabulary.py -------------------------------------------------------------------------------- /code/C8/src/trainer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /code/C8/src/trainer/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/trainer/trainer.py -------------------------------------------------------------------------------- /code/C8/src/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /code/C8/src/utils/early_stop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/utils/early_stop.py -------------------------------------------------------------------------------- /code/C8/src/utils/file_io.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/utils/file_io.py -------------------------------------------------------------------------------- /code/C8/src/utils/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/code/C8/src/utils/logger.py -------------------------------------------------------------------------------- /docs/.nojekyll: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /docs/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/README.md -------------------------------------------------------------------------------- /docs/_sidebar.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/_sidebar.md -------------------------------------------------------------------------------- /docs/chapter1/01_nlp_intro.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter1/01_nlp_intro.md -------------------------------------------------------------------------------- /docs/chapter1/images/1_1_1.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter1/images/1_1_1.gif -------------------------------------------------------------------------------- /docs/chapter11/01_PEFT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/01_PEFT.md -------------------------------------------------------------------------------- /docs/chapter11/02_lora.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/02_lora.md -------------------------------------------------------------------------------- /docs/chapter11/03_peft_lora.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/03_peft_lora.md -------------------------------------------------------------------------------- /docs/chapter11/04_qwen2.5_qlora.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/04_qwen2.5_qlora.md -------------------------------------------------------------------------------- /docs/chapter11/images/11_1_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_1_1.png -------------------------------------------------------------------------------- /docs/chapter11/images/11_1_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_1_2.png -------------------------------------------------------------------------------- /docs/chapter11/images/11_1_3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_1_3.png -------------------------------------------------------------------------------- /docs/chapter11/images/11_1_4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_1_4.png -------------------------------------------------------------------------------- /docs/chapter11/images/11_1_5.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_1_5.png -------------------------------------------------------------------------------- /docs/chapter11/images/11_1_6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_1_6.png -------------------------------------------------------------------------------- /docs/chapter11/images/11_2_1.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_2_1.svg -------------------------------------------------------------------------------- /docs/chapter11/images/11_2_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_2_2.png -------------------------------------------------------------------------------- /docs/chapter11/images/11_2_3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_2_3.png -------------------------------------------------------------------------------- /docs/chapter11/images/11_2_4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_2_4.png -------------------------------------------------------------------------------- /docs/chapter11/images/11_3_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_3_1.png -------------------------------------------------------------------------------- /docs/chapter11/images/11_4_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_4_1.png -------------------------------------------------------------------------------- /docs/chapter11/images/11_4_2.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter11/images/11_4_2.svg -------------------------------------------------------------------------------- /docs/chapter12/01_RLHF.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/01_RLHF.md -------------------------------------------------------------------------------- /docs/chapter12/02_llama_factory.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/02_llama_factory.md -------------------------------------------------------------------------------- /docs/chapter12/images/12_1_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_1_1.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_1_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_1_2.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_1_3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_1_3.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_1_4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_1_4.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_1_5.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_1_5.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_1_6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_1_6.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_1_7.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_1_7.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_1_8.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_1_8.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_2_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_2_1.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_2_10.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_2_10.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_2_11.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_2_11.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_2_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_2_2.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_2_3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_2_3.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_2_4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_2_4.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_2_5.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_2_5.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_2_6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_2_6.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_2_7.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_2_7.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_2_8.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_2_8.png -------------------------------------------------------------------------------- /docs/chapter12/images/12_2_9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter12/images/12_2_9.png -------------------------------------------------------------------------------- /docs/chapter14/01_fastapi.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/01_fastapi.md -------------------------------------------------------------------------------- /docs/chapter14/02_uv_linux.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/02_uv_linux.md -------------------------------------------------------------------------------- /docs/chapter14/03_docker_deploy.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/03_docker_deploy.md -------------------------------------------------------------------------------- /docs/chapter14/images/14_1_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_1_1.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_1_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_1_2.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_1_3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_1_3.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_1.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_10.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_10.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_11.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_11.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_12.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_12.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_2.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_3.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_4.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_5.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_5.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_6.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_7.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_7.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_8.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_8.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_2_9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_2_9.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_3_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_3_1.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_3_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_3_2.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_3_3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_3_3.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_3_4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_3_4.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_3_5.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_3_5.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_3_6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_3_6.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_3_7.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_3_7.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_3_8.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_3_8.png -------------------------------------------------------------------------------- /docs/chapter14/images/14_3_9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter14/images/14_3_9.png -------------------------------------------------------------------------------- /docs/chapter16/01_LLM_safety_overview.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter16/01_LLM_safety_overview.md -------------------------------------------------------------------------------- /docs/chapter16/02_threat_modeling_analysis.md: -------------------------------------------------------------------------------- 1 | # 第二节 威胁建模分析 2 | -------------------------------------------------------------------------------- /docs/chapter16/images/16_1_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter16/images/16_1_1.png -------------------------------------------------------------------------------- /docs/chapter16/images/16_1_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter16/images/16_1_2.png -------------------------------------------------------------------------------- /docs/chapter16/images/16_1_3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter16/images/16_1_3.png -------------------------------------------------------------------------------- /docs/chapter16/images/16_1_4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter16/images/16_1_4.png -------------------------------------------------------------------------------- /docs/chapter2/03_tokenization.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter2/03_tokenization.md -------------------------------------------------------------------------------- /docs/chapter2/04_word_vector.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter2/04_word_vector.md -------------------------------------------------------------------------------- /docs/chapter2/05_Word2Vec.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter2/05_Word2Vec.md -------------------------------------------------------------------------------- /docs/chapter2/06_gensim.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter2/06_gensim.md -------------------------------------------------------------------------------- /docs/chapter2/images/2_1_1.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter2/images/2_1_1.svg -------------------------------------------------------------------------------- /docs/chapter2/images/2_3_1.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter2/images/2_3_1.gif -------------------------------------------------------------------------------- /docs/chapter2/images/2_3_2.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter2/images/2_3_2.svg -------------------------------------------------------------------------------- /docs/chapter3/08_RNN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter3/08_RNN.md -------------------------------------------------------------------------------- /docs/chapter3/09_LSTM&GRU.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter3/09_LSTM&GRU.md -------------------------------------------------------------------------------- /docs/chapter3/images/3_1_1.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter3/images/3_1_1.svg -------------------------------------------------------------------------------- /docs/chapter3/images/3_2_1.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter3/images/3_2_1.svg -------------------------------------------------------------------------------- /docs/chapter3/images/3_2_2.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter3/images/3_2_2.svg -------------------------------------------------------------------------------- /docs/chapter4/10_seq2seq.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter4/10_seq2seq.md -------------------------------------------------------------------------------- /docs/chapter4/11_attention.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter4/11_attention.md -------------------------------------------------------------------------------- /docs/chapter4/12_transformer.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter4/12_transformer.md -------------------------------------------------------------------------------- /docs/chapter4/images/4_1_1.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter4/images/4_1_1.svg -------------------------------------------------------------------------------- /docs/chapter4/images/4_2_1.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter4/images/4_2_1.svg -------------------------------------------------------------------------------- /docs/chapter4/images/4_3_1.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter4/images/4_3_1.svg -------------------------------------------------------------------------------- /docs/chapter5/13_Bert.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter5/13_Bert.md -------------------------------------------------------------------------------- /docs/chapter5/14_GPT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter5/14_GPT.md -------------------------------------------------------------------------------- /docs/chapter5/15_T5.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter5/15_T5.md -------------------------------------------------------------------------------- /docs/chapter5/16_HuggingFace.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter5/16_HuggingFace.md -------------------------------------------------------------------------------- /docs/chapter5/images/5_1_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter5/images/5_1_1.png -------------------------------------------------------------------------------- /docs/chapter5/images/5_1_2.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter5/images/5_1_2.svg -------------------------------------------------------------------------------- /docs/chapter5/images/5_1_3.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter5/images/5_1_3.svg -------------------------------------------------------------------------------- /docs/chapter5/images/5_2_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter5/images/5_2_1.png -------------------------------------------------------------------------------- /docs/chapter5/images/5_3_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter5/images/5_3_1.png -------------------------------------------------------------------------------- /docs/chapter5/images/5_3_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter5/images/5_3_2.png -------------------------------------------------------------------------------- /docs/chapter5/images/5_4_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter5/images/5_4_1.png -------------------------------------------------------------------------------- /docs/chapter6/17_handcraft_llama2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/17_handcraft_llama2.md -------------------------------------------------------------------------------- /docs/chapter6/18_MoE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/18_MoE.md -------------------------------------------------------------------------------- /docs/chapter6/images/6_1_1.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_1_1.svg -------------------------------------------------------------------------------- /docs/chapter6/images/6_1_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_1_2.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_1.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_10.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_10.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_11.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_11.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_12.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_12.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_13.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_13.svg -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_2.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_3.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_4.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_5.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_5.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_6.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_7.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_7.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_8.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_8.png -------------------------------------------------------------------------------- /docs/chapter6/images/6_2_9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter6/images/6_2_9.png -------------------------------------------------------------------------------- /docs/chapter7/01_text_classification.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter7/01_text_classification.md -------------------------------------------------------------------------------- /docs/chapter7/02_lstm_text_classification.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter7/02_lstm_text_classification.md -------------------------------------------------------------------------------- /docs/chapter7/03_bert_text_classification.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter7/03_bert_text_classification.md -------------------------------------------------------------------------------- /docs/chapter7/images/7_1_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter7/images/7_1_1.png -------------------------------------------------------------------------------- /docs/chapter7/images/7_1_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter7/images/7_1_2.png -------------------------------------------------------------------------------- /docs/chapter7/images/7_1_3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter7/images/7_1_3.png -------------------------------------------------------------------------------- /docs/chapter7/images/7_2_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter7/images/7_2_1.png -------------------------------------------------------------------------------- /docs/chapter7/images/7_2_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter7/images/7_2_2.png -------------------------------------------------------------------------------- /docs/chapter7/images/7_3_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter7/images/7_3_1.png -------------------------------------------------------------------------------- /docs/chapter8/01_named_entity_recognition.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter8/01_named_entity_recognition.md -------------------------------------------------------------------------------- /docs/chapter8/02_data_processing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter8/02_data_processing.md -------------------------------------------------------------------------------- /docs/chapter8/03_model_building_and_training.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter8/03_model_building_and_training.md -------------------------------------------------------------------------------- /docs/chapter8/04_evaluation_and_prediction.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter8/04_evaluation_and_prediction.md -------------------------------------------------------------------------------- /docs/chapter8/images/8_2_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter8/images/8_2_1.png -------------------------------------------------------------------------------- /docs/chapter8/images/8_2_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter8/images/8_2_2.png -------------------------------------------------------------------------------- /docs/chapter8/images/8_3_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/chapter8/images/8_3_1.png -------------------------------------------------------------------------------- /docs/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/index.html -------------------------------------------------------------------------------- /docs/logo.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/logo.svg -------------------------------------------------------------------------------- /docs/约定.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/docs/约定.md -------------------------------------------------------------------------------- /logo.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/datawhalechina/base-nlp/HEAD/logo.svg --------------------------------------------------------------------------------