goodmodeler commited on
Commit
635940d
·
1 Parent(s): a7af970

MOD: update readme

Browse files
Files changed (1) hide show
  1. README.md +12 -14
README.md CHANGED
@@ -49,25 +49,23 @@ export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
49
  pipeline:
50
  # 1 Fully Fine‑tune image model with ZeRO
51
  accelerate launch --deepspeed_config_file=ds_config_zero3.json train_lora.py
52
- python train_lora.py
53
 
54
- # 2 SFT 120B OSS 语言模型 with QLoRA
55
- python sft_train.py
56
 
57
- # 3 distill 120B OSS模型给20B OSS模型
58
- 用 Teacher 生成 Response,student模型用LoRA fine tuning
59
-
60
- # 4 Build RAG index
61
- python build_embeddings.py
62
 
63
- # 5 收集偏好 训练 reward model
64
- python reward_model.py
 
65
 
66
- # 6 PPO RLHF 微调20B OSS model
67
- python ppo_tune.py
68
 
69
- # 7 Inference with RAG
70
- python rag_infer.py
71
 
72
 
73
  system flow:
 
49
  pipeline:
50
  # 1 Fully Fine‑tune image model with ZeRO
51
  accelerate launch --deepspeed_config_file=ds_config_zero3.json train_lora.py
52
+ fully_fine_tine_stablediffusion
53
 
54
+ # 2 SFT 120B OSS 语言模型 with QLoRA
55
+ lauguage_model_fine_tuning
56
 
57
+ # 3 RLHF PPO 120B OSS 语言模型 with QLoRA : 训练 reward model
58
+ lauguage_model_fine_tuning
 
 
 
59
 
60
+ # 4 distill 120B OSS模型给20B OSS模型
61
+ lauguage_model_fine_tuning
62
+ 用 Teacher 生成 Response,student模型用LoRA fine tuning
63
 
64
+ # 5 Build RAG index embedding table
65
+ retrieval_augmented_generation
66
 
67
+ # 6 Inference with RAG
68
+ inference.py
69
 
70
 
71
  system flow: