julycoding
diff --git a/‎applications/DeepSpeed-Chat/.gitignore‎
Lines changed: 137 additions & 0 deletions b/‎applications/DeepSpeed-Chat/.gitignore‎
Lines changed: 137 additions & 0 deletions
diff --git a/‎applications/DeepSpeed-Chat/README.md‎
Lines changed: 10 additions & 5 deletions b/‎applications/DeepSpeed-Chat/README.md‎
Lines changed: 10 additions & 5 deletions
diff --git a/‎…ing/step3_rlhf_finetuning/ppo_trainer.py‎ ‎…eepSpeed-Chat/dschat/rlhf/ppo_trainer.py‎applications/DeepSpeed-Chat/training/step3_rlhf_finetuning/ppo_trainer.py renamed to applications/DeepSpeed-Chat/dschat/rlhf/ppo_trainer.py
Lines changed: 1 addition & 6 deletions b/‎…ing/step3_rlhf_finetuning/ppo_trainer.py‎ ‎…eepSpeed-Chat/dschat/rlhf/ppo_trainer.py‎applications/DeepSpeed-Chat/training/step3_rlhf_finetuning/ppo_trainer.py renamed to applications/DeepSpeed-Chat/dschat/rlhf/ppo_trainer.py
Lines changed: 1 addition & 6 deletions
diff --git a/‎…ing/step3_rlhf_finetuning/rlhf_engine.py‎ ‎…eepSpeed-Chat/dschat/rlhf/rlhf_engine.py‎applications/DeepSpeed-Chat/training/step3_rlhf_finetuning/rlhf_engine.py renamed to applications/DeepSpeed-Chat/dschat/rlhf/rlhf_engine.py
Lines changed: 4 additions & 4 deletions b/‎…ing/step3_rlhf_finetuning/rlhf_engine.py‎ ‎…eepSpeed-Chat/dschat/rlhf/rlhf_engine.py‎applications/DeepSpeed-Chat/training/step3_rlhf_finetuning/rlhf_engine.py renamed to applications/DeepSpeed-Chat/dschat/rlhf/rlhf_engine.py
Lines changed: 4 additions & 4 deletions
diff --git a/‎…d-Chat/training/utils/data/data_utils.py‎ ‎…eed-Chat/dschat/utils/data/data_utils.py‎applications/DeepSpeed-Chat/training/utils/data/data_utils.py renamed to applications/DeepSpeed-Chat/dschat/utils/data/data_utils.py
Lines changed: 1 addition & 1 deletion b/‎…d-Chat/training/utils/data/data_utils.py‎ ‎…eed-Chat/dschat/utils/data/data_utils.py‎applications/DeepSpeed-Chat/training/utils/data/data_utils.py renamed to applications/DeepSpeed-Chat/dschat/utils/data/data_utils.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎…Chat/training/utils/data/raw_datasets.py‎ ‎…d-Chat/dschat/utils/data/raw_datasets.py‎applications/DeepSpeed-Chat/training/utils/data/raw_datasets.py renamed to applications/DeepSpeed-Chat/dschat/utils/data/raw_datasets.py b/‎…Chat/training/utils/data/raw_datasets.py‎ ‎…d-Chat/dschat/utils/data/raw_datasets.py‎applications/DeepSpeed-Chat/training/utils/data/raw_datasets.py renamed to applications/DeepSpeed-Chat/dschat/utils/data/raw_datasets.py
diff --git a/‎…eepSpeed-Chat/training/utils/ds_utils.py‎ ‎…/DeepSpeed-Chat/dschat/utils/ds_utils.py‎applications/DeepSpeed-Chat/training/utils/ds_utils.py renamed to applications/DeepSpeed-Chat/dschat/utils/ds_utils.py b/‎…eepSpeed-Chat/training/utils/ds_utils.py‎ ‎…/DeepSpeed-Chat/dschat/utils/ds_utils.py‎applications/DeepSpeed-Chat/training/utils/ds_utils.py renamed to applications/DeepSpeed-Chat/dschat/utils/ds_utils.py
diff --git a/‎…Chat/training/utils/model/model_utils.py‎ ‎…d-Chat/dschat/utils/model/model_utils.py‎applications/DeepSpeed-Chat/training/utils/model/model_utils.py renamed to applications/DeepSpeed-Chat/dschat/utils/model/model_utils.py
Lines changed: 2 additions & 3 deletions b/‎…Chat/training/utils/model/model_utils.py‎ ‎…d-Chat/dschat/utils/model/model_utils.py‎applications/DeepSpeed-Chat/training/utils/model/model_utils.py renamed to applications/DeepSpeed-Chat/dschat/utils/model/model_utils.py
Lines changed: 2 additions & 3 deletions
diff --git a/‎…hat/training/utils/model/reward_model.py‎ ‎…-Chat/dschat/utils/model/reward_model.py‎applications/DeepSpeed-Chat/training/utils/model/reward_model.py renamed to applications/DeepSpeed-Chat/dschat/utils/model/reward_model.py b/‎…hat/training/utils/model/reward_model.py‎ ‎…-Chat/dschat/utils/model/reward_model.py‎applications/DeepSpeed-Chat/training/utils/model/reward_model.py renamed to applications/DeepSpeed-Chat/dschat/utils/model/reward_model.py
diff --git a/‎…Speed-Chat/training/utils/module/lora.py‎ ‎…epSpeed-Chat/dschat/utils/module/lora.py‎applications/DeepSpeed-Chat/training/utils/module/lora.py renamed to applications/DeepSpeed-Chat/dschat/utils/module/lora.py b/‎…Speed-Chat/training/utils/module/lora.py‎ ‎…epSpeed-Chat/dschat/utils/module/lora.py‎applications/DeepSpeed-Chat/training/utils/module/lora.py renamed to applications/DeepSpeed-Chat/dschat/utils/module/lora.py
@@ -0,0 +1,137 @@
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+pip-wheel-metadata/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# IPython
+profile_default/
+ipython_config.py
+
+# pyenv
+.python-version
+
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow
+__pypackages__/
+
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+
+# Pyre type checker
+.pyre/
+
+results/
+outputs/
+
+.amltconfig
+.test_output
+*.hdf5
+*.h5
@@ -33,20 +33,24 @@ A fast, affordable, scalable and open system framework for enabling end-to-end R
 <!-- markdown-toc start - Don't edit this section. Run M-x markdown-toc-refresh-toc -->
 ## Table of Contents
 
+- [🐕DeepSpeed-Chat: Easy, Fast and Affordable RLHF Training of ChatGPT-like Models at All Scales🐕](#deepspeed-chat-easy-fast-and-affordable-rlhf-training-of-chatgpt-like-models-at-all-scales)
+- [Table of Contents](#table-of-contents)
 - [📰 Latest News 📰](#-latest-news-)
-- [🚀 What is DeepSpeed Chat 🚀️](#-what-is-deepspeed-chat-)
+- [🚀 What is DeepSpeed Chat 🚀](#-what-is-deepspeed-chat-)
 - [🧨 Capabilities 🧨](#-capabilities-)
 - [☕ Quick Start ☕](#-quick-start-)
   - [🐼 Installation](#-installation)
-  - [🐼 Single Script for Training 3-Step RLHF Pipeline](#-one-single-script-completes-all-three-stages-of-rlhf-training-and-generate-your-first-chatgpt-model)
+  - [🐼 One Single Script Completes All Three Steps of RLHF Training and Generate Your First ChatGPT Model](#-one-single-script-completes-all-three-steps-of-rlhf-training-and-generate-your-first-chatgpt-model)
   - [🐼 Demonstration: Individual Step Fine-Tuning](#-demonstration-individual-step-fine-tuning)
     - [🕐 Step 1 - Supervised Fine-Tuning](#-step-1---supervised-fine-tuning)
     - [🕑 Step 2 - Reward Model](#-step-2---reward-model)
     - [🕒 Step 3 - Reinforcement Learning with Human Feedback](#-step-3---reinforcement-learning-with-human-feedback)
-   - [🐼 Adding and using your own datasets in DeepSpeed-Chat](#-adding-and-using-your-own-datasets-in-deepspeed-chat)
-   - [🐼 Customizing RLHF training pipeline via DeepSpeed-Chat’s APIs](#-customizing-your-own-rlhf-training-pipeline-using-deepspeed-chats-rlhf-apis)
-   - [🐼 Serving Your Model: Plug-in and Test!](#-serving-plug-in-your-final-model-trained-by-deepspeed-chat-and-test-it-out)  
+  - [🐼 Adding and using your own datasets in DeepSpeed-Chat](#-adding-and-using-your-own-datasets-in-deepspeed-chat)
+  - [🐼 Customizing your own RLHF training pipeline using DeepSpeed-Chat’s RLHF APIs](#-customizing-your-own-rlhf-training-pipeline-using-deepspeed-chats-rlhf-apis)
+  - [🐼 Serving: Plug-in your final model trained by DeepSpeed-Chat and test it out!](#-serving-plug-in-your-final-model-trained-by-deepspeed-chat-and-test-it-out)
 - [🔥 Training Performance Evaluation 🔥](#-training-performance-evaluation-)
+  - [🐲 Superior Model Scale and Low Training Cost](#-superior-model-scale-and-low-training-cost)
+  - [🐲 Throughput and Model Size Scalability Comparisons with Existing RLHF Systems](#-throughput-and-model-size-scalability-comparisons-with-existing-rlhf-systems)
 - [😽 Supported Models 😽](#-supported-models-)
 - [🔬 Build Pipeline Status 🔬](#-build-pipeline-status-)
 - [⚓ Documentation and Tutorial ⚓](#-documentation-and-tutorial-)
@@ -119,6 +123,7 @@ pip install deepspeed>=0.9.0
 git clone https://github.com/microsoft/DeepSpeedExamples.git
 cd DeepSpeedExamples/applications/DeepSpeed-Chat/
 pip install -r requirements.txt
+pip install -e .
 ```
 
 ### 🐼 One Single Script Completes All Three Steps of RLHF Training and Generate Your First ChatGPT Model
 
@@ -4,17 +4,12 @@
 # DeepSpeed Team
 import torch
 import torch.nn.functional as F
-import sys
-import os
 import time
 import deepspeed
 from deepspeed.runtime.zero.partition_parameters import ZeroParamStatus
 from deepspeed.accelerator import get_accelerator
 
-sys.path.append(
-    os.path.abspath(os.path.join(os.path.dirname(__file__), os.path.pardir)))
-
-from utils.utils import print_rank_0
+from dschat.utils.utils import print_rank_0
 
 
 def print_all_ranks(tag, value, rank):
 
@@ -9,10 +9,10 @@
 from deepspeed.ops.adam import DeepSpeedCPUAdam
 from transformers import AutoModelForCausalLM, get_scheduler
 
-from utils.ds_utils import get_train_ds_config, get_eval_ds_config
-from utils.module.lora import convert_linear_layer_to_lora, only_optimize_lora_parameters, make_model_gradient_checkpointing_compatible
-from utils.model.model_utils import create_hf_model, create_critic_model
-from utils.utils import get_optimizer_grouped_parameters
+from dschat.utils.ds_utils import get_train_ds_config, get_eval_ds_config
+from dschat.utils.module.lora import convert_linear_layer_to_lora, only_optimize_lora_parameters, make_model_gradient_checkpointing_compatible
+from dschat.utils.model.model_utils import create_hf_model, create_critic_model
+from dschat.utils.utils import get_optimizer_grouped_parameters
 """
 TODOs:
   * support HF models for critic (for debugging), must be a previously saved ckpt from step-2
 
@@ -14,7 +14,7 @@
 import os
 import hashlib
 from itertools import chain
-from . import raw_datasets
+from dschat.utils.data import raw_datasets
 from deepspeed.accelerator import get_accelerator
 
 
 
@@ -12,9 +12,8 @@
 from huggingface_hub import snapshot_download
 from transformers.deepspeed import HfDeepSpeedConfig
 
-from .reward_model import RewardModel
-from ..utils import load_state_dict_into_model
-from ..utils import print_rank_0
+from dschat.utils.model.reward_model import RewardModel
+from dschat.utils.utils import load_state_dict_into_model, print_rank_0
 
 
 def configure_dropout(model_config, dropout):