NVIDIA / NeMo-Aligner

Scalable toolkit for efficient model alignment
Apache License 2.0
507 stars 55 forks source link

DPO Training error: NameError: name 'RetroConfig' is not defined #262

Closed sunilitggu closed 1 month ago

sunilitggu commented 1 month ago

Following the steps provided for DPO Training at https://docs.nvidia.com/nemo-framework/user-guide/latest/modelalignment/dpo.html

` Starting training ***STARTING****

Starting training Traceback (most recent call last): File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/examples/nlp/gpt/train_gpt_dpo.py", line 22, in Traceback (most recent call last): File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/examples/nlp/gpt/train_gpt_dpo.py", line 22, in Traceback (most recent call last): File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/examples/nlp/gpt/train_gpt_dpo.py", line 22, in Traceback (most recent call last): File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/examples/nlp/gpt/train_gpt_dpo.py", line 22, in Traceback (most recent call last): from nemo_aligner.algorithms.dpo import DPOTrainer, dpo_custom_collate File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/nemo_aligner/algorithms/dpo.py", line 22, in File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/examples/nlp/gpt/train_gpt_dpo.py", line 22, in from nemo_aligner.algorithms.dpo import DPOTrainer, dpo_custom_collate File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/nemo_aligner/algorithms/dpo.py", line 22, in from nemo_aligner.algorithms.dpo import DPOTrainer, dpo_custom_collate File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/nemo_aligner/algorithms/dpo.py", line 22, in from nemo_aligner.algorithms.dpo import DPOTrainer, dpo_custom_collate File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/nemo_aligner/algorithms/dpo.py", line 22, in Traceback (most recent call last): File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/examples/nlp/gpt/train_gpt_dpo.py", line 22, in from nemo_aligner.algorithms.dpo import DPOTrainer, dpo_custom_collate File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/nemo_aligner/algorithms/dpo.py", line 22, in from nemo_aligner.algorithms.dpo import DPOTrainer, dpo_custom_collate File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/nemo_aligner/algorithms/dpo.py", line 22, in from nemo.collections.nlp.data.language_modeling.megatron.megatron_batch_samplers import ( File "/opt/NeMo/nemo/collections/nlp/init.py", line 15, in from nemo.collections.nlp.data.language_modeling.megatron.megatron_batch_samplers import ( File "/opt/NeMo/nemo/collections/nlp/init.py", line 15, in from nemo.collections.nlp import data, losses, models, modules File "/opt/NeMo/nemo/collections/nlp/models/init.py", line 28, in from nemo.collections.nlp.data.language_modeling.megatron.megatron_batch_samplers import ( File "/opt/NeMo/nemo/collections/nlp/init.py", line 15, in from nemo.collections.nlp import data, losses, models, modules File "/opt/NeMo/nemo/collections/nlp/models/init.py", line 28, in from nemo.collections.nlp.models.language_modeling import MegatronGPTPromptLearningModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/init.py", line 20, in from nemo.collections.nlp.data.language_modeling.megatron.megatron_batch_samplers import ( File "/opt/NeMo/nemo/collections/nlp/init.py", line 15, in from nemo.collections.nlp import data, losses, models, modules File "/opt/NeMo/nemo/collections/nlp/models/init.py", line 28, in from nemo.collections.nlp.models.language_modeling import MegatronGPTPromptLearningModel from nemo.collections.nlp.data.language_modeling.megatron.megatron_batch_samplers import ( File "/opt/NeMo/nemo/collections/nlp/init.py", line 15, in from nemo.collections.nlp import data, losses, models, modules File "/opt/NeMo/nemo/collections/nlp/models/init.py", line 28, in from nemo.collections.nlp.models.language_modeling import MegatronGPTPromptLearningModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/init.py", line 20, in from nemo.collections.nlp.data.language_modeling.megatron.megatron_batch_samplers import ( File "/opt/NeMo/nemo/collections/nlp/init.py", line 15, in from nemo.collections.nlp import data, losses, models, modules File "/opt/NeMo/nemo/collections/nlp/models/init.py", line 28, in from nemo.collections.nlp.models.language_modeling import MegatronGPTPromptLearningModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/init.py", line 20, in from nemo.collections.nlp.models.language_modeling.megatron_retro_model import MegatronRetroModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/megatron_retro_model.py", line 37, in from nemo.collections.nlp import data, losses, models, modules File "/opt/NeMo/nemo/collections/nlp/models/init.py", line 28, in from nemo.collections.nlp.models.language_modeling import MegatronGPTPromptLearningModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/init.py", line 20, in from nemo.collections.nlp.models.language_modeling.megatron_retro_model import MegatronRetroModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/megatron_retro_model.py", line 37, in from nemo.collections.nlp.models.language_modeling import MegatronGPTPromptLearningModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/init.py", line 20, in from nemo.collections.nlp.models.language_modeling.megatron_retro_model import MegatronRetroModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/megatron_retro_model.py", line 37, in from nemo.collections.nlp.models.language_modeling.megatron_retro_model import MegatronRetroModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/megatron_retro_model.py", line 37, in from nemo.collections.nlp.data.language_modeling.megatron.retro_dataset import build_train_valid_test_datasets File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 55, in File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/init.py", line 20, in from nemo.collections.nlp.models.language_modeling.megatron_retro_model import MegatronRetroModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/megatron_retro_model.py", line 37, in from nemo.collections.nlp.data.language_modeling.megatron.retro_dataset import build_train_valid_test_datasets from nemo.collections.nlp.models.language_modeling.megatron_retro_model import MegatronRetroModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/megatron_retro_model.py", line 37, in from nemo.collections.nlp.data.language_modeling.megatron.retro_dataset import build_train_valid_test_datasets File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 55, in from nemo.collections.nlp.data.language_modeling.megatron.retro_dataset import build_train_valid_test_datasets File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 55, in class RETRODataset(Dataset): from nemo.collections.nlp.data.language_modeling.megatron.retro_dataset import build_train_valid_test_datasets File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 55, in class RETRODataset(Dataset): File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 56, in RETRODataset from nemo.collections.nlp.data.language_modeling.megatron.retro_dataset import build_train_valid_test_datasets File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 55, in class RETRODataset(Dataset): File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 56, in RETRODataset class RETRODataset(Dataset): File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 56, in RETRODataset def init(self, cfg, retro_config: RetroConfig, tokenizer, mcore_retro_dataset, number_samples_with_neighbors): File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 55, in class RETRODataset(Dataset): File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 56, in RETRODataset def init(self, cfg, retro_config: RetroConfig, tokenizer, mcore_retro_dataset, number_samples_with_neighbors): class RETRODataset(Dataset): File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 56, in RETRODataset def init(self, cfg, retro_config: RetroConfig, tokenizer, mcore_retro_dataset, number_samples_with_neighbors): File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 56, in RETRODataset def init(self, cfg, retro_config: RetroConfig, tokenizer, mcore_retro_dataset, number_samples_with_neighbors): NameError: name 'RetroConfig' is not defined def init(self, cfg, retro_config: RetroConfig, tokenizer, mcore_retro_dataset, number_samples_with_neighbors): def init(self, cfg, retro_config: RetroConfig, tokenizer, mcore_retro_dataset, number_samples_with_neighbors): NameError: name 'RetroConfig' is not defined NameError: name 'RetroConfig' is not defined NameError: name 'RetroConfig' is not defined NameError: name 'RetroConfig' is not defined NameError: name 'RetroConfig' is not defined Traceback (most recent call last): File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/examples/nlp/gpt/train_gpt_dpo.py", line 22, in from nemo_aligner.algorithms.dpo import DPOTrainer, dpo_custom_collate File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/nemo_aligner/algorithms/dpo.py", line 22, in from nemo.collections.nlp.data.language_modeling.megatron.megatron_batch_samplers import ( File "/opt/NeMo/nemo/collections/nlp/init.py", line 15, in from nemo.collections.nlp import data, losses, models, modules File "/opt/NeMo/nemo/collections/nlp/models/init.py", line 28, in from nemo.collections.nlp.models.language_modeling import MegatronGPTPromptLearningModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/init.py", line 20, in from nemo.collections.nlp.models.language_modeling.megatron_retro_model import MegatronRetroModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/megatron_retro_model.py", line 37, in from nemo.collections.nlp.data.language_modeling.megatron.retro_dataset import build_train_valid_test_datasets File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 55, in class RETRODataset(Dataset): File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 56, in RETRODataset def init(self, cfg, retro_config: RetroConfig, tokenizer, mcore_retro_dataset, number_samples_with_neighbors): NameError: name 'RetroConfig' is not defined Traceback (most recent call last): File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/examples/nlp/gpt/train_gpt_dpo.py", line 22, in from nemo_aligner.algorithms.dpo import DPOTrainer, dpo_custom_collate File "/vast/core42-nlp/users/sunil.sahu/projects/llm/dpo_training/NeMo-Aligner/nemo_aligner/algorithms/dpo.py", line 22, in from nemo.collections.nlp.data.language_modeling.megatron.megatron_batch_samplers import ( File "/opt/NeMo/nemo/collections/nlp/init.py", line 15, in from nemo.collections.nlp import data, losses, models, modules File "/opt/NeMo/nemo/collections/nlp/models/init.py", line 28, in from nemo.collections.nlp.models.language_modeling import MegatronGPTPromptLearningModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/init.py", line 20, in from nemo.collections.nlp.models.language_modeling.megatron_retro_model import MegatronRetroModel File "/opt/NeMo/nemo/collections/nlp/models/language_modeling/megatron_retro_model.py", line 37, in from nemo.collections.nlp.data.language_modeling.megatron.retro_dataset import build_train_valid_test_datasets File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 55, in class RETRODataset(Dataset): File "/opt/NeMo/nemo/collections/nlp/data/language_modeling/megatron/retro_dataset.py", line 56, in RETRODataset def init(self, cfg, retro_config: RetroConfig, tokenizer, mcore_retro_dataset, number_samples_with_neighbors): NameError: name 'RetroConfig' is not defined `

sunilitggu commented 1 month ago

NA