autogen/flaml/nlp/huggingface/trainer.py

import os

try:
    from transformers import Seq2SeqTrainer
except ImportError:
    Seq2SeqTrainer = object


class TrainerForAuto(Seq2SeqTrainer):
    def predict(
        self,
        test_dataset,
        ignore_keys=None,
        metric_key_prefix=None,
        max_length=None,
        num_beams=None,
    ):
        if getattr(self, "_is_seq2seq", None):
            return super().predict(
                test_dataset,
                ignore_keys,
                metric_key_prefix,
                max_length,
                num_beams,
            )
        else:
            return super(Seq2SeqTrainer, self).predict(
                test_dataset, ignore_keys, metric_key_prefix
            )

    def prediction_step(
        self,
        model,
        inputs,
        prediction_loss_only,
        ignore_keys,
    ):
        if getattr(self, "_is_seq2seq", None):
            return super().prediction_step(
                model, inputs, prediction_loss_only, ignore_keys
            )
        else:
            return super(Seq2SeqTrainer, self).prediction_step(
                model, inputs, prediction_loss_only, ignore_keys
            )

    def evaluate(
        self,
        eval_dataset=None,
        ignore_keys=None,
        metric_key_prefix="eval",
    ):
        """Overriding transformers.Trainer.evaluate by saving metrics and checkpoint path."""
        from transformers.trainer_utils import PREFIX_CHECKPOINT_DIR

        ckpt_dir = os.path.join(
            self.args.output_dir, f"{PREFIX_CHECKPOINT_DIR}-{self.state.global_step}"
        )
        eval_dataset = eval_dataset if eval_dataset is not None else self.eval_dataset

        # TODO: if your task is seq2seq (i.e., SUMMARIZATION), uncomment the code below (add indentation before metrics = eval_dataset...

        if getattr(self, "_is_seq2seq", None):
            metrics = eval_dataset and super().evaluate(
                eval_dataset,
                ignore_keys,
                metric_key_prefix,
                max_length=self.args.generation_max_length,
                num_beams=self.args.generation_num_beams,
            )
        else:
            metrics = eval_dataset and super(Seq2SeqTrainer, self).evaluate(
                eval_dataset,
                ignore_keys,
                metric_key_prefix,
            )
        if metrics:
            for key in list(metrics.keys()):
                if key.startswith("eval_"):
                    metrics[key[5:]] = metrics.pop(key)
        if hasattr(self, "ckpt_to_global_step"):
            self.ckpt_to_global_step[ckpt_dir] = self.state.global_step
            if metrics:
                self.ckpt_to_metric[ckpt_dir] = metrics
        else:
            self.ckpt_to_global_step = {ckpt_dir: self.state.global_step}
            self.ckpt_to_metric = {ckpt_dir: metrics} if metrics else {}


# TODO: if your task is SUMMARIZATION, you need a different
#  class Seq2SeqTrainerForAuto, uncomment the code below
#  Note: I have implemented it here,
#  but I don't know whether it's correct, you need to debug
#  Seq2SeqTrainerForAuto to make sure it's correct


# class Seq2SeqTrainerForAuto(TrainerForAuto):
#     def evaluate(self, eval_dataset=None, ignore_keys=None, metric_key_prefix="eval"):
#         """Overriding transformers.Trainer.evaluate by saving metrics and checkpoint path"""
#         self._is_seq2seq = True
#         TrainerForAuto.evaluate(self, eval_dataset, ignore_keys, metric_key_prefix)
#         # super(TrainerForAuto, self).evaluate(
#         #     eval_dataset, ignore_keys, metric_key_prefix
#         # )


# TODO: if your task is QUESTIONANSWERING, uncomment the code below
#  by adapting the code in https://github.com/huggingface/transformers/blob/master/examples/pytorch/question-answering/trainer_qa.py#L28


# class QATrainerForAuto(TrainerForAuto):
#     pass
# TODO: if your task is QUESTIONANSWERING, do the post processing here
Make NLP tasks available from AutoML.fit() (#210) Sequence classification and regression: "seq-classification" and "seq-regression" Co-authored-by: Chi Wang <wang.chi@microsoft.com> 2021-11-16 14:06:20 -05:00			`import os`

			`try:`
adding TODOs for NLP module, so students can implement other tasks easier (#321) * fixing ray pickle bug, skipping macosx bug, completing code for seqregression * catching connectionerror * ading TODOs for NLP module 2021-12-03 12:45:16 -05:00			`from transformers import Seq2SeqTrainer`
Make NLP tasks available from AutoML.fit() (#210) Sequence classification and regression: "seq-classification" and "seq-regression" Co-authored-by: Chi Wang <wang.chi@microsoft.com> 2021-11-16 14:06:20 -05:00			`except ImportError:`
Adding the NLP task summarization (#346) * Add test_autohf_summarization.py * adding seq2seq * Update flaml/nlp/huggingface/trainer.py * rouge metrics Co-authored-by: XinZofStevens <xzhao4346@gmail.com> Co-authored-by: JinzhuoWu <wujinzhuo0105@gmail.com> Co-authored-by: Chi Wang <wang.chi@microsoft.com> 2021-12-20 17:19:32 -05:00			`Seq2SeqTrainer = object`
Make NLP tasks available from AutoML.fit() (#210) Sequence classification and regression: "seq-classification" and "seq-regression" Co-authored-by: Chi Wang <wang.chi@microsoft.com> 2021-11-16 14:06:20 -05:00

Adding the NLP task summarization (#346) * Add test_autohf_summarization.py * adding seq2seq * Update flaml/nlp/huggingface/trainer.py * rouge metrics Co-authored-by: XinZofStevens <xzhao4346@gmail.com> Co-authored-by: JinzhuoWu <wujinzhuo0105@gmail.com> Co-authored-by: Chi Wang <wang.chi@microsoft.com> 2021-12-20 17:19:32 -05:00			`class TrainerForAuto(Seq2SeqTrainer):`
			`def predict(`
			`self,`
			`test_dataset,`
			`ignore_keys=None,`
			`metric_key_prefix=None,`
			`max_length=None,`
			`num_beams=None,`
			`):`
			`if getattr(self, "_is_seq2seq", None):`
			`return super().predict(`
			`test_dataset,`
			`ignore_keys,`
			`metric_key_prefix,`
			`max_length,`
			`num_beams,`
			`)`
			`else:`
			`return super(Seq2SeqTrainer, self).predict(`
			`test_dataset, ignore_keys, metric_key_prefix`
			`)`

			`def prediction_step(`
			`self,`
			`model,`
			`inputs,`
			`prediction_loss_only,`
			`ignore_keys,`
			`):`
			`if getattr(self, "_is_seq2seq", None):`
			`return super().prediction_step(`
			`model, inputs, prediction_loss_only, ignore_keys`
			`)`
			`else:`
			`return super(Seq2SeqTrainer, self).prediction_step(`
			`model, inputs, prediction_loss_only, ignore_keys`
			`)`

adding TODOs for NLP module, so students can implement other tasks easier (#321) * fixing ray pickle bug, skipping macosx bug, completing code for seqregression * catching connectionerror * ading TODOs for NLP module 2021-12-03 12:45:16 -05:00			`def evaluate(`
			`self,`
			`eval_dataset=None,`
			`ignore_keys=None,`
			`metric_key_prefix="eval",`
			`):`
Deploy a new doc website (#338) A new documentation website. And: * add actions for doc * update docstr * installation instructions for doc dev * unify README and Getting Started * rename notebook * doc about best_model_for_estimator #340 * docstr for keep_search_state #340 * DNN Co-authored-by: Qingyun Wu <qingyun.wu@psu.edu> Co-authored-by: Z.sk <shaokunzhang@psu.edu> 2021-12-16 17:11:33 -08:00			`"""Overriding transformers.Trainer.evaluate by saving metrics and checkpoint path."""`
Make NLP tasks available from AutoML.fit() (#210) Sequence classification and regression: "seq-classification" and "seq-regression" Co-authored-by: Chi Wang <wang.chi@microsoft.com> 2021-11-16 14:06:20 -05:00			`from transformers.trainer_utils import PREFIX_CHECKPOINT_DIR`

model_history, ITER_HP, settings in AutoML(), checkpoint bug fix (#283) if save_best_model_per_estimator is False and retrain_final is True, unfit the model after evaluation in HPO. retrain if using ray. update ITER_HP in config after a trial is finished. change prophet logging level. example and notebook update. allow settings to be passed to AutoML constructor. Are you planning to add multi-output-regression capability to FLAML #192 Is multi-tasking allowed? #277 can pass the auotml setting to the constructor instead of requiring a derived class. remove model_history. checkpoint bug fix. * model_history meaning save_best_model_per_estimator * ITER_HP * example update * prophet logging level * comment update in forecast notebook * print format improvement * allow settings to be passed to AutoML constructor * checkpoint bug fix * time limit for autohf regression test * skip slow test on macos * cleanup before del 2021-11-18 09:39:45 -08:00			`ckpt_dir = os.path.join(`
			`self.args.output_dir, f"{PREFIX_CHECKPOINT_DIR}-{self.state.global_step}"`
			`)`
			`eval_dataset = eval_dataset if eval_dataset is not None else self.eval_dataset`
adding TODOs for NLP module, so students can implement other tasks easier (#321) * fixing ray pickle bug, skipping macosx bug, completing code for seqregression * catching connectionerror * ading TODOs for NLP module 2021-12-03 12:45:16 -05:00
			`# TODO: if your task is seq2seq (i.e., SUMMARIZATION), uncomment the code below (add indentation before metrics = eval_dataset...`

Adding the NLP task summarization (#346) * Add test_autohf_summarization.py * adding seq2seq * Update flaml/nlp/huggingface/trainer.py * rouge metrics Co-authored-by: XinZofStevens <xzhao4346@gmail.com> Co-authored-by: JinzhuoWu <wujinzhuo0105@gmail.com> Co-authored-by: Chi Wang <wang.chi@microsoft.com> 2021-12-20 17:19:32 -05:00			`if getattr(self, "_is_seq2seq", None):`
			`metrics = eval_dataset and super().evaluate(`
			`eval_dataset,`
			`ignore_keys,`
			`metric_key_prefix,`
			`max_length=self.args.generation_max_length,`
			`num_beams=self.args.generation_num_beams,`
			`)`
			`else:`
			`metrics = eval_dataset and super(Seq2SeqTrainer, self).evaluate(`
			`eval_dataset,`
			`ignore_keys,`
			`metric_key_prefix,`
			`)`
model_history, ITER_HP, settings in AutoML(), checkpoint bug fix (#283) if save_best_model_per_estimator is False and retrain_final is True, unfit the model after evaluation in HPO. retrain if using ray. update ITER_HP in config after a trial is finished. change prophet logging level. example and notebook update. allow settings to be passed to AutoML constructor. Are you planning to add multi-output-regression capability to FLAML #192 Is multi-tasking allowed? #277 can pass the auotml setting to the constructor instead of requiring a derived class. remove model_history. checkpoint bug fix. * model_history meaning save_best_model_per_estimator * ITER_HP * example update * prophet logging level * comment update in forecast notebook * print format improvement * allow settings to be passed to AutoML constructor * checkpoint bug fix * time limit for autohf regression test * skip slow test on macos * cleanup before del 2021-11-18 09:39:45 -08:00			`if metrics:`
			`for key in list(metrics.keys()):`
			`if key.startswith("eval_"):`
			`metrics[key[5:]] = metrics.pop(key)`
			`if hasattr(self, "ckpt_to_global_step"):`
			`self.ckpt_to_global_step[ckpt_dir] = self.state.global_step`
			`if metrics:`
			`self.ckpt_to_metric[ckpt_dir] = metrics`
			`else:`
			`self.ckpt_to_global_step = {ckpt_dir: self.state.global_step}`
			`self.ckpt_to_metric = {ckpt_dir: metrics} if metrics else {}`
adding TODOs for NLP module, so students can implement other tasks easier (#321) * fixing ray pickle bug, skipping macosx bug, completing code for seqregression * catching connectionerror * ading TODOs for NLP module 2021-12-03 12:45:16 -05:00

			`# TODO: if your task is SUMMARIZATION, you need a different`
			`# class Seq2SeqTrainerForAuto, uncomment the code below`
			`# Note: I have implemented it here,`
			`# but I don't know whether it's correct, you need to debug`
			`# Seq2SeqTrainerForAuto to make sure it's correct`


Adding the NLP task summarization (#346) * Add test_autohf_summarization.py * adding seq2seq * Update flaml/nlp/huggingface/trainer.py * rouge metrics Co-authored-by: XinZofStevens <xzhao4346@gmail.com> Co-authored-by: JinzhuoWu <wujinzhuo0105@gmail.com> Co-authored-by: Chi Wang <wang.chi@microsoft.com> 2021-12-20 17:19:32 -05:00			`# class Seq2SeqTrainerForAuto(TrainerForAuto):`
adding TODOs for NLP module, so students can implement other tasks easier (#321) * fixing ray pickle bug, skipping macosx bug, completing code for seqregression * catching connectionerror * ading TODOs for NLP module 2021-12-03 12:45:16 -05:00			`# def evaluate(self, eval_dataset=None, ignore_keys=None, metric_key_prefix="eval"):`
			`# """Overriding transformers.Trainer.evaluate by saving metrics and checkpoint path"""`
Adding the NLP task summarization (#346) * Add test_autohf_summarization.py * adding seq2seq * Update flaml/nlp/huggingface/trainer.py * rouge metrics Co-authored-by: XinZofStevens <xzhao4346@gmail.com> Co-authored-by: JinzhuoWu <wujinzhuo0105@gmail.com> Co-authored-by: Chi Wang <wang.chi@microsoft.com> 2021-12-20 17:19:32 -05:00			`# self._is_seq2seq = True`
			`# TrainerForAuto.evaluate(self, eval_dataset, ignore_keys, metric_key_prefix)`
			`# # super(TrainerForAuto, self).evaluate(`
			`# # eval_dataset, ignore_keys, metric_key_prefix`
			`# # )`
adding TODOs for NLP module, so students can implement other tasks easier (#321) * fixing ray pickle bug, skipping macosx bug, completing code for seqregression * catching connectionerror * ading TODOs for NLP module 2021-12-03 12:45:16 -05:00

			`# TODO: if your task is QUESTIONANSWERING, uncomment the code below`
			`# by adapting the code in https://github.com/huggingface/transformers/blob/master/examples/pytorch/question-answering/trainer_qa.py#L28`


			`# class QATrainerForAuto(TrainerForAuto):`
			`# pass`
			`# TODO: if your task is QUESTIONANSWERING, do the post processing here`