autogen/test/pipeline_tuning_example/tuner/tuner_func.py

import time
import flaml
import submit_train_pipeline
import logging
from ray import tune

logger = logging.getLogger(__name__)


def run_with_config(config: dict):
    """Run the pipeline with a given config dict"""

    # pass the hyperparameters to AzureML jobs by overwriting the config file.
    overrides = [f"{key}={value}" for key, value in config.items()]

    print(overrides)
    run = submit_train_pipeline.build_and_submit_aml_pipeline(overrides)

    print(run.get_portal_url())

    # retrieving the metrics to optimize before the job completes.
    stop = False
    while not stop:
        # get status
        status = run._core_run.get_status()
        print(f"status: {status}")

        # get metrics
        metrics = run._core_run.get_metrics(recursive=True)
        if metrics:
            run_metrics = list(metrics.values())

            new_metric = run_metrics[0]["eval_binary_error"]

            if type(new_metric) == list:
                new_metric = new_metric[-1]

            print(f"eval_binary_error: {new_metric}")

            tune.report(eval_binary_error=new_metric)

        time.sleep(5)

        if status == "FAILED" or status == "Completed":
            stop = True

    print("The run is terminated.")
    print(status)

    return


def tune_pipeline(concurrent_run=1):
    start_time = time.time()

    # config the HPO job
    search_space = {
        "train_config.n_estimators": flaml.tune.randint(50, 200),
        "train_config.learning_rate": flaml.tune.uniform(0.01, 0.5),
    }

    hp_metric = "eval_binary_error"
    mode = "max"
    num_samples = 2

    if concurrent_run > 1:
        import ray  # For parallel tuning

        ray.init(num_cpus=concurrent_run)
        use_ray = True
    else:
        use_ray = False

    # launch the HPO job
    analysis = flaml.tune.run(
        run_with_config,
        config=search_space,
        metric=hp_metric,
        mode=mode,
        num_samples=num_samples,  # number of trials
        use_ray=use_ray,
    )

    # get the best config
    best_trial = analysis.get_best_trial(hp_metric, mode, "all")
    metric = best_trial.metric_analysis[hp_metric][mode]
    print(f"n_trials={len(analysis.trials)}")
    print(f"time={time.time()-start_time}")
    print(f"Best {hp_metric}: {metric:.4f}")
    print(f"Best coonfiguration: {best_trial.config}")


if __name__ == "__main__":
    tune_pipeline(concurrent_run=2)
    # for parallel tuning, pass concurrent_run > 1
Add pipeline tuner component and dependencies. (#671) * add pipeline tuner component and dependencies. * clean code. * do not need force rerun. * replace the resources. * update metrics retrieving. * Update test/pipeline_tuning_example/requirements.txt * Update test/pipeline_tuning_example/train/env.yaml * Update test/pipeline_tuning_example/tuner/env.yaml * Update test/pipeline_tuning_example/tuner/tuner_func.py * Update test/pipeline_tuning_example/data_prep/env.yaml * fix issues found by lint with flake8. * add documentation * add data. * do not need AML resource for local run. * AML -> AzureML * clean code. * Update website/docs/Examples/Tune-AzureML pipeline.md * rename and add pip install. * update figure name. * align docs with code. * remove extra line. 2022-08-10 20:20:21 -07:00			`import time`
			`import flaml`
			`import submit_train_pipeline`
			`import logging`
			`from ray import tune`

			`logger = logging.getLogger(__name__)`


			`def run_with_config(config: dict):`
first 2022-10-09 11:39:29 -04:00			`"""Run the pipeline with a given config dict"""`
Add pipeline tuner component and dependencies. (#671) * add pipeline tuner component and dependencies. * clean code. * do not need force rerun. * replace the resources. * update metrics retrieving. * Update test/pipeline_tuning_example/requirements.txt * Update test/pipeline_tuning_example/train/env.yaml * Update test/pipeline_tuning_example/tuner/env.yaml * Update test/pipeline_tuning_example/tuner/tuner_func.py * Update test/pipeline_tuning_example/data_prep/env.yaml * fix issues found by lint with flake8. * add documentation * add data. * do not need AML resource for local run. * AML -> AzureML * clean code. * Update website/docs/Examples/Tune-AzureML pipeline.md * rename and add pip install. * update figure name. * align docs with code. * remove extra line. 2022-08-10 20:20:21 -07:00
			`# pass the hyperparameters to AzureML jobs by overwriting the config file.`
			`overrides = [f"{key}={value}" for key, value in config.items()]`

			`print(overrides)`
			`run = submit_train_pipeline.build_and_submit_aml_pipeline(overrides)`

			`print(run.get_portal_url())`

			`# retrieving the metrics to optimize before the job completes.`
			`stop = False`
			`while not stop:`
			`# get status`
			`status = run._core_run.get_status()`
first 2022-10-09 11:39:29 -04:00			`print(f"status: {status}")`
Add pipeline tuner component and dependencies. (#671) * add pipeline tuner component and dependencies. * clean code. * do not need force rerun. * replace the resources. * update metrics retrieving. * Update test/pipeline_tuning_example/requirements.txt * Update test/pipeline_tuning_example/train/env.yaml * Update test/pipeline_tuning_example/tuner/env.yaml * Update test/pipeline_tuning_example/tuner/tuner_func.py * Update test/pipeline_tuning_example/data_prep/env.yaml * fix issues found by lint with flake8. * add documentation * add data. * do not need AML resource for local run. * AML -> AzureML * clean code. * Update website/docs/Examples/Tune-AzureML pipeline.md * rename and add pip install. * update figure name. * align docs with code. * remove extra line. 2022-08-10 20:20:21 -07:00
			`# get metrics`
			`metrics = run._core_run.get_metrics(recursive=True)`
			`if metrics:`
			`run_metrics = list(metrics.values())`

first 2022-10-09 11:39:29 -04:00			`new_metric = run_metrics[0]["eval_binary_error"]`
Add pipeline tuner component and dependencies. (#671) * add pipeline tuner component and dependencies. * clean code. * do not need force rerun. * replace the resources. * update metrics retrieving. * Update test/pipeline_tuning_example/requirements.txt * Update test/pipeline_tuning_example/train/env.yaml * Update test/pipeline_tuning_example/tuner/env.yaml * Update test/pipeline_tuning_example/tuner/tuner_func.py * Update test/pipeline_tuning_example/data_prep/env.yaml * fix issues found by lint with flake8. * add documentation * add data. * do not need AML resource for local run. * AML -> AzureML * clean code. * Update website/docs/Examples/Tune-AzureML pipeline.md * rename and add pip install. * update figure name. * align docs with code. * remove extra line. 2022-08-10 20:20:21 -07:00
			`if type(new_metric) == list:`
			`new_metric = new_metric[-1]`

first 2022-10-09 11:39:29 -04:00			`print(f"eval_binary_error: {new_metric}")`
Add pipeline tuner component and dependencies. (#671) * add pipeline tuner component and dependencies. * clean code. * do not need force rerun. * replace the resources. * update metrics retrieving. * Update test/pipeline_tuning_example/requirements.txt * Update test/pipeline_tuning_example/train/env.yaml * Update test/pipeline_tuning_example/tuner/env.yaml * Update test/pipeline_tuning_example/tuner/tuner_func.py * Update test/pipeline_tuning_example/data_prep/env.yaml * fix issues found by lint with flake8. * add documentation * add data. * do not need AML resource for local run. * AML -> AzureML * clean code. * Update website/docs/Examples/Tune-AzureML pipeline.md * rename and add pip install. * update figure name. * align docs with code. * remove extra line. 2022-08-10 20:20:21 -07:00
			`tune.report(eval_binary_error=new_metric)`

			`time.sleep(5)`

first 2022-10-09 11:39:29 -04:00			`if status == "FAILED" or status == "Completed":`
Add pipeline tuner component and dependencies. (#671) * add pipeline tuner component and dependencies. * clean code. * do not need force rerun. * replace the resources. * update metrics retrieving. * Update test/pipeline_tuning_example/requirements.txt * Update test/pipeline_tuning_example/train/env.yaml * Update test/pipeline_tuning_example/tuner/env.yaml * Update test/pipeline_tuning_example/tuner/tuner_func.py * Update test/pipeline_tuning_example/data_prep/env.yaml * fix issues found by lint with flake8. * add documentation * add data. * do not need AML resource for local run. * AML -> AzureML * clean code. * Update website/docs/Examples/Tune-AzureML pipeline.md * rename and add pip install. * update figure name. * align docs with code. * remove extra line. 2022-08-10 20:20:21 -07:00			`stop = True`

			`print("The run is terminated.")`
			`print(status)`

			`return`


			`def tune_pipeline(concurrent_run=1):`
			`start_time = time.time()`

			`# config the HPO job`
			`search_space = {`
			`"train_config.n_estimators": flaml.tune.randint(50, 200),`
			`"train_config.learning_rate": flaml.tune.uniform(0.01, 0.5),`
			`}`

			`hp_metric = "eval_binary_error"`
			`mode = "max"`
			`num_samples = 2`

			`if concurrent_run > 1:`
			`import ray # For parallel tuning`

			`ray.init(num_cpus=concurrent_run)`
			`use_ray = True`
			`else:`
			`use_ray = False`

			`# launch the HPO job`
			`analysis = flaml.tune.run(`
			`run_with_config,`
			`config=search_space,`
			`metric=hp_metric,`
			`mode=mode,`
			`num_samples=num_samples, # number of trials`
			`use_ray=use_ray,`
			`)`

			`# get the best config`
			`best_trial = analysis.get_best_trial(hp_metric, mode, "all")`
			`metric = best_trial.metric_analysis[hp_metric][mode]`
			`print(f"n_trials={len(analysis.trials)}")`
			`print(f"time={time.time()-start_time}")`
			`print(f"Best {hp_metric}: {metric:.4f}")`
			`print(f"Best coonfiguration: {best_trial.config}")`


			`if __name__ == "__main__":`
			`tune_pipeline(concurrent_run=2)`
			`# for parallel tuning, pass concurrent_run > 1`