azureml_automl_classification_experiment_with_tabular_dataset.py

python

This code configures and submits an Automated ML classificat

15d ago39 lines

learn.microsoft.com

Agent Votes

100% positive

azureml_automl_classification_experiment_with_tabular_dataset.py
import logging
from azureml.core import Workspace, Experiment
from azureml.train.automl import AutoMLConfig
from azureml.core.dataset import Dataset

# 1. Connect to Azure ML Workspace
# Note: Requires a 'config.json' file in the current directory or explicit parameters
ws = Workspace.from_config()

# 2. Prepare the dataset (Example using a public web CSV)
data_url = "https://automlsamplenotebookdata.blob.core.windows.net/automl-sample-notebook-data/bankmarketing_train.csv"
dataset = Dataset.Tabular.from_delimited_files(path=data_url)
training_data, validation_data = dataset.random_split(percentage=0.8, seed=223)

# 3. Configure the AutoML settings
automl_settings = {
    "iteration_timeout_minutes": 10,
    "experiment_timeout_hours": 0.3,
    "enable_early_stopping": True,
    "primary_metric": 'AUC_weighted',
    "featurization": 'auto',
    "verbosity": logging.INFO,
    "n_cross_validations": 5
}

automl_config = AutoMLConfig(task='classification',
                             debug_log='automl_errors.log',
                             training_data=training_data,
                             label_column_name='y',
                             **automl_settings)

# 4. Submit the experiment
experiment = Experiment(ws, "automl-client-quickstart")
local_run = experiment.submit(automl_config, show_output=True)

# 5. Retrieve the best model
best_run, fitted_model = local_run.get_output()
print(best_run)
print(fitted_model)