|
- import pandas as pd
-
- from searcher import schemas as schemas_utils
- from searcher.utils import generate_dataset_problem, evaluate_pipeline
-
- table_path = 'datasets/yahoo_sub_5.csv'
- target_index = 6 # what column is the target
-
- #table_path = 'datasets/NAB/realTweets/labeled_Twitter_volume_IBM.csv' # The path of the dataset
- time_limit = 30 # How many seconds you wanna search
- #metric = 'F1' # F1 on label 1
- metric = 'F1_MACRO' # F1 on both label 0 and 1
-
- # Read data and generate dataset and problem
- df = pd.read_csv(table_path)
- dataset, problem_description = generate_dataset_problem(df, target_index=target_index, metric=metric)
-
- # Load the default pipeline
- pipeline = schemas_utils.load_default_pipeline()
-
- # Run the pipeline
- pipeline_result = evaluate_pipeline(problem_description, dataset, pipeline)
- print(pipeline_result)
|