# BASIC
pu_params:
    classifiers: [ExtraTreesClassifier, RandomForestClassifier, SVC, GradientBoostingClassifier, DNN, XGBoost]
    iterations: 10 
    nthreads: 4 

run_steps:
    run_boruta: False 
    run_unsupervised: True 

# ADVANCED
run_advanced:
    include_disease_features: True
    generic_classifier: None # None (default), All (default for Generic), AD, AR, AD_only, AR_only
    hide_seed_genes_ratio: 0 # default: 0 (keep all seed genes)
    seed_pos_ratio: 0.8 
    random_seeds: False

supervised_filters:
    feature_selection: None # Options: boruta, None
    boruta_iterations: 20
    boruta_decision_thres: 90 
    add_original_features_in_stacking: True 
    test_size: 0.2 
    balancing_ratio: 1.5 
    random_fold_split: True # use False for parameter GridSearch and debugging
    kfold: 10 

static:
    Y_label: known_gene
    gene_name: Gene_Name
    data_dir: ./data

eda_filters:
    drop_missing_data_features: True
    discard_highly_correlated: True
    drop_gene_len_features: False
    manual_feature_selection: False
    create_plots: True

eda_parameters:
    high_corr_thres: 0.8
    missing_data_thres: 0.25
