diff --git a/docs/sphinx-builddir/doctrees/environment.pickle b/docs/sphinx-builddir/doctrees/environment.pickle index fa4f775..3d5a972 100644 Binary files a/docs/sphinx-builddir/doctrees/environment.pickle and b/docs/sphinx-builddir/doctrees/environment.pickle differ diff --git a/docs/sphinx-builddir/doctrees/nbsphinx/notebooks/QSARtuna_Tutorial.ipynb b/docs/sphinx-builddir/doctrees/nbsphinx/notebooks/QSARtuna_Tutorial.ipynb index 3968fe6..030a871 100644 --- a/docs/sphinx-builddir/doctrees/nbsphinx/notebooks/QSARtuna_Tutorial.ipynb +++ b/docs/sphinx-builddir/doctrees/nbsphinx/notebooks/QSARtuna_Tutorial.ipynb @@ -893,7 +893,7 @@ "text": [ "[I 2024-08-27 14:01:27,262] A new study created in memory with name: my_study_stratified_split\n", "[I 2024-08-27 14:01:27,303] A new study created in memory with name: study_name_0\n", - "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:180)\n", + "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:180)\n", " return self._cached_call(args, kwargs, shelving=False)[0]\n", "[I 2024-08-27 14:01:27,408] Trial 0 finished with value: -3999.9364276424735 and parameters: {'algorithm_name': 'SVR', 'SVR_algorithm_hash': 'ea7ccc7ef4a9329af0d4e39eb6184933', 'gamma__ea7ccc7ef4a9329af0d4e39eb6184933': 0.11270803112210707, 'C__ea7ccc7ef4a9329af0d4e39eb6184933': 43.81076443656638, 'descriptor': '{\"name\": \"ECFP\", \"parameters\": {\"radius\": 3, \"nBits\": 2048, \"returnRdkit\": false}}'}. Best is trial 0 with value: -3999.9364276424735.\n", "[I 2024-08-27 14:01:27,485] Trial 1 finished with value: -1856.4459752935309 and parameters: {'algorithm_name': 'PLSRegression', 'PLSRegression_algorithm_hash': '9f2f76e479633c0bf18cf2912fed9eda', 'n_components__9f2f76e479633c0bf18cf2912fed9eda': 4, 'descriptor': '{\"name\": \"MACCS_keys\", \"parameters\": {}}'}. Best is trial 1 with value: -1856.4459752935309.\n", @@ -1726,9 +1726,9 @@ "Traceback (most recent call last):\n", " File \"/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/optuna/study/_optimize.py\", line 196, in _run_trial\n", " value_or_values = func(trial)\n", - " File \"/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/objective.py\", line 128, in __call__\n", + " File \"/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/objective.py\", line 128, in __call__\n", " self._validate_algos()\n", - " File \"/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/objective.py\", line 270, in _validate_algos\n", + " File \"/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/objective.py\", line 270, in _validate_algos\n", " raise ValueError(\n", "ValueError: PRFClassifier supplied but response column outside [0.0-1.0] acceptable range. Response max: 9.7, response min: 5.3 \n", "[W 2024-08-27 14:02:47,253] Trial 0 failed with value None.\n" @@ -3388,7 +3388,7 @@ "[I 2024-08-27 14:09:24,367] A new study created in memory with name: my_study\n", "[I 2024-08-27 14:09:24,410] A new study created in memory with name: study_name_0\n", "INFO:root:Enqueued ChemProp manual trial with sensible defaults: {'activation__fd833c2dde0b7147e6516ea5eebb2657': 'ReLU', 'aggregation__fd833c2dde0b7147e6516ea5eebb2657': 'mean', 'aggregation_norm__fd833c2dde0b7147e6516ea5eebb2657': 100, 'batch_size__fd833c2dde0b7147e6516ea5eebb2657': 50, 'depth__fd833c2dde0b7147e6516ea5eebb2657': 3, 'dropout__fd833c2dde0b7147e6516ea5eebb2657': 0.0, 'features_generator__fd833c2dde0b7147e6516ea5eebb2657': 'none', 'ffn_hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300, 'ffn_num_layers__fd833c2dde0b7147e6516ea5eebb2657': 2, 'final_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300, 'init_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'max_lr_exp__fd833c2dde0b7147e6516ea5eebb2657': -3, 'warmup_epochs_ratio__fd833c2dde0b7147e6516ea5eebb2657': 0.1, 'algorithm_name': 'ChemPropClassifier', 'ChemPropClassifier_algorithm_hash': 'fd833c2dde0b7147e6516ea5eebb2657'}\n", - "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:859)\n", + "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:859)\n", " return self._cached_call(args, kwargs, shelving=False)[0]\n", "[I 2024-08-27 14:16:18,484] Trial 0 finished with value: 0.65625 and parameters: {'algorithm_name': 'ChemPropClassifier', 'ChemPropClassifier_algorithm_hash': 'fd833c2dde0b7147e6516ea5eebb2657', 'activation__fd833c2dde0b7147e6516ea5eebb2657': , 'aggregation__fd833c2dde0b7147e6516ea5eebb2657': , 'aggregation_norm__fd833c2dde0b7147e6516ea5eebb2657': 100.0, 'batch_size__fd833c2dde0b7147e6516ea5eebb2657': 50.0, 'depth__fd833c2dde0b7147e6516ea5eebb2657': 3.0, 'dropout__fd833c2dde0b7147e6516ea5eebb2657': 0.0, 'ensemble_size__fd833c2dde0b7147e6516ea5eebb2657': 5, 'epochs__fd833c2dde0b7147e6516ea5eebb2657': 4, 'features_generator__fd833c2dde0b7147e6516ea5eebb2657': , 'ffn_hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300.0, 'ffn_num_layers__fd833c2dde0b7147e6516ea5eebb2657': 2.0, 'final_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300.0, 'init_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'max_lr_exp__fd833c2dde0b7147e6516ea5eebb2657': -3, 'warmup_epochs_ratio__fd833c2dde0b7147e6516ea5eebb2657': 0.1, 'descriptor': '{\"name\": \"SmilesFromFile\", \"parameters\": {}}'}. Best is trial 0 with value: 0.65625.\n", " \r" @@ -4745,7 +4745,7 @@ "text": [ "[I 2024-08-27 15:09:26,977] A new study created in memory with name: non-transform_example\n", "[I 2024-08-27 15:09:26,979] A new study created in memory with name: study_name_0\n", - "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:180)\n", + "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:180)\n", " return self._cached_call(args, kwargs, shelving=False)[0]\n", "[I 2024-08-27 15:09:27,144] Trial 0 finished with value: -3501.942111261296 and parameters: {'algorithm_name': 'RandomForestRegressor', 'RandomForestRegressor_algorithm_hash': 'f1ac01e1bba332215ccbd0c29c9ac3c3', 'max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3': 6, 'n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3': 5, 'max_features__f1ac01e1bba332215ccbd0c29c9ac3c3': , 'descriptor': '{\"name\": \"ECFP\", \"parameters\": {\"radius\": 3, \"nBits\": 2048, \"returnRdkit\": false}}'}. Best is trial 0 with value: -3501.942111261296.\n", "[I 2024-08-27 15:09:27,220] Trial 1 finished with value: -5451.207265576796 and parameters: {'algorithm_name': 'RandomForestRegressor', 'RandomForestRegressor_algorithm_hash': 'f1ac01e1bba332215ccbd0c29c9ac3c3', 'max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3': 7, 'n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3': 6, 'max_features__f1ac01e1bba332215ccbd0c29c9ac3c3': , 'descriptor': '{\"name\": \"ECFP\", \"parameters\": {\"radius\": 3, \"nBits\": 2048, \"returnRdkit\": false}}'}. Best is trial 0 with value: -3501.942111261296.\n", @@ -11399,7 +11399,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "The AutoML daemon functionaility in Qptuna automates the process of preparing data for model training, including data cleaning, feature extraction, and data formatting, streamlining the data preprocessing stage. The main aspects of this workflow are the following:\n", + "The AutoML daemon functionaility in QSARtuna automates the process of preparing data for model training, including data cleaning, feature extraction, and data formatting, streamlining the data preprocessing stage. The main aspects of this workflow are the following:\n", "\n", "* __Automated Data Preparation__: Automated process of preparing data for model training, including cleaning, feature extraction, formatting and quorum checks, streamlining data preprocessing\n", "\n", @@ -11407,9 +11407,9 @@ "\n", "* __Scalable and Efficient with Dynamic Resource Allocation__: Workflow designed to handle large datasets (with multiple prediction tasks) and dynamically utilize CPU/GPU/memory HPC resources\n", "\n", - "* __Customizable SLURM and Qptuna Templates__: SLURM templates can be tailored for different use cases. Both initial training and retraining Qptuna JSON configurations are used, allowing users customise which algorithms and descriptors should be trialed. The default configuration will for e.g. train an initial ChemProp model, and subsequent models will automatically trial Transfer Learning (TL) from previous models for new data, when appropriate\n", + "* __Customizable SLURM and QSARtuna Templates__: SLURM templates can be tailored for different use cases. Both initial training and retraining QSARtuna JSON configurations are used, allowing users customise which algorithms and descriptors should be trialed. The default configuration will for e.g. train an initial ChemProp model, and subsequent models will automatically trial Transfer Learning (TL) from previous models for new data, when appropriate\n", "\n", - "* __Metadata, Prediction and Model Tracking__: The code includes functionality for tracking temporal performance, raw test predictions, active learning predictions and exported Qptuna models, aiding monitoring and evaluating pseudo-prospective model performance over time\n", + "* __Metadata, Prediction and Model Tracking__: The code includes functionality for tracking temporal performance, raw test predictions, active learning predictions and exported QSARtuna models, aiding monitoring and evaluating pseudo-prospective model performance over time\n", "\n", "* __Automatic Job Resubmission__: In case of SLURM job failures, the code provides functionality to automatically resubmit failed jobs with modified resource allocations, enhancing the robustness of the model training process\n", "\n", @@ -11417,7 +11417,7 @@ "\n", "* __Dry Run Mode__: Dry run mode option enables users to simulate the process without actually submitting jobs, useful for verifying configurations and testing the workflow\n", "\n", - "The following is an example from the Qptuna unit tests:" + "The following is an example from the QSARtuna unit tests:" ] }, { @@ -11534,7 +11534,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "Qptuna AutoML expects temporal data (`--input-data`) to have been exported from warehouses/databases in a flat file structure in CSV format (which can also be gz compressed), containing SMILES, activity and task (which denotes each distinct property to be modelled) CSV columns. \n", + "QSARtuna AutoML expects temporal data (`--input-data`) to have been exported from warehouses/databases in a flat file structure in CSV format (which can also be gz compressed), containing SMILES, activity and task (which denotes each distinct property to be modelled) CSV columns. \n", "\n", "Exports are expected to be temporal in nature, with the naming convention `%Y-%m-%d` (see [here](https://docs.python.org/3/library/datetime.html#strftime-and-strptime-behavior) for details). Data can be exported in two ways:\n", "\n", @@ -11605,7 +11605,7 @@ "Then our configuration would be:\n", "\n", "```\n", - "qptuna-automl \n", + "qsartuna-automl \n", " --input-data \"../tests/data/automl/*\" \\\n", " --email @astrazeneca.com --user_name \\ # username should be accurate to monitor jobs\n", " --input-smiles-csv-column canonical --input-activity-csv-column molwt \\\n", @@ -11690,7 +11690,7 @@ " \"--n-cores\",\n", " \"1\",\n", " \"--dry-run\", # The dry-run option is enabled, so the AutoML pipeline does not submit to SLURM\n", - " \"-vv\", # Use this CLI option to enable detailed debugging logging to observe Qptuna AutoML behaviour \n", + " \"-vv\", # Use this CLI option to enable detailed debugging logging to observe QSARtuna AutoML behaviour \n", " \"--slurm-al-pool\",\n", " \"../tests/data/DRD2/subset-1000/train.csv\",\n", " \"--slurm-al-smiles-csv-column\",\n", @@ -11733,11 +11733,11 @@ "* resulting folder `data/TID1` comprises the following processed data:\n", " * `TID1.csv` : molecular property data set ready for modelling\n", " * `TID1.json`: config for an initial round of model training\n", - " * `TID1.sh`: used to run run Qptuna AutoML via an `sbatch` command, though `-- dry-run` prevented this happening\n", + " * `TID1.sh`: used to run run QSARtuna AutoML via an `sbatch` command, though `-- dry-run` prevented this happening\n", " * `.24_01_01` lock file initiated to track the status of the training at this timepoint\n", "* `processed_timepoints.json` is created to track which timepoints are processed\n", "\n", - "The script stopped at this point, to allow for HPC resources to submit the initial optimisation job. Subsequent runs of the Qptuna AutoML are required to progress past the initial optimisation run, and so could be scheduled (e.g. using `cron` or similar).\n", + "The script stopped at this point, to allow for HPC resources to submit the initial optimisation job. Subsequent runs of the QSARtuna AutoML are required to progress past the initial optimisation run, and so could be scheduled (e.g. using `cron` or similar).\n", "\n", "Running the AutoML workflow does a dry-run check of the status of the run:" ] @@ -11817,7 +11817,7 @@ "ml Miniconda3\n", "conda activate my_env_with_qsartuna\n", "\n", - "qptuna-automl \n", + "qsartuna-automl \n", " --input-data \"/tests/data/automl/*\" \\\n", " --email @astrazeneca.com --user_name \\\n", " --input-smiles-csv-column canonical --input-activity-csv-column molwt \\\n", diff --git a/docs/sphinx-builddir/doctrees/notebooks/QPTUNA_Tutorial.doctree b/docs/sphinx-builddir/doctrees/notebooks/QPTUNA_Tutorial.doctree index ed11d05..650f5c2 100644 Binary files a/docs/sphinx-builddir/doctrees/notebooks/QPTUNA_Tutorial.doctree and b/docs/sphinx-builddir/doctrees/notebooks/QPTUNA_Tutorial.doctree differ diff --git a/docs/sphinx-builddir/doctrees/notebooks/QSARtuna_Tutorial.doctree b/docs/sphinx-builddir/doctrees/notebooks/QSARtuna_Tutorial.doctree index 223c382..1728af8 100644 Binary files a/docs/sphinx-builddir/doctrees/notebooks/QSARtuna_Tutorial.doctree and b/docs/sphinx-builddir/doctrees/notebooks/QSARtuna_Tutorial.doctree differ diff --git a/docs/sphinx-builddir/doctrees/optunaz.doctree b/docs/sphinx-builddir/doctrees/optunaz.doctree index 76e5f30..382e53a 100644 Binary files a/docs/sphinx-builddir/doctrees/optunaz.doctree and b/docs/sphinx-builddir/doctrees/optunaz.doctree differ diff --git a/docs/sphinx-builddir/html/_sources/notebooks/QSARtuna_Tutorial.ipynb.txt b/docs/sphinx-builddir/html/_sources/notebooks/QSARtuna_Tutorial.ipynb.txt index 3968fe6..030a871 100644 --- a/docs/sphinx-builddir/html/_sources/notebooks/QSARtuna_Tutorial.ipynb.txt +++ b/docs/sphinx-builddir/html/_sources/notebooks/QSARtuna_Tutorial.ipynb.txt @@ -893,7 +893,7 @@ "text": [ "[I 2024-08-27 14:01:27,262] A new study created in memory with name: my_study_stratified_split\n", "[I 2024-08-27 14:01:27,303] A new study created in memory with name: study_name_0\n", - "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:180)\n", + "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:180)\n", " return self._cached_call(args, kwargs, shelving=False)[0]\n", "[I 2024-08-27 14:01:27,408] Trial 0 finished with value: -3999.9364276424735 and parameters: {'algorithm_name': 'SVR', 'SVR_algorithm_hash': 'ea7ccc7ef4a9329af0d4e39eb6184933', 'gamma__ea7ccc7ef4a9329af0d4e39eb6184933': 0.11270803112210707, 'C__ea7ccc7ef4a9329af0d4e39eb6184933': 43.81076443656638, 'descriptor': '{\"name\": \"ECFP\", \"parameters\": {\"radius\": 3, \"nBits\": 2048, \"returnRdkit\": false}}'}. Best is trial 0 with value: -3999.9364276424735.\n", "[I 2024-08-27 14:01:27,485] Trial 1 finished with value: -1856.4459752935309 and parameters: {'algorithm_name': 'PLSRegression', 'PLSRegression_algorithm_hash': '9f2f76e479633c0bf18cf2912fed9eda', 'n_components__9f2f76e479633c0bf18cf2912fed9eda': 4, 'descriptor': '{\"name\": \"MACCS_keys\", \"parameters\": {}}'}. Best is trial 1 with value: -1856.4459752935309.\n", @@ -1726,9 +1726,9 @@ "Traceback (most recent call last):\n", " File \"/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/optuna/study/_optimize.py\", line 196, in _run_trial\n", " value_or_values = func(trial)\n", - " File \"/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/objective.py\", line 128, in __call__\n", + " File \"/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/objective.py\", line 128, in __call__\n", " self._validate_algos()\n", - " File \"/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/objective.py\", line 270, in _validate_algos\n", + " File \"/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/objective.py\", line 270, in _validate_algos\n", " raise ValueError(\n", "ValueError: PRFClassifier supplied but response column outside [0.0-1.0] acceptable range. Response max: 9.7, response min: 5.3 \n", "[W 2024-08-27 14:02:47,253] Trial 0 failed with value None.\n" @@ -3388,7 +3388,7 @@ "[I 2024-08-27 14:09:24,367] A new study created in memory with name: my_study\n", "[I 2024-08-27 14:09:24,410] A new study created in memory with name: study_name_0\n", "INFO:root:Enqueued ChemProp manual trial with sensible defaults: {'activation__fd833c2dde0b7147e6516ea5eebb2657': 'ReLU', 'aggregation__fd833c2dde0b7147e6516ea5eebb2657': 'mean', 'aggregation_norm__fd833c2dde0b7147e6516ea5eebb2657': 100, 'batch_size__fd833c2dde0b7147e6516ea5eebb2657': 50, 'depth__fd833c2dde0b7147e6516ea5eebb2657': 3, 'dropout__fd833c2dde0b7147e6516ea5eebb2657': 0.0, 'features_generator__fd833c2dde0b7147e6516ea5eebb2657': 'none', 'ffn_hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300, 'ffn_num_layers__fd833c2dde0b7147e6516ea5eebb2657': 2, 'final_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300, 'init_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'max_lr_exp__fd833c2dde0b7147e6516ea5eebb2657': -3, 'warmup_epochs_ratio__fd833c2dde0b7147e6516ea5eebb2657': 0.1, 'algorithm_name': 'ChemPropClassifier', 'ChemPropClassifier_algorithm_hash': 'fd833c2dde0b7147e6516ea5eebb2657'}\n", - "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:859)\n", + "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:859)\n", " return self._cached_call(args, kwargs, shelving=False)[0]\n", "[I 2024-08-27 14:16:18,484] Trial 0 finished with value: 0.65625 and parameters: {'algorithm_name': 'ChemPropClassifier', 'ChemPropClassifier_algorithm_hash': 'fd833c2dde0b7147e6516ea5eebb2657', 'activation__fd833c2dde0b7147e6516ea5eebb2657': , 'aggregation__fd833c2dde0b7147e6516ea5eebb2657': , 'aggregation_norm__fd833c2dde0b7147e6516ea5eebb2657': 100.0, 'batch_size__fd833c2dde0b7147e6516ea5eebb2657': 50.0, 'depth__fd833c2dde0b7147e6516ea5eebb2657': 3.0, 'dropout__fd833c2dde0b7147e6516ea5eebb2657': 0.0, 'ensemble_size__fd833c2dde0b7147e6516ea5eebb2657': 5, 'epochs__fd833c2dde0b7147e6516ea5eebb2657': 4, 'features_generator__fd833c2dde0b7147e6516ea5eebb2657': , 'ffn_hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300.0, 'ffn_num_layers__fd833c2dde0b7147e6516ea5eebb2657': 2.0, 'final_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300.0, 'init_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'max_lr_exp__fd833c2dde0b7147e6516ea5eebb2657': -3, 'warmup_epochs_ratio__fd833c2dde0b7147e6516ea5eebb2657': 0.1, 'descriptor': '{\"name\": \"SmilesFromFile\", \"parameters\": {}}'}. Best is trial 0 with value: 0.65625.\n", " \r" @@ -4745,7 +4745,7 @@ "text": [ "[I 2024-08-27 15:09:26,977] A new study created in memory with name: non-transform_example\n", "[I 2024-08-27 15:09:26,979] A new study created in memory with name: study_name_0\n", - "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:180)\n", + "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:180)\n", " return self._cached_call(args, kwargs, shelving=False)[0]\n", "[I 2024-08-27 15:09:27,144] Trial 0 finished with value: -3501.942111261296 and parameters: {'algorithm_name': 'RandomForestRegressor', 'RandomForestRegressor_algorithm_hash': 'f1ac01e1bba332215ccbd0c29c9ac3c3', 'max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3': 6, 'n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3': 5, 'max_features__f1ac01e1bba332215ccbd0c29c9ac3c3': , 'descriptor': '{\"name\": \"ECFP\", \"parameters\": {\"radius\": 3, \"nBits\": 2048, \"returnRdkit\": false}}'}. Best is trial 0 with value: -3501.942111261296.\n", "[I 2024-08-27 15:09:27,220] Trial 1 finished with value: -5451.207265576796 and parameters: {'algorithm_name': 'RandomForestRegressor', 'RandomForestRegressor_algorithm_hash': 'f1ac01e1bba332215ccbd0c29c9ac3c3', 'max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3': 7, 'n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3': 6, 'max_features__f1ac01e1bba332215ccbd0c29c9ac3c3': , 'descriptor': '{\"name\": \"ECFP\", \"parameters\": {\"radius\": 3, \"nBits\": 2048, \"returnRdkit\": false}}'}. Best is trial 0 with value: -3501.942111261296.\n", @@ -11399,7 +11399,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "The AutoML daemon functionaility in Qptuna automates the process of preparing data for model training, including data cleaning, feature extraction, and data formatting, streamlining the data preprocessing stage. The main aspects of this workflow are the following:\n", + "The AutoML daemon functionaility in QSARtuna automates the process of preparing data for model training, including data cleaning, feature extraction, and data formatting, streamlining the data preprocessing stage. The main aspects of this workflow are the following:\n", "\n", "* __Automated Data Preparation__: Automated process of preparing data for model training, including cleaning, feature extraction, formatting and quorum checks, streamlining data preprocessing\n", "\n", @@ -11407,9 +11407,9 @@ "\n", "* __Scalable and Efficient with Dynamic Resource Allocation__: Workflow designed to handle large datasets (with multiple prediction tasks) and dynamically utilize CPU/GPU/memory HPC resources\n", "\n", - "* __Customizable SLURM and Qptuna Templates__: SLURM templates can be tailored for different use cases. Both initial training and retraining Qptuna JSON configurations are used, allowing users customise which algorithms and descriptors should be trialed. The default configuration will for e.g. train an initial ChemProp model, and subsequent models will automatically trial Transfer Learning (TL) from previous models for new data, when appropriate\n", + "* __Customizable SLURM and QSARtuna Templates__: SLURM templates can be tailored for different use cases. Both initial training and retraining QSARtuna JSON configurations are used, allowing users customise which algorithms and descriptors should be trialed. The default configuration will for e.g. train an initial ChemProp model, and subsequent models will automatically trial Transfer Learning (TL) from previous models for new data, when appropriate\n", "\n", - "* __Metadata, Prediction and Model Tracking__: The code includes functionality for tracking temporal performance, raw test predictions, active learning predictions and exported Qptuna models, aiding monitoring and evaluating pseudo-prospective model performance over time\n", + "* __Metadata, Prediction and Model Tracking__: The code includes functionality for tracking temporal performance, raw test predictions, active learning predictions and exported QSARtuna models, aiding monitoring and evaluating pseudo-prospective model performance over time\n", "\n", "* __Automatic Job Resubmission__: In case of SLURM job failures, the code provides functionality to automatically resubmit failed jobs with modified resource allocations, enhancing the robustness of the model training process\n", "\n", @@ -11417,7 +11417,7 @@ "\n", "* __Dry Run Mode__: Dry run mode option enables users to simulate the process without actually submitting jobs, useful for verifying configurations and testing the workflow\n", "\n", - "The following is an example from the Qptuna unit tests:" + "The following is an example from the QSARtuna unit tests:" ] }, { @@ -11534,7 +11534,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "Qptuna AutoML expects temporal data (`--input-data`) to have been exported from warehouses/databases in a flat file structure in CSV format (which can also be gz compressed), containing SMILES, activity and task (which denotes each distinct property to be modelled) CSV columns. \n", + "QSARtuna AutoML expects temporal data (`--input-data`) to have been exported from warehouses/databases in a flat file structure in CSV format (which can also be gz compressed), containing SMILES, activity and task (which denotes each distinct property to be modelled) CSV columns. \n", "\n", "Exports are expected to be temporal in nature, with the naming convention `%Y-%m-%d` (see [here](https://docs.python.org/3/library/datetime.html#strftime-and-strptime-behavior) for details). Data can be exported in two ways:\n", "\n", @@ -11605,7 +11605,7 @@ "Then our configuration would be:\n", "\n", "```\n", - "qptuna-automl \n", + "qsartuna-automl \n", " --input-data \"../tests/data/automl/*\" \\\n", " --email @astrazeneca.com --user_name \\ # username should be accurate to monitor jobs\n", " --input-smiles-csv-column canonical --input-activity-csv-column molwt \\\n", @@ -11690,7 +11690,7 @@ " \"--n-cores\",\n", " \"1\",\n", " \"--dry-run\", # The dry-run option is enabled, so the AutoML pipeline does not submit to SLURM\n", - " \"-vv\", # Use this CLI option to enable detailed debugging logging to observe Qptuna AutoML behaviour \n", + " \"-vv\", # Use this CLI option to enable detailed debugging logging to observe QSARtuna AutoML behaviour \n", " \"--slurm-al-pool\",\n", " \"../tests/data/DRD2/subset-1000/train.csv\",\n", " \"--slurm-al-smiles-csv-column\",\n", @@ -11733,11 +11733,11 @@ "* resulting folder `data/TID1` comprises the following processed data:\n", " * `TID1.csv` : molecular property data set ready for modelling\n", " * `TID1.json`: config for an initial round of model training\n", - " * `TID1.sh`: used to run run Qptuna AutoML via an `sbatch` command, though `-- dry-run` prevented this happening\n", + " * `TID1.sh`: used to run run QSARtuna AutoML via an `sbatch` command, though `-- dry-run` prevented this happening\n", " * `.24_01_01` lock file initiated to track the status of the training at this timepoint\n", "* `processed_timepoints.json` is created to track which timepoints are processed\n", "\n", - "The script stopped at this point, to allow for HPC resources to submit the initial optimisation job. Subsequent runs of the Qptuna AutoML are required to progress past the initial optimisation run, and so could be scheduled (e.g. using `cron` or similar).\n", + "The script stopped at this point, to allow for HPC resources to submit the initial optimisation job. Subsequent runs of the QSARtuna AutoML are required to progress past the initial optimisation run, and so could be scheduled (e.g. using `cron` or similar).\n", "\n", "Running the AutoML workflow does a dry-run check of the status of the run:" ] @@ -11817,7 +11817,7 @@ "ml Miniconda3\n", "conda activate my_env_with_qsartuna\n", "\n", - "qptuna-automl \n", + "qsartuna-automl \n", " --input-data \"/tests/data/automl/*\" \\\n", " --email @astrazeneca.com --user_name \\\n", " --input-smiles-csv-column canonical --input-activity-csv-column molwt \\\n", diff --git a/docs/sphinx-builddir/html/notebooks/QSARtuna_Tutorial.html b/docs/sphinx-builddir/html/notebooks/QSARtuna_Tutorial.html index 3ce50ef..a42f003 100644 --- a/docs/sphinx-builddir/html/notebooks/QSARtuna_Tutorial.html +++ b/docs/sphinx-builddir/html/notebooks/QSARtuna_Tutorial.html @@ -1094,7 +1094,7 @@

Configuration example
 [I 2024-08-27 14:01:27,262] A new study created in memory with name: my_study_stratified_split
 [I 2024-08-27 14:01:27,303] A new study created in memory with name: study_name_0
-/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:180)
+/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:180)
   return self._cached_call(args, kwargs, shelving=False)[0]
 [I 2024-08-27 14:01:27,408] Trial 0 finished with value: -3999.9364276424735 and parameters: {'algorithm_name': 'SVR', 'SVR_algorithm_hash': 'ea7ccc7ef4a9329af0d4e39eb6184933', 'gamma__ea7ccc7ef4a9329af0d4e39eb6184933': 0.11270803112210707, 'C__ea7ccc7ef4a9329af0d4e39eb6184933': 43.81076443656638, 'descriptor': '{"name": "ECFP", "parameters": {"radius": 3, "nBits": 2048, "returnRdkit": false}}'}. Best is trial 0 with value: -3999.9364276424735.
 [I 2024-08-27 14:01:27,485] Trial 1 finished with value: -1856.4459752935309 and parameters: {'algorithm_name': 'PLSRegression', 'PLSRegression_algorithm_hash': '9f2f76e479633c0bf18cf2912fed9eda', 'n_components__9f2f76e479633c0bf18cf2912fed9eda': 4, 'descriptor': '{"name": "MACCS_keys", "parameters": {}}'}. Best is trial 1 with value: -1856.4459752935309.
@@ -1807,9 +1807,9 @@ 

Interlude: Cautionary advice for PRF ∆y (response column) validityEnsemble uncertainty (ChemProp Only)
 [I 2024-08-27 15:09:26,977] A new study created in memory with name: non-transform_example
 [I 2024-08-27 15:09:26,979] A new study created in memory with name: study_name_0
-/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:180)
+/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:180)
   return self._cached_call(args, kwargs, shelving=False)[0]
 [I 2024-08-27 15:09:27,144] Trial 0 finished with value: -3501.942111261296 and parameters: {'algorithm_name': 'RandomForestRegressor', 'RandomForestRegressor_algorithm_hash': 'f1ac01e1bba332215ccbd0c29c9ac3c3', 'max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3': 6, 'n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3': 5, 'max_features__f1ac01e1bba332215ccbd0c29c9ac3c3': <RandomForestMaxFeatures.AUTO: 'auto'>, 'descriptor': '{"name": "ECFP", "parameters": {"radius": 3, "nBits": 2048, "returnRdkit": false}}'}. Best is trial 0 with value: -3501.942111261296.
 [I 2024-08-27 15:09:27,220] Trial 1 finished with value: -5451.207265576796 and parameters: {'algorithm_name': 'RandomForestRegressor', 'RandomForestRegressor_algorithm_hash': 'f1ac01e1bba332215ccbd0c29c9ac3c3', 'max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3': 7, 'n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3': 6, 'max_features__f1ac01e1bba332215ccbd0c29c9ac3c3': <RandomForestMaxFeatures.AUTO: 'auto'>, 'descriptor': '{"name": "ECFP", "parameters": {"radius": 3, "nBits": 2048, "returnRdkit": false}}'}. Best is trial 0 with value: -3501.942111261296.
@@ -5524,18 +5524,18 @@ 

Precomputed descriptors from a file example

Overview

-

The AutoML daemon functionaility in Qptuna automates the process of preparing data for model training, including data cleaning, feature extraction, and data formatting, streamlining the data preprocessing stage. The main aspects of this workflow are the following:

+

The AutoML daemon functionaility in QSARtuna automates the process of preparing data for model training, including data cleaning, feature extraction, and data formatting, streamlining the data preprocessing stage. The main aspects of this workflow are the following:

  • Automated Data Preparation: Automated process of preparing data for model training, including cleaning, feature extraction, formatting and quorum checks, streamlining data preprocessing

  • Model Training with SLURM: Integration with SLURM to dispatch tasks, leveraging distributed computing resources for efficient and scalable model training

  • Scalable and Efficient with Dynamic Resource Allocation: Workflow designed to handle large datasets (with multiple prediction tasks) and dynamically utilize CPU/GPU/memory HPC resources

  • -
  • Customizable SLURM and Qptuna Templates: SLURM templates can be tailored for different use cases. Both initial training and retraining Qptuna JSON configurations are used, allowing users customise which algorithms and descriptors should be trialed. The default configuration will for e.g. train an initial ChemProp model, and subsequent models will automatically trial Transfer Learning (TL) from previous models for new data, when appropriate

  • -
  • Metadata, Prediction and Model Tracking: The code includes functionality for tracking temporal performance, raw test predictions, active learning predictions and exported Qptuna models, aiding monitoring and evaluating pseudo-prospective model performance over time

  • +
  • Customizable SLURM and QSARtuna Templates: SLURM templates can be tailored for different use cases. Both initial training and retraining QSARtuna JSON configurations are used, allowing users customise which algorithms and descriptors should be trialed. The default configuration will for e.g. train an initial ChemProp model, and subsequent models will automatically trial Transfer Learning (TL) from previous models for new data, when appropriate

  • +
  • Metadata, Prediction and Model Tracking: The code includes functionality for tracking temporal performance, raw test predictions, active learning predictions and exported QSARtuna models, aiding monitoring and evaluating pseudo-prospective model performance over time

  • Automatic Job Resubmission: In case of SLURM job failures, the code provides functionality to automatically resubmit failed jobs with modified resource allocations, enhancing the robustness of the model training process

  • Parallel Task Processing: Supports for parallel processing training tasks, allowing for efficient handling of multiple retraining tasks simultaneously, reducing overall processing time

  • Dry Run Mode: Dry run mode option enables users to simulate the process without actually submitting jobs, useful for verifying configurations and testing the workflow

-

The following is an example from the Qptuna unit tests:

+

The following is an example from the QSARtuna unit tests:

[102]:
 
@@ -5631,7 +5631,7 @@

Note on High-Performance Computing (HPC) Setup

Data extraction options

-

Qptuna AutoML expects temporal data (--input-data) to have been exported from warehouses/databases in a flat file structure in CSV format (which can also be gz compressed), containing SMILES, activity and task (which denotes each distinct property to be modelled) CSV columns.

+

QSARtuna AutoML expects temporal data (--input-data) to have been exported from warehouses/databases in a flat file structure in CSV format (which can also be gz compressed), containing SMILES, activity and task (which denotes each distinct property to be modelled) CSV columns.

Exports are expected to be temporal in nature, with the naming convention %Y-%m-%d (see here for details). Data can be exported in two ways:

  • 1.) Multiple files: Each extraction date gets an distinct/unique file with %Y-%m-%d format within the filename, which denotes that point in temporal train time, like so:

  • @@ -5680,7 +5680,7 @@

    Walkthough running an AutoML pipeline../tests/data/DRD2/subset-1000/train.csv

Then our configuration would be:

-
qptuna-automl
+
qsartuna-automl
    --input-data "../tests/data/automl/*"  \
    --email <example>@astrazeneca.com  --user_name <example>  \ # username should be accurate to monitor jobs
    --input-smiles-csv-column canonical  --input-activity-csv-column molwt \
@@ -5724,7 +5724,7 @@ 

Walkthough running an AutoML pipeline"--n-cores", "1", "--dry-run", # The dry-run option is enabled, so the AutoML pipeline does not submit to SLURM - "-vv", # Use this CLI option to enable detailed debugging logging to observe Qptuna AutoML behaviour + "-vv", # Use this CLI option to enable detailed debugging logging to observe QSARtuna AutoML behaviour "--slurm-al-pool", "../tests/data/DRD2/subset-1000/train.csv", "--slurm-al-smiles-csv-column", @@ -5796,13 +5796,13 @@

Walkthough running an AutoML pipelineTID1.csv : molecular property data set ready for modelling

  • TID1.json: config for an initial round of model training

  • -
  • TID1.sh: used to run run Qptuna AutoML via an sbatch command, though -- dry-run prevented this happening

  • +
  • TID1.sh: used to run run QSARtuna AutoML via an sbatch command, though -- dry-run prevented this happening

  • .24_01_01 lock file initiated to track the status of the training at this timepoint

  • processed_timepoints.json is created to track which timepoints are processed

  • -

    The script stopped at this point, to allow for HPC resources to submit the initial optimisation job. Subsequent runs of the Qptuna AutoML are required to progress past the initial optimisation run, and so could be scheduled (e.g. using cron or similar).

    +

    The script stopped at this point, to allow for HPC resources to submit the initial optimisation job. Subsequent runs of the QSARtuna AutoML are required to progress past the initial optimisation run, and so could be scheduled (e.g. using cron or similar).

    Running the AutoML workflow does a dry-run check of the status of the run:

    [ ]:
    @@ -5851,7 +5851,7 @@ 

    Schedule AutoML as a daemon for up-to-date models, 'aggregation__fd833c2dde0b7147e6516ea5eebb2657': , 'aggregation_norm__fd833c2dde0b7147e6516ea5eebb2657': 100.0, 'batch_size__fd833c2dde0b7147e6516ea5eebb2657': 50.0, 'depth__fd833c2dde0b7147e6516ea5eebb2657': 3.0, 'dropout__fd833c2dde0b7147e6516ea5eebb2657': 0.0, 'ensemble_size__fd833c2dde0b7147e6516ea5eebb2657': 5, 'epochs__fd833c2dde0b7147e6516ea5eebb2657': 4, 'features_generator__fd833c2dde0b7147e6516ea5eebb2657': , 'ffn_hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300.0, 'ffn_num_layers__fd833c2dde0b7147e6516ea5eebb2657': 2.0, 'final_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300.0, 'init_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'max_lr_exp__fd833c2dde0b7147e6516ea5eebb2657': -3, 'warmup_epochs_ratio__fd833c2dde0b7147e6516ea5eebb2657': 0.1, 'descriptor': '{\"name\": \"SmilesFromFile\", \"parameters\": {}}'}. Best is trial 0 with value: 0.65625.\n", " \r" @@ -4745,7 +4745,7 @@ "text": [ "[I 2024-08-27 15:09:26,977] A new study created in memory with name: non-transform_example\n", "[I 2024-08-27 15:09:26,979] A new study created in memory with name: study_name_0\n", - "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:180)\n", + "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:180)\n", " return self._cached_call(args, kwargs, shelving=False)[0]\n", "[I 2024-08-27 15:09:27,144] Trial 0 finished with value: -3501.942111261296 and parameters: {'algorithm_name': 'RandomForestRegressor', 'RandomForestRegressor_algorithm_hash': 'f1ac01e1bba332215ccbd0c29c9ac3c3', 'max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3': 6, 'n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3': 5, 'max_features__f1ac01e1bba332215ccbd0c29c9ac3c3': , 'descriptor': '{\"name\": \"ECFP\", \"parameters\": {\"radius\": 3, \"nBits\": 2048, \"returnRdkit\": false}}'}. Best is trial 0 with value: -3501.942111261296.\n", "[I 2024-08-27 15:09:27,220] Trial 1 finished with value: -5451.207265576796 and parameters: {'algorithm_name': 'RandomForestRegressor', 'RandomForestRegressor_algorithm_hash': 'f1ac01e1bba332215ccbd0c29c9ac3c3', 'max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3': 7, 'n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3': 6, 'max_features__f1ac01e1bba332215ccbd0c29c9ac3c3': , 'descriptor': '{\"name\": \"ECFP\", \"parameters\": {\"radius\": 3, \"nBits\": 2048, \"returnRdkit\": false}}'}. Best is trial 0 with value: -3501.942111261296.\n", @@ -11399,7 +11399,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "The AutoML daemon functionaility in Qptuna automates the process of preparing data for model training, including data cleaning, feature extraction, and data formatting, streamlining the data preprocessing stage. The main aspects of this workflow are the following:\n", + "The AutoML daemon functionaility in QSARtuna automates the process of preparing data for model training, including data cleaning, feature extraction, and data formatting, streamlining the data preprocessing stage. The main aspects of this workflow are the following:\n", "\n", "* __Automated Data Preparation__: Automated process of preparing data for model training, including cleaning, feature extraction, formatting and quorum checks, streamlining data preprocessing\n", "\n", @@ -11407,9 +11407,9 @@ "\n", "* __Scalable and Efficient with Dynamic Resource Allocation__: Workflow designed to handle large datasets (with multiple prediction tasks) and dynamically utilize CPU/GPU/memory HPC resources\n", "\n", - "* __Customizable SLURM and Qptuna Templates__: SLURM templates can be tailored for different use cases. Both initial training and retraining Qptuna JSON configurations are used, allowing users customise which algorithms and descriptors should be trialed. The default configuration will for e.g. train an initial ChemProp model, and subsequent models will automatically trial Transfer Learning (TL) from previous models for new data, when appropriate\n", + "* __Customizable SLURM and QSARtuna Templates__: SLURM templates can be tailored for different use cases. Both initial training and retraining QSARtuna JSON configurations are used, allowing users customise which algorithms and descriptors should be trialed. The default configuration will for e.g. train an initial ChemProp model, and subsequent models will automatically trial Transfer Learning (TL) from previous models for new data, when appropriate\n", "\n", - "* __Metadata, Prediction and Model Tracking__: The code includes functionality for tracking temporal performance, raw test predictions, active learning predictions and exported Qptuna models, aiding monitoring and evaluating pseudo-prospective model performance over time\n", + "* __Metadata, Prediction and Model Tracking__: The code includes functionality for tracking temporal performance, raw test predictions, active learning predictions and exported QSARtuna models, aiding monitoring and evaluating pseudo-prospective model performance over time\n", "\n", "* __Automatic Job Resubmission__: In case of SLURM job failures, the code provides functionality to automatically resubmit failed jobs with modified resource allocations, enhancing the robustness of the model training process\n", "\n", @@ -11417,7 +11417,7 @@ "\n", "* __Dry Run Mode__: Dry run mode option enables users to simulate the process without actually submitting jobs, useful for verifying configurations and testing the workflow\n", "\n", - "The following is an example from the Qptuna unit tests:" + "The following is an example from the QSARtuna unit tests:" ] }, { @@ -11534,7 +11534,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "Qptuna AutoML expects temporal data (`--input-data`) to have been exported from warehouses/databases in a flat file structure in CSV format (which can also be gz compressed), containing SMILES, activity and task (which denotes each distinct property to be modelled) CSV columns. \n", + "QSARtuna AutoML expects temporal data (`--input-data`) to have been exported from warehouses/databases in a flat file structure in CSV format (which can also be gz compressed), containing SMILES, activity and task (which denotes each distinct property to be modelled) CSV columns. \n", "\n", "Exports are expected to be temporal in nature, with the naming convention `%Y-%m-%d` (see [here](https://docs.python.org/3/library/datetime.html#strftime-and-strptime-behavior) for details). Data can be exported in two ways:\n", "\n", @@ -11605,7 +11605,7 @@ "Then our configuration would be:\n", "\n", "```\n", - "qptuna-automl \n", + "qsartuna-automl \n", " --input-data \"../tests/data/automl/*\" \\\n", " --email @astrazeneca.com --user_name \\ # username should be accurate to monitor jobs\n", " --input-smiles-csv-column canonical --input-activity-csv-column molwt \\\n", @@ -11690,7 +11690,7 @@ " \"--n-cores\",\n", " \"1\",\n", " \"--dry-run\", # The dry-run option is enabled, so the AutoML pipeline does not submit to SLURM\n", - " \"-vv\", # Use this CLI option to enable detailed debugging logging to observe Qptuna AutoML behaviour \n", + " \"-vv\", # Use this CLI option to enable detailed debugging logging to observe QSARtuna AutoML behaviour \n", " \"--slurm-al-pool\",\n", " \"../tests/data/DRD2/subset-1000/train.csv\",\n", " \"--slurm-al-smiles-csv-column\",\n", @@ -11733,11 +11733,11 @@ "* resulting folder `data/TID1` comprises the following processed data:\n", " * `TID1.csv` : molecular property data set ready for modelling\n", " * `TID1.json`: config for an initial round of model training\n", - " * `TID1.sh`: used to run run Qptuna AutoML via an `sbatch` command, though `-- dry-run` prevented this happening\n", + " * `TID1.sh`: used to run run QSARtuna AutoML via an `sbatch` command, though `-- dry-run` prevented this happening\n", " * `.24_01_01` lock file initiated to track the status of the training at this timepoint\n", "* `processed_timepoints.json` is created to track which timepoints are processed\n", "\n", - "The script stopped at this point, to allow for HPC resources to submit the initial optimisation job. Subsequent runs of the Qptuna AutoML are required to progress past the initial optimisation run, and so could be scheduled (e.g. using `cron` or similar).\n", + "The script stopped at this point, to allow for HPC resources to submit the initial optimisation job. Subsequent runs of the QSARtuna AutoML are required to progress past the initial optimisation run, and so could be scheduled (e.g. using `cron` or similar).\n", "\n", "Running the AutoML workflow does a dry-run check of the status of the run:" ] @@ -11817,7 +11817,7 @@ "ml Miniconda3\n", "conda activate my_env_with_qsartuna\n", "\n", - "qptuna-automl \n", + "qsartuna-automl \n", " --input-data \"/tests/data/automl/*\" \\\n", " --email @astrazeneca.com --user_name \\\n", " --input-smiles-csv-column canonical --input-activity-csv-column molwt \\\n", diff --git a/docs/sphinx-builddir/html/optunaz.html b/docs/sphinx-builddir/html/optunaz.html index 9af66b0..33fec51 100644 --- a/docs/sphinx-builddir/html/optunaz.html +++ b/docs/sphinx-builddir/html/optunaz.html @@ -163,7 +163,7 @@

    Submodules

    optunaz.automl module

    -class optunaz.automl.ModelAutoML(output_path=None, input_data=None, n_cores=- 1, email=None, user_name=None, smiles_col=None, activity_col=None, task_col=None, dry_run=False, timestr='20240828-171643')[source]
    +class optunaz.automl.ModelAutoML(output_path=None, input_data=None, n_cores=- 1, email=None, user_name=None, smiles_col=None, activity_col=None, task_col=None, dry_run=False, timestr='20240828-172746')[source]

    Bases: object

    Prepares the data ready for the model training with ModelDispatcher. The ModelAutoML will also store activity for new tasks pending enough data.

    diff --git a/docs/sphinx-builddir/html/searchindex.js b/docs/sphinx-builddir/html/searchindex.js index bb29867..c28ffe8 100644 --- a/docs/sphinx-builddir/html/searchindex.js +++ b/docs/sphinx-builddir/html/searchindex.js @@ -1 +1 @@ -Search.setIndex({"docnames": ["README", "algorithms", "deduplicator", "descriptors", "index", "modules", "notebooks/QPTUNA_Tutorial", "notebooks/QSARtuna_Tutorial", "notebooks/preprocess_data", "optunaz", "optunaz.config", "optunaz.utils", "optunaz.utils.enums", "optunaz.utils.preprocessing", "splitters", "transform"], "filenames": ["README.md", "algorithms.rst", "deduplicator.rst", "descriptors.rst", "index.rst", "modules.rst", "notebooks/QPTUNA_Tutorial.ipynb", "notebooks/QSARtuna_Tutorial.ipynb", "notebooks/preprocess_data.ipynb", "optunaz.rst", "optunaz.config.rst", "optunaz.utils.rst", "optunaz.utils.enums.rst", "optunaz.utils.preprocessing.rst", "splitters.rst", "transform.rst"], "titles": ["QSARtuna \ud80c\udd9b: QSAR using Optimization for Hyperparameter Tuning (formerly Optuna AZ and QPTUNA)", "Available algorithms", "Available deduplicators", "Available descriptors", "Welcome to QSARtuna Documentation!", "optunaz", "QPTUNA CLI Tutorial", "QSARtuna CLI Tutorial", "Preprocessing data for QSARtuna", "optunaz package", "optunaz.config package", "optunaz.utils package", "optunaz.utils.enums package", "optunaz.utils.preprocessing package", "Available splitters", "Available transform"], "terms": {"build": [0, 4, 8, 9, 10, 11, 12], "predict": [0, 1, 3, 5, 6, 7, 8, 10, 11, 12], "compchem": 0, "develop": [0, 3, 7, 9], "uncertainti": [0, 1, 4, 8, 9, 10, 13, 15], "quantif": 0, "explain": [0, 1, 4, 5, 10], "mind": 0, "thi": [0, 1, 3, 4, 8, 9, 10, 11, 12, 13, 14], "librari": [0, 6, 7, 8], "search": [0, 1, 3, 9, 10], "best": [0, 1, 9, 10], "ml": [0, 4, 7, 10], "molecular": [0, 1, 3, 4, 6, 7, 8, 9, 10], "given": [0, 1, 3, 6, 7, 8, 9, 10, 11], "data": [0, 1, 3, 4, 9, 10, 11, 12, 13, 14, 15], "itself": [0, 6, 7], "done": [0, 6, 7], "emploi": [0, 3, 6, 7, 8, 9], "latest": [0, 9, 10], "state": [0, 6, 7, 13], "art": [0, 6, 7], "estim": [0, 1, 3, 4, 9, 10, 12], "packag": [0, 1, 3, 5, 6, 7, 8], "further": [0, 10], "document": [0, 6, 7, 8], "github": [0, 6, 7, 9, 13], "page": [0, 6], "here": [0, 3, 6, 7, 8, 9, 10, 13, 14], "public": [0, 1, 3, 4, 6, 7, 9, 10], "avail": [0, 4, 6, 7, 9, 11], "structur": [0, 1, 3, 6, 7, 8, 9, 10], "around": [0, 6, 7, 8], "train": [0, 1, 3, 4, 8, 9, 10, 11, 12, 13, 14], "mani": [0, 1, 6, 7, 10], "differ": [0, 1, 3, 6, 7, 9, 10, 11, 13], "paramet": [0, 1, 3, 6, 7, 8, 9, 10, 12, 13, 14, 15], "onli": [0, 1, 3, 8, 9, 10, 13, 14], "dataset": [0, 1, 8, 9, 10, 12, 13], "usual": [0, 1, 6, 7, 8, 10], "cross": [0, 1, 6, 7, 10, 13], "valid": [0, 1, 3, 8, 9, 10, 12, 13], "pick": 0, "evalu": [0, 4, 5, 6, 7], "its": [0, 1, 6, 7, 10, 12], "perform": [0, 3, 4, 9, 12, 13, 15], "test": [0, 1, 4, 8, 9, 10, 12, 13, 14], "prod": [0, 6, 7], "re": [0, 6, 7, 9], "merg": [0, 8, 9, 13], "ha": [0, 1, 6, 7, 8, 9, 10, 13], "drawback": [0, 6, 7], "left": [0, 6, 7, 8], "result": [0, 1, 3, 6, 7, 8, 9, 10], "big": [0, 6, 7], "benefit": [0, 6, 7], "final": [0, 1, 6, 7, 10], "all": [0, 1, 3, 6, 7, 8, 9, 10, 12, 13], "let": [0, 6, 7, 8], "s": [0, 6, 7, 8], "look": [0, 1, 6, 7, 8, 10], "trivial": 0, "exampl": [0, 3, 8, 9, 10], "weight": [0, 1, 3, 6, 7, 9, 10, 12], "set": [0, 3, 4, 8, 9, 10, 11, 12, 13, 14], "50": [0, 1, 3, 6, 7, 9, 10], "molecul": [0, 1, 3, 6, 7, 8, 9, 10, 13], "we": [0, 3, 6, 7, 8, 9, 10, 13, 14], "start": [0, 4, 6, 7, 8, 9], "format": [0, 3, 6, 7, 8, 9, 11], "It": [0, 1, 3, 6, 7, 8, 9, 10], "contain": [0, 3, 6, 7, 9, 11], "four": 0, "main": [0, 3, 6, 7, 8, 9], "section": [0, 6, 7, 8], "locat": [0, 6, 7], "column": [0, 3, 8, 9, 11, 12, 13, 14, 15], "detail": [0, 3, 6, 7, 8, 9, 10, 11], "about": [0, 6, 7, 8, 9], "which": [0, 1, 3, 6, 7, 8, 9, 10, 13], "below": [0, 3, 6, 7, 8, 9], "task": [0, 3, 8, 9, 10, 11, 12], "training_dataset_fil": [0, 6, 7, 8, 9], "drd2": [0, 6, 7], "subset": [0, 1, 6, 7, 8, 10], "csv": [0, 3, 4, 6, 7, 9], "input_column": [0, 3, 6, 7, 8, 9, 12], "canon": [0, 6, 7, 9, 13], "response_column": [0, 3, 6, 7, 8, 9, 12], "molwt": [0, 6, 7], "mode": [0, 6, 7, 9, 10, 12], "regress": [0, 1, 8, 10, 12, 13], "cross_valid": [0, 6, 7, 10, 12, 13], "5": [0, 1, 3, 6, 7, 8, 9, 10, 13], "direct": [0, 1, 6, 7, 10, 12], "maxim": [0, 1, 6, 7, 10], "n_trial": [0, 6, 7, 9, 10, 12], "100": [0, 1, 3, 6, 7, 8, 9, 10, 11], "n_startup_tri": [0, 6, 7, 9, 10], "30": [0, 1, 6, 7, 10], "name": [0, 1, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15], "ecfp": [0, 4, 6, 7, 9, 10, 12], "radiu": [0, 3, 6, 7, 9, 12], "3": [0, 1, 3, 4, 6, 7, 8, 9, 10], "nbit": [0, 3, 6, 7, 9, 10, 12], "2048": [0, 3, 6, 7, 9], "maccs_kei": [0, 4, 6, 7, 9, 12], "randomforestregressor": [0, 4, 6, 7, 10, 12], "max_depth": [0, 1, 10, 12], "low": [0, 1, 3, 6, 7, 8, 9, 10, 12], "2": [0, 1, 3, 4, 6, 7, 8, 9, 10, 13, 14], "high": [0, 1, 3, 4, 9, 10, 12], "32": [0, 1, 6, 7, 10], "n_estim": [0, 1, 6, 7, 10, 12], "10": [0, 1, 3, 6, 7, 8, 9, 10, 13], "250": [0, 1, 6, 7, 10], "max_featur": [0, 1, 10, 12], "auto": [0, 1, 6, 7, 9, 10], "ridg": [0, 4, 6, 7, 10, 12], "alpha": [0, 1, 6, 7, 8, 9, 10, 12], "0": [0, 1, 3, 6, 7, 8, 9, 10, 11, 13, 14], "lasso": [0, 4, 6, 7, 10, 12], "xgbregressor": [0, 4, 6, 7, 10, 12], "learning_r": [0, 1, 10, 12], "1": [0, 1, 3, 4, 6, 7, 8, 9, 10, 11, 13, 14], "specifi": [0, 1, 6, 7, 8, 9, 10, 12], "In": [0, 1, 3, 6, 7, 8, 9, 10], "rel": [0, 6, 7], "path": [0, 1, 3, 6, 7, 8, 9, 10, 11], "folder": [0, 6, 7, 8], "ar": [0, 1, 3, 6, 7, 8, 9, 10, 12, 13, 14], "want": [0, 6, 7, 8], "fold": [0, 1, 6, 7, 8, 10, 13, 14], "valu": [0, 1, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15], "object": [0, 1, 5, 8, 10, 11, 12, 13], "function": [0, 1, 3, 4, 8, 9, 10, 11, 12, 13, 15], "standard": [0, 1, 8, 10, 13, 15], "scikit": [0, 6, 7, 9, 13, 14], "have": [0, 3, 6, 7, 8, 9, 10, 13], "total": [0, 6, 7, 8], "trial": [0, 1, 10, 11, 12], "first": [0, 1, 3, 6, 7, 8, 9, 10, 13], "startup": [0, 6, 7], "should": [0, 1, 3, 6, 7, 8, 9, 10, 11, 13], "random": [0, 1, 4, 10, 13], "explor": [0, 6, 7], "get": [0, 6, 7, 8, 9], "stuck": 0, "earli": [0, 1, 6, 7, 9, 10], "one": [0, 3, 8, 9, 10, 13, 14], "local": [0, 6, 7], "minimum": [0, 1, 3, 9, 10, 13, 14], "two": [0, 1, 6, 7, 8, 10, 13, 14], "free": [0, 3, 9], "pair": [0, 6, 7, 9], "ani": [0, 3, 6, 7, 8, 9, 10, 13], "when": [0, 1, 6, 7, 8, 9, 10, 11, 13, 14], "our": [0, 6, 7, 8], "time": [0, 1, 3, 8, 9, 10, 11], "creat": [0, 8, 9, 11], "conda": [0, 7], "environ": [0, 3, 6, 7, 9], "instal": [0, 6, 7], "modul": [0, 5, 6, 7], "purg": 0, "load": [0, 1, 6, 7, 8, 9, 10], "miniconda3": [0, 7], "my_env_with_qsartuna": [0, 7], "pip": [0, 6, 7], "activ": [0, 1, 6, 7, 8, 9, 10, 12, 13, 15], "just": [0, 6, 7], "case": [0, 1, 6, 7, 8, 9, 10], "check": [0, 6, 7, 9, 12, 13], "output": [0, 1, 6, 7, 8, 9, 10, 13, 15], "m": [0, 6, 7, 9, 11], "http": [0, 3, 6, 7, 8, 9, 10, 13], "com": [0, 6, 7, 8, 9, 13], "molecularai": [0, 7], "releas": [0, 4, 6, 7], "download": [0, 7], "tar": [0, 6, 7], "gz": [0, 6, 7], "Then": [0, 6, 7], "you": [0, 1, 6, 7, 8, 10], "can": [0, 1, 3, 6, 7, 8, 9, 10, 13, 14], "insid": [0, 9], "your": [0, 6, 7, 8], "three_step_opt_build_merg": [0, 5, 6, 7], "import": [0, 6, 7], "buildconfig_best": [0, 6, 7, 9], "build_best": [0, 6, 7, 9], "build_merg": [0, 6, 7, 9], "config": [0, 1, 5, 6, 7, 9], "modelmod": [0, 6, 7, 9, 10], "optimizationdirect": [0, 6, 7, 10], "optconfig": [0, 1, 5, 6, 7, 9, 11, 12], "optimizationconfig": [0, 6, 7, 9, 10], "svr": [0, 4, 6, 7, 10, 12], "randomforest": 0, "pl": [0, 1, 10], "dataread": [0, 5, 6, 7], "ecfp_count": [0, 4, 6, 7, 9, 12], "prepar": [0, 4, 8, 9], "new": [0, 1, 3, 6, 7, 8, 9, 10, 11], "studi": [0, 3, 6, 7, 9, 10, 11, 12], "study_nam": [0, 6, 7, 9], "my_studi": [0, 6, 7], "make": [0, 1, 6, 7, 8, 9, 10, 13, 14, 15], "buildconfig": [0, 5, 6, 7, 9, 11], "write": [0, 6, 7, 9], "out": [0, 1, 6, 7, 8, 10], "print": [0, 6, 7, 8], "dump": [0, 6, 7], "indent": [0, 6, 7], "save": [0, 6, 7], "target": [0, 1, 6, 7, 8, 10, 13, 15], "pkl": [0, 1, 6, 7, 10], "deploi": 0, "directli": [0, 6, 7, 8], "To": [0, 6, 7, 8], "follow": [0, 3, 6, 7, 8, 9, 10, 11], "syntax": 0, "schemagen": [0, 5], "regression_drd2_50": 0, "outpath": 0, "accept": [0, 6, 7, 8], "argument": [0, 6, 7, 9], "shell": 0, "h": [0, 3, 6, 7, 8, 9], "usag": [0, 6, 7], "best_buildconfig_outpath": 0, "best_model_outpath": 0, "merged_model_outpath": 0, "cach": [0, 3, 6, 7, 9, 10], "optbuild": [0, 5], "hyper": [0, 6, 7, 10], "help": [0, 6, 7], "show": [0, 6, 7, 8], "messag": [0, 1, 6, 7, 10, 11], "exit": [0, 6, 7], "where": [0, 1, 6, 7, 8, 10], "persist": 0, "turn": [0, 10, 13, 14], "off": [0, 1, 6, 7, 8, 10, 13, 14], "gener": [0, 1, 3, 6, 7, 8, 9, 10, 13, 14], "requir": [0, 3, 6, 7, 8, 9], "input": [0, 1, 3, 4, 6, 7, 9, 10, 11, 13, 14, 15], "either": [0, 3, 8, 9, 10], "sinc": [0, 3, 6, 7, 8, 9, 13], "long": [0, 8], "avoid": [0, 6, 7, 8, 13], "login": 0, "node": 0, "queue": [0, 6, 7], "instead": [0, 1, 3, 6, 7, 8, 9, 10, 13], "script": [0, 6, 7, 9], "give": [0, 6, 7], "sbatch": [0, 6, 7], "bin": [0, 6, 7, 8, 11, 13, 14], "sh": [0, 6, 7, 11], "ntask": 0, "cpu": [0, 6, 7, 9], "per": [0, 1, 8, 9, 10], "mem": [0, 6, 7, 9], "4g": 0, "partit": [0, 6, 7], "core": [0, 6, 7, 8, 10], "illustr": [0, 6, 7, 8], "how": [0, 1, 3, 6, 7, 8, 9, 10], "chose": 0, "chang": [0, 6, 7], "directori": [0, 6, 7, 9, 11], "cd": 0, "project_fold": 0, "project": [0, 1, 10], "dir": [0, 9], "complet": [0, 3, 6, 7, 9], "pickl": [0, 6, 7], "home": 0, "under": [0, 6, 7], "built": [0, 3, 8, 9, 10], "infer": [0, 3, 6, 7, 8, 9], "smile": [0, 3, 6, 7, 8, 9, 11, 12, 13, 14], "note": [0, 1, 3, 4, 8, 9, 10, 12, 13, 14], "varieti": [0, 6, 7], "model_fil": 0, "input_smiles_csv_fil": 0, "input_smiles_csv_column": [0, 6, 7], "aux": [0, 6, 7, 9, 11], "input_aux_column": 0, "precomput": [0, 3, 8, 9], "input_precomputed_fil": 0, "input_precomputed_input_column": 0, "respons": [0, 3, 8, 9], "input_precomputed_response_column": 0, "output_prediction_csv_column": 0, "output_prediction_csv_fil": 0, "uncertainty_quantil": 0, "optunaaz": 0, "auxiliari": [0, 3, 6, 7, 9, 13, 15], "filenam": [0, 6, 7, 9, 11], "identifi": [0, 3, 6, 7, 8, 9], "must": [0, 1, 6, 7, 10], "provid": [0, 1, 3, 6, 7, 8, 9, 10, 13], "shap": [0, 9], "chemprop": [0, 1, 3, 4, 9, 10], "appli": [0, 1, 3, 6, 7, 8, 9, 10, 13, 14, 15], "threshold": [0, 1, 3, 4, 6, 7, 9, 10, 13, 14, 15], "tri": 0, "dure": [0, 1, 3, 6, 7, 8, 9, 10], "mlflow": [0, 5, 9, 12], "track": [0, 3, 5, 6, 7, 9, 10], "ui": 0, "open": [0, 1, 6, 7, 9, 10], "link": 0, "browser": 0, "If": [0, 1, 3, 6, 7, 9, 10, 13, 14], "scp": [0, 6], "forward": [0, 1, 10], "port": 0, "separ": [0, 3, 8, 9], "ssh": 0, "session": 0, "non": [0, 1, 3, 6, 7, 8, 9, 10], "n": [0, 1, 6, 7, 8, 10, 11], "l": 0, "localhost": 0, "5000": 0, "user": [0, 1, 3, 4, 6, 7, 9, 10, 12, 13, 14, 15], "intranet": 0, "net": [0, 6], "execut": 0, "select": [0, 1, 3, 6, 7, 8, 9, 10], "experi": [0, 8, 11], "after": [0, 1, 3, 6, 7, 8, 9, 10, 11], "choos": [0, 4], "compar": [0, 6, 7], "comparison": [0, 6, 7, 8], "call": [0, 1, 3, 6, 7, 9, 10, 13], "well": [0, 6, 7, 8], "metric": [0, 1, 6, 7, 9, 10, 12], "At": 0, "bottom": 0, "plot": [0, 6, 7, 8, 10, 12], "For": [0, 1, 3, 6, 7, 8, 9, 10, 13], "x": [0, 1, 3, 6, 7, 8, 9, 10, 13, 14], "axi": [0, 6, 7, 8], "_": [0, 6, 7], "number": [0, 1, 3, 6, 7, 8, 9, 10, 11], "y": [0, 1, 8, 9, 10, 11, 13, 14], "cvmean": 0, "r2": [0, 6, 7, 8, 10], "more": [0, 1, 3, 8, 9, 10, 11], "click": 0, "individu": [0, 1, 6, 7, 8, 10], "There": [0, 1, 6, 7, 8, 10], "access": [0, 3, 9], "an": [0, 1, 3, 4, 8, 9, 10, 11, 13, 14], "daemon": [0, 4], "design": [0, 6, 7], "autom": [0, 4, 8], "dispatch": [0, 6, 7, 9], "job": [0, 6, 7, 8, 9, 11], "schedul": [0, 4, 6], "particularli": [0, 6, 7], "scientist": 0, "research": 0, "who": 0, "work": [0, 6, 7, 8], "larg": [0, 1, 8, 10], "need": [0, 4, 9], "distribut": [0, 1, 6, 7, 8, 10], "comput": [0, 1, 3, 4, 8, 9, 10, 13], "resourc": [0, 6, 7, 9], "code": [0, 3, 6, 7, 8, 9, 11], "streamlin": [0, 6, 7], "manag": 0, "submiss": 0, "while": [0, 3, 6, 7, 8, 9, 13], "ensur": [0, 6, 7, 8, 9, 10], "effici": [0, 6, 7], "scalabl": [0, 6, 7], "output_path": [0, 6, 7, 9], "email": [0, 6, 7, 9], "user_nam": [0, 6, 7, 9], "input_data": [0, 6, 7, 9], "input_activity_csv_column": [0, 6, 7], "input_task_csv_column": [0, 6, 7], "initi": [0, 6, 7, 8, 9, 10], "templat": [0, 6, 7], "input_initial_templ": [0, 6, 7], "retrain": [0, 4, 5, 9], "input_retrain_templ": [0, 6, 7], "input_slurm_templ": [0, 6, 7], "quorum": [0, 6, 7, 9], "n_core": [0, 6, 7, 9], "dry": [0, 6, 7], "v": [0, 6, 7], "req": [0, 6, 7], "slurm_req_cor": [0, 6, 7, 9], "slurm_req_mem": [0, 6, 7, 9], "slurm_req_partit": [0, 6, 7, 9], "al": [0, 3, 6, 7, 8, 9], "pool": [0, 6, 7], "slurm_al_pool": [0, 6, 7, 9], "slurm_al_smiles_csv_column": [0, 6, 7], "prefix": [0, 6, 7, 11], "slurm_job_prefix": [0, 6, 7, 9], "failur": [0, 6, 7, 9], "increment": [0, 6, 7], "slurm_failure_cores_incr": [0, 6, 7], "slurm_failure_mem_incr": [0, 6, 7], "min": [0, 1, 6, 7, 8, 10, 13], "slurm_failure_mins_incr": [0, 6, 7], "max": [0, 6, 7, 8, 13], "retri": [0, 6, 7], "slurm_failure_max_retri": [0, 6, 7], "slurm_failure_max_mem": [0, 6, 7], "slurm_failure_max_cpu": [0, 6, 7], "previou": [0, 6, 7, 11], "tempor": [0, 4, 6, 7, 9, 11, 13], "verbos": [0, 6, 7], "notif": [0, 6, 7], "prid": [0, 6], "multipl": [0, 3, 6, 7, 9, 13, 14], "wildcard": [0, 6, 7], "express": [0, 6, 7], "would": [0, 3, 6, 7, 8, 9, 11], "one_taskid": [0, 6, 7], "c": [0, 1, 3, 6, 7, 8, 9, 10, 12], "vvv": [0, 6, 7], "test_auto1": 0, "220": [0, 6, 7], "testaml": [0, 6, 7], "testpartit": [0, 7], "inform": [0, 1, 3, 9, 10, 11], "regard": 0, "add": [0, 6, 7, 8, 9, 11], "optunaz": [0, 1, 3, 6, 7, 8, 14, 15], "py": [0, 1, 6, 7, 8, 10], "like": [0, 1, 3, 6, 7, 8, 9, 10], "so": [0, 6, 7, 8, 10], "dataclass": [0, 11], "class": [0, 1, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15], "yournewdescriptor": 0, "rdkitdescriptor": [0, 9], "descript": [0, 9, 10], "goe": 0, "apischema": [0, 6, 7, 9], "type_nam": 0, "yournewdescriptorparam": 0, "pass": [0, 1, 3, 6, 7, 9, 10, 13], "exampleofaparamet": 0, "annot": [0, 6, 7, 9], "int": [0, 1, 3, 9, 10, 13, 14], "schema": [0, 5, 9, 12], "titl": [0, 1, 3, 6, 7, 8, 9, 10, 11, 13, 14, 15], "field": 0, "default": [0, 1, 8, 9, 10, 13, 14], "liter": [0, 9, 10, 13, 14], "def": [0, 6, 7, 8, 10], "calculate_from_smi": [0, 3, 6, 7, 9], "self": [0, 6, 7, 10], "smi": [0, 3, 9, 11], "str": [0, 1, 3, 6, 7, 9, 10, 11, 12, 13, 14, 15], "insert": [0, 8], "calcul": [0, 3, 6, 7, 9, 13, 14, 15], "fp": [0, 3, 6, 7, 9], "code_to_calculate_fp": 0, "return": [0, 3, 6, 7, 8, 9, 11, 12, 13, 14], "list": [0, 1, 3, 4, 6, 7, 8, 9, 10, 13, 15], "within": [0, 1, 3, 9, 10, 13, 14], "same": [0, 1, 6, 7, 8, 10, 11], "anyunscaleddescriptor": 0, "union": [0, 1, 3, 9, 10], "avalon": [0, 4, 9, 10, 12], "pathfp": [0, 4, 6, 7, 9, 12], "amorprotdescriptor": [0, 3, 9, 12], "precomputeddescriptorfromfil": [0, 4, 6, 7, 9, 12], "unscaledmapc": [0, 3, 9, 12], "unscaledphyschemdescriptor": [0, 4, 6, 7, 9, 12], "unscaledjazzydescriptor": [0, 4, 6, 7, 9, 12], "unscaledzscalesdescriptor": [0, 4, 9, 12], "compositecompatibledescriptor": 0, "scaleddescriptor": [0, 4, 9, 12], "mapc": [0, 3, 9, 12], "physchemdescriptor": [0, 4, 9, 12], "jazzydescriptor": [0, 4, 9, 12], "zscalesdescriptor": [0, 3, 9, 12], "now": [0, 6, 7, 8, 10], "consid": [0, 3, 6, 7, 9, 13, 14], "later": [0, 6, 7], "among": [0, 6, 7], "exist": [0, 3, 6, 9, 11], "youraglrotihm": 0, "youralgorithmparam": 0, "youralgorithmparameterint": 0, "metadata": [0, 6, 7, 9, 10, 11, 12], "youralgorithmparameterfloat": 0, "float": [0, 1, 6, 7, 8, 10, 11, 13, 14, 15], "0001": [0, 1, 10], "001": [0, 7], "parameter_int": 0, "parameter_float": 0, "fixed_int": 0, "priori": 0, "fix": [0, 9, 10], "runtim": [0, 3, 9], "optimis": [0, 3, 6, 7, 8, 9, 10, 11], "youralgorithm": 0, "b": [0, 6, 7, 8], "sens": [0, 3, 9], "refer": [0, 3, 6, 7, 9, 11, 12], "anyregressionalgorithm": 0, "regressor": [0, 1, 6, 7, 9, 10, 12], "plsregress": [0, 4, 6, 7, 10, 12], "kneighborsregressor": [0, 4, 6, 7, 10, 12], "prfclassifi": [0, 4, 6, 7, 10, 12], "chempropregressor": [0, 4, 6, 7, 10, 12], "chempropregressorpretrain": [0, 4, 6, 7, 10], "chemprophyperoptregressor": [0, 4, 6, 7, 10, 12], "anyclassificationalgorithm": 0, "adaboostclassifi": [0, 4, 6, 7, 10, 12], "kneighborsclassifi": [0, 4, 6, 7, 10, 12], "logisticregress": [0, 4, 6, 7, 10, 12], "randomforestclassifi": [0, 4, 6, 7, 10, 12], "svc": [0, 4, 6, 7, 10, 12], "chempropclassifi": [0, 4, 6, 7, 10, 12], "chemprophyperoptclassifi": [0, 4, 6, 7, 10, 12], "depend": [0, 1, 6, 7, 8, 10], "classifi": [0, 1, 6, 7, 9, 10, 12], "youralgorithmparamet": 0, "consist": [0, 6, 7], "youralgorihtm": 0, "examplealgorithm": 0, "expect": [0, 6, 7, 8, 11], "4": [0, 1, 3, 6, 7, 8, 9, 10, 13, 14], "build_from_opt": [0, 5, 9], "elif": 0, "statement": 0, "isinst": 0, "alg": [0, 9, 10], "opt": 0, "suggest_int": 0, "_encode_nam": 0, "encod": [0, 1, 9, 10], "string": [0, 3, 6, 7, 8, 9, 12, 13, 14, 15], "para": 0, "suggest_float": 0, "suggest": [0, 6, 7], "report": [0, 4, 6, 7, 8], "even": [0, 6, 7, 8], "instanti": 0, "8": [0, 6, 7, 8, 10], "sourc": [1, 3, 9, 10, 11, 12, 13, 14, 15], "adaboost": [1, 10], "meta": [1, 6, 7, 9, 10], "begin": [1, 6, 7, 8, 10, 13, 14], "fit": [1, 3, 6, 7, 8, 9, 10, 13], "origin": [1, 3, 6, 7, 8, 9, 10, 13], "addit": [1, 6, 7, 10], "copi": [1, 6, 7, 8, 10, 11], "incorrectli": [1, 10], "instanc": [1, 6, 7, 8, 9, 10], "adjust": [1, 10], "subsequ": [1, 6, 7, 10], "focu": [1, 10], "difficult": [1, 6, 7, 10], "adaboostclassifierparametersnestim": [1, 10], "adaboostclassifierparameterslearningr": [1, 10], "The": [1, 3, 8, 9, 10, 11, 13, 15], "maximum": [1, 3, 6, 7, 8, 9, 10, 13, 14], "boost": [1, 3, 9, 10], "termin": [1, 10], "perfect": [1, 10], "learn": [1, 3, 4, 8, 9, 10, 13, 14], "procedur": [1, 3, 6, 7, 8, 9, 10], "stop": [1, 6, 7, 10], "each": [1, 3, 6, 7, 8, 9, 10, 13], "classifierat": [1, 10], "iter": [1, 6, 7, 10, 13, 14], "A": [1, 3, 8, 9, 10], "higher": [1, 6, 7, 10], "rateincreas": [1, 10], "contribut": [1, 3, 6, 7, 9, 10], "trade": [1, 10], "between": [1, 6, 7, 8, 10, 11], "learning_rateand": [1, 10], "linear": [1, 8, 10], "model": [1, 3, 4, 8, 9, 10, 11, 13, 14, 15], "l1": [1, 10], "prior": [1, 8, 10], "regular": [1, 6, 7, 10], "spars": [1, 10], "coeffici": [1, 10], "tend": [1, 10], "prefer": [1, 10], "solut": [1, 6, 7, 10], "fewer": [1, 10], "zero": [1, 3, 9, 10], "effect": [1, 6, 7, 8, 10, 13], "reduc": [1, 6, 7, 10], "featur": [1, 3, 6, 7, 9, 10], "upon": [1, 6, 7, 10], "lassoparametersalpha": [1, 10], "constant": [1, 10], "multipli": [1, 10], "term": [1, 6, 7, 10], "control": [1, 6, 7, 8, 10, 13], "strength": [1, 3, 9, 10], "neg": [1, 6, 7, 8, 10], "i": [1, 3, 6, 7, 8, 9, 10, 11], "e": [1, 3, 8, 9, 10, 11, 13, 15], "inf": [1, 6, 7, 9, 10], "equival": [1, 10], "ordinari": [1, 10], "least": [1, 6, 7, 10], "squar": [1, 6, 7, 10], "solv": [1, 6, 7, 10], "linearregress": [1, 10], "numer": [1, 7, 8, 10], "reason": [1, 6, 7, 8, 9, 10], "us": [1, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15], "advis": [1, 6, 7, 8, 10], "implement": [1, 3, 6, 7, 9, 10, 13], "k": [1, 6, 7, 8, 10, 13, 14], "nearest": [1, 6, 7, 10], "neighbor": [1, 6, 7, 10, 13, 14], "vote": [1, 10], "principl": [1, 10], "behind": [1, 6, 7, 10], "method": [1, 3, 8, 9, 10, 12, 13], "find": [1, 6, 7, 9, 10], "predefin": [1, 4, 10, 13, 15], "sampl": [1, 6, 7, 10, 13, 14], "closest": [1, 10], "distanc": [1, 6, 7, 9, 10], "point": [1, 8, 10, 13, 14], "label": [1, 6, 7, 8, 9, 10, 13, 14], "from": [1, 3, 4, 9, 10, 11, 13, 14, 15], "defin": [1, 3, 6, 7, 8, 9, 10, 11, 13], "despit": [1, 6, 7, 10], "simplic": [1, 10], "success": [1, 6, 7, 10], "classif": [1, 4, 8, 9, 10, 12, 13], "problem": [1, 6, 7, 8, 9, 10], "n_neighbor": [1, 10, 12], "kneighborsclassifierparametersn_neighbor": [1, 10], "kneighbor": [1, 10], "queri": [1, 6, 7, 8, 9, 10], "minkowski": [1, 6, 7, 10], "euclidean": [1, 10], "kneighborsregressorparametersn_neighbor": [1, 10], "logist": [1, 10], "rather": [1, 3, 6, 7, 8, 9, 10], "than": [1, 3, 6, 7, 8, 9, 10], "also": [1, 3, 6, 7, 8, 9, 10, 13], "known": [1, 3, 6, 7, 8, 9, 10], "literatur": [1, 10], "logit": [1, 10], "entropi": [1, 8, 10], "maxent": [1, 10], "log": [1, 4, 10, 11, 12, 13, 15], "probabl": [1, 4, 8, 10], "describ": [1, 3, 6, 7, 9, 10, 13], "possibl": [1, 6, 7, 8, 9, 10, 11, 13, 14], "outcom": [1, 10], "singl": [1, 6, 7, 10], "solver": [1, 10, 12], "logisticregressionparametersparameterc": [1, 10], "try": [1, 6, 7, 8, 10], "sag": [1, 10], "saga": [1, 10], "fast": [1, 6, 7, 10], "converg": [1, 6, 7, 10], "guarante": [1, 10], "approxim": [1, 6, 7, 10], "scale": [1, 3, 8, 9, 10, 13, 15], "preprocess": [1, 4, 9, 10, 11, 14, 15], "scaler": [1, 3, 9, 10], "invers": [1, 10], "posit": [1, 3, 6, 7, 9, 10], "support": [1, 6, 7, 9, 10], "vector": [1, 3, 6, 7, 9, 10, 13, 15], "machin": [1, 3, 4, 6, 7, 8, 9, 10], "smaller": [1, 6, 7, 10], "stronger": [1, 10], "decomposit": [1, 10], "partial": [1, 6, 7, 10], "form": [1, 3, 6, 7, 8, 9, 10, 13], "compon": [1, 3, 6, 7, 9, 10], "fundament": [1, 10], "relat": [1, 3, 6, 7, 8, 9, 10], "matric": [1, 10], "thei": [1, 3, 6, 7, 8, 9, 10], "latent": [1, 10], "variabl": [1, 6, 7, 8, 9, 10], "approach": [1, 3, 6, 7, 8, 9, 10], "covari": [1, 4, 9, 10], "space": [1, 8, 10, 13, 14], "multidimension": [1, 10], "varianc": [1, 6, 7, 8, 10], "other": [1, 6, 7, 8, 10, 13], "word": [1, 6, 7, 10], "both": [1, 6, 7, 8, 10], "lower": [1, 6, 7, 10], "dimension": [1, 10], "subspac": [1, 6, 7, 9, 10], "transform": [1, 4, 9, 10, 11], "n_compon": [1, 10, 12], "ncompon": [1, 10], "keep": [1, 6, 7, 8, 10, 13], "n_sampl": [1, 10], "n_featur": [1, 10], "n_target": [1, 10], "forest": [1, 4, 8, 10], "decis": [1, 6, 7, 8, 10, 13, 15], "tree": [1, 6, 7, 10], "variou": [1, 6, 7, 9, 10], "sub": [1, 6, 7, 10], "averag": [1, 3, 6, 7, 8, 9, 10, 13], "improv": [1, 3, 6, 7, 9, 10], "accuraci": [1, 6, 7, 10], "over": [1, 6, 7, 10], "randomforestclassifierparametersmaxdepth": [1, 10], "randomforestclassifierparametersnestim": [1, 6, 7, 10], "depth": [1, 6, 7, 10, 12], "considerwhen": [1, 10], "split": [1, 4, 9, 10, 13, 14, 15], "thenconsid": [1, 10], "sqrt": [1, 6, 7, 8, 10], "log2": [1, 8, 10, 13, 15], "randomforestregressorparametersmaxdepth": [1, 10], "randomforestregressorparametersnestim": [1, 10], "l2": [1, 10], "loss": [1, 3, 6, 7, 9, 10], "norm": [1, 8, 10], "tikhonov": [1, 10], "base": [1, 3, 4, 6, 7, 9, 10, 11, 12, 13, 14, 15], "libsvm": [1, 10], "quadrat": [1, 10], "mai": [1, 3, 6, 7, 8, 9, 10], "impract": [1, 10], "beyond": [1, 10], "ten": [1, 10], "thousand": [1, 10], "svcparametersparameterc": [1, 10], "1e": [1, 10], "gamma": [1, 10, 12], "proport": [1, 6, 7, 10], "strictli": [1, 10], "penalti": [1, 10], "kernel": [1, 10], "epsilon": [1, 10], "complex": [1, 6, 7, 10], "hard": [1, 3, 9, 10], "coupl": [1, 10], "10000": [1, 10], "svrparametersparameterc": [1, 10], "svrparametersgamma": [1, 10], "maxdepth": [1, 10], "nestim": [1, 10], "learningr": [1, 10], "xgboost": [1, 10, 12], "gradient": [1, 10], "stand": [1, 10], "extrem": [1, 6, 7, 10], "paper": [1, 3, 6, 7, 9, 10], "greedi": [1, 10], "friedman": [1, 10], "learner": [1, 10], "round": [1, 6, 7, 8, 10], "prf": [1, 4, 8, 10], "probabilist": [1, 4, 10], "seen": [1, 6, 7, 8, 10], "hybrid": [1, 6, 7, 10], "similar": [1, 3, 6, 7, 8, 9, 10, 13, 14], "take": [1, 3, 6, 7, 8, 9, 10, 13], "real": [1, 6, 7, 8, 10, 13, 14], "represent": [1, 3, 4, 9, 10], "ptr": [1, 4, 6, 7, 10, 13], "howev": [1, 3, 6, 7, 8, 9, 10], "belong": [1, 3, 6, 7, 8, 9, 10], "inact": [1, 6, 7, 8, 10, 13, 15], "use_py_gini": [1, 10, 12], "use_py_leaf": [1, 10, 12], "prfclassifierparametersmaxdepth": [1, 10], "prfclassifierparametersnestim": [1, 10], "min_py_sum_leaf": [1, 10, 12], "prfclassifierparametersminpysumleaf": [1, 10], "gini": [1, 10], "true": [1, 3, 6, 7, 8, 9, 10, 13, 14], "leav": [1, 10], "leaf": [1, 10], "allow": [1, 3, 6, 7, 8, 9, 10], "prune": [1, 6, 7, 10], "propag": [1, 10], "small": [1, 8, 9, 10], "thu": [1, 6, 7, 10], "pth": [1, 10], "scheme": [1, 10], "noisi": [1, 10], "deep": [1, 6, 7, 10], "properti": [1, 3, 6, 7, 8, 9, 10, 11], "network": [1, 3, 6, 7, 9, 10], "neural": [1, 6, 7, 9, 10], "d": [1, 3, 6, 7, 9, 10, 11], "mpnn": [1, 10], "graph": [1, 3, 6, 7, 9, 10], "feed": [1, 10], "ffnn": [1, 10], "multi": [1, 3, 9, 10], "layer": [1, 3, 6, 7, 9, 10], "perceptron": [1, 10], "wa": [1, 3, 6, 7, 9, 10, 11], "present": [1, 6, 7, 8, 10, 11], "analyz": [1, 6, 7, 10], "optuna": [1, 4, 6, 7, 9, 10, 11, 12], "optims": [1, 10], "hyperopt": [1, 10], "ensemble_s": [1, 6, 7, 10, 12], "epoch": [1, 6, 7, 10, 12], "aggreg": [1, 6, 7, 8, 10, 12, 13, 14], "aggregation_norm": [1, 6, 7, 10, 12], "chempropparametersaggregation_norm": [1, 10], "200": [1, 6, 7, 9, 10], "q": [1, 3, 6, 7, 9, 10, 12], "batch_siz": [1, 6, 7, 10, 12], "chempropparametersbatch_s": [1, 10], "chempropparametersdepth": [1, 10], "6": [1, 6, 7, 8, 10], "dropout": [1, 10, 12], "chempropparametersdropout": [1, 10], "04": [1, 6, 7, 10], "features_gener": [1, 6, 7, 10, 12], "ffn_hidden_s": [1, 6, 7, 10, 12], "chempropparametersffn_hidden_s": [1, 10], "300": [1, 6, 7, 10], "2400": [1, 10], "ffn_num_lay": [1, 6, 7, 10, 12], "chempropparametersffn_num_lay": [1, 10], "final_lr_ratio_exp": [1, 6, 7, 10, 12], "chempropparametersfinal_lr_ratio_exp": [1, 10], "hidden_s": [1, 6, 7, 10, 12], "chempropparametershidden_s": [1, 10], "init_lr_ratio_exp": [1, 6, 7, 10, 12], "chempropparametersinit_lr_ratio_exp": [1, 10], "max_lr_exp": [1, 6, 7, 10, 12], "chempropparametersmax_lr_exp": [1, 10], "warmup_epochs_ratio": [1, 6, 7, 10, 12], "chempropparameterswarmup_epochs_ratio": [1, 10], "ensembl": [1, 10, 12], "initialis": [1, 6, 7, 9, 10], "size": [1, 3, 6, 7, 8, 9, 10], "run": [1, 3, 4, 8, 9, 10, 11], "increas": [1, 6, 7, 8, 9, 10, 13, 14], "400": [1, 6, 7, 10], "sum": [1, 6, 7, 10], "atom": [1, 3, 6, 7, 9, 10, 13, 14], "divid": [1, 6, 7, 10], "up": [1, 3, 4, 6, 9, 10, 11], "batch": [1, 10, 13], "step": [1, 8, 9, 10], "visibl": [1, 10], "randomli": [1, 6, 7, 8, 10], "some": [1, 3, 6, 7, 8, 9, 10], "element": [1, 10, 13, 14], "tensor": [1, 10], "p": [1, 3, 9, 10], "bernoulli": [1, 10], "channel": [1, 10], "independ": [1, 8, 10], "everi": [1, 6, 7, 10], "proven": [1, 10], "techniqu": [1, 8, 10], "prevent": [1, 6, 7, 10], "co": [1, 8, 10], "adapt": [1, 3, 9, 10], "neuron": [1, 10], "hidden": [1, 6, 7, 10], "ffn": [1, 6, 7, 10], "exponenti": [1, 8, 10], "rate": [1, 10], "bond": [1, 3, 9, 10], "ratio": [1, 10], "linearli": [1, 10], "init_lr": [1, 10], "max_lr": [1, 10], "afterward": [1, 8, 10], "decreas": [1, 8, 10], "final_lr": [1, 10], "without": [1, 6, 7, 9, 10, 13], "hyperparamet": [1, 4, 6, 7, 9, 10], "side": [1, 3, 9, 10], "nb": [1, 3, 6, 7, 8, 9, 10], "quick": [1, 4, 10], "simpl": [1, 8, 10], "sensibl": [1, 6, 7, 8, 9, 10], "author": [1, 6, 7, 9, 10], "do": [1, 6, 7, 8, 9, 10, 13], "num_it": [1, 6, 7, 10, 12], "search_parameter_level": [1, 6, 7, 10, 12], "dictat": [1, 6, 7, 10], "larger": [1, 3, 6, 7, 8, 9, 10], "pretrin": [1, 10], "pretrain": [1, 6, 7, 9, 10], "carri": [1, 10], "suppli": [1, 3, 6, 7, 8, 9, 10], "previous": [1, 10], "qsartuna": [1, 9, 10], "chempropparametersepoch": [1, 6, 7, 10], "frzn": [1, 10, 12], "pretrained_model": [1, 6, 7, 9, 10, 12], "none": [1, 3, 6, 7, 9, 10, 11, 13, 14, 15], "fine": [1, 10], "tune": [1, 3, 4, 6, 7, 9, 10], "decid": [1, 10], "freez": [1, 10], "transfer": [1, 10], "frozen": [1, 10], "calibr": [1, 4, 9, 10], "isoton": [1, 6, 7, 10], "vennab": [1, 10], "cv": [1, 6, 7, 10], "With": [1, 3, 9, 10], "across": [1, 6, 7, 8, 10, 13], "fals": [1, 3, 6, 7, 8, 9, 10, 13], "obtain": [1, 6, 7, 8, 10], "unbias": [1, 10], "offer": [1, 3, 6, 7, 9, 10], "p0": [1, 6, 7, 10], "vs": [1, 6, 7, 8, 9, 10], "p1": [1, 6, 7, 10], "discord": [1, 6, 7, 10], "type": [1, 3, 6, 7, 8, 9, 10, 13], "calibratedclassifiercvensembl": [1, 10], "calibratedclassifiercvmethod": [1, 10], "n_fold": [1, 6, 7, 10, 12], "whether": [1, 3, 8, 9, 10, 13, 15], "agnost": [1, 6, 7, 10], "interv": [1, 6, 7, 10], "encompass": [1, 10], "aleator": [1, 10], "epistem": [1, 10], "back": [1, 6, 7, 10], "strong": [1, 10], "theoret": [1, 6, 7, 10], "thank": [1, 10], "conform": [1, 10], "mapie_alpha": [1, 6, 7, 10, 12], "05": [1, 6, 7, 8, 10], "01": [1, 6, 7, 10], "99": [1, 6, 7, 10], "see": [3, 6, 7, 8, 9, 10, 13, 14], "gedeck": [3, 9], "et": [3, 8, 9], "qsar": [3, 4, 6, 7, 8, 9], "good": [3, 6, 7, 8, 9], "practic": [3, 9], "fingerprint": [3, 9, 10], "wai": [3, 6, 7, 8, 9], "daylight": [3, 9], "enumer": [3, 6, 7, 9, 10], "custom": [3, 6, 7, 9], "ref": [3, 9, 11], "16": [3, 6, 7, 8, 9], "hash": [3, 6, 7, 9, 10, 11], "style": [3, 6, 7, 8, 9], "implicitli": [3, 9], "largest": [3, 6, 7, 9], "toward": [3, 6, 7, 8, 9], "binari": [3, 6, 7, 9, 10], "extend": [3, 6, 7, 8, 9], "connect": [3, 6, 7, 9], "roger": [3, 9], "circular": [3, 9], "morgan": [3, 9, 10], "algorithm": [3, 4, 8, 9, 10, 11, 12, 13, 14], "invari": [3, 9], "getmorganfingerprintasbitvect": [3, 9], "rdkit": [3, 6, 7, 8, 9, 10], "systemat": [3, 9], "record": [3, 6, 7, 8, 9], "neighborhood": [3, 9, 10], "substructur": [3, 6, 7, 9], "map": [3, 6, 7, 8, 9], "integ": [3, 8, 9, 13, 14], "length": [3, 6, 7, 9], "diamet": [3, 9], "append": [3, 6, 7, 8, 9, 10], "g": [3, 8, 9, 13, 15], "ecfp4": [3, 9], "correspond": [3, 6, 7, 8, 9, 10], "returnrdkit": [3, 6, 7, 9], "bit": [3, 6, 7, 9], "sometim": [3, 6, 7, 8, 9], "bool": [3, 9, 10, 13, 14], "calculate_from_mol": [3, 9], "mol": [3, 6, 7, 8, 9], "numpi": [3, 6, 7, 8, 9, 13, 14], "arrai": [3, 6, 7, 9, 13, 14], "count": [3, 6, 7, 9, 10], "gethashedmorganfingerprint": [3, 9], "appear": [3, 6, 7, 9, 12], "usefeatur": [3, 6, 7, 9, 12], "fcfp": [3, 9], "normal": [3, 6, 7, 8, 9, 10], "ones": [3, 6, 7, 9], "definit": [3, 9, 13], "gobbi": [3, 9], "popping": [3, 9], "biotechnolog": [3, 9], "bioengin": [3, 9], "61": [3, 6, 7, 9], "47": [3, 6, 7, 9], "54": [3, 6, 7, 9], "1998": [3, 6, 7, 9], "lead": [3, 8, 9], "score": [3, 4, 9, 10, 11, 13, 15], "maxpath": [3, 6, 7, 9, 12], "fpsize": [3, 6, 7, 9, 12], "macc": [3, 6, 7, 9], "system": [3, 6, 7, 8, 9], "often": [3, 6, 7, 9], "mdl": [3, 9], "kei": [3, 6, 7, 8, 9, 11, 12], "compani": [3, 9], "keyset": [3, 9], "construct": [3, 9, 12], "optim": [3, 4, 8, 9, 10, 12], "durant": [3, 9], "reoptim": [3, 9], "drug": [3, 9], "discoveri": [3, 9], "166": [3, 6, 7, 9], "2d": [3, 9, 10], "essenti": [3, 8, 9], "answer": [3, 9], "fragment": [3, 9], "question": [3, 9], "explicitli": [3, 6, 7, 8, 9], "matter": [3, 9], "becaus": [3, 6, 7, 8, 9], "address": [3, 9], "specif": [3, 6, 7, 8, 9, 12], "repres": [3, 6, 7, 8, 9], "9": [3, 6, 7, 8, 9], "1049": [3, 9], "distinct": [3, 6, 7, 8, 9, 10], "rdkit_nam": [3, 6, 7, 9, 12], "unscal": [3, 9], "These": [3, 6, 7, 8, 9, 13], "physchem": [3, 6, 7, 9], "caution": [3, 8, 9], "208": [3, 6, 7, 9], "includ": [3, 6, 7, 8, 9], "clogp": [3, 6, 7, 9], "mw": [3, 6, 7, 9], "ring": [3, 8, 9], "rotat": [3, 9], "fraction": [3, 6, 7, 8, 9, 13, 14], "sp3": [3, 9], "kier": [3, 9], "indic": [3, 6, 7, 8, 9, 13, 14], "etc": [3, 6, 7, 8, 9], "tpsa": [3, 6, 7, 9], "slogp": [3, 9], "group": [3, 8, 9, 13, 14], "vsa": [3, 9], "moe": [3, 9], "charg": [3, 9], "www": [3, 9], "org": [3, 6, 7, 9], "doc": [3, 6, 7, 9], "gettingstartedinpython": [3, 9], "html": [3, 6, 7, 8, 9, 10], "whose": [3, 9], "been": [3, 6, 7, 8, 9], "level": [3, 6, 7, 8, 9, 10], "One": [3, 8, 9], "advantag": [3, 9], "interpret": [3, 9], "mean": [3, 6, 7, 8, 9, 10, 13], "physicochem": [3, 9], "intuit": [3, 9], "understood": [3, 9], "option": [3, 4, 8, 9, 10, 12, 13, 14, 15], "jazzy_nam": [3, 6, 7, 9, 12], "jazzy_filt": [3, 6, 7, 9], "jazzi": [3, 9], "hydrat": [3, 9], "energi": [3, 9], "hydrogen": [3, 9], "acceptor": [3, 6, 7, 9], "donor": [3, 6, 7, 9], "found": [3, 6, 7, 9, 11], "doi": [3, 6, 7, 9], "1038": [3, 9], "s41598": [3, 9], "023": [3, 6, 9], "30089": [3, 9], "mmff94": [3, 9], "minimis": [3, 9], "1000da": [3, 9], "compound": [3, 6, 7, 8, 9, 13, 14], "dict": [3, 9, 10, 11, 12], "ndarrai": [3, 9], "z": [3, 9, 13, 15], "peptid": [3, 6, 7, 9, 13, 15], "unfittedsklearnscal": [3, 9], "mol_data": [3, 9], "moldata": [3, 9], "file_path": [3, 9], "smiles_column": [3, 9], "fittedsklearnscal": [3, 9], "alia": [3, 9, 10], "file": [3, 8, 9, 11, 12, 13, 14], "header": [3, 9, 11], "line": [3, 4, 6, 7, 8, 9, 11], "row": [3, 6, 7, 8, 9], "comma": [3, 6, 7, 8, 9], "pre": [3, 8, 9], "inference_paramet": [3, 6, 7, 9], "were": [3, 6, 7, 8, 9], "propos": [3, 9], "sandberg": [3, 9], "proteogen": [3, 9], "amino": [3, 6, 7, 9], "acid": [3, 6, 7, 9], "nmr": [3, 9], "thin": [3, 9], "chromatographi": [3, 9], "tlc": [3, 9], "1021": [3, 6, 7, 9], "jm9700575": [3, 9], "captur": [3, 6, 7, 8, 9], "lipophil": [3, 9], "steric": [3, 9], "bulk": [3, 9], "polariz": [3, 9], "electron": [3, 9], "polar": [3, 9], "electroneg": [3, 9], "heat": [3, 9], "electrophil": [3, 9], "anoth": [3, 6, 7, 9], "through": [3, 6, 7, 9], "_and_": [3, 9], "continu": [3, 6, 7, 9], "learnt": [3, 6, 7, 9], "manner": [3, 6, 7, 9], "intent": [3, 6, 7, 9], "much": [3, 9], "remain": [3, 9, 13], "deriv": [3, 6, 7, 8, 9], "cautiou": [3, 9], "upload": [3, 9], "_all_": [3, 9], "ruder": [3, 9], "io": [3, 7, 9, 10], "index": [3, 6, 7, 8, 9], "auxiliarytask": [3, 9], "aux_weight_pc": [3, 6, 7, 9, 10, 12], "20": [3, 6, 7, 8, 9], "info": [3, 6, 7, 9], "percentag": [3, 9], "wrap": [3, 6, 7, 9], "certain": [3, 6, 7, 8, 9], "rang": [3, 6, 7, 8, 9, 13, 14], "scaleddescriptorparamet": [3, 9], "composit": [3, 6, 7, 9], "concaten": [3, 9], "button": [3, 9], "pleas": [3, 6, 7, 9, 11], "compat": [3, 6, 7, 9], "intro": 4, "background": 4, "json": [4, 6, 7, 9, 10, 12], "command": [4, 6, 7], "interfac": [4, 6, 7, 9, 12, 13], "python": [4, 6, 7, 9, 13], "jupyt": [4, 6, 7], "notebook": [4, 6, 7], "via": [4, 6, 7, 8, 13], "cli": 4, "inspect": [4, 6, 7], "automl": [4, 5], "automat": [4, 6, 7, 8], "ad": [4, 6, 7, 8, 13, 14], "descriptor": [4, 5, 8, 10, 12], "introduct": 4, "translat": [4, 6, 7], "sdf": [4, 6, 7, 9], "deal": [4, 13], "duplic": [4, 9, 10, 13], "dedupl": [4, 6, 7, 9, 11], "experiment": [4, 6, 7, 13, 15], "error": [4, 6, 7], "tutori": 4, "remov": [4, 8, 9, 10, 13, 14], "advanc": [4, 8, 9], "functoinail": 4, "overview": 4, "hpc": 4, "setup": [4, 10], "extract": 4, "walkthough": 4, "pipelin": [4, 6], "date": [4, 6, 9, 11], "calibratedclassifiercvwithva": [4, 6, 7, 10, 12], "mapi": [4, 10, 12], "zscale": [4, 6, 7, 9, 13], "smilesfromfil": [4, 6, 7, 9, 12], "smilesandsideinfofromfil": [4, 6, 7, 9, 12], "compositedescriptor": [4, 6, 7, 9, 12], "stratifi": [4, 6, 7, 13], "scaffoldsplit": [4, 8, 13], "modeldatatransform": [4, 6, 7, 8, 9, 13], "vectorfromcolumn": [4, 6, 7, 9, 13], "keepfirst": [4, 8, 13], "keeplast": [4, 8, 13], "keeprandom": [4, 8, 13], "keepmin": [4, 8, 13], "keepmax": [4, 8, 13], "keepavg": [4, 8, 13], "keepmedian": [4, 6, 7, 8, 13], "keepkeepallnodedupl": 4, "coverag": 4, "subpackag": 5, "submodul": 5, "content": 5, "util": [5, 6, 7, 8, 9, 14, 15], "files_path": [5, 9], "load_json": [5, 9], "builder": 5, "metirc": 5, "model_writ": 5, "visual": [5, 10, 12], "intend": [6, 7, 9], "necessari": [6, 7], "gui": [6, 7], "reinvent": [6, 7], "most": [6, 7, 8], "them": [6, 7, 8, 9, 10], "influenc": [6, 7, 8, 10], "idea": [6, 7, 8], "read": [6, 7, 8, 9], "otherwis": [6, 7, 13], "might": [6, 7, 8, 13], "skip": [6, 7, 8, 9, 11], "astrazeneca": [6, 7], "qptuna_latest": 6, "toi": [6, 7], "chosen": [6, 7], "whole": [6, 7, 8], "less": [6, 7, 8], "minut": [6, 7, 9], "holdout": [6, 7, 8], "readi": [6, 7, 9], "next": [6, 7, 8], "few": [6, 7, 8], "head": [6, 7, 8], "molwt_gt_330": [6, 7], "cc1cc": [6, 7], "nc": [6, 7, 8], "o": [6, 7, 8], "c2cccc": [6, 7], "coc3ccc": [6, 7], "br": [6, 7, 8], "cc3": [6, 7, 8], "c2": [6, 7, 8], "no1": [6, 7], "387": [6, 7], "233": [6, 7], "nc1ccc": [6, 7], "f": [6, 7, 8, 13], "cc1f": [6, 7], "nc1sccc1": [6, 7], "c1nc2ccccc2s1": [6, 7], "4360000000001": [6, 7], "coc": [6, 7], "c1ccccc1nc": [6, 7], "c1cc": [6, 7], "nn1cc1ccccc1": [6, 7], "380": [6, 7], "36000000000007": [6, 7], "ccoc": [6, 7], "sc1nc": [6, 7], "c2ccccc2": [6, 7], "ccc1c": [6, 7], "312": [6, 7], "39400000000006": [6, 7], "ccc": [6, 7, 8], "cc": [6, 7, 8], "c1nn": [6, 7, 8], "cc2ccccc2": [6, 7], "c2ccccc12": [6, 7], "349": [6, 7], "4340000000001": [6, 7], "brc1ccccc1occcoc1cccc2cccnc12": [6, 7], "358": [6, 7], "235": [6, 7], "ccccn1c": [6, 7], "coc2cccc": [6, 7], "oc": [6, 7], "nc2ccccc21": [6, 7], "310": [6, 7], "39700000000005": [6, 7], "ccoc1cccc": [6, 7], "c2sc3nc": [6, 7], "c4ccc": [6, 7], "cc4": [6, 7], "ccc3c2n": [6, 7], "c1": [6, 7, 8], "407": [6, 7], "4700000000001": [6, 7], "coc1ccc": [6, 7], "nc2ccc": [6, 7], "cc2": [6, 7], "c2ccc": [6, 7], "cc1oc": [6, 7], "454": [6, 7], "54800000000023": [6, 7], "sy": [6, 7, 8], "sklearn": [6, 7, 12], "typic": [6, 7, 8], "test_dataset_fil": [6, 7, 9], "random_se": [6, 7, 10], "42": [6, 7, 8, 13, 14], "seed": [6, 7, 8, 9, 13, 14], "reproduc": [6, 7, 13, 15], "basic": [6, 7, 9, 10], "importlib": [6, 7], "reload": [6, 7], "basicconfig": [6, 7], "getlogg": [6, 7], "disabl": [6, 7, 12], "np": [6, 7, 8], "seterr": [6, 7], "ignor": [6, 7], "warn": [6, 7], "filterwarn": [6, 7], "categori": [6, 7], "futurewarn": [6, 7], "runtimewarn": [6, 7], "tqdm": [6, 7], "functool": [6, 7], "partialmethod": [6, 7], "__init__": [6, 7, 10], "flood": [6, 7], "decpreci": [6, 7], "simplefilt": [6, 7], "arg": [6, 7, 9, 10], "kwarg": [6, 7, 10], "stderr": [6, 7], "render": [6, 7, 8], "red": [6, 7], "2024": [6, 7], "08": [6, 7], "23": [6, 7, 8], "51": [6, 7], "03": [6, 7], "367": [6, 7], "memori": [6, 7, 8, 9, 11], "440": [6, 7], "study_name_0": [6, 7], "760": [6, 7], "finish": [6, 7], "3594": [6, 7], "2228073972638": [6, 7], "39": [6, 7, 8], "algorithm_nam": [6, 7, 12], "randomforestregressor_algorithm_hash": [6, 7], "f1ac01e1bba332215ccbd0c29c9ac3c3": [6, 7], "max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3": [6, 7], "n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3": [6, 7], "max_features__f1ac01e1bba332215ccbd0c29c9ac3c3": [6, 7], "lt": [6, 7, 8], "randomforestmaxfeatur": [6, 7, 10], "gt": [6, 7, 8], "34": [6, 7, 8], "915": [6, 7], "5029": [6, 7], "734616310275": [6, 7], "svr_algorithm_hash": [6, 7], "ea7ccc7ef4a9329af0d4e39eb6184933": [6, 7], "gamma__ea7ccc7ef4a9329af0d4e39eb6184933": [6, 7], "039054412752107935": [6, 7], "c__ea7ccc7ef4a9329af0d4e39eb6184933": [6, 7], "1242780840717016e": [6, 7], "07": [6, 7], "195": 6, "4242": [6, 7], "092751193529": [6, 7], "341": [6, 7], "3393": [6, 7], "577488426015": [6, 7], "ridge_algorithm_hash": [6, 7], "cfa1990d5153c8812982f034d788d7e": [6, 7], "alpha__cfa1990d5153c8812982f034d788d7e": [6, 7], "06877704223043679": [6, 7], "506": 6, "427": [6, 7], "45250420148204": [6, 7], "lasso_algorithm_hash": [6, 7], "5457f609662e44f04dcc9423066d2f58": [6, 7], "alpha__5457f609662e44f04dcc9423066d2f58": [6, 7], "7896547008552977": [6, 7], "577": [6, 7], "3387": [6, 7], "245629616474": [6, 7], "plsregression_algorithm_hash": [6, 7], "9f2f76e479633c0bf18cf2912fed9eda": [6, 7], "n_components__9f2f76e479633c0bf18cf2912fed9eda": [6, 7], "646": [6, 7], "734620250011": [6, 7], "3661540064603184": [6, 7], "1799882524170321": [6, 7], "711": 6, "7": [6, 7, 8, 10], "9650": [6, 7], "026568221794": [6, 7], "kneighborsregressor_algorithm_hash": [6, 7], "1709d2c39117ae29f6c9debe7241287b": [6, 7], "metric__1709d2c39117ae29f6c9debe7241287b": [6, 7], "kneighborsmetr": [6, 7, 10], "n_neighbors__1709d2c39117ae29f6c9debe7241287b": [6, 7], "weights__1709d2c39117ae29f6c9debe7241287b": [6, 7], "kneighborsweight": [6, 7, 10], "uniform": [6, 7, 10], "727": [6, 7], "5437": [6, 7], "151635569594": [6, 7], "05083825348819038": [6, 7], "858": [6, 7], "2669": [6, 7], "8534551928174": 6, "876": 6, "4341": [6, 7], "586120152291": [6, 7], "7921825998469865": [6, 7], "098": [6, 7], "11": [6, 7, 8], "5514": [6, 7], "404088878843": 6, "210": 6, "12": [6, 7, 8], "5431": [6, 7], "634989239215": [6, 7], "228": 6, "13": [6, 7, 8], "3530": [6, 7], "5496618991288": [6, 7], "245": [6, 7], "14": [6, 7, 8], "3497": [6, 7], "6833185436312": [6, 7], "263": [6, 7], "15": [6, 7, 8], "4382": [6, 7], "16208862162": [6, 7], "279": [6, 7], "734620031822": [6, 7], "002825619931800395": [6, 7], "309885135051862e": [6, 7], "09": [6, 7], "296": [6, 7], "17": [6, 7, 8], "679": [6, 7], "3109044887755": [6, 7], "16827992999009767": [6, 7], "370": [6, 7], "18": [6, 7, 8], "2550": [6, 7], "114129318373": [6, 7], "386": [6, 7], "19": [6, 7, 8], "4847": [6, 7], "085792360169": [6, 7], "735431606118867": [6, 7], "404": 6, "268760278916": [6, 7], "0014840820994557746": [6, 7], "04671166881768783": [6, 7], "518": 6, "21": [6, 7, 8], "4783": [6, 7], "047015479679": 6, "536": 6, "22": [6, 7, 8], "3905": [6, 7], "0064899852296": [6, 7], "604": 6, "4030": [6, 7], "4577379164707": [6, 7], "672": 6, "24": [6, 7, 8], "4681": [6, 7], "602145939593": [6, 7], "690": [6, 7], "25": [6, 7, 8], "4398": [6, 7], "544034028325": [6, 7], "6452011213193165": [6, 7], "756": 6, "26": [6, 7, 8], "4454": [6, 7], "143979828406": 6, "27": [6, 7, 8], "765": 6, "28": [6, 7, 8], "833": 6, "29": [6, 7], "4397": [6, 7], "330360587512": [6, 7], "838": 6, "880": [6, 7], "31": [6, 7], "2602": [6, 7], "7561184287083": [6, 7], "897": 6, "5267": [6, 7], "388279961089": [6, 7], "2015560027548533": [6, 7], "06": [6, 7], "014": [6, 7], "33": [6, 7], "4863": [6, 7], "5817607510535": [6, 7], "032": [6, 7], "388": [6, 7], "96473594016675": [6, 7], "5528259214839937": [6, 7], "076": 6, "35": [6, 7], "5539": [6, 7], "698232987626": [6, 7], "6400992020612235": [6, 7], "107": [6, 7], "36": [6, 7], "5180": [6, 7], "5533034102455": [6, 7], "8968910439566395": [6, 7], "125": 6, "37": [6, 7], "4989": [6, 7], "929984864281": [6, 7], "04458440839692226": [6, 7], "492108041427977": [6, 7], "130": 6, "38": [6, 7, 8], "173": [6, 7], "6528": [6, 7], "215066535042": [6, 7], "16700143339733753": [6, 7], "237": [6, 7], "40": [6, 7, 8], "4168": [6, 7], "7955967552625": 6, "292": [6, 7], "41": [6, 7], "6177": [6, 7], "060727800014": [6, 7], "3963": [6, 7], "9069546583414": [6, 7], "378": [6, 7], "43": [6, 7], "6805334166565": [6, 7], "013186009009851564": [6, 7], "001008958590140135": [6, 7], "421": [6, 7], "44": [6, 7], "9300": [6, 7], "86840721566": [6, 7], "441": 6, "45": [6, 7, 8], "83": [6, 7], "87968210939489": [6, 7], "382674443425525e": [6, 7], "447": 6, "46": [6, 7], "460": [6, 7], "48": [6, 7], "525": 6, "49": [6, 7], "3660": [6, 7], "9359502556003": 6, "550": 6, "688": [6, 7], "5244070398325": [6, 7], "5267860995545326": [6, 7], "572": [6, 7], "6494438072099": [6, 7], "8458809314722497": [6, 7], "597": 6, "52": [6, 7], "691": [6, 7], "1197058420935": [6, 7], "9167866889210807": [6, 7], "622": [6, 7], "53": [6, 7], "3111710449325": [6, 7], "945685900574672": [6, 7], "9665592812149": [6, 7], "8936837761725833": [6, 7], "55": [6, 7], "4682747008223": [6, 7], "5183865279530455": [6, 7], "695": [6, 7], "56": [6, 7], "687": [6, 7], "5230947231512": [6, 7], "3771771681361766": [6, 7], "718": [6, 7], "57": [6, 7], "4503442069594": [6, 7], "3663259819415374": [6, 7], "743": [6, 7], "58": [6, 7], "686": [6, 7], "9553733616618": [6, 7], "2925652230875628": [6, 7], "766": [6, 7], "59": [6, 7], "2038330506566": [6, 7], "3962903248948568": [6, 7], "790": 6, "60": [6, 7], "377": [6, 7], "25988028857313": [6, 7], "45237513161879": [6, 7], "814": [6, 7], "379": [6, 7], "8933285317637": [6, 7], "4741161933311207": [6, 7], "62": [6, 7], "374": [6, 7], "50897467366013": [6, 7], "4290962207409417": [6, 7], "864": [6, 7], "63": [6, 7, 8], "376": [6, 7], "5588572940058": [6, 7], "4464295711264585": [6, 7], "890": 6, "64": [6, 7], "237448916406": [6, 7], "4687500034684213": [6, 7], "914": [6, 7], "65": [6, 7], "375": [6, 7], "7474776359051": [6, 7], "4395650011783436": [6, 7], "941": 6, "66": [6, 7], "362": [6, 7], "2834906299732": [6, 7], "3326755354190032": [6, 7], "966": [6, 7], "67": [6, 7], "357": [6, 7], "3474880122588": [6, 7], "2887212943233457": [6, 7], "993": 6, "68": [6, 7], "354": [6, 7], "279045046449": [6, 7], "2577677164664005": [6, 7], "031": 6, "69": [6, 7], "347": [6, 7], "36894395697703": [6, 7], "1672928587680225": [6, 7], "069": [6, 7], "70": [6, 7], "345": [6, 7], "17697390093394": [6, 7], "1242367255308854": [6, 7], "095": 6, "71": [6, 7], "74610809299037": [6, 7], "1728352983905301": [6, 7], "133": [6, 7], "72": [6, 7], "23464281634324": [6, 7], "1265380781508565": [6, 7], "171": 6, "73": [6, 7], "344": [6, 7], "6848312222365": [6, 7], "0829896313820404": [6, 7], "74": [6, 7, 8], "9111966504334": [6, 7], "1070414661080543": [6, 7], "75": [6, 7], "70116419828565": [6, 7], "0875643695329498": [6, 7], "271": [6, 7], "76": [6, 7], "62647974688133": [6, 7], "0716281620790837": [6, 7], "298": 6, "77": [6, 7], "6759429204596": [6, 7], "0456289319914898": [6, 7], "324": 6, "78": [6, 7], "343": [6, 7], "58131497761616": [6, 7], "0010195360522613": [6, 7], "351": 6, "79": [6, 7], "342": [6, 7], "7290581014813": [6, 7], "9073210715005748": [6, 7], "80": [6, 7, 8], "67866114080107": [6, 7], "9166305667100072": [6, 7], "402": 6, "81": [6, 7], "6440308445311": [6, 7], "9248722692093634": [6, 7], "430": [6, 7], "82": [6, 7], "02085648448934": [6, 7], "8776928646870886": [6, 7], "457": [6, 7], "1662266300702": [6, 7], "867592364677856": [6, 7], "484": [6, 7], "84": [6, 7], "30158716569775": [6, 7], "8599491178327108": [6, 7], "523": 6, "85": [6, 7, 9], "2803074848341": [6, 7], "8396948389352923": [6, 7], "563": 6, "86": [6, 7], "28301101884045": [6, 7], "8396651775801683": [6, 7], "589": [6, 7], "87": [6, 7], "6781906268143": [6, 7], "8356021935129933": [6, 7], "617": 6, "88": [6, 7], "0405418264898": [6, 7], "7430046191126949": [6, 7], "645": [6, 7], "89": [6, 7], "77203208258476": [6, 7], "9015965341429055": [6, 7], "684": 6, "90": [6, 7], "363": [6, 7], "1622720320929": [6, 7], "6746575663752555": [6, 7], "712": 6, "91": [6, 7], "7403796626193": [6, 7], "9057564666836629": [6, 7], "740": 6, "92": [6, 7], "63579667712696": [6, 7], "9332275205203372": [6, 7], "767": [6, 7], "93": [6, 7, 8], "6886425884964": [6, 7], "9433063264508291": [6, 7], "795": [6, 7], "94": [6, 7], "9341048659705": [6, 7], "884739221967487": [6, 7], "823": 6, "95": [6, 7, 8], "63507445779743": [6, 7], "9381000493689634": [6, 7], "851": [6, 7], "96": [6, 7], "06021011302374": [6, 7], "963138023068903": [6, 7], "879": 6, "97": [6, 7], "9990546212019": [6, 7], "9601651093867907": [6, 7], "910": 6, "98": [6, 7], "3821": [6, 7], "2267845437514": [6, 7], "938": 6, "356": [6, 7], "6786067133016": [6, 7], "721603508336166": [6, 7], "seaborn": [6, 7, 8], "sn": [6, 7, 8], "set_them": [6, 7], "darkgrid": [6, 7], "default_reg_scor": [6, 7], "ax": [6, 7, 8], "scatterplot": [6, 7], "trials_datafram": [6, 7], "xlabel": [6, 7, 8], "ylabel": [6, 7, 8], "ojbect": [6, 7], "interest": [6, 7, 8], "neg_mean_squared_error": [6, 7, 10], "highlight": [6, 7], "color": [6, 7, 8], "cv_test": [6, 7], "user_attrs_test_scor": [6, 7], "lambda": [6, 7, 13], "item": [6, 7, 11], "idx": [6, 7, 8], "hue": [6, 7], "palett": [6, 7], "set1": [6, 7], "buildconfig_as_dict": [6, 7], "serial": [6, 7], "response_typ": [6, 7, 8, 9], "deduplication_strategi": [6, 7, 8, 9], "split_strategi": [6, 7, 8, 9], "nosplit": [6, 7, 13], "save_intermediate_fil": [6, 7, 9], "log_transform": [6, 7, 8, 9], "log_transform_bas": [6, 7, 8, 9], "null": [6, 7], "log_transform_neg": [6, 7, 8, 9], "log_transform_unit_convers": [6, 7, 8, 9], "probabilistic_threshold_represent": [6, 7, 8, 9], "probabilistic_threshold_representation_threshold": [6, 7, 8, 9], "probabilistic_threshold_representation_std": [6, 7, 8, 9], "shuffl": [6, 7, 10, 12, 13, 14], "best_trial": [6, 7, 10, 12], "best_valu": [6, 7, 10, 12], "tracking_rest_endpoint": [6, 7, 10], "best_build": [6, 7], "rb": [6, 7], "predict_from_smil": [6, 7, 9], "cc1": [6, 7, 8], "43103985": [6, 7], "177": [6, 7], "99850936": [6, 7], "panda": [6, 7, 8], "pd": [6, 7, 8], "df": [6, 7, 13, 14], "read_csv": [6, 7], "matplotlib": [6, 7, 8], "pyplot": [6, 7, 8], "plt": [6, 7, 8], "scatter": [6, 7], "lim": [6, 7], "diagon": [6, 7], "r2_score": [6, 7], "mean_squared_error": [6, 7], "mean_absolute_error": [6, 7], "y_true": [6, 7, 9, 12], "y_pred": [6, 7, 9, 12], "rmse": [6, 7], "mae": [6, 7], "absolut": [6, 7], "8566354978126369": [6, 7], "204909888075044": [6, 7], "298453946973815": [6, 7], "again": [6, 7], "hopefulli": [6, 7, 8], "littl": [6, 7], "better": [6, 7, 8, 9, 13], "send": [6, 7], "strategi": [6, 7, 9], "current": [6, 7, 9, 11], "observ": [6, 7, 8], "last": [6, 7, 8, 13], "alreadi": [6, 7, 8, 9, 11], "sort": [6, 7, 8, 13, 14], "oldest": [6, 7, 8, 13, 14], "newest": [6, 7, 8, 9, 13, 14], "end": [6, 7, 8, 13, 14], "extern": [6, 7], "tool": [6, 7], "excel": [6, 7], "unballanc": [6, 7], "come": [6, 7, 8], "measur": [6, 7, 8], "fact": [6, 7], "disregard": [6, 7], "stereochemistri": [6, 7, 8, 9], "sever": [6, 7], "median": [6, 7, 8, 13], "factor": [6, 7, 8], "replic": [6, 7, 8], "robust": [6, 7, 8], "outlier": [6, 7, 8], "acorss": [6, 7], "trust": [6, 7], "kept": [6, 7], "splitter": [6, 7, 8, 9, 11], "track_to_mlflow": [6, 7, 10], "my_study_stratified_split": [6, 7], "165": 6, "207": [6, 7], "303": [6, 7], "261": [6, 7], "95269731189177": 6, "586114272804535": 6, "439": [6, 7], "3455": 6, "51800700426": 6, "1856": [6, 7], "4459752935309": [6, 7], "477": 6, "1235": 6, "3128104073717": 6, "5613443439636077": 6, "495": [6, 7], "3949": [6, 7], "4997740833423": [6, 7], "259060787354118": 6, "06151214721649829": 6, "560": [6, 7], "3258": 6, "3324669641333": 6, "580": 6, "281": [6, 7], "6313215642597": 6, "821793264230599": 6, "2756": [6, 7], "046839500092": [6, 7], "615": 6, "2720": [6, 7], "793752592223": [6, 7], "631": 6, "4702695112846": 6, "11028790699101433": 6, "001202131310186554": 6, "710": [6, 7], "2695": [6, 7], "2514836330784": [6, 7], "731": 6, "1688": 6, "7128683041683": 6, "1044548905141272": 6, "746": 6, "2658": 6, "13214897931": 6, "813": [6, 7], "1948": 6, "0314425327626": 6, "831": [6, 7], "1332": 6, "6840893052315": 6, "8033739312636219": 6, "848": [6, 7], "7730407032913": 6, "978415570131035": 6, "380966239365776": 6, "5380266414879525e": 6, "882": [6, 7], "39037036873405": 6, "13170545295199e": 6, "898": [6, 7], "347685324232952": 6, "782238919549724e": 6, "902": 6, "920": [6, 7], "4997657609406": 6, "004091119479264935": 6, "7670039814136804e": 6, "939": [6, 7], "4997709689146": 6, "020406357580717727": 6, "826432657033465e": 6, "956": [6, 7], "3942": 6, "5257596151837": 6, "00017594354214526438": 6, "3221158157501884": 6, "972": [6, 7], "1775": [6, 7], "55204856041": [6, 7], "989": [6, 7], "9426790782418": 6, "28574770987033293": 6, "006": [6, 7], "1254": 6, "9841129079468": 6, "0742769549097546": 6, "073": [6, 7], "090": 6, "1249": 6, "5519579928275": 6, "26166764283582": 6, "122": [6, 7], "4997740490603": 6, "1551243322855379": 6, "869530660905885e": 6, "141": 6, "613671789797623": 6, "18743805815241568": 6, "160": 6, "4997740057183": 6, "0006647090582038176": 6, "720240531591189e": 6, "188": [6, 7], "236": [6, 7], "75701162742902": 6, "15225101226627": 6, "2726": [6, 7], "0476769808097": [6, 7], "225": [6, 7], "98897579737036": 6, "3434026346873007e": 6, "3596": 6, "741420193717": 6, "311": 6, "1242": 6, "8479265462504": 6, "3806781553300398": 6, "148057819462277": 6, "1220747475846438e": 6, "410": [6, 7], "2906": 6, "3484169581293": 6, "474": [6, 7], "2182": 6, "2854817163393": 6, "494": 6, "1682": 6, "7555601297397": 6, "7692026965764096": 6, "527": 6, "1885": 6, "3761105075926": 6, "8499325582942474": 6, "7934477837753": 6, "26437658363366806": 6, "399729524954495": 6, "4996545768313": 6, "03999295021459913": 6, "487454158254508e": 6, "648": [6, 7], "2279": 6, "772434063323": 6, "668": 6, "1686": 6, "497519225056": 6, "9798152426640634": 6, "700": [6, 7], "1734": 6, "418175645478": 6, "1638039970995402": 6, "720": [6, 7, 9], "2641": [6, 7], "7637473751115": [6, 7], "726": [6, 7], "732": 6, "751": 6, "4997740833387": 6, "6381698921109232": 6, "0041111342254524e": 6, "774": [6, 7], "8133725349282": 6, "9498873960159637": 6, "797": [6, 7], "7735399551454": 6, "9780612881075026": 6, "822": 6, "8160071680375": 6, "9480302946593064": 6, "843": 6, "75592491031455": 6, "9905788379110985": 6, "866": [6, 7], "7455012578744": 6, "998003047330558": 6, "891": 6, "265": [6, 7], "5420569489236": 6, "731766992009085": 6, "925": 6, "268": [6, 7], "5837896907764": 6, "8088769537936915": 6, "961": [6, 7], "270": [6, 7], "2819638853734": 6, "8381998920032558": 6, "986": 6, "5370756433875": 6, "8423274630826914": 6, "009": [6, 7], "6648549453774": 6, "8105870658571404": 6, "034": 6, "267": [6, 7], "33331573420924": 6, "7812473578529109": 6, "058": 6, "54266068640237": 6, "7865813805833881": 6, "084": [6, 7], "264": [6, 7], "7374685857255": 6, "7033718535925544": 6, "108": [6, 7], "259": 6, "06013832754854": 6, "530230339296878": 6, "134": [6, 7], "254": 6, "45098385749847": 6, "4449038663990794": 6, "252": [6, 7], "46933447499055": 6, "4118163766482357": 6, "211": [6, 7], "400610865412": 6, "3751234485145145": 6, "248": [6, 7], "55142126098917": 6, "3782312158054713": 6, "285": [6, 7], "249": [6, 7], "939720762774": 6, "3654947227249123": 6, "51859203038146": 6, "3389300472278876": 6, "247": [6, 7], "97854622218964": 6, "3291551817821483": 6, "82875013698148": 6, "344470263084507": 6, "437": 6, "89404238932664": 6, "2945916241697062": 6, "475": 6, "88444574036467": 6, "294423585518049": 6, "512": [6, 7], "242": [6, 7], "7250858383981": 6, "2374026497690556": 6, "241": [6, 7], "38995410978927": 6, "2216216823389983": 6, "588": [6, 7], "75773569374167": 6, "1685257395531474": 6, "627": [6, 7], "238": [6, 7], "9591618086847": 6, "1871718734668695": 6, "667": 6, "16615158396067": 6, "1749827907502346": 6, "705": [6, 7], "87253431766433": 6, "1541307320952652": 6, "744": [6, 7], "234": [6, 7], "54432497574712": 6, "1118826871769896": 6, "783": [6, 7], "500370208023": 6, "1109739335876776": 6, "820": 6, "227": [6, 7], "05479722761888": 6, "9557242358902104": 6, "859": [6, 7], "226": 6, "75744778941316": 6, "9492111894491083": 6, "900": [6, 7], "23291544469544": 6, "9371731029417466": 6, "940": [6, 7], "8608948363877": 6, "9283493142218042": 6, "981": [6, 7], "223": [6, 7], "79470023518647": 6, "8924342905874942": 6, "021": [6, 7, 8], "04998656317707": 6, "914666812200899": 6, "061": 6, "3255192874075": 6, "8835546302939554": 6, "099": [6, 7], "224": [6, 7], "5251215421697": 6, "9055752025758994": 6, "140": [6, 7], "49998736816636": 6, "9051359167587669": 6, "180": [6, 7], "40892455090952": 6, "9035104089361927": 6, "1896344823456": 6, "9170686489009984": 6, "217": 6, "03166841852928": 6, "6196471760805207": 6, "289": [6, 7], "15921264908027": 6, "6137087588616705": 6, "330": [6, 8], "216": [6, 7], "30437532378687": 6, "6380025600331409": 6, "372": [6, 7], "215": [6, 7], "71630507323695": 6, "663588879747517": 6, "411": [6, 7], "1690838497103": 6, "641298655189503": 6, "450": 6, "79332895242592": 6, "654362351183699": 6, "491": [6, 7], "737398967865": 6, "6605844367915987": 6, "By": [6, 7, 8], "roc_auc": [6, 7, 10], "stabl": [6, 7, 9], "model_evalu": [6, 7], "amongst": [6, 7], "regression_scor": [6, 7], "classification_scor": [6, 7], "explained_vari": [6, 7, 10], "max_error": [6, 7, 10], "neg_mean_absolute_error": [6, 7, 10], "neg_median_absolute_error": [6, 7, 10], "average_precis": [6, 7, 10], "balanced_accuraci": [6, 7, 10], "f1": [6, 7, 10], "f1_macro": [6, 7, 10], "f1_micro": [6, 7, 10], "f1_weight": [6, 7, 10], "jaccard": [6, 7, 10], "jaccard_macro": [6, 7, 10], "jaccard_micro": [6, 7, 10], "jaccard_weight": [6, 7, 10], "neg_brier_scor": [6, 7, 10], "precis": [6, 7, 8, 10], "precision_macro": [6, 7, 10], "precision_micro": [6, 7, 10], "precision_weight": [6, 7, 10], "recal": [6, 7, 10], "recall_macro": [6, 7, 10], "recall_micro": [6, 7, 10], "recall_weight": [6, 7, 10], "auc_pr_cal": [6, 7, 9, 10], "bedroc": [6, 7, 9, 10], "concordance_index": [6, 7, 9, 10], "my_study_r2": [6, 7], "590": 6, "01117186866515977": [6, 7], "657": [6, 7], "08689402230378156": [6, 7], "12553701248394863": [6, 7], "141096648805748": [6, 7], "4893466963980463e": [6, 7], "922": 6, "3039309544203818": [6, 7], "936": 6, "20182749628697164": [6, 7], "957": [6, 7], "8187194367176578": [6, 7], "979": [6, 7], "4647239019719945": [6, 7], "6574750183038587": [6, 7], "8614818478547979": [6, 7], "3974313630683448": [6, 7], "086": [6, 7], "12769795082909816": 6, "127": [6, 7], "8639946428338224": [6, 7], "2391884918766034": [6, 7], "157": [6, 7], "12553701248377633": [6, 7], "00044396482429275296": [6, 7], "3831436879125245e": [6, 7], "186": [6, 7], "12553700871203702": [6, 7], "00028965395242758657": [6, 7], "99928292425642e": [6, 7], "202": [6, 7], "2935582042429075": [6, 7], "219": [6, 7], "18476333152695587": [6, 7], "8190707459213998": [6, 7], "4060379177903557": [6, 7], "301": [6, 7], "12206148974315863": [6, 7], "318": [6, 7], "3105263811279067": [6, 7], "344271094811757": [6, 7], "336": [6, 7], "3562469062424869": [6, 7], "670604991178476": [6, 7], "401": [6, 7], "045959695906983344": [6, 7], "432": 6, "8583939656024446": [6, 7], "5158832554303112": [6, 7], "448": 6, "3062574078515544": [6, 7], "479": 6, "11657354998283716": [6, 7], "0009327650919528738": [6, 7], "062479210472502": [6, 7], "483": 6, "502": 6, "8498478905829554": [6, 7], "1366172066709432": [6, 7], "602": [6, 7], "13519830637607919": [6, 7], "92901911959232": [6, 7], "999026012594694": [6, 7], "621": [6, 7], "8198078293055633": [6, 7], "5888977841391714": [6, 7], "640": 6, "8201573964824842": [6, 7], "19435298754153707": [6, 7], "706": [6, 7], "04595969590698312": 6, "736": [6, 7], "6285506249643193": [6, 7], "35441495011256785": [6, 7], "803": [6, 7], "11934070343348317": [6, 7], "4374125584543907": [6, 7], "2457809516380005": [6, 7], "852": 6, "3625576518621392": [6, 7], "6459129458824919": [6, 7], "871": [6, 7], "36175556871883746": [6, 7], "8179058888285398": [6, 7], "896": 6, "8202473217121523": [6, 7], "0920052840435055": [6, 7], "913": [6, 7], "3672927879319306": [6, 7], "8677032984759461": [6, 7], "918": 6, "40076792599874356": [6, 7], "2865764368847064": [6, 7], "996": 6, "26560316846701765": [6, 7], "064": [6, 7], "41215254857081174": [6, 7], "221": [6, 7], "004614143721600701": 6, "240": 6, "27282533524183633": [6, 7], "322": 6, "10220127407364972": 6, "30323404130582854": [6, 7], "3044553805553568": [6, 7], "6437201185807124": [6, 7], "382": 6, "41502276709562": [6, 7], "10978379088847677": [6, 7], "36160209098547913": [6, 7], "022707289534838138": [6, 7], "423": 6, "2916101445983833": [6, 7], "kljk345": [6, 7], "pypoetri": [6, 7], "virtualenv": [6, 7], "_qsktrft": 6, "py3": [6, 7], "lib": [6, 7], "python3": [6, 7], "site": [6, 7], "linear_model": [6, 7], "_coordinate_desc": [6, 7], "678": [6, 7], "convergencewarn": [6, 7], "did": [6, 7], "regularis": [6, 7], "dualiti": [6, 7], "gap": [6, 7], "936e": [6, 7], "02": [6, 7], "toler": [6, 7], "782e": [6, 7], "cd_fast": [6, 7], "enet_coordinate_desc": [6, 7], "434e": [6, 7], "977e": [6, 7], "496": 6, "8609413020928532": [6, 7], "04987590926279814": [6, 7], "794e": [6, 7], "830e": [6, 7], "906e": [6, 7], "578e": [6, 7], "8610289662757457": [6, 7], "019211413400468974": [6, 7], "754e": [6, 7], "843e": [6, 7], "507e": [6, 7], "8610070549049179": [6, 7], "018492644772509947": [6, 7], "840e": [6, 7], "924e": [6, 7], "513e": [6, 7], "754": [6, 7], "8569771623635769": [6, 7], "008783442408928633": [6, 7], "243e": [6, 7], "014e": [6, 7], "825": 6, "8624781673814641": [6, 7], "05782221001517797": [6, 7], "113e": [6, 7], "935e": [6, 7], "122e": [6, 7], "8618589507037001": [6, 7], "02487072255316275": [6, 7], "960": [6, 7], "864754359721037": [6, 7], "2079910754941946": [6, 7], "998": [6, 7], "8622236413326235": [6, 7], "333215560931422": [6, 7], "861832165638517": [6, 7], "3628098560209365": [6, 7], "072": 6, "8620108533993581": [6, 7], "34240779695521706": [6, 7], "120": [6, 7], "8638540565650902": [6, 7], "26493714991266293": [6, 7], "8629799500771645": [6, 7], "30596394512914815": [6, 7], "8621408609583922": [6, 7], "33648829357762355": [6, 7], "8638132124078156": [6, 7], "2679814646317183": [6, 7], "319": [6, 7], "863983758876634": [6, 7], "24062119162159595": [6, 7], "8627356047945115": [6, 7], "3141728910335158": [6, 7], "8639203054085788": [6, 7], "23391390640786494": [6, 7], "8570103863991635": [6, 7], "6124885145996103": [6, 7], "532": 6, "8647961976727571": [6, 7], "2059976546070975": [6, 7], "591": 6, "8648312544921793": [6, 7], "20266060662750784": [6, 7], "653": [6, 7], "8648431452862716": [6, 7], "20027647978240445": [6, 7], "715": 6, "8648491459660418": [6, 7], "1968919999787333": [6, 7], "778": 6, "8650873115156988": [6, 7], "174598921162764": [6, 7], "855": 6, "8650350577921149": [6, 7], "16468002989641095": [6, 7], "928": 6, "8649412283687147": [6, 7], "1606717091615047": [6, 7], "986e": [6, 7], "015": [6, 7], "8649537211609554": [6, 7], "14694925097689848": [6, 7], "8649734575435447": [6, 7], "147612713300643": [6, 7], "446e": [6, 7], "175": [6, 7], "8648761002838515": [6, 7], "14440434705706803": [6, 7], "398e": [6, 7], "251": [6, 7], "8639826593122782": [6, 7], "1265357179513065": [6, 7], "690e": [6, 7], "328": [6, 7], "864435565531768": [6, 7], "1374245525868926": [6, 7], "366": [6, 7], "8590221951825531": [6, 7], "49890830155012533": [6, 7], "8649098880804443": [6, 7], "1573428812070292": [6, 7], "405e": [6, 7], "520": 6, "864536410656637": [6, 7], "13886104722511608": [6, 7], "561": [6, 7], "8597401050431873": [6, 7], "47746341180045787": [6, 7], "600": 6, "8537465461603838": [6, 7], "050e": [6, 7], "8642643827090003": [6, 7], "13446778921611002": [6, 7], "175e": [6, 7], "8641621818665252": [6, 7], "1286796719653316": [6, 7], "854": [6, 7], "864182755916388": [6, 7], "13303218726548235": [6, 7], "1255357440899417": [6, 7], "021711452917433944": [6, 7], "559714273835951e": [6, 7], "937": [6, 7], "8604596648091501": [6, 7], "43644874418279245": [6, 7], "463e": [6, 7], "8635689909135862": [6, 7], "10940922083495383": [6, 7], "078": 6, "8648544336551733": [6, 7], "1912756875742137": [6, 7], "142": 6, "8648496595672595": [6, 7], "19628449928540487": [6, 7], "170": [6, 7], "8452625121122099": [6, 7], "4324661283995224": [6, 7], "198": [6, 7], "8378670635846416": [6, 7], "839206620815206": [6, 7], "002e": [6, 7], "082e": [6, 7], "286": 6, "8649365368153895": [6, 7], "07270781179126021": [6, 7], "373": 6, "8875676754699953": [6, 7], "0006995169897945908": [6, 7], "618e": [6, 7], "234e": [6, 7], "586e": [6, 7], "465": [6, 7], "8730555131061773": [6, 7], "0018186269840273495": [6, 7], "509": [6, 7], "12553508835019533": [6, 7], "04867556317570456": [6, 7], "0011658455138452": [6, 7], "177e": [6, 7], "284e": [6, 7], "016e": [6, 7], "599": [6, 7], "8586292788613132": [6, 7], "005078762921098462": [6, 7], "anyalgorithm": [6, 7], "__args__": [6, 7], "consider": [6, 7, 8], "modif": [6, 7, 11, 13], "establish": [6, 7], "rf": [6, 7], "account": [6, 7, 8, 9], "though": [6, 7], "treat": [6, 7, 8], "pdf": [6, 7, 10], "denot": [6, 7, 13, 14], "determinist": [6, 7, 8], "quantiti": [6, 7], "tradit": [6, 7, 8], "discret": [6, 7], "discretis": [6, 7, 13, 15], "bioactiv": [6, 7, 8], "integr": [6, 7], "afford": [6, 7, 8], "liklihood": [6, 7], "membership": [6, 7, 8], "iopscienc": [6, 7], "iop": [6, 7], "articl": [6, 7, 8], "3847": [6, 7], "1538": [6, 7], "3881": [6, 7], "aaf101": [6, 7], "pxc50": [6, 7, 8], "p24863": [6, 7], "enabl": [6, 7, 8], "alwai": [6, 7, 8, 9], "724": 6, "0811707042483984": 6, "prfclassifier_algorithm_hash": [6, 7], "efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "max_depth__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "n_estimators__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "max_features__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "prfclassifiermaxfeatur": [6, 7, 10], "min_py_sum_leaf__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "use_py_gini__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "use_py_leafs__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "07385123845467624": 6, "08693605025593726": 6, "782": [6, 7], "07306390786920249": 6, "07213945175504542": 6, "055757209329220986": 6, "039": 6, "06330901806749258": 6, "811": 6, "07619841217081819": 6, "061815145745506755": 6, "091": 6, "07429343450473058": 6, "06446287784137206": 6, "574": 6, "06120344765133655": 6, "745": 6, "0686143607166384": 6, "199": 6, "05295650394252901": 6, "best_built": [6, 7], "demonstr": [6, 7, 8], "purpos": [6, 7, 8], "transduct": [6, 7], "example_smil": [6, 7], "get_set": [6, 7, 8, 9], "outsid": [6, 7, 8, 9], "likelihood": [6, 7], "problemat": [6, 7], "except": [6, 7, 9, 11, 13], "valueerror": [6, 7], "As": [6, 7, 8], "raw": [6, 7, 8, 9, 13], "551": [6, 7], "595": [6, 7], "w": [6, 7, 9], "fail": [6, 7, 9], "traceback": [6, 7], "recent": [6, 7], "_optim": [6, 7], "196": [6, 7], "_run_trial": [6, 7], "value_or_valu": [6, 7], "func": [6, 7], "pycharmproject": [6, 7], "optuna_az": [6, 8], "128": [6, 7], "__call__": [6, 7], "_validate_algo": [6, 7], "rais": [6, 7, 9, 11, 13], "598": 6, "summaris": [6, 7], "handl": [6, 7], "convent": [6, 7, 8, 11], "classic": [6, 7], "relev": [6, 7], "cutoff": [6, 7, 8, 13], "ouput": [6, 7], "reflect": [6, 7, 8], "abov": [6, 7, 8], "arguabl": [6, 7], "mpo": [6, 7], "pub": [6, 7], "ac": [6, 7], "full": [6, 7, 10], "jcim": [6, 7], "9b00237": [6, 7], "slide": [6, 7], "googl": [6, 7], "14pbd9ltxzfpsjhyxykflxnk8q80lhvnjimg8a3wqcrm": [6, 7], "edit": [6, 7], "calcault": [6, 7], "smilesbaseddescriptor": [6, 7], "architectur": [6, 7, 8], "quickli": [6, 7], "650": [6, 7], "root": [6, 7, 10, 11], "enqueu": [6, 7, 9], "manual": [6, 7], "activation__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "relu": [6, 7, 10], "aggregation__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "aggregation_norm__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "batch_size__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "depth__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "dropout__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "features_generator__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "ffn_hidden_size__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "ffn_num_layers__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "final_lr_ratio_exp__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "hidden_size__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "init_lr_ratio_exp__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "max_lr_exp__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "warmup_epochs_ratio__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "chempropregressor_algorithm_hash": [6, 7], "668a7428ff5cdb271b01c0925e8fea45": [6, 7], "416": 6, "6833": [6, 7], "034983241957": [6, 7], "chempropactiv": [6, 7, 10], "chempropaggreg": [6, 7, 10], "ensemble_size__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "epochs__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "chempropfeatures_gener": [6, 7, 10], "531": [6, 7], "6341": 6, "72494883772": 6, "115": [6, 7], "500": [6, 7], "1500": 6, "safe": [6, 7], "nan": [6, 7, 9, 13, 14], "prompt": [6, 7], "due": [6, 7, 8, 9, 11], "deactiv": [6, 7], "own": [6, 7], "still": [6, 7], "commun": [6, 7], "facilit": [6, 7, 8, 10], "preset": [6, 7], "enqu": [6, 7], "bayesian": [6, 7], "split_chemprop": [6, 7, 10], "flag": [6, 7, 8, 13, 14], "n_chemprop_tri": [6, 7, 10], "desir": [6, 7], "undirect": [6, 7], "shown": [6, 7, 8], "aspect": [6, 7, 9], "princip": [6, 7, 8], "expand": [6, 7, 9], "differnt": [6, 7], "rememb": [6, 7], "unless": [6, 7], "alter": [6, 7, 10], "characterist": [6, 7, 8], "too": [6, 7, 10], "limit": [6, 7, 8, 10], "vice": [6, 7, 10], "versa": [6, 7, 10], "extens": [6, 7, 10], "trail": [6, 7, 10], "applic": [6, 7, 8, 10], "chanc": [6, 7], "caruana": [6, 7], "particular": [6, 7], "achiev": [6, 7, 8], "st": [6, 7], "figur": [6, 7, 8], "signal": [6, 7], "aka": [6, 7], "could": [6, 7, 8], "share": [6, 7, 13, 14], "until": [6, 7, 10], "longer": [6, 7, 11], "mt": [6, 7], "onc": [6, 7, 8, 13], "knowledg": [6, 7], "order": [6, 7, 8, 10, 13], "earlier": [6, 7, 8], "accompi": [6, 7], "train_side_info": [6, 7], "clog": [6, 7], "surfac": [6, 7], "area": [6, 7, 8], "psa": [6, 7], "293": [6, 7], "22475": [6, 7], "8088": [6, 7], "883": [6, 7], "32297": [6, 7], "6237": [6, 7], "835": [6, 7], "287": [6, 7], "33334": [6, 7], "2804": [6, 7], "314": [6, 7], "26075": [6, 7], "2533": [6, 7], "498": [6, 7], "278": [6, 7], "18917": [6, 7], "5102": [6, 7], "694": [6, 7], "246": [6, 7], "12575": [6, 7], "7244": [6, 7], "255": [6, 7], "14831": [6, 7], "4338": [6, 7], "895": [6, 7], "302": [6, 7], "26838": [6, 7], "2041": [6, 7], "057": [6, 7], "22298": [6, 7], "match": [6, 7], "train_side_info_cl": [6, 7], "clogp_gt2": [6, 7], "clogs_gt": [6, 7], "acceptors_gt5": [6, 7], "donors_gt0": [6, 7], "area_gt250": [6, 7], "psa_lt0": [6, 7], "832": 6, "809": [6, 7], "5817": [6, 7], "944294219682": 6, "chemprophyperoptregressor_algorithm_hash": [6, 7], "db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "ensemble_size__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "epochs__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "features_generator__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "num_iters__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "search_parameter_level__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "chempropsearch_parameter_level": [6, 7, 10], "aux_weight_pc__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "841": 6, "5796": [6, 7], "344216469237": 6, "443": 6, "5795": [6, 7], "086276167766": 6, "468": [6, 7], "5820": [6, 7], "228288292862": 6, "012": [6, 7], "5852": [6, 7], "160071204277": 6, "inlfuenc": [6, 7], "henc": [6, 7, 8], "percent": [6, 7], "product": [6, 7], "user_attrs_trial_ran": [6, 7], "drop": [6, 7, 8, 9], "erron": [6, 7], "__": [6, 7], "params_aux_weight_pc": [6, 7], "conclud": [6, 7, 8], "produc": [6, 7], "overrid": [6, 7, 10], "situat": [6, 7, 8], "along": [6, 7], "potenti": [6, 7, 8], "compris": [6, 7, 8], "incompat": [6, 7, 11], "whilst": [6, 7, 8], "desciptor": [6, 7], "grei": [6, 7, 8], "tial": [6, 7], "what": [6, 7], "unpromis": [6, 7], "why": [6, 7, 8], "poor": [6, 7], "sampler": [6, 7], "incompta": [6, 7], "repeatedli": [6, 7], "hyerparamet": [6, 7], "ident": [6, 7, 11], "368": 6, "9525489095524835": [6, 7], "aux_weight_pc__cfa1990d5153c8812982f034d788d7e": [6, 7], "4824": [6, 7], "686269039228": [6, 7], "7731425652872588": [6, 7], "555": [6, 7], "4409": [6, 7], "946844928445": [6, 7], "791002332112292": [6, 7], "874": [6, 7], "329624779366306": [6, 7], "00015024763718638216": [6, 7], "917": [6, 7], "4396": [6, 7], "722635068717": [6, 7], "081": [6, 7], "309": [6, 7], "320": 6, "consult": [6, 7], "incompitbl": [6, 7], "algo": [6, 7, 10], "occur": [6, 7, 9], "assign": [6, 7, 8], "doe": [6, 7, 8, 9, 10, 11, 13], "params_algorithm_nam": [6, 7], "move_legend": [6, 7], "upper": [6, 7, 8], "bbox_to_anchor": [6, 7, 8], "never": [6, 7], "successfulli": [6, 7], "absenc": [6, 7], "8th": [6, 7], "miss": [6, 7, 9, 13, 14], "associ": [6, 7, 8], "asid": [6, 7], "mitig": [6, 7], "overal": [6, 7, 8], "serv": [6, 7, 12], "tl": [6, 7], "wider": [6, 7], "787": 6, "788": [6, 7], "activation__e0d3a442222d4b38f3aa1434851320db": [6, 7], "aggregation__e0d3a442222d4b38f3aa1434851320db": [6, 7], "aggregation_norm__e0d3a442222d4b38f3aa1434851320db": [6, 7], "batch_size__e0d3a442222d4b38f3aa1434851320db": [6, 7], "depth__e0d3a442222d4b38f3aa1434851320db": [6, 7], "dropout__e0d3a442222d4b38f3aa1434851320db": [6, 7], "features_generator__e0d3a442222d4b38f3aa1434851320db": [6, 7], "ffn_hidden_size__e0d3a442222d4b38f3aa1434851320db": [6, 7], "ffn_num_layers__e0d3a442222d4b38f3aa1434851320db": [6, 7], "final_lr_ratio_exp__e0d3a442222d4b38f3aa1434851320db": [6, 7], "hidden_size__e0d3a442222d4b38f3aa1434851320db": [6, 7], "init_lr_ratio_exp__e0d3a442222d4b38f3aa1434851320db": [6, 7], "max_lr_exp__e0d3a442222d4b38f3aa1434851320db": [6, 7], "warmup_epochs_ratio__e0d3a442222d4b38f3aa1434851320db": [6, 7], "e0d3a442222d4b38f3aa1434851320db": [6, 7], "4937": [6, 7], "540075659691": [6, 7], "ensemble_size__e0d3a442222d4b38f3aa1434851320db": [6, 7], "epochs__e0d3a442222d4b38f3aa1434851320db": [6, 7], "953": 6, "462": [6, 7], "5114": [6, 7], "7131239123555": [6, 7], "chempropregressorpretrained_algorithm_hash": [6, 7], "dfc518a76317f23d95e5aa5a3eac77f0": [6, 7], "frzn__dfc518a76317f23d95e5aa5a3eac77f0": [6, 7], "chempropfrzn": [6, 7, 10], "epochs__dfc518a76317f23d95e5aa5a3eac77f0": [6, 7], "cover": [6, 7], "global": [6, 7], "fair": [6, 7], "tl_studi": [6, 7], "loc": [6, 7, 8], "params_epoch": [6, 7], "fillna": [6, 7], "astyp": [6, 7, 8], "agg": [6, 7], "join": [6, 7, 8], "params_chempropregressor_algorithm_hash": [6, 7], "isna": [6, 7], "570": [6, 7], "452": [6, 7], "5891": [6, 7], "7552821093905": [6, 7], "994": [6, 7], "105": [6, 7], "5846": [6, 7], "8674879655655": [6, 7], "1600": [6, 7], "861": [6, 7], "5890": [6, 7], "94653501547": [6, 7], "77dfc8230317e08504ed5e643243fbc2": [6, 7], "frzn__77dfc8230317e08504ed5e643243fbc2": [6, 7], "epochs__77dfc8230317e08504ed5e643243fbc2": [6, 7], "283": 6, "881210303758": [6, 7], "right": [6, 7, 8], "ncol": [6, 7], "world": [6, 7, 8, 13, 14], "penultim": [6, 7, 10], "chemprop_model": [6, 7], "heatmap": [6, 7], "predictor": [6, 7, 9], "chemprop_fingerprint": [6, 7], "fingerprint_typ": [6, 7], "mpn": [6, 7], "cbar_kw": [6, 7], "semi": [6, 7], "supervis": [6, 7], "altern": [6, 7], "last_ffn": [6, 7], "howeev": [6, 7], "respect": [6, 7, 8], "kind": [6, 7, 8, 13], "confid": [6, 7], "calibratedclassifiercv": [6, 7], "understand": [6, 7], "predict_proba": [6, 7, 9], "gave": [6, 7], "close": [6, 7, 8], "actual": [6, 7, 8], "topic": [6, 7], "sigmoid": [6, 7, 10], "review": [6, 7], "those": [6, 7, 8, 9], "calibration_curv": [6, 7], "collect": [6, 7], "defaultdict": [6, 7], "precision_scor": [6, 7], "recall_scor": [6, 7], "f1_score": [6, 7], "brier_score_loss": [6, 7], "log_loss": [6, 7], "roc_auc_scor": [6, 7], "n_job": [6, 7, 10, 12], "calibrated_rf": [6, 7], "calibrated_model": [6, 7], "701": [6, 7], "703": 6, "775": [6, 7], "8353535353535354": [6, 7], "calibratedclassifiercvwithva_algorithm_hash": [6, 7], "e788dfbfc5075967acb5ddf9d971ea20": [6, 7], "n_folds__e788dfbfc5075967acb5ddf9d971ea20": [6, 7], "max_depth__e788dfbfc5075967acb5ddf9d971ea20": [6, 7], "n_estimators__e788dfbfc5075967acb5ddf9d971ea20": [6, 7], "max_features__e788dfbfc5075967acb5ddf9d971ea20": [6, 7], "uncalibr": [6, 7], "uncalibrated_rf": [6, 7], "uncalibrated_model": [6, 7], "306": 6, "352": 6, "719": [6, 7], "8185858585858585": [6, 7], "randomforestclassifier_algorithm_hash": [6, 7], "167e1e88dd2a80133e317c78f009bdc9": [6, 7], "max_depth__167e1e88dd2a80133e317c78f009bdc9": [6, 7], "n_estimators__167e1e88dd2a80133e317c78f009bdc9": [6, 7], "max_features__167e1e88dd2a80133e317c78f009bdc9": [6, 7], "conserv": [6, 7], "1000": [6, 7, 8], "random_st": [6, 7, 13, 14], "123": [6, 7], "calibrated_predict": [6, 7], "uncalibrated_predict": [6, 7], "cal_df": [6, 7], "datafram": [6, 7, 8, 9, 12, 13], "boxplot": [6, 7], "melt": [6, 7], "set_ylabel": [6, 7, 8], "behaviour": [6, 7, 8], "curv": [6, 7, 8], "reliabl": [6, 7], "diagram": [6, 7], "against": [6, 7], "figsiz": [6, 7, 8], "ax1": [6, 7], "subplot2grid": [6, 7], "rowspan": [6, 7], "ax2": [6, 7], "perfectli": [6, 7, 8], "pred": [6, 7], "fraction_of_posit": [6, 7], "mean_predicted_valu": [6, 7], "n_bin": [6, 7], "brier": [6, 7], "2f": [6, 7], "hist": [6, 7], "histtyp": [6, 7], "lw": [6, 7], "set_ylim": [6, 7], "legend": [6, 7, 8], "set_titl": [6, 7], "set_xlabel": [6, 7, 8], "center": [6, 7, 8], "tight_layout": [6, 7, 8], "compos": [6, 7], "refin": [6, 7], "notic": [6, 7], "significantli": [6, 7], "cell": [6, 7], "accur": [6, 7], "alloc": [6, 7, 9], "y_prob": [6, 7], "ye": [6, 7], "score_nam": [6, 7], "__name__": [6, 7], "replac": [6, 7, 11], "capit": [6, 7], "score_df": [6, 7], "set_index": [6, 7], "decim": [6, 7], "roc": [6, 7], "auc": [6, 7, 9], "184705": [6, 7], "547129": [6, 7], "830565": [6, 7], "744048": [6, 7], "784929": [6, 7], "716536": [6, 7], "175297": [6, 7], "529474": [6, 7], "811209": [6, 7], "818452": [6, 7], "814815": [6, 7], "714104": [6, 7], "va": [6, 7], "multipoint": [6, 7], "0c00476": [6, 7], "margin": [6, 7, 8], "bounari": [6, 7], "384": [6, 7], "469": [6, 7], "8213131313131313": [6, 7], "79765fbec1586f3c917ff30de274fdb4": [6, 7], "n_folds__79765fbec1586f3c917ff30de274fdb4": [6, 7], "max_depth__79765fbec1586f3c917ff30de274fdb4": [6, 7], "n_estimators__79765fbec1586f3c917ff30de274fdb4": [6, 7], "max_features__79765fbec1586f3c917ff30de274fdb4": [6, 7], "uncert": [6, 7, 9], "chem": [6, 7, 8, 9], "allchem": [6, 7], "pandastool": [6, 7, 8], "rdconfig": [6, 7], "datastruct": [6, 7], "train_df": [6, 7], "addmoleculecolumntofram": [6, 7], "includefingerprint": [6, 7], "getmorganfingerprint": [6, 7], "nn": [6, 7], "bulktanimotosimilar": [6, 7], "va_pr": [6, 7], "va_uncert": [6, 7], "dtm": [6, 7], "trelli": [6, 7], "fig": [6, 7, 8], "subplot": [6, 7, 8], "sharei": [6, 7], "regplot": [6, 7], "referenc": [6, 7], "boundari": [6, 7, 8, 13, 15], "neither": [6, 7], "nor": [6, 7], "dissimilar": [6, 7], "cp_pred_ensembl": [6, 7], "cp_uncert_ensembl": [6, 7], "886": 6, "933": [6, 7], "activation__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "aggregation__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "aggregation_norm__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "batch_size__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "depth__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "dropout__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "features_generator__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "ffn_hidden_size__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "ffn_num_layers__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "final_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "hidden_size__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "init_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "max_lr_exp__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "warmup_epochs_ratio__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "chempropclassifier_algorithm_hash": [6, 7], "fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "137": [6, 7], "65625": [6, 7], "ensemble_size__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "epochs__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "midpoint": [6, 7], "mont": [6, 7], "carlo": [6, 7], "virtual": [6, 7, 9], "931": 6, "activation__c73885c5d5a4182168b8b002d321965a": [6, 7], "aggregation__c73885c5d5a4182168b8b002d321965a": [6, 7], "aggregation_norm__c73885c5d5a4182168b8b002d321965a": [6, 7], "batch_size__c73885c5d5a4182168b8b002d321965a": [6, 7], "depth__c73885c5d5a4182168b8b002d321965a": [6, 7], "dropout__c73885c5d5a4182168b8b002d321965a": [6, 7], "features_generator__c73885c5d5a4182168b8b002d321965a": [6, 7], "ffn_hidden_size__c73885c5d5a4182168b8b002d321965a": [6, 7], "ffn_num_layers__c73885c5d5a4182168b8b002d321965a": [6, 7], "final_lr_ratio_exp__c73885c5d5a4182168b8b002d321965a": [6, 7], "hidden_size__c73885c5d5a4182168b8b002d321965a": [6, 7], "init_lr_ratio_exp__c73885c5d5a4182168b8b002d321965a": [6, 7], "max_lr_exp__c73885c5d5a4182168b8b002d321965a": [6, 7], "warmup_epochs_ratio__c73885c5d5a4182168b8b002d321965a": [6, 7], "c73885c5d5a4182168b8b002d321965a": [6, 7], "371": [6, 7], "46875": [6, 7], "ensemble_size__c73885c5d5a4182168b8b002d321965a": [6, 7], "epochs__c73885c5d5a4182168b8b002d321965a": [6, 7], "cp_pred_dropout": [6, 7], "cp_uncert_dropout": [6, 7], "proabil": [6, 7], "va_predict": [6, 7], "correl": [6, 7, 8], "drouput": [6, 7], "uncertatinti": [6, 7], "cp_uncert_delta": [6, 7], "categor": [6, 7, 13], "unit": [6, 7, 8], "parsabl": [6, 7], "cast": [6, 7], "appropri": [6, 7], "befor": [6, 7, 8, 13], "choic": [6, 7, 13], "346": [6, 7], "391": [6, 7], "582": [6, 7], "4259": 6, "713886871285": 6, "mapie_algorithm_hash": [6, 7], "976d211e4ac64e5568d369bcddd3aeb1": [6, 7], "mapie_alpha__976d211e4ac64e5568d369bcddd3aeb1": [6, 7], "max_depth__976d211e4ac64e5568d369bcddd3aeb1": [6, 7], "n_estimators__976d211e4ac64e5568d369bcddd3aeb1": [6, 7], "max_features__976d211e4ac64e5568d369bcddd3aeb1": [6, 7], "analysi": [6, 7, 8, 9], "perfom": [6, 7], "post": [6, 7], "mapie_pr": [6, 7], "mapie_unc": [6, 7], "bar": [6, 7], "visualis": [6, 7], "errorbar": [6, 7], "yerr": [6, 7], "ab": [6, 7], "fmt": [6, 7], "black": [6, 7, 8], "ecolor": [6, 7], "grai": [6, 7], "elinewidth": [6, 7], "capsiz": [6, 7], "move": [6, 7, 11], "analys": [6, 7, 8], "width": [6, 7, 8], "alpha_impact": [6, 7], "ma": [6, 7], "unc_df": [6, 7], "unc": [6, 7], "reset_index": [6, 7, 8], "concat": [6, 7], "lineplot": [6, 7], "err_styl": [6, 7], "se": [6, 7], "incorpor": [6, 7], "tradition": [6, 7], "unsupport": [6, 7], "kernelexplain": [6, 7, 9], "shaplei": [6, 7], "explan": [6, 7], "slundberg": [6, 7], "game": [6, 7], "credit": [6, 7], "theori": [6, 7], "publish": [6, 7], "comopsit": [6, 7], "101": [6, 7], "146": 6, "_ridg": [6, 7], "243": [6, 7], "userwarn": [6, 7, 8], "singular": [6, 7], "matrix": [6, 7], "dual": [6, 7], "578": 6, "36553318492385256": 6, "9346053663473015": 6, "dga": [6, 7], "dgp": [6, 7], "dgtot": [6, 7], "sa": [6, 7], "sdc": [6, 7], "sdx": [6, 7], "numhacceptor": [6, 7], "numhdonor": [6, 7], "maxabsestateindex": [6, 7], "maxestateindex": [6, 7], "minabsestateindex": [6, 7], "minestateindex": [6, 7], "qed": [6, 7], "sp": [6, 7], "heavyatommolwt": [6, 7], "exactmolwt": [6, 7], "numvalenceelectron": [6, 7], "numradicalelectron": [6, 7], "maxpartialcharg": [6, 7], "minpartialcharg": [6, 7], "maxabspartialcharg": [6, 7], "minabspartialcharg": [6, 7], "fpdensitymorgan1": [6, 7], "fpdensitymorgan2": [6, 7], "fpdensitymorgan3": [6, 7], "bcut2d_mwhi": [6, 7], "bcut2d_mwlow": [6, 7], "bcut2d_chghi": [6, 7], "bcut2d_chglo": [6, 7], "bcut2d_logphi": [6, 7], "bcut2d_logplow": [6, 7], "bcut2d_mrhi": [6, 7], "bcut2d_mrlow": [6, 7], "avgipc": [6, 7], "balabanj": [6, 7], "bertzct": [6, 7], "chi0": [6, 7], "chi0n": [6, 7], "chi0v": [6, 7], "chi1": [6, 7], "chi1n": [6, 7], "chi1v": [6, 7], "chi2n": [6, 7], "chi2v": [6, 7], "chi3n": [6, 7], "chi3v": [6, 7], "chi4n": [6, 7], "chi4v": [6, 7], "hallkieralpha": [6, 7], "ipc": [6, 7], "kappa1": [6, 7], "kappa2": [6, 7], "kappa3": [6, 7], "labuteasa": [6, 7], "peoe_vsa1": [6, 7], "peoe_vsa10": [6, 7], "peoe_vsa11": [6, 7], "peoe_vsa12": [6, 7], "peoe_vsa13": [6, 7], "peoe_vsa14": [6, 7], "peoe_vsa2": [6, 7], "peoe_vsa3": [6, 7], "peoe_vsa4": [6, 7], "peoe_vsa5": [6, 7], "peoe_vsa6": [6, 7], "peoe_vsa7": [6, 7], "peoe_vsa8": [6, 7], "peoe_vsa9": [6, 7], "smr_vsa1": [6, 7], "smr_vsa10": [6, 7], "smr_vsa2": [6, 7], "smr_vsa3": [6, 7], "smr_vsa4": [6, 7], "smr_vsa5": [6, 7], "smr_vsa6": [6, 7], "smr_vsa7": [6, 7], "smr_vsa8": [6, 7], "smr_vsa9": [6, 7], "slogp_vsa1": [6, 7], "slogp_vsa10": [6, 7], "slogp_vsa11": [6, 7], "slogp_vsa12": [6, 7], "slogp_vsa2": [6, 7], "slogp_vsa3": [6, 7], "slogp_vsa4": [6, 7], "slogp_vsa5": [6, 7], "slogp_vsa6": [6, 7], "slogp_vsa7": [6, 7], "slogp_vsa8": [6, 7], "slogp_vsa9": [6, 7], "estate_vsa1": [6, 7], "estate_vsa10": [6, 7], "estate_vsa11": [6, 7], "estate_vsa2": [6, 7], "estate_vsa3": [6, 7], "estate_vsa4": [6, 7], "estate_vsa5": [6, 7], "estate_vsa6": [6, 7], "estate_vsa7": [6, 7], "estate_vsa8": [6, 7], "estate_vsa9": [6, 7], "vsa_estate1": [6, 7], "vsa_estate10": [6, 7], "vsa_estate2": [6, 7], "vsa_estate3": [6, 7], "vsa_estate4": [6, 7], "vsa_estate5": [6, 7], "vsa_estate6": [6, 7], "vsa_estate7": [6, 7], "vsa_estate8": [6, 7], "vsa_estate9": [6, 7], "fractioncsp3": [6, 7], "heavyatomcount": [6, 7], "nhohcount": [6, 7], "nocount": [6, 7], "numaliphaticcarbocycl": [6, 7], "numaliphaticheterocycl": [6, 7], "numaliphaticr": [6, 7], "numaromaticcarbocycl": [6, 7], "numaromaticheterocycl": [6, 7], "numaromaticr": [6, 7], "numheteroatom": [6, 7], "numrotatablebond": [6, 7], "numsaturatedcarbocycl": [6, 7], "numsaturatedheterocycl": [6, 7], "numsaturatedr": [6, 7], "ringcount": [6, 7], "mollogp": [6, 7], "molmr": [6, 7], "fr_al_coo": [6, 7], "fr_al_oh": [6, 7], "fr_al_oh_notert": [6, 7], "fr_arn": [6, 7], "fr_ar_coo": [6, 7], "fr_ar_n": [6, 7], "fr_ar_nh": [6, 7], "fr_ar_oh": [6, 7], "fr_coo": [6, 7], "fr_coo2": [6, 7], "fr_c_o": [6, 7], "fr_c_o_nocoo": [6, 7], "fr_c_": [6, 7], "fr_hoccn": [6, 7], "fr_imin": [6, 7], "fr_nh0": [6, 7], "fr_nh1": [6, 7], "fr_nh2": [6, 7], "fr_n_o": [6, 7], "fr_ndealkylation1": [6, 7], "fr_ndealkylation2": [6, 7], "fr_nhpyrrol": [6, 7], "fr_sh": [6, 7], "fr_aldehyd": [6, 7], "fr_alkyl_carbam": [6, 7], "fr_alkyl_halid": [6, 7], "fr_allylic_oxid": [6, 7], "fr_amid": [6, 7], "fr_amidin": [6, 7], "fr_anilin": [6, 7], "fr_aryl_methyl": [6, 7], "fr_azid": [6, 7], "fr_azo": [6, 7], "fr_barbitur": [6, 7], "fr_benzen": [6, 7], "fr_benzodiazepin": [6, 7], "fr_bicycl": [6, 7], "fr_diazo": [6, 7], "fr_dihydropyridin": [6, 7], "fr_epoxid": [6, 7], "fr_ester": [6, 7], "fr_ether": [6, 7], "fr_furan": [6, 7], "fr_guanido": [6, 7], "fr_halogen": [6, 7], "fr_hdrzine": [6, 7], "fr_hdrzone": [6, 7], "fr_imidazol": [6, 7], "fr_imid": [6, 7], "fr_isocyan": [6, 7], "fr_isothiocyan": [6, 7], "fr_keton": [6, 7], "fr_ketone_topliss": [6, 7], "fr_lactam": [6, 7], "fr_lacton": [6, 7], "fr_methoxi": [6, 7], "fr_morpholin": [6, 7], "fr_nitril": [6, 7], "fr_nitro": [6, 7], "fr_nitro_arom": [6, 7], "fr_nitro_arom_nonortho": [6, 7], "fr_nitroso": [6, 7], "fr_oxazol": [6, 7], "fr_oxim": [6, 7], "fr_para_hydroxyl": [6, 7], "fr_phenol": [6, 7], "fr_phenol_noorthohbond": [6, 7], "fr_phos_acid": [6, 7], "fr_phos_est": [6, 7], "fr_piperdin": [6, 7], "fr_piperzin": [6, 7], "fr_priamid": [6, 7], "fr_prisulfonamd": [6, 7], "fr_pyridin": [6, 7], "fr_quatn": [6, 7], "fr_sulfid": [6, 7], "fr_sulfonamd": [6, 7], "fr_sulfon": [6, 7], "fr_term_acetylen": [6, 7], "fr_tetrazol": [6, 7], "fr_thiazol": [6, 7], "fr_thiocyan": [6, 7], "fr_thiophen": [6, 7], "fr_unbrch_alkan": [6, 7], "fr_urea": [6, 7], "shap_valu": [6, 7], "2227": [6, 7], "042517e": 6, "2229": [6, 7], "025057e": 6, "2228": [6, 7], "804876e": 6, "2267": [6, 7], "372192e": 6, "00": [6, 7], "2230": [6, 7], "106846e": 6, "352611e": 6, "1375": 6, "1376": 6, "s1": 6, "n1c": [6, 7], "1784": 6, "1785": 6, "995": 6, "1617": 6, "1618": 6, "1570": [6, 7], "contrinubt": [6, 7], "datset": [6, 7], "unscaledphyschemjazzi": [6, 7], "rank": [6, 7, 9], "053": 6, "742": 6, "t": [6, 7, 8, 9, 10], "kekul": [6, 7], "unkekul": [6, 7], "rational": [6, 7], "rationale_scor": [6, 7], "097": [6, 7], "ch3": [6, 7], "ch": [6, 7], "389": [6, 7, 8], "151": [6, 7], "485": [6, 7], "c1c": [6, 7], "c1n": [6, 7], "ch2": [6, 7], "nh2": [6, 7], "565": [6, 7], "nn1cc1c": [6, 7], "c1cccc": [6, 7], "110": [6, 7], "997": [6, 7], "contian": [6, 7], "second": [6, 7], "dummi": [6, 7], "third": [6, 7], "smallest": [6, 7], "made": [6, 7, 8], "fourth": [6, 7], "irregularli": [6, 7], "xc50": [6, 7, 8], "log10": [6, 7, 8, 13, 15], "6th": [6, 7], "convers": [6, 7, 8, 13, 15], "logbas": [6, 7, 8, 13, 15], "logneg": [6, 7, 8, 13, 15], "negat": [6, 7, 8, 13, 15], "transformed_studi": [6, 7], "transform_exampl": [6, 7], "5959493772536109": 6, "6571993250300608": [6, 7], "426": 6, "1511102853256885": [6, 7], "516": 6, "2487063317112765": [6, 7], "6714912461080983": [6, 7], "2725944467796781": [6, 7], "606": [6, 7], "194926264155893": [6, 7], "7520919188596032": [6, 7], "748": 6, "7803723847416691": [6, 7], "764": [6, 7], "6397753979196248": [6, 7], "781": 6, "151110299986041": [6, 7], "798": 6, "151110111437006": [6, 7], "5410418750776741": [6, 7], "829": [6, 7], "7183231137124538": [6, 7], "845": [6, 7], "2721824844856162": [6, 7], "912": [6, 7], "19009294702225": [6, 7], "929": 6, "945": [6, 7], "5585323973564646": [6, 7], "3169218304262786": [6, 7], "028": 6, "7974925066137679": [6, 7], "045": 6, "218395226466336": [6, 7], "062": [6, 7], "1474226942497083": [6, 7], "066": [6, 7], "0239005731675412": [6, 7], "150": [6, 7], "169": [6, 7], "178901060853144": [6, 7], "187": 6, "27137790098830755": [6, 7], "206": [6, 7], "2710284516876423": [6, 7], "6273152492418945": [6, 7], "1900929470222508": [6, 7], "361": 6, "1907041717628215": [6, 7], "398": [6, 7], "3209075619139279": [6, 7], "403": 6, "2709423025014604": [6, 7], "438": [6, 7], "3133943310851415": [6, 7], "461": [6, 7], "257769959239938": [6, 7], "40359637945134746": 6, "658": 6, "4127882135896648": [6, 7], "663": 6, "734": [6, 7], "9246005133276612": [6, 7], "885": [6, 7], "8908739215746118": 6, "905": [6, 7], "107536316777608": [6, 7], "054360360588395": [6, 7], "964": 6, "5428179904345867": [6, 7], "983": 6, "5696273642213351": [6, 7], "007": [6, 7], "27099769667470536": [6, 7], "1580741708125475": [6, 7], "2709564785634315": [6, 7], "10900413894771653": [6, 7], "056": [6, 7], "2709799905898163": [6, 7], "13705914456987853": [6, 7], "080": [6, 7], "27097230608092054": [6, 7], "12790870116376127": [6, 7], "102": [6, 7], "2709499903064464": [6, 7], "10123180962907431": [6, 7], "2710895886052581": [6, 7], "26565663774320425": [6, 7], "149": 6, "2708711012023424": [6, 7], "005637048678674678": [6, 7], "174": [6, 7], "27092322402109364": [6, 7], "06902647427781451": [6, 7], "2712140349882": [6, 7], "4076704953178294": [6, 7], "27090080367174": [6, 7], "04187106800188596": [6, 7], "27086925247190047": [6, 7], "003371853599610078": [6, 7], "2708933298483799": [6, 7], "032781796328385376": [6, 7], "27087205624489635": [6, 7], "006806773659187283": [6, 7], "2708869511176179": [6, 7], "025009489814943348": [6, 7], "2711465077924297": [6, 7], "3311125627707556": [6, 7], "369": [6, 7], "2708756855936628": [6, 7], "011249102380159387": [6, 7], "395": [6, 7], "27087301924224993": [6, 7], "007985924302396141": [6, 7], "419": [6, 7], "2708685399954944": [6, 7], "00249856291483601": [6, 7], "444": [6, 7], "27121879554836553": [6, 7], "4130244908975993": [6, 7], "470": 6, "2708693196600531": [6, 7], "0034541978803366022": [6, 7], "27110195265802334": [6, 7], "27994943662091765": [6, 7], "2708682582859318": [6, 7], "0021532199144365088": [6, 7], "545": [6, 7], "27087024523986086": [6, 7], "0045884092728113585": [6, 7], "569": 6, "27087351807632193": [6, 7], "008596600952859433": [6, 7], "2710818633795896": [6, 7], "2567049271070902": [6, 7], "620": [6, 7], "27103241786565463": [6, 7], "1990111983307052": [6, 7], "2710350879598171": [6, 7], "20214459724424078": [6, 7], "2708688328221868": [6, 7], "00285750520671645": [6, 7], "697": [6, 7], "27100832234449684": [6, 7], "17064008990759916": [6, 7], "721": [6, 7], "27268613236193845": [6, 7], "8725420109733135": [6, 7], "747": [6, 7], "27119617446689237": [6, 7], "387533542012365": [6, 7], "773": 6, "2708691110831552": [6, 7], "0031985656730512953": [6, 7], "800": [6, 7], "27086852174155146": [6, 7], "002476186542950981": [6, 7], "27135383618835024": [6, 7], "5626643670396761": [6, 7], "2709819654433871": [6, 7], "1394077979875128": [6, 7], "2718548944510965": [6, 7], "0858347526799794": [6, 7], "1508084699212935": [6, 7], "03329943145150872": [6, 7], "00025672309762227527": [6, 7], "27249853374634975": [6, 7], "702026434077893": [6, 7], "27095660957755363": [6, 7], "10916094511173127": [6, 7], "987": [6, 7], "27102160995407715": [6, 7], "18630665884100353": [6, 7], "27095708822582026": [6, 7], "10973377642487026": [6, 7], "041": [6, 7], "27088222008661084": [6, 7], "019235980282946118": [6, 7], "2708703086029017": [6, 7], "004666043957133775": [6, 7], "27095279044622245": [6, 7], "1045877457096882": [6, 7], "2709408288690431": [6, 7], "09023455456986404": [6, 7], "152": [6, 7], "9289218260898663": [6, 7], "8200088368788958": [6, 7], "181": [6, 7], "27086675101898655": [6, 7], "00030502148265565063": [6, 7], "209": 6, "2710491243757999": [6, 7], "21858260742423916": [6, 7], "239": [6, 7], "1491615840508995": [6, 7], "024725853754515203": [6, 7], "2709462479577586": [6, 7], "0967427718847167": [6, 7], "default_studi": [6, 7], "837": [6, 7], "3501": [6, 7], "942111261296": [6, 7], "5451": [6, 7], "207265576796": [6, 7], "1049201007814": [6, 7], "9964": [6, 7], "541364058234": [6, 7], "003": [6, 7], "3543": [6, 7], "953608539901": [6, 7], "6837": [6, 7], "057544630979": [6, 7], "043": [6, 7], "2507": [6, 7], "1794330606067": [6, 7], "21534": [6, 7], "719219668405": [6, 7], "2899": [6, 7], "736555614694": [6, 7], "294e": [6, 7], "760e": [6, 7], "167": 6, "21674": [6, 7], "445000284228": [6, 7], "1049203123567": [6, 7], "1049192609138": [6, 7], "3630": [6, 7], "72768093756": [6, 7], "3431": [6, 7], "942816967268": [6, 7], "6908": [6, 7], "462045154488": [6, 7], "5964": [6, 7], "65935954044": [6, 7], "332": [6, 7], "21070": [6, 7], "107195348774": [6, 7], "348": 6, "4977": [6, 7], "068508997133": [6, 7], "8873": [6, 7], "669262669626": [6, 7], "21387": [6, 7], "63697424318": [6, 7], "9958": [6, 7], "573006910125": [6, 7], "463": [6, 7], "5182695600183": [6, 7], "467": [6, 7], "20684": [6, 7], "56412138056": [6, 7], "3435882510586": [6, 7], "7068": [6, 7], "705383113378": [6, 7], "613": 6, "7150": [6, 7], "482090052133": [6, 7], "680": [6, 7], "698": 6, "203": [6, 7], "93637462922368": [6, 7], "762": [6, 7], "779": [6, 7], "2570": [6, 7], "5111262532305": [6, 7], "21987": [6, 7], "659957192194": [6, 7], "9889": [6, 7], "493204596083": [6, 7], "819": [6, 7], "7172": [6, 7], "208490771303": [6, 7], "856": [6, 7], "9804": [6, 7], "512701665093": [6, 7], "881": [6, 7], "9165": [6, 7], "74081120673": [6, 7], "949": [6, 7], "543": [6, 7], "0280270800017": [6, 7], "161": [6, 7], "1602933782954": [6, 7], "888460860864": [6, 7], "109": 6, "8414": [6, 7], "932694243476": [6, 7], "2270": [6, 7], "540799189148": 6, "10383": [6, 7], "79559309305": [6, 7], "20815": [6, 7], "025469865475": [6, 7], "7560385808573": [6, 7], "244": 6, "5264": [6, 7], "4700789389035": [6, 7], "3668": [6, 7], "255064135424": [6, 7], "290": 6, "156": [6, 7], "12174877890536": [6, 7], "793408178086295": [6, 7], "99902820845678": [6, 7], "316": [6, 7], "371632749506": [6, 7], "88307313087517": [6, 7], "140915461519354": [6, 7], "340": [6, 7], "153": [6, 7], "66773675231477": [6, 7], "177324126813716": [6, 7], "77906017834145": [6, 7], "52056745848623": [6, 7], "4565714180547": [6, 7], "6710444346508": [6, 7], "392": [6, 8], "30976119334312": [6, 7], "62916671166313": [6, 7], "023639423189294": [6, 7], "418": [6, 7], "053696900694": [6, 7], "914617418880486": [6, 7], "31140591484044": [6, 7], "201": [6, 7], "33573874994386": [6, 7], "569769302718845": [6, 7], "5781354926491789": [6, 7], "190": [6, 7], "1384885119049": [6, 7], "87666716965626": [6, 7], "2537791489618": [6, 7], "076949848299": [6, 7], "9559574710535281": [6, 7], "0032830967319653665": [6, 7], "522": 6, "764974036324": [6, 7], "03910427457823": [6, 7], "406811480459925": [6, 7], "546": 6, "164": [6, 7], "4477304958181": [6, 7], "701690847791482": [6, 7], "819274780536123": [6, 7], "573": [6, 7], "87939164358104": [6, 7], "32187661108304": [6, 7], "660320437878754": [6, 7], "601": [6, 7], "01705178481896": [6, 7], "61397716361812": [6, 7], "603665957830847": [6, 7], "629": [6, 7], "155": [6, 7], "73257312230092": [6, 7], "759645965959294": [6, 7], "503212714246787": [6, 7], "656": [6, 7], "154": [6, 7], "46848394144124": [6, 7], "8546740801317": [6, 7], "35327336610912": [6, 7], "683": 6, "20421802817864": [6, 7], "57596974747163": [6, 7], "84756262407801": [6, 7], "709": 6, "51233215278089": [6, 7], "3564642040401464": [6, 7], "5034542273159819": [6, 7], "68667089892196": [6, 7], "034895878929095": [6, 7], "03653571911285094": [6, 7], "52277054278186": [6, 7], "01961499216484045": [6, 7], "670937191883546": [6, 7], "28722475694815": [6, 7], "012434370509176538": [6, 7], "34222704431493": [6, 7], "816": [6, 7], "87402050281146": [6, 7], "008452015347522093": [6, 7], "914863578437455": [6, 7], "844": 6, "38847505937936": [6, 7], "01573542234868893": [6, 7], "99307522974174": [6, 7], "870": 6, "96336195786391": [6, 7], "009845516063879428": [6, 7], "59422914099683": [6, 7], "19345618324213": [6, 7], "009382525091504246": [6, 7], "35573659237662": [6, 7], "30772721342525": [6, 7], "010579672066291478": [6, 7], "35550323165882": [6, 7], "954": [6, 7], "23970902543148": [6, 7], "013369359066405863": [6, 7], "4744102498801": [6, 7], "984": 6, "34331248758777": [6, 7], "011398351701814368": [6, 7], "54146340620301": [6, 7], "104535853341": [6, 7], "011708779850509646": [6, 7], "682286191624579e": [6, 7], "040": [6, 7], "0653774146952": [6, 7], "009806826677473646": [6, 7], "90274406278985": [6, 7], "64646042813787": [6, 7], "0038598153381434685": [6, 7], "20918134828555": [6, 7], "68420472011734": [6, 7], "0032474576673554513": [6, 7], "35551178979624": [6, 7], "85985201823172": [6, 7], "003187930738019005": [6, 7], "29431603544847": [6, 7], "21583898009355": [6, 7], "003122319313153475": [6, 7], "83526418992966": [6, 7], "185": 6, "34787242859676": [6, 7], "002781955938462633": [6, 7], "76228981520067": [6, 7], "213": [6, 7], "194": [6, 7], "70914272129673": [6, 7], "0023173546614751305": [6, 7], "3000082904498813": [6, 7], "10492031097328": [6, 7], "002606064524407": [6, 7], "7861330234653922e": [6, 7], "1049154281806": [6, 7], "0029210589377408366": [6, 7], "200933937391094e": [6, 7], "10492028002287": [6, 7], "06431564840324226": [6, 7], "2981641934644904e": [6, 7], "56066541774658": [6, 7], "0010848843623839548": [6, 7], "151493073951163": [6, 7], "76337597039308": [6, 7], "004134805589645341": [6, 7], "88115336652716": [6, 7], "58009587759925": [6, 7], "004763418454688096": [6, 7], "02920758025023": [6, 7], "415": [6, 7], "113": [6, 7], "35230417583477": [6, 7], "0009098023238189749": [6, 7], "57100980886017": [6, 7], "445": [6, 7], "30807467406214": [6, 7], "03739791555156691": [6, 7], "12818940557025": [6, 7], "476": 6, "44100655116532": [6, 7], "006380481141720477": [6, 7], "4882351186755": [6, 7], "505": 6, "35181001564942": [6, 7], "0036244007454981787": [6, 7], "608797806921866": [6, 7], "533": 6, "124": [6, 7], "3719027482892": [6, 7], "0014198536004321608": [6, 7], "05588994284273": [6, 7], "562": [6, 7], "28568052794907": [6, 7], "005434972462746285": [6, 7], "215759789700954": [6, 7], "20325": [6, 7], "66479442037": [6, 7], "9696417046589247": [6, 7], "132": [6, 7], "21507621375022": [6, 7], "0004528978867024753": [6, 7], "80386923876023": [6, 7], "655": [6, 7], "85570350846885": [6, 7], "0016948043699497222": [6, 7], "455627755557016": [6, 7], "contrast": [6, 7, 8], "relplot": [6, 7], "col": [6, 7, 8], "facet_kw": [6, 7], "axisgrid": [6, 7, 8], "facetgrid": [6, 7], "0x7ff3a1d3ba30": 6, "noramlis": [6, 7], "unlog": [6, 7], "yield": [6, 7, 8, 13, 14], "mse": [6, 7], "1126": [6, 7], "56968721": [6, 7], "20237903": [6, 7], "revers": [6, 7, 8, 13, 15], "onto": [6, 7], "action": [6, 7], "importantli": [6, 7], "easili": [6, 7, 8], "94824194": [6, 7], "92008694": [6, 7], "instruct": [6, 7], "untransform": [6, 7], "wish": [6, 7], "cut": [6, 7, 8], "10um": [6, 7], "ptr_config_log_transform": [6, 7], "ptr_transformed_studi": [6, 7], "ptr_and_transform_exampl": [6, 7], "002341918451736244": 6, "0024908979029632677": [6, 7], "526": [6, 7], "007901407671048116": [6, 7], "00496231674623194": [6, 7], "585": [6, 7], "0026848278110363512": [6, 7], "0010872728889471893": [6, 7], "624": 6, "008706109201510277": [6, 7], "704": [6, 7], "002999462459688866": 6, "00825680029907454": [6, 7], "007901407993550248": [6, 7], "753": 6, "007901405163828307": [6, 7], "769": [6, 7], "0021653695362066753": [6, 7], "002869169486971014": [6, 7], "804": 6, "0010855652626111146": [6, 7], "867": [6, 7], "005505338042993082": [6, 7], "884": 6, "901": [6, 7], "002236800860454562": [6, 7], "955": [6, 7], "006105985607235417": [6, 7], "971": 6, "004846526544994462": [6, 7], "119": 6, "006964668794465202": [6, 7], "204": 6, "0029994624596888677": [6, 7], "222": [6, 7], "008384326901042542": [6, 7], "001082194093844804": [6, 7], "256": 6, "0010807084256204563": [6, 7], "321": 6, "338": [6, 7], "422": 6, "458": 6, "005247934991526694": [6, 7], "480": [6, 7], "0010803393728928605": [6, 7], "005218354425190125": [6, 7], "503": 6, "521": 6, "004999207507691546": [6, 7], "0015694919308122948": [6, 7], "0019757694194001397": 6, "664": [6, 7], "730": [6, 7], "002341918451736245": [6, 7], "00368328296527152": [6, 7], "003412828259848677": [6, 7], "836": [6, 7], "004412110711416997": [6, 7], "893": [6, 7], "0021743798524909573": [6, 7], "911": [6, 7], "0022761245849848527": [6, 7], "934": 6, "0010805768178458735": [6, 7], "959": 6, "001080400188305814": [6, 7], "982": 6, "0010805009783570441": [6, 7], "0010804680472500541": [6, 7], "030": [6, 7], "0010803723579987025": [6, 7], "001080969596032512": [6, 7], "0010800333715082816": [6, 7], "0010802574700236845": [6, 7], "0010814994986419817": [6, 7], "147": [6, 7], "001080161136846237": [6, 7], "0010800254136811547": [6, 7], "197": [6, 7], "0010801290036870739": [6, 7], "001080037482216557": [6, 7], "0010801015705851358": [6, 7], "0010812122378841013": [6, 7], "295": [6, 7], "0010800531021304936": [6, 7], "00108004162698813": [6, 7], "0010800223466649803": [6, 7], "0010815197263834202": [6, 7], "394": [6, 8], "0010800257029027847": [6, 7], "0010810223438672223": [6, 7], "442": 6, "0010800211339555509": [6, 7], "0010800296871141684": [6, 7], "492": [6, 7], "0010800437739166451": [6, 7], "517": [6, 7], "0010809366267195716": [6, 7], "540": 6, "001080725386603206": [6, 7], "0010807368035830652": [6, 7], "0010800236072155854": [6, 7], "616": 6, "0010806223050773966": [6, 7], "642": [6, 7], "0010876516369772728": [6, 7], "669": 6, "00108142358144501": [6, 7], "0010800248050489667": [6, 7], "001080022268085466": [6, 7], "0010820922958715991": [6, 7], "771": [6, 7], "0010805094397523254": [6, 7], "0010841993753324146": [6, 7], "826": 6, "007899735988203994": [6, 7], "853": 6, "0010868762004637347": [6, 7], "001080400750193767": [6, 7], "907": [6, 7], "0010806791616300314": [6, 7], "0010804028029753213": [6, 7], "962": [6, 7], "0010800812188506515": [6, 7], "0010800299598580359": [6, 7], "017": 6, "0010803843696362083": [6, 7], "047": 6, "001080333048974234": [6, 7], "001080014645182176": [6, 7], "129": [6, 7], "0010807968027851892": [6, 7], "007907028395366658": [6, 7], "0010803563024666294": [6, 7], "3506154": [6, 7], "inlin": [6, 7, 8], "timepoint": [6, 7, 9, 11], "aux_column": [6, 7, 9], "accord": [6, 7, 8, 9], "aux_col_config": [6, 7], "aux_descriptors_dataset": [6, 7], "train_with_conc": [6, 7], "aux1": [6, 7], "aux_col_studi": [6, 7], "covariate_exampl": [6, 7], "aux1_model": [6, 7], "904": 6, "946": 6, "070": 6, "5186": [6, 7], "76766395672": 6, "138": 6, "4679": [6, 7], "740824270968": [6, 7], "4890": [6, 7], "6705099499995": [6, 7], "276": [6, 7], "3803": [6, 7], "9324375833753": [6, 7], "291": [6, 7], "3135": [6, 7], "6497388676926": [6, 7], "2518812859375": [6, 7], "4309": [6, 7], "124112370974": [6, 7], "30159424580074": [6, 7], "4357": [6, 7], "02827013125": 6, "1437929337522": [6, 7], "45281013": [6, 7], "shape": [6, 7, 8, 9], "thrown": [6, 7, 9], "prediciton": [6, 7], "regardless": [6, 7], "utilis": [6, 7, 8], "seper": [6, 7], "vector_covariate_config": [6, 7], "precomputed_descriptor": [6, 7], "train_with_fp": [6, 7], "aux_transform": [6, 7, 9], "vector_covariate_studi": [6, 7], "vector_aux_exampl": [6, 7], "vector_covariate_model": [6, 7], "735": 6, "776": 6, "857": 6, "2200": [6, 7], "6817959410578": [6, 7], "011994365911634164": [6, 7], "95660880078": [6, 7], "029071783512897825": [6, 7], "5798": [6, 7], "564494725643": [6, 7], "022631709120790048": [6, 7], "2198637677605415": [6, 7], "2899178898048": [6, 7], "8916194399474267": [6, 7], "022": [6, 7], "647": [6, 7], "3336440433073": [6, 7], "5914093983615214": [6, 7], "050": [6, 7], "3036472748931": [6, 7], "6201811079699818": [6, 7], "068": 6, "3807": [6, 7], "8035919667395": [6, 7], "914e": [6, 7], "901e": [6, 7], "892e": [6, 7], "5019": [6, 7], "459500770764": [6, 7], "1376436589359351": [6, 7], "4017711284796": [6, 7], "797115414836": [6, 7], "74340620175102": [6, 7], "train_smil": [6, 7, 9], "train_i": [6, 7, 9], "train_aux": [6, 7, 9], "test_smil": [6, 7, 9], "test_i": [6, 7, 9], "test_aux": [6, 7, 9], "legth": [6, 7], "39754917": [6, 7], "06352766": [6, 7], "52031134": [6, 7], "89875316": [6, 7], "5516046": [6, 7], "85042171": [6, 7], "436": [6, 7], "33406203": [6, 7], "504": [6, 7], "91439129": [6, 7], "80585907": [6, 7], "48565041": [6, 7], "protein": [6, 7, 13, 15], "alongsid": [6, 7], "chemic": [6, 7, 8, 13, 14], "sequenc": [6, 7, 13, 15], "former": [6, 7], "wherea": [6, 7], "latter": [6, 7, 8], "interact": [6, 7], "basi": [6, 7, 8, 9], "toxinpred3": [6, 7], "mdlititwasvmvaftfslslvvwgrsgl": [6, 7], "ccsc": [6, 7], "cc1c": [6, 7, 8], "nh": [6, 7, 8], "cc1ccccc1": [6, 7], "ncc": [6, 7], "cccnc": [6, 7], "arrggvlnfgqfglqalecgfvtnr": [6, 7], "cs": [6, 7], "gwcgdpgatcgklrlyccsgacdcytktckdkssa": [6, 7], "n1": [6, 7], "ccc1": [6, 7], "ccccn": [6, 7], "cc1ccc": [6, 7], "ngnllggllrpvlgvvkgltgglgkk": [6, 7], "demponstr": [6, 7], "zscale_covariate_config": [6, 7], "zscale_covariate_studi": [6, 7], "zscale_aux_exampl": [6, 7], "zscale_covariate_model": [6, 7], "425": 6, "385": 6, "8735224395254063": [6, 7], "kneighborsclassifier_algorithm_hash": [6, 7], "e51ca55089f389fc37a736adb2aa0e42": [6, 7], "metric__e51ca55089f389fc37a736adb2aa0e42": [6, 7], "n_neighbors__e51ca55089f389fc37a736adb2aa0e42": [6, 7], "weights__e51ca55089f389fc37a736adb2aa0e42": [6, 7], "unlik": [6, 7], "31176471": [6, 7], "08058824": [6, 7], "27176471": [6, 7], "56470588": [6, 7], "62529412": [6, 7], "99521739": [6, 7], "59826087": [6, 7], "34695652": [6, 7], "03086957": [6, 7], "13391304": [6, 7], "08083333": [6, 7], "6125": [6, 7], "82916667": [6, 7], "05083333": [6, 7], "56083333": [6, 7], "93357143": [6, 7], "02785714": [6, 7], "04214286": [6, 7], "30461538": [6, 7], "55307692": [6, 7], "31307692": [6, 7], "11076923": [6, 7], "00846154": [6, 7], "1232": [6, 7], "3364": [6, 7], "2328": [6, 7], "1368": [6, 7], "2304": [6, 7], "7060": [6, 7], "7062": [6, 7], "x_": [6, 7], "vmin": [6, 7], "vmax": [6, 7], "cmap": [6, 7], "spectral": [6, 7], "248bit": [6, 7], "128bit": [6, 7], "minimz": [6, 7], "generaliz": [6, 7], "minimize_std_dev": [6, 7], "minimise_std_dev": [6, 7, 10], "std": [6, 7, 8, 13, 15], "dev": [6, 7, 8], "example_multi": [6, 7], "parameter_analysi": [6, 7], "set_metric_nam": [6, 7], "4008740644240856": [6, 7], "9876203329634794": 6, "673": 6, "3561484909673425": [6, 7], "9875061220991905": [6, 7], "725": 6, "7856521165563053": [6, 7], "21863029956806662": [6, 7], "9125905675311808": [6, 7], "7861693342190089": [6, 7], "850": [6, 7], "5238765412750027": [6, 7], "2789424384877304": [6, 7], "873": [6, 7], "5348363849100434": [6, 7], "5741725628917808": [6, 7], "894": 6, "0072511048320134": [6, 7], "2786318125997387": [6, 7], "9625764609276656": [6, 7], "27575381401822424": [6, 7], "973": [6, 7], "1114006274062536": [6, 7], "7647766019001522": [6, 7], "990": [6, 8], "7801680863916906": [6, 7], "2725738454485389": [6, 7], "785652116470164": [6, 7], "21863029955530786": [6, 7], "060": 6, "785651973436432": [6, 7], "21863032832257323": [6, 7], "075": [6, 7], "6101359993004856": [6, 7], "3011280543457062": [6, 7], "092": 6, "5361950698070447": [6, 7], "23560786523195643": [6, 7], "5356113574175657": [6, 7], "5769721187181905": [6, 7], "5434303669217287": 6, "5147474123466615": 6, "191": [6, 7], "5194661889628072": [6, 7], "40146744515282495": [6, 7], "659749443628722": 6, "6659085938841998": 6, "1068495306229729": [6, 7], "24457822094737378": [6, 7], "305": 6, "8604898820838102": [6, 7], "7086875504668667": [6, 7], "5919869916997383": [6, 7], "2367498627927979": [6, 7], "327": [6, 7], "2497762395862362": [6, 7], "10124660026536195": [6, 7], "399": 6, "study_name_1": [6, 7], "0621601907738047": [6, 7], "2749020946925899": [6, 7], "xxx": [6, 7], "values_neg_mean_squared_error": [6, 7], "values_standard": [6, 7], "twinx": [6, 7], "r": [6, 7, 9], "floor": [6, 7], "ceil": [6, 7], "align": [6, 7], "set_ytick": [6, 7], "linspac": [6, 7], "set_xtick": [6, 7], "text": [6, 7, 8, 9, 13], "pareto": [6, 7], "front": [6, 7], "plot_pareto_front": [6, 7], "plot_param_import": [6, 7], "dictionari": [6, 7, 11], "ordereddict": [6, 7], "descend": [6, 7], "algortihm": [6, 7], "impact": [6, 7, 9], "durat": [6, 7], "total_second": [6, 7], "target_nam": [6, 7], "relationship": [6, 7], "plot_parallel_coordin": [6, 7, 9, 10, 12], "param": [6, 7, 8, 10, 11], "taken": [6, 7, 8], "precomputed_config": [6, 7], "precomputed_studi": [6, 7], "precomputed_exampl": [6, 7], "precomputed_model": [6, 7], "3014": [6, 7], "274803630188": [6, 7], "481": 6, "471088599086": [6, 7], "03592375122963953": [6, 7], "519": 6, "3029": [6, 7], "113810544919": [6, 7], "8153295905650357": [6, 7], "618": 6, "4358": [6, 7], "575772003129": [6, 7], "unseen": [6, 7], "caus": [6, 7], "new_molecul": [6, 7], "tempfil": [6, 7], "temp": [6, 7, 8], "store": [6, 7, 8, 9, 12], "temporari": [6, 7, 11], "1st": [6, 7], "example_fp": [6, 7], "namedtemporaryfil": [6, 7], "temp_fil": [6, 7], "len": [6, 7, 8], "to_csv": [6, 7], "65709987": [6, 7], "64327077": [6, 7], "clean": [6, 7], "stage": [6, 7, 8], "workflow": [6, 7], "slurm": [6, 7, 9, 11], "leverag": [6, 7], "dynam": [6, 7, 9], "gpu": [6, 7], "customiz": [6, 7], "tailor": [6, 7], "customis": [6, 7], "export": [6, 7], "aid": [6, 7], "monitor": [6, 7], "pseudo": [6, 7, 9], "prospect": [6, 7, 9], "resubmiss": [6, 7, 11], "resubmit": [6, 7, 9], "modifi": [6, 7, 9], "enhanc": [6, 7], "parallel": [6, 7, 9], "simultan": [6, 7], "simul": [6, 7], "submit": [6, 7, 11], "verifi": [6, 7], "unittest": [6, 7], "mock": [6, 7], "patch": [6, 7, 8], "aml_arg": [6, 7], "prog": [6, 7], "argv": [6, 7], "systemexit": [6, 7], "functionila": [6, 7], "signific": [6, 7, 8], "thorough": [6, 7], "warehous": [6, 7], "databas": [6, 7], "flat": [6, 7], "compress": [6, 7], "natur": [6, 7, 8], "uniqu": [6, 7, 8], "106": 6, "ls": [6, 7], "lrth": [6, 7], "rw": [6, 7], "staff": [6, 7], "2k": [6, 7], "aug": [6, 7], "12k": [6, 7], "438b": [6, 7], "written": [6, 7], "undergon": [6, 7], "updat": [6, 7, 8], "trigger": [6, 7], "bash": [6, 7], "orchestr": [6, 7], "easi": [6, 7], "request": [6, 7], "exce": [6, 7], "50g": [6, 7], "retain": [6, 7, 9], "futur": [6, 7, 9], "example_automl": [6, 7], "workbook": [6, 7], "automl_exampl": [6, 7], "vv": [6, 7], "debug": [6, 7], "namespac": 6, "dry_run": [6, 9], "dgx": 6, "save_previous_model": [6, 9], "24_01_01": [6, 7], "042": [6, 7], "first_run": [6, 9], "processed_timepoint": [6, 7, 9], "044": 6, "checkskip": [6, 9], "tid1": [6, 7], "checkislock": [6, 9], "lockfil": 6, "lock": [6, 7, 9, 11], "taskcod": [6, 9], "046": [6, 7], "checkrunningslurmjob": [6, 9], "usr": [6, 7], "squeue": 6, "resubmitanyfailedjob": [6, 7, 9], "ran": 6, "submitjob": [6, 9], "054": 6, "ongo": 6, "took": 6, "024824142": 6, "055": [6, 7], "pid": 6, "posix": 6, "pidfil": 6, "0x7ff3f48a5cc0": 6, "scene": [6, 7], "sed": [6, 7], "togeth": [6, 7], "correctli": [6, 7, 9], "ingest": [6, 7], "meet": [6, 7], "quourum": [6, 7], "happen": [6, 7], "statu": [6, 7], "past": [6, 7, 11], "cron": [6, 7], "513": 6, "0x7ff3f48a5c00": 6, "enter": 6, "515": [6, 7], "524": [6, 7], "529": [6, 7], "534": 6, "535": [6, 7], "019070148": 6, "retir": [6, 7], "acut": [6, 7], "attempt": [6, 7], "insuffici": [6, 7, 9, 13], "emul": [6, 7, 8, 13, 14], "sucess": [6, 7], "shutil": [6, 7], "os": [6, 7, 8], "drd2_reg": [6, 7], "549": 6, "0x7ff3f48a5e40": 6, "552": 6, "556": [6, 7], "557": 6, "558": [6, 7], "576": 6, "processretrain": [6, 9], "fist": 6, "setprocessedtimepoint": [6, 9], "581": [6, 7], "getretrainingdata": [6, 9], "24_02_01": [6, 7], "586": [6, 7], "587": [6, 7], "592": [6, 7], "processtrain": [6, 9], "60g": [6, 7], "No": [6, 10, 11, 13], "writedataset": [6, 9], "wrote": 6, "608": 6, "writeslurm": [6, 9], "611": 6, "writejson": [6, 9], "612": [6, 7], "setjoblock": [6, 9], "lock_fil": 6, "614": 6, "062794924": 6, "proce": [6, 7], "datapoint": [6, 7, 8, 9, 11, 13, 14], "pseodu": [6, 7], "9zyw8gtc": 7, "tqdmwarn": 7, "iprogress": 7, "ipywidget": 7, "readthedoc": [7, 10], "en": [7, 10], "user_instal": 7, "autonotebook": 7, "notebook_tqdm": 7, "713": 7, "794": 7, "810": 7, "827": 7, "892": 7, "853455192818": 7, "048": 7, "112": 7, "404088878841": 7, "284": 7, "339": 7, "047015479678": 7, "459": 7, "559": 7, "143979828407": 7, "660": 7, "799": 7, "924": 7, "795596755263": 7, "193": 7, "212": 7, "297": 7, "9359502556013": 7, "482": 7, "507": 7, "530": 7, "553": 7, "637": 7, "661": 7, "785": 7, "899": 7, "999": 7, "037": 7, "288": 7, "355": 7, "420": 7, "514": 7, "596": 7, "635": 7, "676": 7, "821": 7, "963": 7, "262": 7, "joblib": [7, 9], "joblibcollisionwarn": 7, "collis": 7, "public_qptuna": 7, "_cached_cal": 7, "shelv": 7, "408": [7, 8], "3999": 7, "9364276424735": 7, "11270803112210707": 7, "81076443656638": 7, "3215970512413": 7, "4503197998963022": 7, "412900098594": 7, "0005181574946923789": 7, "025601513670726564": 7, "4941115157144": 7, "04539011914094239": 7, "0004375261377371938": 7, "758": 7, "2116": 7, "9335959003747": 7, "2124": 7, "9660426577593": 7, "1286": 7, "0769369193436": 7, "8784876169901574": 7, "839": 7, "1276": 7, "7802172741008": 7, "9512603410202876": 7, "2795207825823": 7, "9555128319114616": 7, "926": 7, "8121584310656": 7, "08008391330553266": 7, "942": 7, "277": 7, "22285881334636": 7, "950404670920864": 7, "340295864211": 7, "03834458564679112": 7, "0012347340743566007": 7, "025": 7, "3286": 7, "3458857183705": 7, "1671": 7, "978884132793": 7, "1617522685589332": 7, "466e": 7, "820e": 7, "2291": 7, "4431541048393": 7, "11135166203819158": 7, "218": 7, "3551": 7, "4754762175066": 7, "1703": 7, "5472682894215": 7, "9386828094838913": 7, "253": 7, "1595": 7, "6713281001928": 7, "1334174010640954": 7, "317": 7, "3057": 7, "0737441471406": 7, "335": 7, "358207737329": 7, "8045138424869749": 7, "406": 7, "3163": 7, "129883232068": 7, "745e": 7, "824e": 7, "473": 7, "00091009328474": 7, "03221878838522718": 7, "1306": 7, "5184610043127": 7, "7499005468308115": 7, "510": 7, "1262": 7, "6469892776183": 7, "0985974843950514": 7, "575": 7, "3059": 7, "470983832716": 7, "274": 7, "7005065089059": 7, "9093347536574419": 7, "3054": 7, "7066202193814": 7, "665": 7, "1325": 7, "4979657271272": 7, "5409105715354152": 7, "670": 7, "1814": 7, "6019641143478": 7, "3331": 7, "867542200907": 7, "2240": 7, "669934747297": 7, "828": 7, "8972970077489": 7, "6774731649874095": 7, "846": 7, "1879": 7, "2457309916924": 7, "8772717895282218": 7, "927": 7, "8197755321637": 7, "5177471708941157": 7, "499774083188": 7, "3690814560784887": 7, "012140477955952245": 7, "978": 7, "280": 7, "17463144475477": 7, "7022855415761313": 7, "69499953504345": 7, "7868425071077856": 7, "2174": 7, "0174962828364": 7, "2478696042156301": 7, "2733": 7, "5772576431627": 7, "275": 7, "9100107045787": 7, "9291713852865917": 7, "273": 7, "0829803041618": 7, "8837007827687249": 7, "144": 7, "49436461257073": 7, "9898473627215156": 7, "8855537592183": 7, "9765992415502778": 7, "30111488501615": 7, "9842537157445685": 7, "266": 7, "9084083294047": 7, "7700364511238211": 7, "08546968046016": 7, "7174555152957753": 7, "87394849447105": 7, "6657778446979243": 7, "57037115440716": 7, "6549600121936776": 7, "73632857486865": 7, "6012341182929566": 7, "8912182200218": 7, "610338208270851": 7, "8551585556689": 7, "608205745163954": 7, "2138932313906": 7, "5903994630391254": 7, "2415991435093": 7, "5908543043200158": 7, "258": 7, "9523786752699": 7, "5278661577890018": 7, "53897978343346": 7, "3779758893668723": 7, "508": [7, 9], "47213290450173": 7, "1905703564298876e": 7, "06884768780446": 7, "3682097961495725": 7, "583": 7, "39234737037964": 7, "336648765853807": 7, "619": 7, "49357359736462": 7, "3384792184834002": 7, "654": 7, "98988892704782": 7, "3472988458237292": 7, "4318590800788": 7, "3203044400907151": 7, "729": 7, "60939991827328": 7, "2896152552004716": 7, "57908944967576": 7, "3400204345244455": 7, "3328308520906": 7, "3355893292668126": 7, "89284193590962": 7, "2399635656610752": 7, "877": 7, "38938750703497": 7, "19357886055335": 7, "4997740789586": 7, "00020513916607513548": 7, "4326248941768776e": 7, "947": 7, "72495253431336": 7, "2374010908702786": 7, "16509356166648": 7, "1589849176145737": 7, "019": 7, "07682320089074": 7, "140733480213489": 7, "38922657607546": 7, "1460326309523254": 7, "096": 7, "48603723419197": 7, "1106769242312984": 7, "135": 7, "2330323343841": 7, "105401956026003": 7, "97865576673902": 7, "1000318093457389": 7, "232": 7, "01471657314468": 7, "0553438336940761": 7, "82080194631138": 7, "9715618816799196": 7, "49039871573063": 7, "9049680809556248": 7, "75568720888796": 7, "8917112780641941": 7, "52818001153125": 7, "8874420080681129": 7, "76711515271572": 7, "3506098555413268e": 7, "449": 7, "98946208159907": 7, "8769574977693346": 7, "490": 7, "9478946070053": 7, "8952523217347376": 7, "01732338929523": 7, "8965185664534796": 7, "567": 7, "7486972968999": 7, "8509681340315446": 7, "19689822636008": 7, "8810095036429842": 7, "26432510046484": 7, "8621657970877505": 7, "55052102161756": 7, "8680843345290663": 7, "56366099802298": 7, "7442205305129062": 7, "0644622341688": 7, "7150915543843963": 7, "796": 7, "093": 7, "12769795082909807": 7, "390": [7, 8], "446": 7, "464": 7, "750": 7, "916": 7, "117": 7, "136": 7, "159": 7, "178": 7, "183": 7, "337": 7, "00461414372160085": 7, "511": 7, "10220127407364965": 7, "579": 7, "089": 7, "148": 7, "903": 7, "977": 7, "272": 7, "628": 7, "126": 7, "365": 7, "393": 7, "860": 7, "08048357913360568": 7, "499": 7, "07632537970908462": 7, "08984764740598594": 7, "06847327885133497": 7, "07559783310619407": 7, "05514462099560352": 7, "061375603485350996": 7, "921": 7, "07939472167407403": 7, "0684392715056296": 7, "489": 7, "07494614575719116": 7, "07133468298392816": 7, "061875032318225075": 7, "07572085582137136": 7, "054237426197199234": 7, "299": 7, "331": 7, "6743": 7, "225992071741": 7, "584": 7, "944009132488": 7, "34392897437": 7, "086720713623": 7, "424": 7, "228032558769": 7, "456": 7, "16017644995": 7, "544": 7, "815": 7, "027": 7, "487": 7, "497": 7, "722": 7, "326": 7, "992": 7, "808": 7, "189": 7, "118": 7, "231": 7, "4253": 7, "872561867463": 7, "433": 7, "36708973607664297": 7, "006253064467624636": 7, "043440e": 7, "025864e": 7, "805554e": 7, "367604e": 7, "104342e": 7, "1496": 7, "052067e": 7, "1497": 7, "015542e": 7, "2234": 7, "387391e": 7, "862": 7, "140929e": 7, "863": 7, "083": 7, "143": 7, "472": 7, "595949377253611": 7, "943": 7, "033": 7, "172": 7, "325": 7, "417": 7, "488": [7, 9], "554": 7, "571": 7, "605": 7, "609": 7, "626": 7, "780": 7, "817": 7, "985": 7, "026": 7, "067": 7, "40359637945134724": 7, "214": 7, "5959493772536111": 7, "308": 7, "8908739215746114": 7, "413": 7, "493": 7, "537": 7, "651": 7, "674": 7, "791": 7, "840": 7, "887": 7, "065": 7, "162": 7, "313": 7, "364": 7, "675": 7, "702": 7, "333": 7, "353": 7, "548": 7, "932": 7, "988": 7, "111": 7, "304": 7, "396": [7, 8], "5407991891466": 7, "636": 7, "738": 7, "888": 7, "967": 7, "049": 7, "074": 7, "205": 7, "260": 7, "315": 7, "428": 7, "685": 7, "714": 7, "772": 7, "830": 7, "0x7fa8b811a5c0": 7, "594": 7, "633": 7, "935": 7, "013": 7, "063": 7, "114": 7, "409": 7, "528": 7, "547": 7, "639": 7, "662": 7, "717": 7, "001975769419400139": 7, "930": 7, "087": 7, "414": 7, "630": 7, "805": 7, "082": 7, "323": 7, "767663956718": 7, "028270131251": 7, "869": 7, "948": 7, "681": 7, "9876203329634793": 7, "543430366921729": 7, "514747412346662": 7, "610": 7, "6597494436287219": 7, "6659085938841999": 7, "644": 7, "682": 7, "643": 7, "752": 7, "919": 7, "qptuna": [7, 11], "usernam": 7, "hous": 7, "103": 7, "104": 7, "tb": 7, "assess": [7, 8], "frequent": 7, "slurm_update_models_parallel": 7, "qsartuna_automl": 7, "j": [7, 9], "12g": 7, "your_path": 7, "update_it": 7, "hourli": 7, "common": 8, "proper": 8, "process": [8, 9, 11], "functionail": 8, "configur": [8, 9, 10, 11, 12], "draw": 8, "ipythonconsol": 8, "ipython": 8, "displai": 8, "listdir": 8, "isfil": 8, "walk": 8, "handi": 8, "med": 8, "titles": 8, "fontsiz": 8, "labels": 8, "xtick": 8, "ytick": 8, "rcparam": 8, "v0_8": 8, "whitegrid": 8, "set_styl": 8, "white": 8, "boolean": 8, "nomin": 8, "convert": [8, 9, 13], "conduct": 8, "primarydf": 8, "loadsdf": 8, "inchi": 8, "skeletonspher": 8, "nm": 8, "id": 8, "romol": 8, "ic50": 8, "\u00b5m": 8, "c1ccc2c": 8, "co2": 8, "004320939": 8, "1s": 8, "c8h7no2": 8, "c10": 8, "qrcgftxrxymjo": 8, "uhfffaoysa": 8, "86075": 8, "kinas": 8, "p38": 8, "rdchem": 8, "0x7f9ca0112340": 8, "c1ccc": 8, "ccc2ccccc2occ3ccc": 8, "882397308": 8, "c22h20o3": 8, "c23": 8, "ytdaoqyeyfcini": 8, "89637": 8, "kd": 8, "retinoid": 8, "receptor": 8, "0x7f9c808beff0": 8, "130299026": 8, "0x7f9c808bf060": 8, "48148606": 8, "c9h7no": 8, "c11": 8, "lisfmebwquvkpj": 8, "n93": 8, "n82": 8, "n65": 8, "n36": 8, "n33": 8, "ki": 8, "nki": 8, "carbon": 8, "anhydras": 8, "xii": 8, "ncarbon": 8, "0x7f9c808bf0d0": 8, "nc1ccccn1": 8, "c7h8n2o": 8, "h2": 8, "5h": 8, "qrokotbwfzitjz": 8, "86233": 8, "nicotin": 8, "phosphoribosyltransferas": 8, "0x7f9c808bf140": 8, "renam": 8, "conveni": [8, 9, 10, 13], "rest": 8, "moltosmil": 8, "isomericsmil": 8, "c1coc2ccccc2n1": 8, "004321": 8, "coc2ccccc2ccc2ccccc2": 8, "882397": 8, "130299": 8, "c1ccc2ccccc2": 8, "481486": 8, "stick": 8, "engin": 8, "assum": [8, 13, 14], "slightli": 8, "pose": 8, "wise": 8, "outlin": 8, "occurr": 8, "preserv": 8, "vari": 8, "recommend": 8, "abil": 8, "being": 8, "version": [8, 9, 10], "df_po": 8, "dedup": [8, 13], "df_rnd": 8, "df_max": 8, "df_avg": 8, "df_med": 8, "deduplidc": 8, "397": 8, "indici": 8, "coc1cc2ncnc": 8, "nc3ccc": 8, "scc4ccccc4": 8, "cl": 8, "c3": 8, "c2cc1oc": 8, "282579": 8, "912929": 8, "cc1cccc": 8, "nc2ncnc3ccc": 8, "c4ccccc4": 8, "cc23": 8, "n2cc": 8, "cc2c": 8, "nc2cccc": 8, "n2": 8, "065502": 8, "958607": 8, "oc2cccc": 8, "cn1nc": 8, "c2cnc": 8, "c3ccc": 8, "nc1c1": 8, "oc1nc": 8, "oc2cc": 8, "c3ccccc3": 8, "c3cccc": 8, "cn": 8, "936291": 8, "359": 8, "minim": [8, 10], "densiti": 8, "dpi": 8, "kdeplot": 8, "fill": 8, "orang": 8, "ndigit": 8, "blue": 8, "keepaverag": 8, "deeppink": 8, "hold": [8, 9], "aim": 8, "simpli": 8, "sai": 8, "veri": 8, "intern": [8, 11], "resembl": 8, "easiest": 8, "especi": 8, "reli": 8, "stochast": 8, "train_ran": 8, "test_ran": 8, "time_column": 8, "old": [8, 9], "accru": 8, "entri": [8, 13, 14], "timestamp": 8, "top": 8, "df_med_tempor": 8, "fake": 8, "nccccccoc1ccc2c": 8, "n1cc": 8, "684240": 8, "1037": 8, "481464": 8, "1036": 8, "c1cn": 8, "n2c": 8, "nc3cccc": 8, "n3": 8, "cc3cc3": 8, "732625": 8, "1035": 8, "568332": 8, "1034": 8, "790259": 8, "1033": 8, "train_tempor": 8, "test_tempor": 8, "highli": 8, "skew": 8, "fd": [8, 13, 14], "histogram": [8, 13, 14], "determin": [8, 13, 14], "balanc": 8, "fd_merg": [8, 13, 14], "train_str": 8, "test_str": 8, "realist": 8, "deplopi": 8, "hop": 8, "opportun": 8, "seri": 8, "push": 8, "domain": 8, "realibl": 8, "challeng": 8, "scaf_split": 8, "train_sca": 8, "test_sca": 8, "ground": 8, "df_val": 8, "roughli": [8, 10], "evid": 8, "pronounc": 8, "dodgerblu": 8, "middl": 8, "saffold": 8, "discuss": 8, "propreti": 8, "endpoint": 8, "routin": 8, "linearis": 8, "variat": 8, "gaussian": 8, "realiti": 8, "nearli": 8, "exhibit": 8, "superior": 8, "wide": 8, "xc50_data": 8, "keepallnodedupl": [8, 13], "pxc50_data": 8, "zip": 8, "jointplot": 8, "suptitl": 8, "plot_margin": 8, "rugplot": 8, "crimson": 8, "height": 8, "clip_on": 8, "jointgrid": 8, "0x7f9ca05ade10": 8, "heteroscedast": 8, "homoscedast": 8, "transorm": 8, "0x7f9c458f85e0": 8, "logartihm": 8, "power": [8, 13, 15], "um": 8, "dataset_transform": 8, "THe": 8, "0x7f9ca05aeb30": 8, "had": 8, "reverse_transform": [8, 13], "0x7f9c926f8970": 8, "mervin": 8, "framework": [8, 9], "somewher": 8, "unavoid": 8, "ideal": 8, "deviat": [8, 13, 15], "\u03c3": 8, "heterogen": 8, "versu": 8, "assimil": 8, "hypothesi": 8, "degre": 8, "p_": 8, "activityt": 8, "cumul": 8, "cdf": 8, "eq": 8, "equal": [8, 10], "delta": 8, "vec": 8, "frac": 8, "erf": 8, "overrightarrow": 8, "sigma": 8, "concret": 8, "arbitrari": 8, "unknown": [8, 11], "therefor": [8, 9], "schemat": 8, "lookup": 8, "tabl": 8, "sd": 8, "scenario": [8, 13, 14], "philosoph": 8, "delimit": [8, 13, 15], "operand": 8, "censor": 8, "far": 8, "granular": 8, "therebi": 8, "combin": [8, 9], "becom": 8, "jcheminf": 8, "biomedcentr": 8, "1186": 8, "s13321": 8, "00539": 8, "sec12": 8, "pxc50_threshold": 8, "pxc50_std": 8, "exmapl": 8, "ptr_data": 8, "gather": 8, "certainti": 8, "lower_reproduc": 8, "upper_reproduc": 8, "dataload": 8, "somewhat": 8, "invert": 8, "bell": 8, "kde": 8, "behav": 8, "mpatch": 8, "line2d": 8, "ax_joint": 8, "axhlin": 8, "linestyl": 8, "ax_marg_i": 8, "ax_marg_x": 8, "axvlin": 8, "region": 8, "uncert_color": 8, "purpl": 8, "uncert_region": 8, "rectangl": 8, "add_patch": 8, "box": 8, "nthreshold": 8, "nptr": 8, "nregion": 8, "fancybox": 8, "borderaxespad": 8, "leg": 8, "get_legend": 8, "legend_handl": 8, "set_alpha": 8, "set_color": 8, "tight": 8, "layout": 8, "subplots_adjust": 8, "set_size_inch": 8, "var": 8, "1v": 8, "9y_z128d7gvcp8mf8q0pz3ch0000gq": 8, "ipykernel_33301": 8, "3093832163": 8, "cannot": 8, "enough": [8, 9], "accommod": 8, "decor": 8, "dash": 8, "shade": 8, "histrogram": 8, "clip": 8, "aforement": 8, "ptrtransform": [8, 13, 15], "ptr_transform": 8, "histplot": 8, "stat": 8, "scipi": 8, "resp_col": [8, 9], "pearsonr": 8, "std_df": 8, "groupbi": 8, "mdn_df": 8, "std_vs_median": 8, "suffix": 8, "_std": 8, "_median": 8, "dropna": 8, "activity_std": 8, "activity_median": 8, "088539": 8, "674782": 8, "265123": 8, "138620": 8, "157605": 8, "stdev": 8, "stat_func": 8, "plot_joint": 8, "zorder": 8, "0x7f9be19abaf0": 8, "assumpt": 8, "fulfil": 8, "ptr_train_ran": 8, "ptr_test_ran": 8, "ptr_train_str": 8, "ptr_test_str": 8, "ptr_train_tempor": 8, "ptr_test_tempor": 8, "ptr_train_sca": 8, "ptr_test_sca": 8, "warn_singular": 8, "xlim": 8, "peak": 8, "extem": 8, "dsitribut": 8, "awai": 8, "bias": 8, "enum": [9, 10, 11, 13], "building_configuration_enum": [9, 11], "configuration_enum": [9, 11], "interface_enum": [9, 11], "model_runner_enum": [9, 11], "objective_enum": [9, 11], "optimization_configuration_enum": [9, 11], "prediction_configuration_enum": [9, 11], "return_values_enum": [9, 11], "visualization_enum": [9, 11], "modelautoml": 9, "smiles_col": [9, 11, 13, 14], "activity_col": 9, "task_col": 9, "timestr": 9, "20240828": 9, "171643": 9, "modeldispatch": 9, "pend": 9, "last_timepoint": 9, "getallretrainingdata": 9, "wilcard": 9, "datetim": 9, "unprocess": 9, "bucket": 9, "nonewretrainingdata": [9, 11], "setretrainingdata": 9, "initprocessedtimepoint": 9, "cfg": 9, "initial_templ": 9, "retrain_templ": 9, "slurm_templ": 9, "slurm_al_smil": 9, "slurm_partit": 9, "log_conf": 9, "checkifretrainingprocess": 9, "unabl": 9, "static": 9, "calcslurmmem": 9, "len_fil": 9, "setdispatchervari": 9, "overwrit": 9, "_taskcode_df": 9, "attribut": 9, "prev": 9, "processquorum": 9, "_input_df": 9, "istrain": 9, "checksavetemporalmodel": 9, "dotemporalpredict": 9, "new_data": 9, "out_df": 9, "setskippedtimepoint": 9, "elig": 9, "checkslurmstatusandnextprocedur": 9, "cancel": 9, "increasejobtim": 9, "increasejobmem": 9, "max_mem": 9, "increasejobcpu": 9, "max_cpu": 9, "addslurmretri": 9, "getslurmretri": 9, "locked_job": 9, "max_retri": 9, "process_retraining_task": 9, "dispatcher_process": 9, "global_cfg": 9, "validate_arg": 9, "prepare_dispatch": 9, "merge_train_and_test_data": 9, "isvalid": 9, "read_data": 9, "aux_col": 9, "invalid": 9, "pars": [9, 10, 12], "tupl": [9, 13, 14], "ambigu": 9, "smiles_": 9, "y_": [9, 11, 13], "aux_": 9, "factori": [9, 10], "intermediate_training_dataset_fil": 9, "intermediate_test_dataset_fil": 9, "get_merged_set": 9, "check_set": 9, "scalingfittingerror": 9, "descriptor_str": 9, "unfittedsklearnscla": [9, 13], "novalidsmil": 9, "mol_from_smi": 9, "numpy_from_rdkit": 9, "dtype": [9, 13], "moldescriptor": 9, "nameparameterdataclass": [9, 10, 13], "abc": [9, 10, 13], "abstract": [9, 10, 13], "parallel_compute_descriptor": 9, "amorprot": [9, 13], "ecfp6": 9, "seq": 9, "pathlib": 9, "get_fitted_scaler_for_fp": 9, "saved_param": 9, "get_fitted_scal": 9, "minhash": 9, "chiral": 9, "orsi": 9, "map4": 9, "unifi": 9, "percept": 9, "benchmark": 9, "cip": 9, "highest": 9, "disproportion": 9, "affect": [9, 13], "maxradiu": [9, 12], "npermut": [9, 12], "permut": 9, "set_unfitted_scaler_data": 9, "fp_info": 9, "canonicalsmil": 9, "scaffold": [9, 13, 14], "genericscaffold": 9, "validdescriptor": 9, "descriptor_from_config": 9, "return_failed_idx": 9, "score_al": 9, "get_scor": 9, "score_all_smil": 9, "get_train_test_scor": 9, "get_merged_train_scor": 9, "get_ecfp_fpinfo": 9, "get_ecfpcount_fpinfo": 9, "explain_ecfp": 9, "len_feat": 9, "get_fp_info": 9, "exp_df": 9, "fp_idx": 9, "strt_idx": 9, "runshap": 9, "x_pred": 9, "shapexplain": 9, "popul": 9, "explainpr": 9, "shallow": 9, "validate_cls_input": 9, "pi_zero": 9, "pr": 9, "melloddi": 9, "sparsechem": 9, "imbal": 9, "bedroc_scor": [9, 10], "truchon": 9, "bayli": 9, "screen": 9, "bad": 9, "recognit": 9, "2007": 9, "concord": 9, "statist": 9, "qualiti": 9, "harald": 9, "On": 9, "surviv": 9, "bound": 9, "2008": 9, "1209": 9, "1216": 9, "api": 9, "posterior": 9, "mark": 9, "abstractmethod": [9, 10], "predict_uncert": 9, "quantifi": 9, "qsartunamodel": 9, "nonetyp": [9, 10], "sent": 9, "get_metadata": 9, "train_scor": [9, 12], "test_scor": [9, 11, 12], "get_transform": 9, "perform_ptr": 9, "wrap_model": 9, "save_model": 9, "novaliddescriptor": 9, "null_scor": 9, "argserror": 9, "issu": [9, 11, 13], "uncertaintyerror": 9, "auxcovariatemiss": 9, "precomputederror": 9, "validate_uncertainti": 9, "check_precomp_arg": 9, "set_inference_param": 9, "desc": [9, 10], "validate_set_precomput": 9, "validate_aux": 9, "doctitl": 9, "docstr": 9, "type_base_schema": 9, "tp": 9, "wyfo": 9, "json_schema": 9, "patch_schema_gener": 9, "patch_schema_optunaz": 9, "split_optim": 9, "base_chemprop_param": 9, "pop": 9, "run_studi": 9, "storag": [9, 12], "trial_number_offset": [9, 11], "log_scor": 9, "main_scor": 9, "outfnam": 9, "plot_by_configur": 9, "conf": 9, "plot_slic": [9, 10, 12], "folder_path": 9, "file_format": [9, 10, 12], "png": [9, 10], "plot_contour": [9, 10, 12], "plot_histori": [9, 10, 12], "set_build_cach": 10, "preexist": 10, "remove_algo_hash": 10, "buildconfig_from_tri": 10, "encode_nam": 10, "cenam": 10, "suggest_alg_param": 10, "suggest_aux_param": 10, "check_invalid_descriptor_param": 10, "adaboostclassifierparamet": 10, "lassoparamet": 10, "kneighborsclassifierparamet": 10, "kneighborsregressorparamet": 10, "logisticregressionparamet": 10, "plsparamet": 10, "randomforestparamet": 10, "ridgeparamet": 10, "svcparamet": 10, "svrparamet": 10, "xgbregressorparamet": 10, "prfclassifierparamet": 10, "bootstrap": 10, "new_syn_data_frac": 10, "chempropregressorparamet": 10, "chempropclassifierparamet": 10, "chempropregressorpretrainedparamet": 10, "chemprophyperoptclassifierparamet": 10, "chemprophyperoptregressorparamet": 10, "calibratedclassifiercvparamet": 10, "mapieparamet": 10, "regressionscor": 10, "classificationscor": 10, "closer": 10, "greater": 10, "manhattan": 10, "trainarg": 10, "tanh": 10, "leakyrelu": 10, "prelu": 10, "selu": 10, "elu": 10, "morgan_count": 10, "rdkit_2d": 10, "rdkit_2d_norm": 10, "mpnn_first_ffn": 10, "mpnn_last_ffn": 10, "linked_hidden_s": 10, "constrain": 10, "l3": 10, "init_lr_exp": 10, "final_lr_exp": 10, "warmup_epoch": 10, "l4": 10, "l5": 10, "l6": 10, "l7": 10, "l8": 10, "isanyof": 10, "obj": [10, 11], "detect_mode_from_alg": 10, "copy_path_for_scaled_descriptor": 10, "cv_split_strategi": 10, "use_cach": 10, "optuna_storag": 10, "set_cach": 10, "set_algo_hash": 10, "declar": 10, "pydant": 10, "don": 10, "classmethod": 10, "1024": 10, "shorter": 10, "output_fold": [10, 12], "use_xvfb": [10, 12], "imagefileformat": 10, "jpeg": 10, "jpg": 10, "svg": 10, "move_up_directori": 11, "attach_root_path": 11, "attach": 11, "loadjson": 11, "add_ellipsi": 11, "max_length": 11, "shorten_nam": 11, "mlflowcallback": 11, "tracking_uri": 11, "callback": 11, "uri": 11, "server": 11, "set_tracking_uri": 11, "prepare_tag": 11, "tag": 11, "tmp_buildconfig": 11, "noretrainingdataconvent": 11, "nodifferingretrainingdata": 11, "retrainingheadersissu": 11, "retrainingisalreadyprocess": 11, "retrainingislock": 11, "temporalpredspredict": 11, "nopreviousmodel": 11, "prev_model_nam": 11, "samepreviousmodel": 11, "timepointskip": 11, "slurmnolog": 11, "itcod": 11, "slurmtimelimitexceed": 11, "exceed": 11, "slurmmemoryexceed": 11, "slurmjobskip": 11, "slurmparseerror": 11, "create_depend": 11, "remove_schema_properti": 11, "add_boolean_guards_for_schema_properti": 11, "replacekei": 11, "input_": 11, "replacevalu": 11, "addsibl": 11, "delsibl": 11, "sibl": 11, "getref": 11, "context": 11, "recurs": 11, "nest": 11, "copytitl": 11, "oneof": 11, "replaceenum": 11, "singleton": 11, "const": 11, "addtitl": 11, "get_authorization_head": 11, "trackingdata": 11, "trial_numb": [11, 12], "trial_valu": 11, "trial_stat": 11, "all_cv_test_scor": 11, "removeprefix": 11, "round_scor": 11, "internaltrackingcallback": 11, "progress": 11, "buildtrackingdata": 11, "response_column_nam": 11, "test_point": 11, "track_build": 11, "mkdict": 11, "load_df_from_fil": 11, "remove_failed_idx": 11, "failed_idx": 11, "md5_hash": 11, "md5": 11, "buildingconfigurationenum": 12, "configurationenum": 12, "general_hyperparamet": 12, "hyper_paramet": 12, "general_regressor": 12, "general_classifi": 12, "metadata_besttri": 12, "metadata_bestvalu": 12, "general_dis": 12, "general_paramet": 12, "task_optim": 12, "task_build": 12, "data_inputcolumn": 12, "data_responsecolumn": 12, "data_train": 12, "data_test": 12, "descriptors_avalon": 12, "descriptors_avalon_nbit": 12, "descriptors_ecfp": 12, "descriptors_ecfp_radiu": 12, "descriptors_ecfp_nbit": 12, "descriptors_ecfpcount": 12, "descriptors_ecfpcounts_radiu": 12, "descriptors_ecfpcounts_usefeatur": 12, "descriptors_pathfp": 12, "descriptors_pathfp_maxpath": 12, "descriptors_pathfp_fps": 12, "descriptors_maccskei": 12, "descriptors_unsc_physchem": 12, "descriptors_physchem": 12, "descriptors_physchem_rdkitnam": 12, "descriptors_amorprot": 12, "descriptors_unsc_mapc": 12, "descriptors_mapc": 12, "descriptors_mapc_maxradiu": 12, "descriptors_mapc_npermut": 12, "descriptors_unsc_jazzi": 12, "descriptors_jazzi": 12, "descriptors_jazzy_jazzynam": 12, "descriptors_precomput": 12, "descriptors_precomputed_fil": 12, "descriptors_precomputed_input_columnn": 12, "descriptors_precomputed_response_column": 12, "descriptors_unsc_zscal": 12, "descriptors_zscal": 12, "descriptors_smil": 12, "descriptors_smiles_and_si": 12, "descriptors_smiles_and_si_fil": 12, "descriptors_smiles_and_si_input_column": 12, "descriptors_smiles_and_si_aux_weight_pc": 12, "descriptors_sc": 12, "descriptors_scaled_descriptor": 12, "descriptors_scaled_descriptor_paramet": 12, "descriptors_composit": 12, "settings_mod": 12, "settings_mode_regress": 12, "settings_mode_classif": 12, "settings_cross_valid": 12, "settings_direct": 12, "settings_n_tri": 12, "settings_n_job": 12, "settings_shuffl": 12, "algorithms_low": 12, "algorithms_high": 12, "algorithms_q": 12, "algorithms_interface_sklearn": 12, "algorithms_interface_xgboost": 12, "algorithms_rfregressor": 12, "algorithms_rfclassifi": 12, "algorithms_rf_max_featur": 12, "algorithms_rf_max_depth": 12, "algorithms_rf_n_estim": 12, "algorithms_svr": 12, "algorithms_svr_c": 12, "algorithms_svr_gamma": 12, "algorithms_svc": 12, "algorithms_svc_c": 12, "algorithms_svc_gamma": 12, "algorithms_lasso": 12, "algorithms_lasso_alpha": 12, "algorithms_kneighborsclassifi": 12, "algorithms_kneighborsregressor": 12, "algorithms_kneighbors_n_neighbor": 12, "algorithms_kneighbors_metr": 12, "algorithms_kneighbors_weight": 12, "algorithms_ridg": 12, "algorithms_ridge_alpha": 12, "algorithms_plsregress": 12, "algorithms_plsregression_n_compon": 12, "algorithms_logisticregress": 12, "algorithms_logisticregression_solv": 12, "algorithms_logisticregression_c": 12, "algorithms_adaboostclassifi": 12, "algorithms_adaboostclassifier_n_estim": 12, "algorithms_adaboostclassifier_learning_r": 12, "algorithms_xgbregressor": 12, "algorithms_xgbregressor_max_depth": 12, "algorithms_xgbregressor_n_estim": 12, "algorithms_xgbregressor_learning_r": 12, "algorithms_prf": 12, "algorithms_prf_max_featur": 12, "algorithms_prf_max_depth": 12, "algorithms_prf_n_estim": 12, "algorithms_prf_minpysumleaf": 12, "algorithms_prf_use_py_gini": 12, "algorithms_prf_use_py_leaf": 12, "algorithms_chemprop": 12, "basechemprop": 12, "algorithms_chemprop_regressor": 12, "algorithms_chemprop_hyperopt_regressor": 12, "algorithms_chemprop_classifi": 12, "algorithms_chemprop_hyperopt_classifi": 12, "algorithms_chemprop_activ": 12, "algorithms_chemprop_aggreg": 12, "algorithms_chemprop_aggregation_norm": 12, "algorithms_chemprop_batch_s": 12, "algorithms_chemprop_depth": 12, "algorithms_chemprop_dropout": 12, "algorithms_chemprop_epoch": 12, "algorithms_chemprop_ensemble_s": 12, "algorithms_chemprop_features_gener": 12, "algorithms_chemprop_ffn_hidden_s": 12, "algorithms_chemprop_ffn_num_lay": 12, "algorithms_chemprop_frzn": 12, "algorithms_chemprop_final_lr_ratio_exp": 12, "algorithms_chemprop_hidden_s": 12, "algorithms_chemprop_num_it": 12, "algorithms_chemprop_init_lr_ratio_exp": 12, "algorithms_chemprop_max_lr_exp": 12, "algorithms_chemprop_pretrained_model": 12, "algorithms_chemprop_search_parameter_level": 12, "algorithms_chemprop_startup_random_it": 12, "startup_random_it": 12, "algorithms_chemprop_warmup_epochs_ratio": 12, "algorithms_calibratedclassifiercv": 12, "algorithms_calibratedclassifiercv_ensembl": 12, "algorithms_calibratedclassifiercv_estim": 12, "algorithms_calibratedclassifiercv_method": 12, "algorithms_calibratedclassifiercv_n_fold": 12, "algorithms_calibratedclassifiercv_param": 12, "calibrated_param": 12, "algorithms_mapi": 12, "algorithms_mapie_alpha": 12, "interfaceenum": 12, "sklearn_set": 12, "xgboost_set": 12, "chemprop_set": 12, "prf_set": 12, "calibrated_set": 12, "modelrunnerdataframeenum": 12, "modelrunn": 12, "objectiveenum": 12, "attribute_trial_train_scor": 12, "extra_column_besthit": 12, "besthit": 12, "optimizationconfigurationenum": 12, "predictionconfigurationenum": 12, "data_dataset": 12, "sklearnreturnvalueenum": 12, "cross_validate_fit_tim": 12, "fit_tim": 12, "cross_validate_score_tim": 12, "score_tim": 12, "cross_validate_test_scor": 12, "cross_validate_train_scor": 12, "xgboostreturnvalueenum": 12, "visualizationenum": 12, "visualization_regressor": 12, "visualization_classifi": 12, "visualization_use_xvfb": 12, "visualization_output_fold": 12, "visualization_file_format": 12, "visualization_plot": 12, "visualization_plots_histori": 12, "visualization_plots_contour": 12, "visualization_plots_parallel_coordin": 12, "visualization_plots_slic": 12, "optuna_system_attrs_numb": 12, "_number": 12, "optuna_system_attrs_intermediate_valu": 12, "intermediate_valu": 12, "optuna_system_attrs_trial_id": 12, "trial_id": 12, "studyuserattr": 12, "trialuserattr": 12, "trialparam": 12, "algorithm_hash": 12, "mlflowlogparam": 12, "sklearnsplitt": 13, "get_n_split": 13, "cvsplitter": 13, "although": 13, "underli": 13, "get_sklearn_splitt": 13, "n_split": 13, "repeat": [13, 14], "edg": [13, 14], "stratifiedshufflesplit": [13, 14], "revert": [13, 14], "empti": 13, "kfold": 13, "consecut": 13, "fd_bin": 13, "11879": 13, "10297": 13, "adjac": 13, "downstream": 13, "nativ": 13, "histogramstratifiedshufflesplit": 13, "test_fract": 13, "groupingsplitt": 13, "column_nam": [13, 14], "butina_clust": [13, 14], "cluster": [13, 14], "butina": [13, 14], "make_scaffold_gener": [13, 14], "murcko": [13, 14], "hetero": [13, 14], "difficulti": [13, 14], "novel": [13, 14], "datatransformerror": 13, "datatransform": 13, "logarithm": [13, 15], "base_dict": 13, "ufunc": 13, "base_neg": 13, "reverse_dict": 13, "exp": 13, "transform_df": 13, "transform_on": 13, "reverse_transform_df": 13, "reverse_transform_on": 13, "auxtransform": 13, "transfor": 13, "auxiliary_data": 13, "usabl": [13, 15]}, "objects": {"": [[9, 0, 0, "-", "optunaz"]], "optunaz": [[9, 0, 0, "-", "automl"], [9, 0, 0, "-", "builder"], [10, 0, 0, "-", "config"], [9, 0, 0, "-", "datareader"], [9, 0, 0, "-", "descriptors"], [9, 0, 0, "-", "evaluate"], [9, 0, 0, "-", "explainability"], [9, 0, 0, "-", "metircs"], [9, 0, 0, "-", "model_writer"], [9, 0, 0, "-", "objective"], [9, 0, 0, "-", "optbuild"], [9, 0, 0, "-", "predict"], [9, 0, 0, "-", "schemagen"], [9, 0, 0, "-", "three_step_opt_build_merge"], [11, 0, 0, "-", "utils"], [9, 0, 0, "-", "visualizer"]], "optunaz.automl": [[9, 1, 1, "", "ModelAutoML"], [9, 1, 1, "", "ModelDispatcher"], [9, 4, 1, "", "dispatcher_process"], [9, 4, 1, "", "main"], [9, 4, 1, "", "meta"], [9, 4, 1, "", "prepare_dispatcher"], [9, 4, 1, "", "process_retraining_task"], [9, 4, 1, "", "validate_args"]], "optunaz.automl.ModelAutoML": [[9, 2, 1, "", "first_run"], [9, 3, 1, "", "getAllRetrainingData"], [9, 3, 1, "", "getRetrainingData"], [9, 3, 1, "", "initProcessedTimepoints"], [9, 2, 1, "", "last_timepoint"], [9, 2, 1, "", "processed_timepoints"], [9, 3, 1, "", "setProcessedTimepoints"], [9, 3, 1, "", "setRetrainingData"]], "optunaz.automl.ModelDispatcher": [[9, 3, 1, "", "addSlurmRetry"], [9, 3, 1, "", "calcSlurmMem"], [9, 3, 1, "", "checkIfRetrainingProcessed"], [9, 3, 1, "", "checkRunningSlurmJobs"], [9, 3, 1, "", "checkSaveTemporalModel"], [9, 3, 1, "", "checkSkipped"], [9, 3, 1, "", "checkSlurmStatusAndNextProcedure"], [9, 3, 1, "", "checkisLocked"], [9, 3, 1, "", "doTemporalPredictions"], [9, 3, 1, "", "getSlurmRetry"], [9, 3, 1, "", "increaseJobCpu"], [9, 3, 1, "", "increaseJobMem"], [9, 3, 1, "", "increaseJobTime"], [9, 3, 1, "", "isTrained"], [9, 2, 1, "", "pretrained_model"], [9, 3, 1, "", "processQuorum"], [9, 3, 1, "", "processRetraining"], [9, 3, 1, "", "processTrain"], [9, 3, 1, "", "resubmitAnyFailedJobs"], [9, 3, 1, "", "setDispatcherVariables"], [9, 3, 1, "", "setJobLocked"], [9, 3, 1, "", "setSkippedTimepoint"], [9, 3, 1, "", "submitJob"], [9, 3, 1, "", "writeDataset"], [9, 3, 1, "", "writeJson"], [9, 3, 1, "", "writeSlurm"]], "optunaz.builder": [[9, 4, 1, "", "build"]], "optunaz.config": [[10, 1, 1, "", "Algorithm"], [10, 1, 1, "", "ModelMode"], [10, 1, 1, "", "NameParameterDataclass"], [10, 1, 1, "", "OptimizationDirection"], [10, 1, 1, "", "Task"], [10, 1, 1, "", "Visualization"], [10, 0, 0, "-", "build_from_opt"], [10, 0, 0, "-", "buildconfig"], [10, 0, 0, "-", "optconfig"]], "optunaz.config.ModelMode": [[10, 5, 1, "", "CLASSIFICATION"], [10, 5, 1, "", "REGRESSION"]], "optunaz.config.NameParameterDataclass": [[10, 3, 1, "", "new"]], "optunaz.config.OptimizationDirection": [[10, 5, 1, "", "MAXIMIZATION"], [10, 5, 1, "", "MINIMIZATION"]], "optunaz.config.Task": [[10, 5, 1, "", "BUILDING"], [10, 5, 1, "", "OPTIMIZATION"], [10, 5, 1, "", "PREDICTION"]], "optunaz.config.Visualization": [[10, 1, 1, "", "ImageFileFormat"], [10, 1, 1, "", "Plots"], [10, 5, 1, "", "file_format"], [10, 5, 1, "", "output_folder"], [10, 5, 1, "", "plots"], [10, 5, 1, "", "use_xvfb"]], "optunaz.config.Visualization.ImageFileFormat": [[10, 5, 1, "", "JPEG"], [10, 5, 1, "", "JPG"], [10, 5, 1, "", "PDF"], [10, 5, 1, "", "PNG"], [10, 5, 1, "", "SVG"]], "optunaz.config.Visualization.Plots": [[10, 5, 1, "", "plot_contour"], [10, 5, 1, "", "plot_history"], [10, 5, 1, "", "plot_parallel_coordinate"], [10, 5, 1, "", "plot_slice"]], "optunaz.config.build_from_opt": [[10, 4, 1, "", "buildconfig_from_trial"], [10, 4, 1, "", "check_invalid_descriptor_param"], [10, 4, 1, "", "encode_name"], [10, 4, 1, "", "remove_algo_hash"], [10, 4, 1, "", "set_build_cache"], [10, 4, 1, "", "suggest_alg_params"], [10, 4, 1, "", "suggest_aux_params"]], "optunaz.config.buildconfig": [[10, 1, 1, "", "AdaBoostClassifier"], [10, 1, 1, "", "Algorithm"], [10, 1, 1, "", "BuildConfig"], [10, 1, 1, "", "CalibratedClassifierCVWithVA"], [10, 1, 1, "", "ChemPropClassifier"], [10, 1, 1, "", "ChemPropHyperoptClassifier"], [10, 1, 1, "", "ChemPropHyperoptRegressor"], [10, 1, 1, "", "ChemPropRegressor"], [10, 1, 1, "", "ChemPropRegressorPretrained"], [10, 1, 1, "", "KNeighborsClassifier"], [10, 1, 1, "", "KNeighborsRegressor"], [10, 1, 1, "", "Lasso"], [10, 1, 1, "", "LogisticRegression"], [10, 1, 1, "", "Mapie"], [10, 1, 1, "", "PLSRegression"], [10, 1, 1, "", "PRFClassifier"], [10, 1, 1, "", "RandomForestClassifier"], [10, 1, 1, "", "RandomForestRegressor"], [10, 1, 1, "", "Ridge"], [10, 1, 1, "", "SVC"], [10, 1, 1, "", "SVR"], [10, 1, 1, "", "XGBRegressor"]], "optunaz.config.buildconfig.AdaBoostClassifier": [[10, 1, 1, "", "AdaBoostClassifierParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.AdaBoostClassifier.AdaBoostClassifierParameters": [[10, 5, 1, "", "learning_rate"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.buildconfig.Algorithm": [[10, 3, 1, "", "estimator"]], "optunaz.config.buildconfig.BuildConfig": [[10, 1, 1, "", "Metadata"], [10, 1, 1, "", "Settings"], [10, 5, 1, "", "algorithm"], [10, 5, 1, "", "data"], [10, 5, 1, "", "descriptor"], [10, 5, 1, "", "metadata"], [10, 5, 1, "", "settings"], [10, 5, 1, "", "task"]], "optunaz.config.buildconfig.BuildConfig.Metadata": [[10, 5, 1, "", "best_trial"], [10, 5, 1, "", "best_value"], [10, 5, 1, "", "cross_validation"], [10, 5, 1, "", "n_trials"], [10, 5, 1, "", "name"], [10, 5, 1, "", "shuffle"], [10, 5, 1, "", "visualization"]], "optunaz.config.buildconfig.BuildConfig.Settings": [[10, 5, 1, "", "direction"], [10, 5, 1, "", "mode"], [10, 5, 1, "", "n_trials"], [10, 5, 1, "", "scoring"], [10, 5, 1, "", "tracking_rest_endpoint"]], "optunaz.config.buildconfig.CalibratedClassifierCVWithVA": [[10, 1, 1, "", "CalibratedClassifierCVParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.CalibratedClassifierCVWithVA.CalibratedClassifierCVParameters": [[10, 5, 1, "", "ensemble"], [10, 5, 1, "", "estimator"], [10, 5, 1, "", "method"], [10, 5, 1, "", "n_folds"]], "optunaz.config.buildconfig.ChemPropClassifier": [[10, 1, 1, "", "ChemPropClassifierParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.ChemPropClassifier.ChemPropClassifierParameters": [[10, 5, 1, "", "activation"], [10, 5, 1, "", "aggregation"], [10, 5, 1, "", "aggregation_norm"], [10, 5, 1, "", "aux_weight_pc"], [10, 5, 1, "", "batch_size"], [10, 5, 1, "", "depth"], [10, 5, 1, "", "dropout"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "ffn_hidden_size"], [10, 5, 1, "", "ffn_num_layers"], [10, 5, 1, "", "final_lr_ratio_exp"], [10, 5, 1, "", "hidden_size"], [10, 5, 1, "", "init_lr_ratio_exp"], [10, 5, 1, "", "max_lr_exp"], [10, 5, 1, "", "warmup_epochs_ratio"]], "optunaz.config.buildconfig.ChemPropHyperoptClassifier": [[10, 1, 1, "", "ChemPropHyperoptClassifierParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.ChemPropHyperoptClassifier.ChemPropHyperoptClassifierParameters": [[10, 5, 1, "", "aux_weight_pc"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "num_iters"], [10, 5, 1, "", "search_parameter_level"]], "optunaz.config.buildconfig.ChemPropHyperoptRegressor": [[10, 1, 1, "", "ChemPropHyperoptRegressorParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.ChemPropHyperoptRegressor.ChemPropHyperoptRegressorParameters": [[10, 5, 1, "", "aux_weight_pc"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "num_iters"], [10, 5, 1, "", "search_parameter_level"]], "optunaz.config.buildconfig.ChemPropRegressor": [[10, 1, 1, "", "ChemPropRegressorParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.ChemPropRegressor.ChemPropRegressorParameters": [[10, 5, 1, "", "activation"], [10, 5, 1, "", "aggregation"], [10, 5, 1, "", "aggregation_norm"], [10, 5, 1, "", "aux_weight_pc"], [10, 5, 1, "", "batch_size"], [10, 5, 1, "", "depth"], [10, 5, 1, "", "dropout"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "ffn_hidden_size"], [10, 5, 1, "", "ffn_num_layers"], [10, 5, 1, "", "final_lr_ratio_exp"], [10, 5, 1, "", "hidden_size"], [10, 5, 1, "", "init_lr_ratio_exp"], [10, 5, 1, "", "max_lr_exp"], [10, 5, 1, "", "warmup_epochs_ratio"]], "optunaz.config.buildconfig.ChemPropRegressorPretrained": [[10, 1, 1, "", "ChemPropRegressorPretrainedParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.ChemPropRegressorPretrained.ChemPropRegressorPretrainedParameters": [[10, 5, 1, "", "epochs"], [10, 5, 1, "", "frzn"], [10, 5, 1, "", "pretrained_model"]], "optunaz.config.buildconfig.KNeighborsClassifier": [[10, 1, 1, "", "KNeighborsClassifierParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.KNeighborsClassifier.KNeighborsClassifierParameters": [[10, 5, 1, "", "metric"], [10, 5, 1, "", "n_neighbors"], [10, 5, 1, "", "weights"]], "optunaz.config.buildconfig.KNeighborsRegressor": [[10, 1, 1, "", "KNeighborsRegressorParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.KNeighborsRegressor.KNeighborsRegressorParameters": [[10, 5, 1, "", "metric"], [10, 5, 1, "", "n_neighbors"], [10, 5, 1, "", "weights"]], "optunaz.config.buildconfig.Lasso": [[10, 1, 1, "", "LassoParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.Lasso.LassoParameters": [[10, 5, 1, "", "alpha"]], "optunaz.config.buildconfig.LogisticRegression": [[10, 1, 1, "", "LogisticRegressionParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.LogisticRegression.LogisticRegressionParameters": [[10, 5, 1, "", "C"], [10, 5, 1, "", "solver"]], "optunaz.config.buildconfig.Mapie": [[10, 1, 1, "", "MapieParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.Mapie.MapieParameters": [[10, 5, 1, "", "estimator"], [10, 5, 1, "", "mapie_alpha"]], "optunaz.config.buildconfig.PLSRegression": [[10, 1, 1, "", "PLSParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.PLSRegression.PLSParameters": [[10, 5, 1, "", "n_components"]], "optunaz.config.buildconfig.PRFClassifier": [[10, 1, 1, "", "PRFClassifierParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.PRFClassifier.PRFClassifierParameters": [[10, 5, 1, "", "bootstrap"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "min_py_sum_leaf"], [10, 5, 1, "", "n_estimators"], [10, 5, 1, "", "new_syn_data_frac"], [10, 5, 1, "", "use_py_gini"], [10, 5, 1, "", "use_py_leafs"]], "optunaz.config.buildconfig.RandomForestClassifier": [[10, 1, 1, "", "RandomForestParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.RandomForestClassifier.RandomForestParameters": [[10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.buildconfig.RandomForestRegressor": [[10, 1, 1, "", "RandomForestParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.RandomForestRegressor.RandomForestParameters": [[10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.buildconfig.Ridge": [[10, 1, 1, "", "RidgeParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.Ridge.RidgeParameters": [[10, 5, 1, "", "alpha"]], "optunaz.config.buildconfig.SVC": [[10, 1, 1, "", "SVCParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.SVC.SVCParameters": [[10, 5, 1, "", "C"], [10, 5, 1, "", "gamma"]], "optunaz.config.buildconfig.SVR": [[10, 1, 1, "", "SVRParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.SVR.SVRParameters": [[10, 5, 1, "", "C"], [10, 5, 1, "", "gamma"]], "optunaz.config.buildconfig.XGBRegressor": [[10, 1, 1, "", "XGBRegressorParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.XGBRegressor.XGBRegressorParameters": [[10, 5, 1, "", "learning_rate"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.optconfig": [[10, 1, 1, "", "AdaBoostClassifier"], [10, 1, 1, "", "Algorithm"], [10, 1, 1, "", "CalibratedClassifierCVEnsemble"], [10, 1, 1, "", "CalibratedClassifierCVMethod"], [10, 1, 1, "", "CalibratedClassifierCVWithVA"], [10, 1, 1, "", "ChemPropActivation"], [10, 1, 1, "", "ChemPropAggregation"], [10, 1, 1, "", "ChemPropClassifier"], [10, 1, 1, "", "ChemPropFeatures_Generator"], [10, 1, 1, "", "ChemPropFrzn"], [10, 1, 1, "", "ChemPropHyperoptClassifier"], [10, 1, 1, "", "ChemPropHyperoptRegressor"], [10, 1, 1, "", "ChemPropRegressor"], [10, 1, 1, "", "ChemPropRegressorPretrained"], [10, 1, 1, "", "ChemPropSearch_Parameter_Level"], [10, 1, 1, "", "ClassificationScore"], [10, 1, 1, "", "KNeighborsClassifier"], [10, 1, 1, "", "KNeighborsMetric"], [10, 1, 1, "", "KNeighborsRegressor"], [10, 1, 1, "", "KNeighborsWeights"], [10, 1, 1, "", "Lasso"], [10, 1, 1, "", "LogisticRegression"], [10, 1, 1, "", "Mapie"], [10, 1, 1, "", "OptimizationConfig"], [10, 1, 1, "", "PLSRegression"], [10, 1, 1, "", "PRFClassifier"], [10, 1, 1, "", "PRFClassifierMaxFeatures"], [10, 1, 1, "", "RandomForestClassifier"], [10, 1, 1, "", "RandomForestMaxFeatures"], [10, 1, 1, "", "RandomForestRegressor"], [10, 1, 1, "", "RegressionScore"], [10, 1, 1, "", "Ridge"], [10, 1, 1, "", "SVC"], [10, 1, 1, "", "SVR"], [10, 1, 1, "", "XGBRegressor"], [10, 4, 1, "", "copy_path_for_scaled_descriptor"], [10, 4, 1, "", "detect_mode_from_algs"], [10, 4, 1, "", "isanyof"]], "optunaz.config.optconfig.AdaBoostClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.AdaBoostClassifier.Parameters": [[10, 1, 1, "", "AdaBoostClassifierParametersLearningRate"], [10, 1, 1, "", "AdaBoostClassifierParametersNEstimators"], [10, 5, 1, "", "learning_rate"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.optconfig.AdaBoostClassifier.Parameters.AdaBoostClassifierParametersLearningRate": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.AdaBoostClassifier.Parameters.AdaBoostClassifierParametersNEstimators": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.CalibratedClassifierCVEnsemble": [[10, 5, 1, "", "FALSE"], [10, 5, 1, "", "TRUE"]], "optunaz.config.optconfig.CalibratedClassifierCVMethod": [[10, 5, 1, "", "ISOTONIC"], [10, 5, 1, "", "SIGMOID"], [10, 5, 1, "", "VENNABERS"]], "optunaz.config.optconfig.CalibratedClassifierCVWithVA": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.CalibratedClassifierCVWithVA.Parameters": [[10, 5, 1, "", "ensemble"], [10, 5, 1, "", "estimator"], [10, 5, 1, "", "method"], [10, 5, 1, "", "n_folds"]], "optunaz.config.optconfig.ChemPropActivation": [[10, 5, 1, "", "ELU"], [10, 5, 1, "", "LEAKYRELU"], [10, 5, 1, "", "PRELU"], [10, 5, 1, "", "RELU"], [10, 5, 1, "", "SELU"], [10, 5, 1, "", "TANH"]], "optunaz.config.optconfig.ChemPropAggregation": [[10, 5, 1, "", "MEAN"], [10, 5, 1, "", "NORM"], [10, 5, 1, "", "SUM"]], "optunaz.config.optconfig.ChemPropClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters": [[10, 1, 1, "", "ChemPropParametersAggregation_Norm"], [10, 1, 1, "", "ChemPropParametersBatch_Size"], [10, 1, 1, "", "ChemPropParametersDepth"], [10, 1, 1, "", "ChemPropParametersDropout"], [10, 1, 1, "", "ChemPropParametersFFN_Hidden_Size"], [10, 1, 1, "", "ChemPropParametersFFN_Num_Layers"], [10, 1, 1, "", "ChemPropParametersFinal_Lr_Ratio_Exp"], [10, 1, 1, "", "ChemPropParametersHidden_Size"], [10, 1, 1, "", "ChemPropParametersInit_Lr_Ratio_Exp"], [10, 1, 1, "", "ChemPropParametersMax_Lr_Exp"], [10, 1, 1, "", "ChemPropParametersWarmup_Epochs_Ratio"], [10, 5, 1, "", "activation"], [10, 5, 1, "", "aggregation"], [10, 5, 1, "", "aggregation_norm"], [10, 5, 1, "", "batch_size"], [10, 5, 1, "", "depth"], [10, 5, 1, "", "dropout"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "ffn_hidden_size"], [10, 5, 1, "", "ffn_num_layers"], [10, 5, 1, "", "final_lr_ratio_exp"], [10, 5, 1, "", "hidden_size"], [10, 5, 1, "", "init_lr_ratio_exp"], [10, 5, 1, "", "max_lr_exp"], [10, 5, 1, "", "warmup_epochs_ratio"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersAggregation_Norm": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersBatch_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersDropout": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersFFN_Hidden_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersFFN_Num_Layers": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersFinal_Lr_Ratio_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersHidden_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersInit_Lr_Ratio_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersMax_Lr_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersWarmup_Epochs_Ratio": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropFeatures_Generator": [[10, 5, 1, "", "MORGAN"], [10, 5, 1, "", "MORGAN_COUNT"], [10, 5, 1, "", "NONE"], [10, 5, 1, "", "RDKIT_2D"], [10, 5, 1, "", "RDKIT_2D_NORMALIZED"]], "optunaz.config.optconfig.ChemPropFrzn": [[10, 5, 1, "", "MPNN"], [10, 5, 1, "", "MPNN_FIRST_FFN"], [10, 5, 1, "", "MPNN_LAST_FFN"], [10, 5, 1, "", "NONE"]], "optunaz.config.optconfig.ChemPropHyperoptClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.ChemPropHyperoptClassifier.Parameters": [[10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "num_iters"], [10, 5, 1, "", "search_parameter_level"]], "optunaz.config.optconfig.ChemPropHyperoptRegressor": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.ChemPropHyperoptRegressor.Parameters": [[10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "num_iters"], [10, 5, 1, "", "search_parameter_level"]], "optunaz.config.optconfig.ChemPropRegressor": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters": [[10, 1, 1, "", "ChemPropParametersAggregation_Norm"], [10, 1, 1, "", "ChemPropParametersBatch_Size"], [10, 1, 1, "", "ChemPropParametersDepth"], [10, 1, 1, "", "ChemPropParametersDropout"], [10, 1, 1, "", "ChemPropParametersFFN_Hidden_Size"], [10, 1, 1, "", "ChemPropParametersFFN_Num_Layers"], [10, 1, 1, "", "ChemPropParametersFinal_Lr_Ratio_Exp"], [10, 1, 1, "", "ChemPropParametersHidden_Size"], [10, 1, 1, "", "ChemPropParametersInit_Lr_Ratio_Exp"], [10, 1, 1, "", "ChemPropParametersMax_Lr_Exp"], [10, 1, 1, "", "ChemPropParametersWarmup_Epochs_Ratio"], [10, 5, 1, "", "activation"], [10, 5, 1, "", "aggregation"], [10, 5, 1, "", "aggregation_norm"], [10, 5, 1, "", "batch_size"], [10, 5, 1, "", "depth"], [10, 5, 1, "", "dropout"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "ffn_hidden_size"], [10, 5, 1, "", "ffn_num_layers"], [10, 5, 1, "", "final_lr_ratio_exp"], [10, 5, 1, "", "hidden_size"], [10, 5, 1, "", "init_lr_ratio_exp"], [10, 5, 1, "", "max_lr_exp"], [10, 5, 1, "", "warmup_epochs_ratio"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersAggregation_Norm": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersBatch_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersDropout": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersFFN_Hidden_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersFFN_Num_Layers": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersFinal_Lr_Ratio_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersHidden_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersInit_Lr_Ratio_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersMax_Lr_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersWarmup_Epochs_Ratio": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressorPretrained": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.ChemPropRegressorPretrained.Parameters": [[10, 1, 1, "", "ChemPropParametersEpochs"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "frzn"], [10, 5, 1, "", "pretrained_model"]], "optunaz.config.optconfig.ChemPropRegressorPretrained.Parameters.ChemPropParametersEpochs": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropSearch_Parameter_Level": [[10, 5, 1, "", "AUTO"], [10, 5, 1, "", "L1"], [10, 5, 1, "", "L2"], [10, 5, 1, "", "L3"], [10, 5, 1, "", "L4"], [10, 5, 1, "", "L5"], [10, 5, 1, "", "L6"], [10, 5, 1, "", "L7"], [10, 5, 1, "", "L8"]], "optunaz.config.optconfig.ClassificationScore": [[10, 5, 1, "", "ACCURACY"], [10, 5, 1, "", "AUC_PR_CAL"], [10, 5, 1, "", "AVERAGE_PRECISION"], [10, 5, 1, "", "BALANCED_ACCURACY"], [10, 5, 1, "", "BEDROC"], [10, 5, 1, "", "CONCORDANCE_INDEX"], [10, 5, 1, "", "F1"], [10, 5, 1, "", "F1_MACRO"], [10, 5, 1, "", "F1_MICRO"], [10, 5, 1, "", "F1_WEIGHTED"], [10, 5, 1, "", "JACCARD"], [10, 5, 1, "", "JACCARD_MACRO"], [10, 5, 1, "", "JACCARD_MICRO"], [10, 5, 1, "", "JACCARD_WEIGHTED"], [10, 5, 1, "", "NEG_BRIER_SCORE"], [10, 5, 1, "", "PRECISION"], [10, 5, 1, "", "PRECISION_MACRO"], [10, 5, 1, "", "PRECISION_MICRO"], [10, 5, 1, "", "PRECISION_WEIGHTED"], [10, 5, 1, "", "RECALL"], [10, 5, 1, "", "RECALL_MACRO"], [10, 5, 1, "", "RECALL_MICRO"], [10, 5, 1, "", "RECALL_WEIGHTED"], [10, 5, 1, "", "ROC_AUC"]], "optunaz.config.optconfig.KNeighborsClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.KNeighborsClassifier.Parameters": [[10, 1, 1, "", "KNeighborsClassifierParametersN_Neighbors"], [10, 5, 1, "", "metric"], [10, 5, 1, "", "n_neighbors"], [10, 5, 1, "", "weights"]], "optunaz.config.optconfig.KNeighborsClassifier.Parameters.KNeighborsClassifierParametersN_Neighbors": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.KNeighborsMetric": [[10, 5, 1, "", "EUCLIDEAN"], [10, 5, 1, "", "MANHATTAN"], [10, 5, 1, "", "MINKOWSKI"]], "optunaz.config.optconfig.KNeighborsRegressor": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.KNeighborsRegressor.Parameters": [[10, 1, 1, "", "KNeighborsRegressorParametersN_Neighbors"], [10, 5, 1, "", "metric"], [10, 5, 1, "", "n_neighbors"], [10, 5, 1, "", "weights"]], "optunaz.config.optconfig.KNeighborsRegressor.Parameters.KNeighborsRegressorParametersN_Neighbors": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.KNeighborsWeights": [[10, 5, 1, "", "DISTANCE"], [10, 5, 1, "", "UNIFORM"]], "optunaz.config.optconfig.Lasso": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.Lasso.Parameters": [[10, 1, 1, "", "LassoParametersAlpha"], [10, 5, 1, "", "alpha"]], "optunaz.config.optconfig.Lasso.Parameters.LassoParametersAlpha": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.LogisticRegression": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.LogisticRegression.Parameters": [[10, 5, 1, "", "C"], [10, 1, 1, "", "LogisticRegressionParametersParameterC"], [10, 5, 1, "", "solver"]], "optunaz.config.optconfig.LogisticRegression.Parameters.LogisticRegressionParametersParameterC": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.Mapie": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.Mapie.Parameters": [[10, 5, 1, "", "estimator"], [10, 5, 1, "", "mapie_alpha"]], "optunaz.config.optconfig.OptimizationConfig": [[10, 1, 1, "", "Settings"], [10, 5, 1, "", "algorithms"], [10, 5, 1, "", "data"], [10, 5, 1, "", "description"], [10, 5, 1, "", "descriptors"], [10, 5, 1, "", "mode"], [10, 5, 1, "", "name"], [10, 3, 1, "", "set_algo_hashes"], [10, 3, 1, "", "set_cache"], [10, 5, 1, "", "settings"], [10, 5, 1, "", "task"], [10, 5, 1, "", "visualization"]], "optunaz.config.optconfig.OptimizationConfig.Settings": [[10, 5, 1, "", "cross_validation"], [10, 5, 1, "", "cv_split_strategy"], [10, 5, 1, "", "direction"], [10, 5, 1, "", "minimise_std_dev"], [10, 5, 1, "", "mode"], [10, 5, 1, "", "n_chemprop_trials"], [10, 5, 1, "", "n_jobs"], [10, 5, 1, "", "n_startup_trials"], [10, 5, 1, "", "n_trials"], [10, 5, 1, "", "optuna_storage"], [10, 5, 1, "", "random_seed"], [10, 5, 1, "", "scoring"], [10, 5, 1, "", "shuffle"], [10, 5, 1, "", "split_chemprop"], [10, 5, 1, "", "track_to_mlflow"], [10, 5, 1, "", "tracking_rest_endpoint"], [10, 5, 1, "", "use_cache"]], "optunaz.config.optconfig.PLSRegression": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.PLSRegression.Parameters": [[10, 1, 1, "", "NComponents"], [10, 5, 1, "", "n_components"]], "optunaz.config.optconfig.PLSRegression.Parameters.NComponents": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.PRFClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.PRFClassifier.Parameters": [[10, 1, 1, "", "PRFClassifierParametersMaxDepth"], [10, 1, 1, "", "PRFClassifierParametersMinPySumLeaf"], [10, 1, 1, "", "PRFClassifierParametersNEstimators"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "min_py_sum_leaf"], [10, 5, 1, "", "n_estimators"], [10, 5, 1, "", "use_py_gini"], [10, 5, 1, "", "use_py_leafs"]], "optunaz.config.optconfig.PRFClassifier.Parameters.PRFClassifierParametersMaxDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.PRFClassifier.Parameters.PRFClassifierParametersMinPySumLeaf": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.PRFClassifier.Parameters.PRFClassifierParametersNEstimators": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.PRFClassifierMaxFeatures": [[10, 5, 1, "", "AUTO"], [10, 5, 1, "", "LOG2"], [10, 5, 1, "", "SQRT"]], "optunaz.config.optconfig.RandomForestClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.RandomForestClassifier.Parameters": [[10, 1, 1, "", "RandomForestClassifierParametersMaxDepth"], [10, 1, 1, "", "RandomForestClassifierParametersNEstimators"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.optconfig.RandomForestClassifier.Parameters.RandomForestClassifierParametersMaxDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.RandomForestClassifier.Parameters.RandomForestClassifierParametersNEstimators": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.RandomForestMaxFeatures": [[10, 5, 1, "", "AUTO"], [10, 5, 1, "", "LOG2"], [10, 5, 1, "", "SQRT"]], "optunaz.config.optconfig.RandomForestRegressor": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.RandomForestRegressor.Parameters": [[10, 1, 1, "", "RandomForestRegressorParametersMaxDepth"], [10, 1, 1, "", "RandomForestRegressorParametersNEstimators"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.optconfig.RandomForestRegressor.Parameters.RandomForestRegressorParametersMaxDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.RandomForestRegressor.Parameters.RandomForestRegressorParametersNEstimators": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.RegressionScore": [[10, 5, 1, "", "EXPLAINED_VARIANCE"], [10, 5, 1, "", "MAX_ERROR"], [10, 5, 1, "", "NEG_MEAN_ABSOLUTE_ERROR"], [10, 5, 1, "", "NEG_MEAN_SQUARED_ERROR"], [10, 5, 1, "", "NEG_MEDIAN_ABSOLUTE_ERROR"], [10, 5, 1, "", "R2"]], "optunaz.config.optconfig.Ridge": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.Ridge.Parameters": [[10, 1, 1, "", "Alpha"], [10, 5, 1, "", "alpha"]], "optunaz.config.optconfig.Ridge.Parameters.Alpha": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.SVC": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.SVC.Parameters": [[10, 5, 1, "", "C"], [10, 1, 1, "", "Gamma"], [10, 1, 1, "", "SVCParametersParameterC"], [10, 5, 1, "", "gamma"]], "optunaz.config.optconfig.SVC.Parameters.Gamma": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.SVC.Parameters.SVCParametersParameterC": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.SVR": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.SVR.Parameters": [[10, 5, 1, "", "C"], [10, 1, 1, "", "SVRParametersGamma"], [10, 1, 1, "", "SVRParametersParameterC"], [10, 5, 1, "", "gamma"]], "optunaz.config.optconfig.SVR.Parameters.SVRParametersGamma": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.SVR.Parameters.SVRParametersParameterC": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.XGBRegressor": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.XGBRegressor.Parameters": [[10, 1, 1, "", "LearningRate"], [10, 1, 1, "", "MaxDepth"], [10, 1, 1, "", "NEstimators"], [10, 5, 1, "", "learning_rate"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.optconfig.XGBRegressor.Parameters.LearningRate": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.XGBRegressor.Parameters.MaxDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.XGBRegressor.Parameters.NEstimators": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.datareader": [[9, 1, 1, "", "Dataset"], [9, 4, 1, "", "deduplicate"], [9, 4, 1, "", "isvalid"], [9, 4, 1, "", "merge"], [9, 4, 1, "", "read_data"], [9, 4, 1, "", "split"], [9, 4, 1, "", "transform"]], "optunaz.datareader.Dataset": [[9, 5, 1, "", "aux_column"], [9, 5, 1, "", "aux_transform"], [9, 3, 1, "", "check_sets"], [9, 5, 1, "", "deduplication_strategy"], [9, 3, 1, "", "get_merged_sets"], [9, 3, 1, "", "get_sets"], [9, 5, 1, "", "input_column"], [9, 5, 1, "", "intermediate_test_dataset_file"], [9, 5, 1, "", "intermediate_training_dataset_file"], [9, 5, 1, "", "log_transform"], [9, 5, 1, "", "log_transform_base"], [9, 5, 1, "", "log_transform_negative"], [9, 5, 1, "", "log_transform_unit_conversion"], [9, 5, 1, "", "probabilistic_threshold_representation"], [9, 5, 1, "", "probabilistic_threshold_representation_std"], [9, 5, 1, "", "probabilistic_threshold_representation_threshold"], [9, 5, 1, "", "response_column"], [9, 5, 1, "", "response_type"], [9, 5, 1, "", "save_intermediate_files"], [9, 5, 1, "", "split_strategy"], [9, 5, 1, "", "test_dataset_file"], [9, 5, 1, "", "training_dataset_file"]], "optunaz.descriptors": [[9, 1, 1, "", "AmorProtDescriptors"], [9, 1, 1, "", "Avalon"], [9, 1, 1, "", "CanonicalSmiles"], [9, 1, 1, "", "CompositeDescriptor"], [9, 1, 1, "", "ECFP"], [9, 1, 1, "", "ECFP_counts"], [9, 1, 1, "", "FittedSklearnScaler"], [9, 1, 1, "", "GenericScaffold"], [9, 1, 1, "", "JazzyDescriptors"], [9, 1, 1, "", "MACCS_keys"], [9, 1, 1, "", "MAPC"], [9, 1, 1, "", "MolDescriptor"], [9, 6, 1, "", "NoValidSmiles"], [9, 1, 1, "", "PathFP"], [9, 1, 1, "", "PhyschemDescriptors"], [9, 1, 1, "", "PrecomputedDescriptorFromFile"], [9, 1, 1, "", "RdkitDescriptor"], [9, 1, 1, "", "Scaffold"], [9, 1, 1, "", "ScaledDescriptor"], [9, 6, 1, "", "ScalingFittingError"], [9, 1, 1, "", "SmilesAndSideInfoFromFile"], [9, 1, 1, "", "SmilesFromFile"], [9, 1, 1, "", "UnfittedSklearnScaler"], [9, 1, 1, "", "UnscaledJazzyDescriptors"], [9, 1, 1, "", "UnscaledMAPC"], [9, 1, 1, "", "UnscaledPhyschemDescriptors"], [9, 1, 1, "", "UnscaledZScalesDescriptors"], [9, 1, 1, "", "ValidDescriptor"], [9, 1, 1, "", "ZScalesDescriptors"], [9, 4, 1, "", "descriptor_from_config"], [9, 4, 1, "", "mol_from_smi"], [9, 4, 1, "", "numpy_from_rdkit"]], "optunaz.descriptors.AmorProtDescriptors": [[9, 1, 1, "", "AmorProt"], [9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.AmorProtDescriptors.AmorProt": [[9, 3, 1, "", "T"], [9, 3, 1, "", "fingerprint"]], "optunaz.descriptors.Avalon": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.Avalon.Parameters": [[9, 5, 1, "", "nBits"]], "optunaz.descriptors.CanonicalSmiles": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.CompositeDescriptor": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 3, 1, "", "fp_info"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.CompositeDescriptor.Parameters": [[9, 5, 1, "", "descriptors"]], "optunaz.descriptors.ECFP": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ECFP.Parameters": [[9, 5, 1, "", "nBits"], [9, 5, 1, "", "radius"], [9, 5, 1, "", "returnRdkit"]], "optunaz.descriptors.ECFP_counts": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ECFP_counts.Parameters": [[9, 5, 1, "", "nBits"], [9, 5, 1, "", "radius"], [9, 5, 1, "", "useFeatures"]], "optunaz.descriptors.FittedSklearnScaler": [[9, 3, 1, "", "get_fitted_scaler"], [9, 5, 1, "", "name"], [9, 5, 1, "", "saved_params"]], "optunaz.descriptors.GenericScaffold": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.JazzyDescriptors": [[9, 1, 1, "", "Parameters"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.JazzyDescriptors.Parameters": [[9, 5, 1, "", "descriptor"], [9, 5, 1, "", "jazzy_filters"], [9, 5, 1, "", "jazzy_names"], [9, 5, 1, "", "scaler"]], "optunaz.descriptors.MACCS_keys": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.MAPC": [[9, 1, 1, "", "Parameters"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.MAPC.Parameters": [[9, 5, 1, "", "descriptor"], [9, 5, 1, "", "maxRadius"], [9, 5, 1, "", "nPermutations"], [9, 5, 1, "", "scaler"]], "optunaz.descriptors.MolDescriptor": [[9, 3, 1, "", "calculate_from_smi"], [9, 3, 1, "", "parallel_compute_descriptor"]], "optunaz.descriptors.PathFP": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.PathFP.Parameters": [[9, 5, 1, "", "fpSize"], [9, 5, 1, "", "maxPath"]], "optunaz.descriptors.PhyschemDescriptors": [[9, 1, 1, "", "Parameters"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.PhyschemDescriptors.Parameters": [[9, 5, 1, "", "descriptor"], [9, 5, 1, "", "rdkit_names"], [9, 5, 1, "", "scaler"]], "optunaz.descriptors.PrecomputedDescriptorFromFile": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 3, 1, "", "inference_parameters"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.PrecomputedDescriptorFromFile.Parameters": [[9, 5, 1, "", "file"], [9, 5, 1, "", "input_column"], [9, 5, 1, "", "response_column"]], "optunaz.descriptors.RdkitDescriptor": [[9, 3, 1, "", "calculate_from_mol"], [9, 3, 1, "", "calculate_from_smi"]], "optunaz.descriptors.Scaffold": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ScaledDescriptor": [[9, 1, 1, "", "ScaledDescriptorParameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"], [9, 3, 1, "", "set_unfitted_scaler_data"]], "optunaz.descriptors.ScaledDescriptor.ScaledDescriptorParameters": [[9, 5, 1, "", "descriptor"], [9, 5, 1, "", "scaler"]], "optunaz.descriptors.SmilesAndSideInfoFromFile": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.SmilesAndSideInfoFromFile.Parameters": [[9, 1, 1, "", "Aux_Weight_Pc"], [9, 5, 1, "", "aux_weight_pc"], [9, 5, 1, "", "file"], [9, 5, 1, "", "input_column"]], "optunaz.descriptors.SmilesAndSideInfoFromFile.Parameters.Aux_Weight_Pc": [[9, 5, 1, "", "high"], [9, 5, 1, "", "low"], [9, 5, 1, "", "q"]], "optunaz.descriptors.SmilesFromFile": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.UnfittedSklearnScaler": [[9, 1, 1, "", "MolData"], [9, 3, 1, "", "get_fitted_scaler_for_fp"], [9, 5, 1, "", "mol_data"], [9, 5, 1, "", "name"]], "optunaz.descriptors.UnfittedSklearnScaler.MolData": [[9, 5, 1, "", "file_path"], [9, 5, 1, "", "smiles_column"]], "optunaz.descriptors.UnscaledJazzyDescriptors": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.UnscaledJazzyDescriptors.Parameters": [[9, 5, 1, "", "jazzy_filters"], [9, 5, 1, "", "jazzy_names"]], "optunaz.descriptors.UnscaledMAPC": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.UnscaledMAPC.Parameters": [[9, 5, 1, "", "maxRadius"], [9, 5, 1, "", "nPermutations"]], "optunaz.descriptors.UnscaledPhyschemDescriptors": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.UnscaledPhyschemDescriptors.Parameters": [[9, 5, 1, "", "rdkit_names"]], "optunaz.descriptors.UnscaledZScalesDescriptors": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ValidDescriptor": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ZScalesDescriptors": [[9, 1, 1, "", "Parameters"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ZScalesDescriptors.Parameters": [[9, 5, 1, "", "descriptor"], [9, 5, 1, "", "scaler"]], "optunaz.evaluate": [[9, 4, 1, "", "get_merged_train_score"], [9, 4, 1, "", "get_scores"], [9, 4, 1, "", "get_train_test_scores"], [9, 4, 1, "", "score_all"], [9, 4, 1, "", "score_all_smiles"]], "optunaz.explainability": [[9, 4, 1, "", "ExplainPreds"], [9, 4, 1, "", "ShapExplainer"], [9, 4, 1, "", "explain_ECFP"], [9, 4, 1, "", "get_ecfp_fpinfo"], [9, 4, 1, "", "get_ecfpcount_fpinfo"], [9, 4, 1, "", "get_fp_info"], [9, 4, 1, "", "runShap"]], "optunaz.metircs": [[9, 4, 1, "", "auc_pr_cal"], [9, 4, 1, "", "bedroc_score"], [9, 4, 1, "", "concordance_index"], [9, 4, 1, "", "validate_cls_input"]], "optunaz.model_writer": [[9, 1, 1, "", "Predictor"], [9, 1, 1, "", "QSARtunaModel"], [9, 4, 1, "", "get_metadata"], [9, 4, 1, "", "get_transform"], [9, 4, 1, "", "perform_ptr"], [9, 4, 1, "", "save_model"], [9, 4, 1, "", "wrap_model"]], "optunaz.model_writer.Predictor": [[9, 3, 1, "", "explain"], [9, 3, 1, "", "predict"], [9, 3, 1, "", "predict_proba"], [9, 3, 1, "", "predict_uncert"]], "optunaz.model_writer.QSARtunaModel": [[9, 5, 1, "", "aux_transform"], [9, 5, 1, "", "descriptor"], [9, 5, 1, "", "metadata"], [9, 5, 1, "", "mode"], [9, 3, 1, "", "predict_from_smiles"], [9, 5, 1, "", "predictor"], [9, 5, 1, "", "transform"]], "optunaz.objective": [[9, 6, 1, "", "NoValidDescriptors"], [9, 1, 1, "", "Objective"], [9, 4, 1, "", "null_scores"]], "optunaz.objective.Objective": [[9, 5, 1, "", "cache"], [9, 5, 1, "", "optconfig"], [9, 5, 1, "", "train_aux"], [9, 5, 1, "", "train_smiles"], [9, 5, 1, "", "train_y"]], "optunaz.optbuild": [[9, 4, 1, "", "main"]], "optunaz.predict": [[9, 6, 1, "", "ArgsError"], [9, 6, 1, "", "AuxCovariateMissing"], [9, 6, 1, "", "PrecomputedError"], [9, 6, 1, "", "UncertaintyError"], [9, 4, 1, "", "check_precomp_args"], [9, 4, 1, "", "main"], [9, 4, 1, "", "set_inference_params"], [9, 4, 1, "", "validate_args"], [9, 4, 1, "", "validate_aux"], [9, 4, 1, "", "validate_set_precomputed"], [9, 4, 1, "", "validate_uncertainty"]], "optunaz.schemagen": [[9, 4, 1, "", "doctitle"], [9, 4, 1, "", "main"], [9, 4, 1, "", "patch_schema_generic"], [9, 4, 1, "", "patch_schema_optunaz"], [9, 4, 1, "", "type_base_schema"]], "optunaz.three_step_opt_build_merge": [[9, 4, 1, "", "base_chemprop_params"], [9, 4, 1, "", "build_best"], [9, 4, 1, "", "build_merged"], [9, 4, 1, "", "buildconfig_best"], [9, 4, 1, "", "log_scores"], [9, 4, 1, "", "optimize"], [9, 4, 1, "", "run_study"], [9, 4, 1, "", "split_optimize"]], "optunaz.utils": [[12, 0, 0, "-", "enums"], [11, 0, 0, "-", "files_paths"], [11, 4, 1, "", "load_df_from_file"], [11, 0, 0, "-", "load_json"], [11, 4, 1, "", "md5_hash"], [11, 4, 1, "", "mkdict"], [11, 0, 0, "-", "mlflow"], [13, 0, 0, "-", "preprocessing"], [11, 4, 1, "", "remove_failed_idx"], [11, 0, 0, "-", "retraining"], [11, 0, 0, "-", "schema"], [11, 0, 0, "-", "tracking"]], "optunaz.utils.enums": [[12, 1, 1, "", "MlflowLogParams"], [12, 1, 1, "", "StudyUserAttrs"], [12, 1, 1, "", "TrialParams"], [12, 1, 1, "", "TrialUserAttrs"], [12, 0, 0, "-", "building_configuration_enum"], [12, 0, 0, "-", "configuration_enum"], [12, 0, 0, "-", "interface_enum"], [12, 0, 0, "-", "model_runner_enum"], [12, 0, 0, "-", "objective_enum"], [12, 0, 0, "-", "optimization_configuration_enum"], [12, 0, 0, "-", "prediction_configuration_enum"], [12, 0, 0, "-", "return_values_enum"], [12, 0, 0, "-", "visualization_enum"]], "optunaz.utils.enums.MlflowLogParams": [[12, 5, 1, "", "TRIAL_NUMBER"]], "optunaz.utils.enums.StudyUserAttrs": [[12, 5, 1, "", "OPTCONFIG"]], "optunaz.utils.enums.TrialParams": [[12, 5, 1, "", "ALGORITHM_HASH"], [12, 5, 1, "", "ALGORITHM_NAME"], [12, 5, 1, "", "DESCRIPTOR"]], "optunaz.utils.enums.TrialUserAttrs": [[12, 5, 1, "", "TEST_SCORES"], [12, 5, 1, "", "TRAIN_SCORES"]], "optunaz.utils.enums.building_configuration_enum": [[12, 1, 1, "", "BuildingConfigurationEnum"]], "optunaz.utils.enums.building_configuration_enum.BuildingConfigurationEnum": [[12, 5, 1, "", "GENERAL_CLASSIFIER"], [12, 5, 1, "", "GENERAL_HYPERPARAMETERS"], [12, 5, 1, "", "GENERAL_REGRESSOR"], [12, 5, 1, "", "METADATA"], [12, 5, 1, "", "METADATA_BESTTRIAL"], [12, 5, 1, "", "METADATA_BESTVALUE"]], "optunaz.utils.enums.configuration_enum": [[12, 1, 1, "", "ConfigurationEnum"]], "optunaz.utils.enums.configuration_enum.ConfigurationEnum": [[12, 5, 1, "", "ALGORITHMS"], [12, 5, 1, "", "ALGORITHMS_ADABOOSTCLASSIFIER"], [12, 5, 1, "", "ALGORITHMS_ADABOOSTCLASSIFIER_LEARNING_RATE"], [12, 5, 1, "", "ALGORITHMS_ADABOOSTCLASSIFIER_N_ESTIMATORS"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV_ENSEMBLE"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV_ESTIMATOR"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV_METHOD"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV_N_FOLDS"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV_PARAMS"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_ACTIVATION"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_AGGREGATION"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_AGGREGATION_NORM"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_BATCH_SIZE"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_CLASSIFIER"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_DEPTH"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_DROPOUT"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_ENSEMBLE_SIZE"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_EPOCHS"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_FEATURES_GENERATOR"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_FFN_HIDDEN_SIZE"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_FFN_NUM_LAYERS"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_FINAL_LR_RATIO_EXP"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_FRZN"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_HIDDEN_SIZE"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_HYPEROPT_CLASSIFIER"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_HYPEROPT_REGRESSOR"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_INIT_LR_RATIO_EXP"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_MAX_LR_EXP"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_NUM_ITERS"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_PRETRAINED_MODEL"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_REGRESSOR"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_SEARCH_PARAMETER_LEVEL"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_STARTUP_RANDOM_ITERS"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_WARMUP_EPOCHS_RATIO"], [12, 5, 1, "", "ALGORITHMS_HIGH"], [12, 5, 1, "", "ALGORITHMS_INTERFACE_SKLEARN"], [12, 5, 1, "", "ALGORITHMS_INTERFACE_XGBOOST"], [12, 5, 1, "", "ALGORITHMS_KNEIGHBORSCLASSIFIER"], [12, 5, 1, "", "ALGORITHMS_KNEIGHBORSREGRESSOR"], [12, 5, 1, "", "ALGORITHMS_KNEIGHBORS_METRIC"], [12, 5, 1, "", "ALGORITHMS_KNEIGHBORS_N_NEIGHBORS"], [12, 5, 1, "", "ALGORITHMS_KNEIGHBORS_WEIGHTS"], [12, 5, 1, "", "ALGORITHMS_LASSO"], [12, 5, 1, "", "ALGORITHMS_LASSO_ALPHA"], [12, 5, 1, "", "ALGORITHMS_LOGISTICREGRESSION"], [12, 5, 1, "", "ALGORITHMS_LOGISTICREGRESSION_C"], [12, 5, 1, "", "ALGORITHMS_LOGISTICREGRESSION_SOLVER"], [12, 5, 1, "", "ALGORITHMS_LOW"], [12, 5, 1, "", "ALGORITHMS_MAPIE"], [12, 5, 1, "", "ALGORITHMS_MAPIE_ALPHA"], [12, 5, 1, "", "ALGORITHMS_PLSREGRESSION"], [12, 5, 1, "", "ALGORITHMS_PLSREGRESSION_N_COMPONENTS"], [12, 5, 1, "", "ALGORITHMS_PRF"], [12, 5, 1, "", "ALGORITHMS_PRF_MAX_DEPTH"], [12, 5, 1, "", "ALGORITHMS_PRF_MAX_FEATURES"], [12, 5, 1, "", "ALGORITHMS_PRF_MINPYSUMLEAF"], [12, 5, 1, "", "ALGORITHMS_PRF_N_ESTIMATORS"], [12, 5, 1, "", "ALGORITHMS_PRF_USE_PY_GINI"], [12, 5, 1, "", "ALGORITHMS_PRF_USE_PY_LEAFS"], [12, 5, 1, "", "ALGORITHMS_Q"], [12, 5, 1, "", "ALGORITHMS_RFCLASSIFIER"], [12, 5, 1, "", "ALGORITHMS_RFREGRESSOR"], [12, 5, 1, "", "ALGORITHMS_RF_MAX_DEPTH"], [12, 5, 1, "", "ALGORITHMS_RF_MAX_FEATURES"], [12, 5, 1, "", "ALGORITHMS_RF_N_ESTIMATORS"], [12, 5, 1, "", "ALGORITHMS_RIDGE"], [12, 5, 1, "", "ALGORITHMS_RIDGE_ALPHA"], [12, 5, 1, "", "ALGORITHMS_SVC"], [12, 5, 1, "", "ALGORITHMS_SVC_C"], [12, 5, 1, "", "ALGORITHMS_SVC_GAMMA"], [12, 5, 1, "", "ALGORITHMS_SVR"], [12, 5, 1, "", "ALGORITHMS_SVR_C"], [12, 5, 1, "", "ALGORITHMS_SVR_GAMMA"], [12, 5, 1, "", "ALGORITHMS_XGBREGRESSOR"], [12, 5, 1, "", "ALGORITHMS_XGBREGRESSOR_LEARNING_RATE"], [12, 5, 1, "", "ALGORITHMS_XGBREGRESSOR_MAX_DEPTH"], [12, 5, 1, "", "ALGORITHMS_XGBREGRESSOR_N_ESTIMATORS"], [12, 5, 1, "", "DATA"], [12, 5, 1, "", "DATA_INPUTCOLUMN"], [12, 5, 1, "", "DATA_RESPONSECOLUMN"], [12, 5, 1, "", "DATA_TEST"], [12, 5, 1, "", "DATA_TRAINING"], [12, 5, 1, "", "DESCRIPTORS"], [12, 5, 1, "", "DESCRIPTORS_AMORPROT"], [12, 5, 1, "", "DESCRIPTORS_AVALON"], [12, 5, 1, "", "DESCRIPTORS_AVALON_NBITS"], [12, 5, 1, "", "DESCRIPTORS_COMPOSITE"], [12, 5, 1, "", "DESCRIPTORS_ECFP"], [12, 5, 1, "", "DESCRIPTORS_ECFPCOUNTS"], [12, 5, 1, "", "DESCRIPTORS_ECFPCOUNTS_RADIUS"], [12, 5, 1, "", "DESCRIPTORS_ECFPCOUNTS_USEFEATURES"], [12, 5, 1, "", "DESCRIPTORS_ECFP_NBITS"], [12, 5, 1, "", "DESCRIPTORS_ECFP_RADIUS"], [12, 5, 1, "", "DESCRIPTORS_JAZZY"], [12, 5, 1, "", "DESCRIPTORS_JAZZY_JAZZYNAMES"], [12, 5, 1, "", "DESCRIPTORS_MACCSKEYS"], [12, 5, 1, "", "DESCRIPTORS_MAPC"], [12, 5, 1, "", "DESCRIPTORS_MAPC_MAXRADIUS"], [12, 5, 1, "", "DESCRIPTORS_MAPC_NPERMUTATIONS"], [12, 5, 1, "", "DESCRIPTORS_PATHFP"], [12, 5, 1, "", "DESCRIPTORS_PATHFP_FPSIZE"], [12, 5, 1, "", "DESCRIPTORS_PATHFP_MAXPATH"], [12, 5, 1, "", "DESCRIPTORS_PHYSCHEM"], [12, 5, 1, "", "DESCRIPTORS_PHYSCHEM_RDKITNAMES"], [12, 5, 1, "", "DESCRIPTORS_PRECOMPUTED"], [12, 5, 1, "", "DESCRIPTORS_PRECOMPUTED_FILE"], [12, 5, 1, "", "DESCRIPTORS_PRECOMPUTED_INPUT_COLUMNN"], [12, 5, 1, "", "DESCRIPTORS_PRECOMPUTED_RESPONSE_COLUMN"], [12, 5, 1, "", "DESCRIPTORS_SCALED"], [12, 5, 1, "", "DESCRIPTORS_SCALED_DESCRIPTOR"], [12, 5, 1, "", "DESCRIPTORS_SCALED_DESCRIPTOR_PARAMETERS"], [12, 5, 1, "", "DESCRIPTORS_SMILES"], [12, 5, 1, "", "DESCRIPTORS_SMILES_AND_SI"], [12, 5, 1, "", "DESCRIPTORS_SMILES_AND_SI_AUX_WEIGHT_PC"], [12, 5, 1, "", "DESCRIPTORS_SMILES_AND_SI_FILE"], [12, 5, 1, "", "DESCRIPTORS_SMILES_AND_SI_INPUT_COLUMN"], [12, 5, 1, "", "DESCRIPTORS_UNSC_JAZZY"], [12, 5, 1, "", "DESCRIPTORS_UNSC_MAPC"], [12, 5, 1, "", "DESCRIPTORS_UNSC_PHYSCHEM"], [12, 5, 1, "", "DESCRIPTORS_UNSC_ZSCALES"], [12, 5, 1, "", "DESCRIPTORS_ZSCALES"], [12, 5, 1, "", "GENERAL_DISABLED"], [12, 5, 1, "", "GENERAL_PARAMETERS"], [12, 5, 1, "", "SETTINGS"], [12, 5, 1, "", "SETTINGS_CROSS_VALIDATION"], [12, 5, 1, "", "SETTINGS_DIRECTION"], [12, 5, 1, "", "SETTINGS_MODE"], [12, 5, 1, "", "SETTINGS_MODE_CLASSIFICATION"], [12, 5, 1, "", "SETTINGS_MODE_REGRESSION"], [12, 5, 1, "", "SETTINGS_N_JOBS"], [12, 5, 1, "", "SETTINGS_N_TRIALS"], [12, 5, 1, "", "SETTINGS_SHUFFLE"], [12, 5, 1, "", "TASK"], [12, 5, 1, "", "TASK_BUILDING"], [12, 5, 1, "", "TASK_OPTIMIZATION"]], "optunaz.utils.enums.interface_enum": [[12, 1, 1, "", "InterfaceEnum"]], "optunaz.utils.enums.interface_enum.InterfaceEnum": [[12, 5, 1, "", "CALIBRATED_SET"], [12, 5, 1, "", "CHEMPROP_SET"], [12, 5, 1, "", "PRF_SET"], [12, 5, 1, "", "SKLEARN_SET"], [12, 5, 1, "", "XGBOOST_SET"]], "optunaz.utils.enums.model_runner_enum": [[12, 1, 1, "", "ModelRunnerDataframeEnum"]], "optunaz.utils.enums.model_runner_enum.ModelRunnerDataframeEnum": [[12, 5, 1, "", "SET"], [12, 5, 1, "", "SMILES"], [12, 5, 1, "", "TEST"], [12, 5, 1, "", "TRAIN"], [12, 5, 1, "", "Y_PRED"], [12, 5, 1, "", "Y_TRUE"]], "optunaz.utils.enums.objective_enum": [[12, 1, 1, "", "ObjectiveEnum"]], "optunaz.utils.enums.objective_enum.ObjectiveEnum": [[12, 5, 1, "", "ATTRIBUTE_TRIAL_TRAIN_SCORE"], [12, 5, 1, "", "EXTRA_COLUMN_BESTHIT"]], "optunaz.utils.enums.optimization_configuration_enum": [[12, 1, 1, "", "OptimizationConfigurationEnum"]], "optunaz.utils.enums.prediction_configuration_enum": [[12, 1, 1, "", "PredictionConfigurationEnum"]], "optunaz.utils.enums.prediction_configuration_enum.PredictionConfigurationEnum": [[12, 5, 1, "", "DATA_DATASET"]], "optunaz.utils.enums.return_values_enum": [[12, 1, 1, "", "SklearnReturnValueEnum"], [12, 1, 1, "", "XGBoostReturnValueEnum"]], "optunaz.utils.enums.return_values_enum.SklearnReturnValueEnum": [[12, 5, 1, "", "CROSS_VALIDATE_FIT_TIME"], [12, 5, 1, "", "CROSS_VALIDATE_SCORE_TIME"], [12, 5, 1, "", "CROSS_VALIDATE_TEST_SCORE"], [12, 5, 1, "", "CROSS_VALIDATE_TRAIN_SCORE"]], "optunaz.utils.enums.return_values_enum.XGBoostReturnValueEnum": [[12, 5, 1, "", "CROSS_VALIDATE_FIT_TIME"], [12, 5, 1, "", "CROSS_VALIDATE_SCORE_TIME"], [12, 5, 1, "", "CROSS_VALIDATE_TEST_SCORE"], [12, 5, 1, "", "CROSS_VALIDATE_TRAIN_SCORE"]], "optunaz.utils.enums.visualization_enum": [[12, 1, 1, "", "VisualizationEnum"]], "optunaz.utils.enums.visualization_enum.VisualizationEnum": [[12, 5, 1, "", "OPTUNA_SYSTEM_ATTRS_INTERMEDIATE_VALUES"], [12, 5, 1, "", "OPTUNA_SYSTEM_ATTRS_NUMBER"], [12, 5, 1, "", "OPTUNA_SYSTEM_ATTRS_TRIAL_ID"], [12, 5, 1, "", "VISUALIZATION"], [12, 5, 1, "", "VISUALIZATION_CLASSIFIER"], [12, 5, 1, "", "VISUALIZATION_FILE_FORMAT"], [12, 5, 1, "", "VISUALIZATION_OUTPUT_FOLDER"], [12, 5, 1, "", "VISUALIZATION_PLOTS"], [12, 5, 1, "", "VISUALIZATION_PLOTS_CONTOUR"], [12, 5, 1, "", "VISUALIZATION_PLOTS_HISTORY"], [12, 5, 1, "", "VISUALIZATION_PLOTS_PARALLEL_COORDINATE"], [12, 5, 1, "", "VISUALIZATION_PLOTS_SLICE"], [12, 5, 1, "", "VISUALIZATION_REGRESSOR"], [12, 5, 1, "", "VISUALIZATION_USE_XVFB"]], "optunaz.utils.files_paths": [[11, 4, 1, "", "attach_root_path"], [11, 4, 1, "", "move_up_directory"]], "optunaz.utils.load_json": [[11, 4, 1, "", "loadJSON"]], "optunaz.utils.mlflow": [[11, 1, 1, "", "MLflowCallback"], [11, 4, 1, "", "add_ellipsis"], [11, 4, 1, "", "shorten_names"]], "optunaz.utils.mlflow.MLflowCallback": [[11, 5, 1, "", "optconfig"], [11, 3, 1, "", "prepare_tags"], [11, 3, 1, "", "tmp_buildconfig"], [11, 5, 1, "", "tracking_uri"], [11, 5, 1, "", "trial_number_offset"]], "optunaz.utils.preprocessing": [[13, 0, 0, "-", "deduplicator"], [13, 0, 0, "-", "splitter"], [13, 0, 0, "-", "transform"]], "optunaz.utils.preprocessing.deduplicator": [[13, 1, 1, "", "Deduplicator"], [13, 1, 1, "", "KeepAllNoDeduplication"], [13, 1, 1, "", "KeepAvg"], [13, 1, 1, "", "KeepFirst"], [13, 1, 1, "", "KeepLast"], [13, 1, 1, "", "KeepMax"], [13, 1, 1, "", "KeepMedian"], [13, 1, 1, "", "KeepMin"], [13, 1, 1, "", "KeepRandom"]], "optunaz.utils.preprocessing.deduplicator.Deduplicator": [[13, 3, 1, "", "dedup"]], "optunaz.utils.preprocessing.deduplicator.KeepAllNoDeduplication": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepAvg": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepFirst": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepLast": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepMax": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepMedian": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepMin": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepRandom": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"], [13, 5, 1, "", "seed"]], "optunaz.utils.preprocessing.splitter": [[13, 1, 1, "", "GroupingSplitter"], [13, 1, 1, "", "HistogramStratifiedShuffleSplit"], [13, 1, 1, "", "KFold"], [13, 1, 1, "", "NoSplitting"], [14, 1, 1, "", "Predefined"], [14, 1, 1, "", "Random"], [14, 1, 1, "", "ScaffoldSplit"], [13, 1, 1, "", "SklearnSplitter"], [13, 1, 1, "", "Splitter"], [14, 1, 1, "", "Stratified"], [14, 1, 1, "", "Temporal"], [13, 4, 1, "", "butina_cluster"], [13, 4, 1, "", "fd_bin"], [13, 4, 1, "", "stratify"]], "optunaz.utils.preprocessing.splitter.GroupingSplitter": [[13, 3, 1, "", "groups"]], "optunaz.utils.preprocessing.splitter.HistogramStratifiedShuffleSplit": [[13, 5, 1, "", "bins"], [13, 3, 1, "", "get_n_splits"], [13, 5, 1, "", "n_splits"], [13, 5, 1, "", "random_state"], [13, 3, 1, "", "split"], [13, 5, 1, "", "test_fraction"]], "optunaz.utils.preprocessing.splitter.KFold": [[13, 3, 1, "", "get_sklearn_splitter"], [13, 5, 1, "", "name"], [13, 5, 1, "", "random_state"], [13, 5, 1, "", "shuffle"], [13, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.NoSplitting": [[13, 3, 1, "", "get_sklearn_splitter"], [13, 5, 1, "", "name"], [13, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.Predefined": [[13, 5, 1, "", "column_name"], [13, 3, 1, "", "get_sklearn_splitter"], [13, 3, 1, "", "groups"], [13, 5, 1, "", "name"], [14, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.Random": [[13, 5, 1, "", "fraction"], [13, 3, 1, "", "get_sklearn_splitter"], [13, 5, 1, "", "name"], [13, 5, 1, "", "seed"]], "optunaz.utils.preprocessing.splitter.ScaffoldSplit": [[13, 5, 1, "", "bins"], [13, 5, 1, "", "butina_cluster"], [13, 3, 1, "", "get_n_splits"], [13, 3, 1, "", "get_sklearn_splitter"], [14, 3, 1, "", "groups"], [13, 5, 1, "", "make_scaffold_generic"], [13, 5, 1, "", "name"], [13, 5, 1, "", "random_state"], [14, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.SklearnSplitter": [[13, 3, 1, "", "get_n_splits"], [13, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.Splitter": [[13, 3, 1, "", "get_sklearn_splitter"], [13, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.Stratified": [[13, 5, 1, "", "bins"], [13, 5, 1, "", "fraction"], [13, 3, 1, "", "get_sklearn_splitter"], [13, 5, 1, "", "name"], [13, 5, 1, "", "seed"]], "optunaz.utils.preprocessing.splitter.Temporal": [[13, 5, 1, "", "fraction"], [13, 3, 1, "", "get_sklearn_splitter"], [13, 5, 1, "", "name"], [14, 3, 1, "", "split"]], "optunaz.utils.preprocessing.transform": [[13, 1, 1, "", "AmorProt"], [13, 1, 1, "", "AuxTransformer"], [13, 1, 1, "", "DataTransform"], [13, 6, 1, "", "DataTransformError"], [13, 1, 1, "", "LogBase"], [13, 1, 1, "", "LogNegative"], [15, 1, 1, "", "ModelDataTransform"], [15, 1, 1, "", "PTRTransform"], [15, 1, 1, "", "VectorFromColumn"], [15, 1, 1, "", "ZScales"]], "optunaz.utils.preprocessing.transform.AmorProt": [[13, 1, 1, "", "Parameters"], [13, 5, 1, "", "name"], [13, 5, 1, "", "parameters"], [13, 3, 1, "", "transform"]], "optunaz.utils.preprocessing.transform.AuxTransformer": [[13, 3, 1, "", "transform"]], "optunaz.utils.preprocessing.transform.DataTransform": [[13, 3, 1, "", "transform"]], "optunaz.utils.preprocessing.transform.LogBase": [[13, 5, 1, "", "LOG"], [13, 5, 1, "", "LOG10"], [13, 5, 1, "", "LOG2"]], "optunaz.utils.preprocessing.transform.LogNegative": [[13, 5, 1, "", "FALSE"], [13, 5, 1, "", "TRUE"]], "optunaz.utils.preprocessing.transform.ModelDataTransform": [[15, 1, 1, "", "Parameters"], [13, 5, 1, "", "base_dict"], [13, 5, 1, "", "base_negation"], [13, 5, 1, "", "name"], [13, 5, 1, "", "parameters"], [13, 5, 1, "", "reverse_dict"], [13, 3, 1, "", "reverse_transform"], [13, 3, 1, "", "reverse_transform_df"], [13, 3, 1, "", "reverse_transform_one"], [13, 3, 1, "", "transform"], [13, 3, 1, "", "transform_df"], [13, 3, 1, "", "transform_one"]], "optunaz.utils.preprocessing.transform.ModelDataTransform.Parameters": [[13, 5, 1, "", "base"], [13, 5, 1, "", "conversion"], [13, 5, 1, "", "negation"]], "optunaz.utils.preprocessing.transform.PTRTransform": [[15, 1, 1, "", "Parameters"], [13, 5, 1, "", "name"], [13, 5, 1, "", "parameters"], [13, 3, 1, "", "reverse_transform"], [13, 3, 1, "", "transform"]], "optunaz.utils.preprocessing.transform.PTRTransform.Parameters": [[13, 5, 1, "", "std"], [13, 5, 1, "", "threshold"]], "optunaz.utils.preprocessing.transform.VectorFromColumn": [[15, 1, 1, "", "Parameters"], [13, 5, 1, "", "name"], [13, 5, 1, "", "parameters"], [13, 3, 1, "", "transform"]], "optunaz.utils.preprocessing.transform.VectorFromColumn.Parameters": [[13, 5, 1, "", "delimiter"]], "optunaz.utils.preprocessing.transform.ZScales": [[15, 1, 1, "", "Parameters"], [13, 5, 1, "", "name"], [13, 5, 1, "", "parameters"], [13, 3, 1, "", "transform"]], "optunaz.utils.retraining": [[11, 6, 1, "", "NoDifferingRetrainingData"], [11, 6, 1, "", "NoNewRetrainingData"], [11, 6, 1, "", "NoPreviousModel"], [11, 6, 1, "", "NoRetrainingDataConvention"], [11, 6, 1, "", "RetrainingHeadersIssue"], [11, 6, 1, "", "RetrainingIsAlreadyProcessed"], [11, 6, 1, "", "RetrainingIsLocked"], [11, 6, 1, "", "SamePreviousModel"], [11, 6, 1, "", "SlurmJobSkip"], [11, 6, 1, "", "SlurmMemoryExceeded"], [11, 6, 1, "", "SlurmNoLog"], [11, 6, 1, "", "SlurmParseError"], [11, 6, 1, "", "SlurmTimeLimitExceeded"], [11, 6, 1, "", "TemporalPredsPredicted"], [11, 6, 1, "", "TimepointSkipped"]], "optunaz.utils.schema": [[11, 4, 1, "", "add_boolean_guards_for_schema_properties"], [11, 4, 1, "", "addsibling"], [11, 4, 1, "", "addtitles"], [11, 4, 1, "", "copytitle"], [11, 4, 1, "", "create_dependency"], [11, 4, 1, "", "delsibling"], [11, 4, 1, "", "getref"], [11, 4, 1, "", "remove_schema_properties"], [11, 4, 1, "", "replaceenum"], [11, 4, 1, "", "replacekey"], [11, 4, 1, "", "replacevalue"]], "optunaz.utils.tracking": [[11, 1, 1, "", "BuildTrackingData"], [11, 1, 1, "", "Datapoint"], [11, 1, 1, "", "InternalTrackingCallback"], [11, 1, 1, "", "TrackingData"], [11, 4, 1, "", "get_authorization_header"], [11, 4, 1, "", "removeprefix"], [11, 4, 1, "", "round_scores"], [11, 4, 1, "", "track_build"]], "optunaz.utils.tracking.BuildTrackingData": [[11, 5, 1, "", "response_column_name"], [11, 5, 1, "", "test_points"], [11, 5, 1, "", "test_scores"]], "optunaz.utils.tracking.Datapoint": [[11, 5, 1, "", "expected"], [11, 5, 1, "", "predicted"], [11, 5, 1, "", "smiles"]], "optunaz.utils.tracking.InternalTrackingCallback": [[11, 5, 1, "", "optconfig"], [11, 5, 1, "", "trial_number_offset"]], "optunaz.utils.tracking.TrackingData": [[11, 5, 1, "", "all_cv_test_scores"], [11, 5, 1, "", "buildconfig"], [11, 5, 1, "", "scoring"], [11, 5, 1, "", "trial_number"], [11, 5, 1, "", "trial_state"], [11, 5, 1, "", "trial_value"]], "optunaz.visualizer": [[9, 1, 1, "", "Visualizer"]], "optunaz.visualizer.Visualizer": [[9, 3, 1, "", "plot_by_configuration"], [9, 3, 1, "", "plot_contour"], [9, 3, 1, "", "plot_history"], [9, 3, 1, "", "plot_parallel_coordinate"], [9, 3, 1, "", "plot_slice"]]}, "objtypes": {"0": "py:module", "1": "py:class", "2": "py:property", "3": "py:method", "4": "py:function", "5": "py:attribute", "6": "py:exception"}, "objnames": {"0": ["py", "module", "Python module"], "1": ["py", "class", "Python class"], "2": ["py", "property", "Python property"], "3": ["py", "method", "Python method"], "4": ["py", "function", "Python function"], "5": ["py", "attribute", "Python attribute"], "6": ["py", "exception", "Python exception"]}, "titleterms": {"qsartuna": [0, 4, 7, 8], "\ud80c\udd9b": 0, "qsar": 0, "us": 0, "optim": [0, 6, 7], "hyperparamet": 0, "tune": 0, "formerli": 0, "optuna": 0, "az": 0, "qptuna": [0, 6], "background": [0, 6, 7], "The": [0, 6, 7], "three": [0, 6, 7], "step": [0, 6, 7], "process": [0, 6, 7], "json": 0, "base": [0, 8], "command": 0, "line": 0, "interfac": 0, "configur": [0, 6, 7], "file": [0, 6, 7], "run": [0, 6, 7], "from": [0, 6, 7, 8], "python": 0, "jupyt": 0, "notebook": 0, "via": 0, "cli": [0, 6, 7], "submit": 0, "slurm": 0, "model": [0, 6, 7], "option": [0, 6, 7], "inspect": 0, "automl": [0, 6, 7, 9], "automat": 0, "machin": 0, "learn": [0, 6, 7], "ad": 0, "descriptor": [0, 3, 6, 7, 9], "algorithm": [0, 1, 6, 7], "avail": [1, 2, 3, 14, 15], "adaboostclassifi": 1, "lasso": 1, "kneighborsclassifi": 1, "kneighborsregressor": 1, "logisticregress": 1, "plsregress": 1, "randomforestclassifi": 1, "randomforestregressor": 1, "ridg": 1, "svc": 1, "svr": 1, "xgbregressor": 1, "prfclassifi": 1, "chempropregressor": 1, "chempropclassifi": 1, "chemprophyperoptclassifi": 1, "chemprophyperoptregressor": 1, "chempropregressorpretrain": 1, "calibratedclassifiercvwithva": 1, "mapi": [1, 6, 7], "dedupl": [2, 8, 13], "keepfirst": 2, "keeplast": 2, "keeprandom": 2, "keepmin": 2, "keepmax": 2, "keepavg": 2, "keepmedian": 2, "keepkeepallnodedupl": 2, "avalon": 3, "ecfp": 3, "ecfp_count": 3, "pathfp": 3, "maccs_kei": 3, "unscaledphyschemdescriptor": 3, "unscaledjazzydescriptor": 3, "unscaledzscalesdescriptor": 3, "physchemdescriptor": 3, "jazzydescriptor": 3, "precomputeddescriptorfromfil": 3, "zscale": [3, 15], "smilesfromfil": 3, "smilesandsideinfofromfil": 3, "scaleddescriptor": 3, "compositedescriptor": 3, "welcom": 4, "document": 4, "develop": 4, "optunaz": [5, 9, 10, 11, 12, 13], "tutori": [6, 7], "thi": [6, 7], "prepar": [6, 7], "regress": [6, 7], "exampl": [6, 7], "creat": [6, 7], "visual": [6, 7, 9], "progress": [6, 7], "pick": [6, 7], "best": [6, 7, 8], "trial": [6, 7], "build": [6, 7], "merg": [6, 7], "preprocess": [6, 7, 8, 13], "split": [6, 7, 8], "data": [6, 7, 8], "train": [6, 7], "test": [6, 7], "set": [6, 7], "remov": [6, 7], "duplic": [6, 7, 8], "dataset": [6, 7], "choos": [6, 7], "score": [6, 7], "function": [6, 7], "advanc": [6, 7], "functoinail": [6, 7], "probabilist": [6, 7, 8], "random": [6, 7, 8, 14], "forest": [6, 7], "prf": [6, 7], "interlud": [6, 7, 8], "cautionari": [6, 7], "advic": [6, 7], "y": [6, 7], "respons": [6, 7], "column": [6, 7], "valid": [6, 7], "chemprop": [6, 7], "simpl": [6, 7], "separ": [6, 7], "shallow": [6, 7], "method": [6, 7], "default": [6, 7], "behavior": [6, 7], "turn": [6, 7], "hyperopt": [6, 7], "within": [6, 7, 8], "functionail": [6, 7], "veri": [6, 7], "larg": [6, 7], "comput": [6, 7], "cost": [6, 7], "A": [6, 7], "note": [6, 7], "mpnn": [6, 7], "search": [6, 7], "space": [6, 7], "side": [6, 7], "inform": [6, 7], "multi": [6, 7], "task": [6, 7], "mtl": [6, 7], "combin": [6, 7], "onli": [6, 7], "recommend": [6, 7], "long": [6, 7], "time": [6, 7], "pre": [6, 7], "adapt": [6, 7], "transfer": [6, 7], "fingerprint": [6, 7], "encod": [6, 7], "latent": [6, 7], "represent": [6, 7, 8], "probabl": [6, 7], "calibr": [6, 7], "classif": [6, 7], "uncertainti": [6, 7], "estim": [6, 7], "vennab": [6, 7], "ensembl": [6, 7], "dropout": [6, 7], "explain": [6, 7, 9], "shap": [6, 7], "interpret": [6, 7], "log": [6, 7, 8], "transform": [6, 7, 8, 13, 15], "covari": [6, 7], "one": [6, 7], "e": [6, 7], "g": [6, 7], "dose": [6, 7], "point": [6, 7], "co": [6, 7], "variat": [6, 7], "proteochemometr": [6, 7], "pcm": [6, 7], "more": [6, 7], "vectorfromsmil": [6, 7], "z": [6, 7], "scale": [6, 7], "object": [6, 7, 9], "priorit": [6, 7], "perform": [6, 7, 8], "standard": [6, 7], "deviat": [6, 7], "further": [6, 7], "precomput": [6, 7], "autom": [6, 7], "retrain": [6, 7, 11], "overview": [6, 7], "high": [6, 7], "hpc": [6, 7], "setup": [6, 7], "extract": [6, 7], "walkthough": [6, 7], "an": [6, 7], "pipelin": 7, "schedul": 7, "daemon": 7, "up": 7, "date": 7, "introduct": 8, "translat": 8, "sdf": 8, "csv": 8, "need": 8, "deal": 8, "compar": 8, "differ": 8, "strategi": 8, "tempor": [8, 14], "stratifi": [8, 14], "scaffold": 8, "input": 8, "user": 8, "import": 8, "logarithm": 8, "dataread": [8, 9], "threshold": 8, "ptr": [8, 15], "experiment": 8, "error": 8, "definit": 8, "implement": 8, "conclus": 8, "calcul": 8, "evalu": [8, 9], "reproduc": 8, "practic": 8, "packag": [9, 10, 11, 12, 13], "subpackag": [9, 11], "submodul": [9, 10, 11, 12, 13], "modul": [9, 10, 11, 12, 13], "builder": 9, "metirc": 9, "model_writ": 9, "optbuild": 9, "predict": 9, "schemagen": 9, "three_step_opt_build_merg": 9, "content": [9, 10, 11, 12, 13], "config": 10, "build_from_opt": 10, "buildconfig": 10, "optconfig": 10, "util": [11, 12, 13], "files_path": 11, "load_json": 11, "mlflow": 11, "schema": 11, "track": 11, "enum": 12, "building_configuration_enum": 12, "configuration_enum": 12, "interface_enum": 12, "model_runner_enum": 12, "objective_enum": 12, "optimization_configuration_enum": 12, "prediction_configuration_enum": 12, "return_values_enum": 12, "visualization_enum": 12, "splitter": [13, 14], "predefin": 14, "scaffoldsplit": 14, "modeldatatransform": 15, "vectorfromcolumn": 15}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 6, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "nbsphinx": 4, "sphinx.ext.todo": 2, "sphinx.ext.viewcode": 1, "sphinx": 56}}) \ No newline at end of file +Search.setIndex({"docnames": ["README", "algorithms", "deduplicator", "descriptors", "index", "modules", "notebooks/QPTUNA_Tutorial", "notebooks/QSARtuna_Tutorial", "notebooks/preprocess_data", "optunaz", "optunaz.config", "optunaz.utils", "optunaz.utils.enums", "optunaz.utils.preprocessing", "splitters", "transform"], "filenames": ["README.md", "algorithms.rst", "deduplicator.rst", "descriptors.rst", "index.rst", "modules.rst", "notebooks/QPTUNA_Tutorial.ipynb", "notebooks/QSARtuna_Tutorial.ipynb", "notebooks/preprocess_data.ipynb", "optunaz.rst", "optunaz.config.rst", "optunaz.utils.rst", "optunaz.utils.enums.rst", "optunaz.utils.preprocessing.rst", "splitters.rst", "transform.rst"], "titles": ["QSARtuna \ud80c\udd9b: QSAR using Optimization for Hyperparameter Tuning (formerly Optuna AZ and QPTUNA)", "Available algorithms", "Available deduplicators", "Available descriptors", "Welcome to QSARtuna Documentation!", "optunaz", "QPTUNA CLI Tutorial", "QSARtuna CLI Tutorial", "Preprocessing data for QSARtuna", "optunaz package", "optunaz.config package", "optunaz.utils package", "optunaz.utils.enums package", "optunaz.utils.preprocessing package", "Available splitters", "Available transform"], "terms": {"build": [0, 4, 8, 9, 10, 11, 12], "predict": [0, 1, 3, 5, 6, 7, 8, 10, 11, 12], "compchem": 0, "develop": [0, 3, 7, 9], "uncertainti": [0, 1, 4, 8, 9, 10, 13, 15], "quantif": 0, "explain": [0, 1, 4, 5, 10], "mind": 0, "thi": [0, 1, 3, 4, 8, 9, 10, 11, 12, 13, 14], "librari": [0, 6, 7, 8], "search": [0, 1, 3, 9, 10], "best": [0, 1, 9, 10], "ml": [0, 4, 7, 10], "molecular": [0, 1, 3, 4, 6, 7, 8, 9, 10], "given": [0, 1, 3, 6, 7, 8, 9, 10, 11], "data": [0, 1, 3, 4, 9, 10, 11, 12, 13, 14, 15], "itself": [0, 6, 7], "done": [0, 6, 7], "emploi": [0, 3, 6, 7, 8, 9], "latest": [0, 9, 10], "state": [0, 6, 7, 13], "art": [0, 6, 7], "estim": [0, 1, 3, 4, 9, 10, 12], "packag": [0, 1, 3, 5, 6, 7, 8], "further": [0, 10], "document": [0, 6, 7, 8], "github": [0, 6, 7, 9, 13], "page": [0, 6], "here": [0, 3, 6, 7, 8, 9, 10, 13, 14], "public": [0, 1, 3, 4, 6, 7, 9, 10], "avail": [0, 4, 6, 7, 9, 11], "structur": [0, 1, 3, 6, 7, 8, 9, 10], "around": [0, 6, 7, 8], "train": [0, 1, 3, 4, 8, 9, 10, 11, 12, 13, 14], "mani": [0, 1, 6, 7, 10], "differ": [0, 1, 3, 6, 7, 9, 10, 11, 13], "paramet": [0, 1, 3, 6, 7, 8, 9, 10, 12, 13, 14, 15], "onli": [0, 1, 3, 8, 9, 10, 13, 14], "dataset": [0, 1, 8, 9, 10, 12, 13], "usual": [0, 1, 6, 7, 8, 10], "cross": [0, 1, 6, 7, 10, 13], "valid": [0, 1, 3, 8, 9, 10, 12, 13], "pick": 0, "evalu": [0, 4, 5, 6, 7], "its": [0, 1, 6, 7, 10, 12], "perform": [0, 3, 4, 9, 12, 13, 15], "test": [0, 1, 4, 8, 9, 10, 12, 13, 14], "prod": [0, 6, 7], "re": [0, 6, 7, 9], "merg": [0, 8, 9, 13], "ha": [0, 1, 6, 7, 8, 9, 10, 13], "drawback": [0, 6, 7], "left": [0, 6, 7, 8], "result": [0, 1, 3, 6, 7, 8, 9, 10], "big": [0, 6, 7], "benefit": [0, 6, 7], "final": [0, 1, 6, 7, 10], "all": [0, 1, 3, 6, 7, 8, 9, 10, 12, 13], "let": [0, 6, 7, 8], "s": [0, 6, 7, 8], "look": [0, 1, 6, 7, 8, 10], "trivial": 0, "exampl": [0, 3, 8, 9, 10], "weight": [0, 1, 3, 6, 7, 9, 10, 12], "set": [0, 3, 4, 8, 9, 10, 11, 12, 13, 14], "50": [0, 1, 3, 6, 7, 9, 10], "molecul": [0, 1, 3, 6, 7, 8, 9, 10, 13], "we": [0, 3, 6, 7, 8, 9, 10, 13, 14], "start": [0, 4, 6, 7, 8, 9], "format": [0, 3, 6, 7, 8, 9, 11], "It": [0, 1, 3, 6, 7, 8, 9, 10], "contain": [0, 3, 6, 7, 9, 11], "four": 0, "main": [0, 3, 6, 7, 8, 9], "section": [0, 6, 7, 8], "locat": [0, 6, 7], "column": [0, 3, 8, 9, 11, 12, 13, 14, 15], "detail": [0, 3, 6, 7, 8, 9, 10, 11], "about": [0, 6, 7, 8, 9], "which": [0, 1, 3, 6, 7, 8, 9, 10, 13], "below": [0, 3, 6, 7, 8, 9], "task": [0, 3, 8, 9, 10, 11, 12], "training_dataset_fil": [0, 6, 7, 8, 9], "drd2": [0, 6, 7], "subset": [0, 1, 6, 7, 8, 10], "csv": [0, 3, 4, 6, 7, 9], "input_column": [0, 3, 6, 7, 8, 9, 12], "canon": [0, 6, 7, 9, 13], "response_column": [0, 3, 6, 7, 8, 9, 12], "molwt": [0, 6, 7], "mode": [0, 6, 7, 9, 10, 12], "regress": [0, 1, 8, 10, 12, 13], "cross_valid": [0, 6, 7, 10, 12, 13], "5": [0, 1, 3, 6, 7, 8, 9, 10, 13], "direct": [0, 1, 6, 7, 10, 12], "maxim": [0, 1, 6, 7, 10], "n_trial": [0, 6, 7, 9, 10, 12], "100": [0, 1, 3, 6, 7, 8, 9, 10, 11], "n_startup_tri": [0, 6, 7, 9, 10], "30": [0, 1, 6, 7, 10], "name": [0, 1, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15], "ecfp": [0, 4, 6, 7, 9, 10, 12], "radiu": [0, 3, 6, 7, 9, 12], "3": [0, 1, 3, 4, 6, 7, 8, 9, 10], "nbit": [0, 3, 6, 7, 9, 10, 12], "2048": [0, 3, 6, 7, 9], "maccs_kei": [0, 4, 6, 7, 9, 12], "randomforestregressor": [0, 4, 6, 7, 10, 12], "max_depth": [0, 1, 10, 12], "low": [0, 1, 3, 6, 7, 8, 9, 10, 12], "2": [0, 1, 3, 4, 6, 7, 8, 9, 10, 13, 14], "high": [0, 1, 3, 4, 9, 10, 12], "32": [0, 1, 6, 7, 10], "n_estim": [0, 1, 6, 7, 10, 12], "10": [0, 1, 3, 6, 7, 8, 9, 10, 13], "250": [0, 1, 6, 7, 10], "max_featur": [0, 1, 10, 12], "auto": [0, 1, 6, 7, 9, 10], "ridg": [0, 4, 6, 7, 10, 12], "alpha": [0, 1, 6, 7, 8, 9, 10, 12], "0": [0, 1, 3, 6, 7, 8, 9, 10, 11, 13, 14], "lasso": [0, 4, 6, 7, 10, 12], "xgbregressor": [0, 4, 6, 7, 10, 12], "learning_r": [0, 1, 10, 12], "1": [0, 1, 3, 4, 6, 7, 8, 9, 10, 11, 13, 14], "specifi": [0, 1, 6, 7, 8, 9, 10, 12], "In": [0, 1, 3, 6, 7, 8, 9, 10], "rel": [0, 6, 7], "path": [0, 1, 3, 6, 7, 8, 9, 10, 11], "folder": [0, 6, 7, 8], "ar": [0, 1, 3, 6, 7, 8, 9, 10, 12, 13, 14], "want": [0, 6, 7, 8], "fold": [0, 1, 6, 7, 8, 10, 13, 14], "valu": [0, 1, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15], "object": [0, 1, 5, 8, 10, 11, 12, 13], "function": [0, 1, 3, 4, 8, 9, 10, 11, 12, 13, 15], "standard": [0, 1, 8, 10, 13, 15], "scikit": [0, 6, 7, 9, 13, 14], "have": [0, 3, 6, 7, 8, 9, 10, 13], "total": [0, 6, 7, 8], "trial": [0, 1, 10, 11, 12], "first": [0, 1, 3, 6, 7, 8, 9, 10, 13], "startup": [0, 6, 7], "should": [0, 1, 3, 6, 7, 8, 9, 10, 11, 13], "random": [0, 1, 4, 10, 13], "explor": [0, 6, 7], "get": [0, 6, 7, 8, 9], "stuck": 0, "earli": [0, 1, 6, 7, 9, 10], "one": [0, 3, 8, 9, 10, 13, 14], "local": [0, 6, 7], "minimum": [0, 1, 3, 9, 10, 13, 14], "two": [0, 1, 6, 7, 8, 10, 13, 14], "free": [0, 3, 9], "pair": [0, 6, 7, 9], "ani": [0, 3, 6, 7, 8, 9, 10, 13], "when": [0, 1, 6, 7, 8, 9, 10, 11, 13, 14], "our": [0, 6, 7, 8], "time": [0, 1, 3, 8, 9, 10, 11], "creat": [0, 8, 9, 11], "conda": [0, 7], "environ": [0, 3, 6, 7, 9], "instal": [0, 6, 7], "modul": [0, 5, 6, 7], "purg": 0, "load": [0, 1, 6, 7, 8, 9, 10], "miniconda3": [0, 7], "my_env_with_qsartuna": [0, 7], "pip": [0, 6, 7], "activ": [0, 1, 6, 7, 8, 9, 10, 12, 13, 15], "just": [0, 6, 7], "case": [0, 1, 6, 7, 8, 9, 10], "check": [0, 6, 7, 9, 12, 13], "output": [0, 1, 6, 7, 8, 9, 10, 13, 15], "m": [0, 6, 7, 9, 11], "http": [0, 3, 6, 7, 8, 9, 10, 13], "com": [0, 6, 7, 8, 9, 13], "molecularai": [0, 7], "releas": [0, 4, 6, 7], "download": [0, 7], "tar": [0, 6, 7], "gz": [0, 6, 7], "Then": [0, 6, 7], "you": [0, 1, 6, 7, 8, 10], "can": [0, 1, 3, 6, 7, 8, 9, 10, 13, 14], "insid": [0, 9], "your": [0, 6, 7, 8], "three_step_opt_build_merg": [0, 5, 6, 7], "import": [0, 6, 7], "buildconfig_best": [0, 6, 7, 9], "build_best": [0, 6, 7, 9], "build_merg": [0, 6, 7, 9], "config": [0, 1, 5, 6, 7, 9], "modelmod": [0, 6, 7, 9, 10], "optimizationdirect": [0, 6, 7, 10], "optconfig": [0, 1, 5, 6, 7, 9, 11, 12], "optimizationconfig": [0, 6, 7, 9, 10], "svr": [0, 4, 6, 7, 10, 12], "randomforest": 0, "pl": [0, 1, 10], "dataread": [0, 5, 6, 7], "ecfp_count": [0, 4, 6, 7, 9, 12], "prepar": [0, 4, 8, 9], "new": [0, 1, 3, 6, 7, 8, 9, 10, 11], "studi": [0, 3, 6, 7, 9, 10, 11, 12], "study_nam": [0, 6, 7, 9], "my_studi": [0, 6, 7], "make": [0, 1, 6, 7, 8, 9, 10, 13, 14, 15], "buildconfig": [0, 5, 6, 7, 9, 11], "write": [0, 6, 7, 9], "out": [0, 1, 6, 7, 8, 10], "print": [0, 6, 7, 8], "dump": [0, 6, 7], "indent": [0, 6, 7], "save": [0, 6, 7], "target": [0, 1, 6, 7, 8, 10, 13, 15], "pkl": [0, 1, 6, 7, 10], "deploi": 0, "directli": [0, 6, 7, 8], "To": [0, 6, 7, 8], "follow": [0, 3, 6, 7, 8, 9, 10, 11], "syntax": 0, "schemagen": [0, 5], "regression_drd2_50": 0, "outpath": 0, "accept": [0, 6, 7, 8], "argument": [0, 6, 7, 9], "shell": 0, "h": [0, 3, 6, 7, 8, 9], "usag": [0, 6, 7], "best_buildconfig_outpath": 0, "best_model_outpath": 0, "merged_model_outpath": 0, "cach": [0, 3, 6, 7, 9, 10], "optbuild": [0, 5], "hyper": [0, 6, 7, 10], "help": [0, 6, 7], "show": [0, 6, 7, 8], "messag": [0, 1, 6, 7, 10, 11], "exit": [0, 6, 7], "where": [0, 1, 6, 7, 8, 10], "persist": 0, "turn": [0, 10, 13, 14], "off": [0, 1, 6, 7, 8, 10, 13, 14], "gener": [0, 1, 3, 6, 7, 8, 9, 10, 13, 14], "requir": [0, 3, 6, 7, 8, 9], "input": [0, 1, 3, 4, 6, 7, 9, 10, 11, 13, 14, 15], "either": [0, 3, 8, 9, 10], "sinc": [0, 3, 6, 7, 8, 9, 13], "long": [0, 8], "avoid": [0, 6, 7, 8, 13], "login": 0, "node": 0, "queue": [0, 6, 7], "instead": [0, 1, 3, 6, 7, 8, 9, 10, 13], "script": [0, 6, 7, 9], "give": [0, 6, 7], "sbatch": [0, 6, 7], "bin": [0, 6, 7, 8, 11, 13, 14], "sh": [0, 6, 7, 11], "ntask": 0, "cpu": [0, 6, 7, 9], "per": [0, 1, 8, 9, 10], "mem": [0, 6, 7, 9], "4g": 0, "partit": [0, 6, 7], "core": [0, 6, 7, 8, 10], "illustr": [0, 6, 7, 8], "how": [0, 1, 3, 6, 7, 8, 9, 10], "chose": 0, "chang": [0, 6, 7], "directori": [0, 6, 7, 9, 11], "cd": 0, "project_fold": 0, "project": [0, 1, 10], "dir": [0, 9], "complet": [0, 3, 6, 7, 9], "pickl": [0, 6, 7], "home": 0, "under": [0, 6, 7], "built": [0, 3, 8, 9, 10], "infer": [0, 3, 6, 7, 8, 9], "smile": [0, 3, 6, 7, 8, 9, 11, 12, 13, 14], "note": [0, 1, 3, 4, 8, 9, 10, 12, 13, 14], "varieti": [0, 6, 7], "model_fil": 0, "input_smiles_csv_fil": 0, "input_smiles_csv_column": [0, 6, 7], "aux": [0, 6, 7, 9, 11], "input_aux_column": 0, "precomput": [0, 3, 8, 9], "input_precomputed_fil": 0, "input_precomputed_input_column": 0, "respons": [0, 3, 8, 9], "input_precomputed_response_column": 0, "output_prediction_csv_column": 0, "output_prediction_csv_fil": 0, "uncertainty_quantil": 0, "optunaaz": 0, "auxiliari": [0, 3, 6, 7, 9, 13, 15], "filenam": [0, 6, 7, 9, 11], "identifi": [0, 3, 6, 7, 8, 9], "must": [0, 1, 6, 7, 10], "provid": [0, 1, 3, 6, 7, 8, 9, 10, 13], "shap": [0, 9], "chemprop": [0, 1, 3, 4, 9, 10], "appli": [0, 1, 3, 6, 7, 8, 9, 10, 13, 14, 15], "threshold": [0, 1, 3, 4, 6, 7, 9, 10, 13, 14, 15], "tri": 0, "dure": [0, 1, 3, 6, 7, 8, 9, 10], "mlflow": [0, 5, 9, 12], "track": [0, 3, 5, 6, 7, 9, 10], "ui": 0, "open": [0, 1, 6, 7, 9, 10], "link": 0, "browser": 0, "If": [0, 1, 3, 6, 7, 9, 10, 13, 14], "scp": [0, 6], "forward": [0, 1, 10], "port": 0, "separ": [0, 3, 8, 9], "ssh": 0, "session": 0, "non": [0, 1, 3, 6, 7, 8, 9, 10], "n": [0, 1, 6, 7, 8, 10, 11], "l": 0, "localhost": 0, "5000": 0, "user": [0, 1, 3, 4, 6, 7, 9, 10, 12, 13, 14, 15], "intranet": 0, "net": [0, 6], "execut": 0, "select": [0, 1, 3, 6, 7, 8, 9, 10], "experi": [0, 8, 11], "after": [0, 1, 3, 6, 7, 8, 9, 10, 11], "choos": [0, 4], "compar": [0, 6, 7], "comparison": [0, 6, 7, 8], "call": [0, 1, 3, 6, 7, 9, 10, 13], "well": [0, 6, 7, 8], "metric": [0, 1, 6, 7, 9, 10, 12], "At": 0, "bottom": 0, "plot": [0, 6, 7, 8, 10, 12], "For": [0, 1, 3, 6, 7, 8, 9, 10, 13], "x": [0, 1, 3, 6, 7, 8, 9, 10, 13, 14], "axi": [0, 6, 7, 8], "_": [0, 6, 7], "number": [0, 1, 3, 6, 7, 8, 9, 10, 11], "y": [0, 1, 8, 9, 10, 11, 13, 14], "cvmean": 0, "r2": [0, 6, 7, 8, 10], "more": [0, 1, 3, 8, 9, 10, 11], "click": 0, "individu": [0, 1, 6, 7, 8, 10], "There": [0, 1, 6, 7, 8, 10], "access": [0, 3, 9], "an": [0, 1, 3, 4, 8, 9, 10, 11, 13, 14], "daemon": [0, 4], "design": [0, 6, 7], "autom": [0, 4, 8], "dispatch": [0, 6, 7, 9], "job": [0, 6, 7, 8, 9, 11], "schedul": [0, 4, 6], "particularli": [0, 6, 7], "scientist": 0, "research": 0, "who": 0, "work": [0, 6, 7, 8], "larg": [0, 1, 8, 10], "need": [0, 4, 9], "distribut": [0, 1, 6, 7, 8, 10], "comput": [0, 1, 3, 4, 8, 9, 10, 13], "resourc": [0, 6, 7, 9], "code": [0, 3, 6, 7, 8, 9, 11], "streamlin": [0, 6, 7], "manag": 0, "submiss": 0, "while": [0, 3, 6, 7, 8, 9, 13], "ensur": [0, 6, 7, 8, 9, 10], "effici": [0, 6, 7], "scalabl": [0, 6, 7], "output_path": [0, 6, 7, 9], "email": [0, 6, 7, 9], "user_nam": [0, 6, 7, 9], "input_data": [0, 6, 7, 9], "input_activity_csv_column": [0, 6, 7], "input_task_csv_column": [0, 6, 7], "initi": [0, 6, 7, 8, 9, 10], "templat": [0, 6, 7], "input_initial_templ": [0, 6, 7], "retrain": [0, 4, 5, 9], "input_retrain_templ": [0, 6, 7], "input_slurm_templ": [0, 6, 7], "quorum": [0, 6, 7, 9], "n_core": [0, 6, 7, 9], "dry": [0, 6, 7], "v": [0, 6, 7], "req": [0, 6, 7], "slurm_req_cor": [0, 6, 7, 9], "slurm_req_mem": [0, 6, 7, 9], "slurm_req_partit": [0, 6, 7, 9], "al": [0, 3, 6, 7, 8, 9], "pool": [0, 6, 7], "slurm_al_pool": [0, 6, 7, 9], "slurm_al_smiles_csv_column": [0, 6, 7], "prefix": [0, 6, 7, 11], "slurm_job_prefix": [0, 6, 7, 9], "failur": [0, 6, 7, 9], "increment": [0, 6, 7], "slurm_failure_cores_incr": [0, 6, 7], "slurm_failure_mem_incr": [0, 6, 7], "min": [0, 1, 6, 7, 8, 10, 13], "slurm_failure_mins_incr": [0, 6, 7], "max": [0, 6, 7, 8, 13], "retri": [0, 6, 7], "slurm_failure_max_retri": [0, 6, 7], "slurm_failure_max_mem": [0, 6, 7], "slurm_failure_max_cpu": [0, 6, 7], "previou": [0, 6, 7, 11], "tempor": [0, 4, 6, 7, 9, 11, 13], "verbos": [0, 6, 7], "notif": [0, 6, 7], "prid": [0, 6], "multipl": [0, 3, 6, 7, 9, 13, 14], "wildcard": [0, 6, 7], "express": [0, 6, 7], "would": [0, 3, 6, 7, 8, 9, 11], "one_taskid": [0, 6, 7], "c": [0, 1, 3, 6, 7, 8, 9, 10, 12], "vvv": [0, 6, 7], "test_auto1": 0, "220": [0, 6, 7], "testaml": [0, 6, 7], "testpartit": [0, 7], "inform": [0, 1, 3, 9, 10, 11], "regard": 0, "add": [0, 6, 7, 8, 9, 11], "optunaz": [0, 1, 3, 6, 7, 8, 14, 15], "py": [0, 1, 6, 7, 8, 10], "like": [0, 1, 3, 6, 7, 8, 9, 10], "so": [0, 6, 7, 8, 10], "dataclass": [0, 11], "class": [0, 1, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15], "yournewdescriptor": 0, "rdkitdescriptor": [0, 9], "descript": [0, 9, 10], "goe": 0, "apischema": [0, 6, 7, 9], "type_nam": 0, "yournewdescriptorparam": 0, "pass": [0, 1, 3, 6, 7, 9, 10, 13], "exampleofaparamet": 0, "annot": [0, 6, 7, 9], "int": [0, 1, 3, 9, 10, 13, 14], "schema": [0, 5, 9, 12], "titl": [0, 1, 3, 6, 7, 8, 9, 10, 11, 13, 14, 15], "field": 0, "default": [0, 1, 8, 9, 10, 13, 14], "liter": [0, 9, 10, 13, 14], "def": [0, 6, 7, 8, 10], "calculate_from_smi": [0, 3, 6, 7, 9], "self": [0, 6, 7, 10], "smi": [0, 3, 9, 11], "str": [0, 1, 3, 6, 7, 9, 10, 11, 12, 13, 14, 15], "insert": [0, 8], "calcul": [0, 3, 6, 7, 9, 13, 14, 15], "fp": [0, 3, 6, 7, 9], "code_to_calculate_fp": 0, "return": [0, 3, 6, 7, 8, 9, 11, 12, 13, 14], "list": [0, 1, 3, 4, 6, 7, 8, 9, 10, 13, 15], "within": [0, 1, 3, 9, 10, 13, 14], "same": [0, 1, 6, 7, 8, 10, 11], "anyunscaleddescriptor": 0, "union": [0, 1, 3, 9, 10], "avalon": [0, 4, 9, 10, 12], "pathfp": [0, 4, 6, 7, 9, 12], "amorprotdescriptor": [0, 3, 9, 12], "precomputeddescriptorfromfil": [0, 4, 6, 7, 9, 12], "unscaledmapc": [0, 3, 9, 12], "unscaledphyschemdescriptor": [0, 4, 6, 7, 9, 12], "unscaledjazzydescriptor": [0, 4, 6, 7, 9, 12], "unscaledzscalesdescriptor": [0, 4, 9, 12], "compositecompatibledescriptor": 0, "scaleddescriptor": [0, 4, 9, 12], "mapc": [0, 3, 9, 12], "physchemdescriptor": [0, 4, 9, 12], "jazzydescriptor": [0, 4, 9, 12], "zscalesdescriptor": [0, 3, 9, 12], "now": [0, 6, 7, 8, 10], "consid": [0, 3, 6, 7, 9, 13, 14], "later": [0, 6, 7], "among": [0, 6, 7], "exist": [0, 3, 6, 9, 11], "youraglrotihm": 0, "youralgorithmparam": 0, "youralgorithmparameterint": 0, "metadata": [0, 6, 7, 9, 10, 11, 12], "youralgorithmparameterfloat": 0, "float": [0, 1, 6, 7, 8, 10, 11, 13, 14, 15], "0001": [0, 1, 10], "001": [0, 7], "parameter_int": 0, "parameter_float": 0, "fixed_int": 0, "priori": 0, "fix": [0, 9, 10], "runtim": [0, 3, 9], "optimis": [0, 3, 6, 7, 8, 9, 10, 11], "youralgorithm": 0, "b": [0, 6, 7, 8], "sens": [0, 3, 9], "refer": [0, 3, 6, 7, 9, 11, 12], "anyregressionalgorithm": 0, "regressor": [0, 1, 6, 7, 9, 10, 12], "plsregress": [0, 4, 6, 7, 10, 12], "kneighborsregressor": [0, 4, 6, 7, 10, 12], "prfclassifi": [0, 4, 6, 7, 10, 12], "chempropregressor": [0, 4, 6, 7, 10, 12], "chempropregressorpretrain": [0, 4, 6, 7, 10], "chemprophyperoptregressor": [0, 4, 6, 7, 10, 12], "anyclassificationalgorithm": 0, "adaboostclassifi": [0, 4, 6, 7, 10, 12], "kneighborsclassifi": [0, 4, 6, 7, 10, 12], "logisticregress": [0, 4, 6, 7, 10, 12], "randomforestclassifi": [0, 4, 6, 7, 10, 12], "svc": [0, 4, 6, 7, 10, 12], "chempropclassifi": [0, 4, 6, 7, 10, 12], "chemprophyperoptclassifi": [0, 4, 6, 7, 10, 12], "depend": [0, 1, 6, 7, 8, 10], "classifi": [0, 1, 6, 7, 9, 10, 12], "youralgorithmparamet": 0, "consist": [0, 6, 7], "youralgorihtm": 0, "examplealgorithm": 0, "expect": [0, 6, 7, 8, 11], "4": [0, 1, 3, 6, 7, 8, 9, 10, 13, 14], "build_from_opt": [0, 5, 9], "elif": 0, "statement": 0, "isinst": 0, "alg": [0, 9, 10], "opt": 0, "suggest_int": 0, "_encode_nam": 0, "encod": [0, 1, 9, 10], "string": [0, 3, 6, 7, 8, 9, 12, 13, 14, 15], "para": 0, "suggest_float": 0, "suggest": [0, 6, 7], "report": [0, 4, 6, 7, 8], "even": [0, 6, 7, 8], "instanti": 0, "8": [0, 6, 7, 8, 10], "sourc": [1, 3, 9, 10, 11, 12, 13, 14, 15], "adaboost": [1, 10], "meta": [1, 6, 7, 9, 10], "begin": [1, 6, 7, 8, 10, 13, 14], "fit": [1, 3, 6, 7, 8, 9, 10, 13], "origin": [1, 3, 6, 7, 8, 9, 10, 13], "addit": [1, 6, 7, 10], "copi": [1, 6, 7, 8, 10, 11], "incorrectli": [1, 10], "instanc": [1, 6, 7, 8, 9, 10], "adjust": [1, 10], "subsequ": [1, 6, 7, 10], "focu": [1, 10], "difficult": [1, 6, 7, 10], "adaboostclassifierparametersnestim": [1, 10], "adaboostclassifierparameterslearningr": [1, 10], "The": [1, 3, 8, 9, 10, 11, 13, 15], "maximum": [1, 3, 6, 7, 8, 9, 10, 13, 14], "boost": [1, 3, 9, 10], "termin": [1, 10], "perfect": [1, 10], "learn": [1, 3, 4, 8, 9, 10, 13, 14], "procedur": [1, 3, 6, 7, 8, 9, 10], "stop": [1, 6, 7, 10], "each": [1, 3, 6, 7, 8, 9, 10, 13], "classifierat": [1, 10], "iter": [1, 6, 7, 10, 13, 14], "A": [1, 3, 8, 9, 10], "higher": [1, 6, 7, 10], "rateincreas": [1, 10], "contribut": [1, 3, 6, 7, 9, 10], "trade": [1, 10], "between": [1, 6, 7, 8, 10, 11], "learning_rateand": [1, 10], "linear": [1, 8, 10], "model": [1, 3, 4, 8, 9, 10, 11, 13, 14, 15], "l1": [1, 10], "prior": [1, 8, 10], "regular": [1, 6, 7, 10], "spars": [1, 10], "coeffici": [1, 10], "tend": [1, 10], "prefer": [1, 10], "solut": [1, 6, 7, 10], "fewer": [1, 10], "zero": [1, 3, 9, 10], "effect": [1, 6, 7, 8, 10, 13], "reduc": [1, 6, 7, 10], "featur": [1, 3, 6, 7, 9, 10], "upon": [1, 6, 7, 10], "lassoparametersalpha": [1, 10], "constant": [1, 10], "multipli": [1, 10], "term": [1, 6, 7, 10], "control": [1, 6, 7, 8, 10, 13], "strength": [1, 3, 9, 10], "neg": [1, 6, 7, 8, 10], "i": [1, 3, 6, 7, 8, 9, 10, 11], "e": [1, 3, 8, 9, 10, 11, 13, 15], "inf": [1, 6, 7, 9, 10], "equival": [1, 10], "ordinari": [1, 10], "least": [1, 6, 7, 10], "squar": [1, 6, 7, 10], "solv": [1, 6, 7, 10], "linearregress": [1, 10], "numer": [1, 7, 8, 10], "reason": [1, 6, 7, 8, 9, 10], "us": [1, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15], "advis": [1, 6, 7, 8, 10], "implement": [1, 3, 6, 7, 9, 10, 13], "k": [1, 6, 7, 8, 10, 13, 14], "nearest": [1, 6, 7, 10], "neighbor": [1, 6, 7, 10, 13, 14], "vote": [1, 10], "principl": [1, 10], "behind": [1, 6, 7, 10], "method": [1, 3, 8, 9, 10, 12, 13], "find": [1, 6, 7, 9, 10], "predefin": [1, 4, 10, 13, 15], "sampl": [1, 6, 7, 10, 13, 14], "closest": [1, 10], "distanc": [1, 6, 7, 9, 10], "point": [1, 8, 10, 13, 14], "label": [1, 6, 7, 8, 9, 10, 13, 14], "from": [1, 3, 4, 9, 10, 11, 13, 14, 15], "defin": [1, 3, 6, 7, 8, 9, 10, 11, 13], "despit": [1, 6, 7, 10], "simplic": [1, 10], "success": [1, 6, 7, 10], "classif": [1, 4, 8, 9, 10, 12, 13], "problem": [1, 6, 7, 8, 9, 10], "n_neighbor": [1, 10, 12], "kneighborsclassifierparametersn_neighbor": [1, 10], "kneighbor": [1, 10], "queri": [1, 6, 7, 8, 9, 10], "minkowski": [1, 6, 7, 10], "euclidean": [1, 10], "kneighborsregressorparametersn_neighbor": [1, 10], "logist": [1, 10], "rather": [1, 3, 6, 7, 8, 9, 10], "than": [1, 3, 6, 7, 8, 9, 10], "also": [1, 3, 6, 7, 8, 9, 10, 13], "known": [1, 3, 6, 7, 8, 9, 10], "literatur": [1, 10], "logit": [1, 10], "entropi": [1, 8, 10], "maxent": [1, 10], "log": [1, 4, 10, 11, 12, 13, 15], "probabl": [1, 4, 8, 10], "describ": [1, 3, 6, 7, 9, 10, 13], "possibl": [1, 6, 7, 8, 9, 10, 11, 13, 14], "outcom": [1, 10], "singl": [1, 6, 7, 10], "solver": [1, 10, 12], "logisticregressionparametersparameterc": [1, 10], "try": [1, 6, 7, 8, 10], "sag": [1, 10], "saga": [1, 10], "fast": [1, 6, 7, 10], "converg": [1, 6, 7, 10], "guarante": [1, 10], "approxim": [1, 6, 7, 10], "scale": [1, 3, 8, 9, 10, 13, 15], "preprocess": [1, 4, 9, 10, 11, 14, 15], "scaler": [1, 3, 9, 10], "invers": [1, 10], "posit": [1, 3, 6, 7, 9, 10], "support": [1, 6, 7, 9, 10], "vector": [1, 3, 6, 7, 9, 10, 13, 15], "machin": [1, 3, 4, 6, 7, 8, 9, 10], "smaller": [1, 6, 7, 10], "stronger": [1, 10], "decomposit": [1, 10], "partial": [1, 6, 7, 10], "form": [1, 3, 6, 7, 8, 9, 10, 13], "compon": [1, 3, 6, 7, 9, 10], "fundament": [1, 10], "relat": [1, 3, 6, 7, 8, 9, 10], "matric": [1, 10], "thei": [1, 3, 6, 7, 8, 9, 10], "latent": [1, 10], "variabl": [1, 6, 7, 8, 9, 10], "approach": [1, 3, 6, 7, 8, 9, 10], "covari": [1, 4, 9, 10], "space": [1, 8, 10, 13, 14], "multidimension": [1, 10], "varianc": [1, 6, 7, 8, 10], "other": [1, 6, 7, 8, 10, 13], "word": [1, 6, 7, 10], "both": [1, 6, 7, 8, 10], "lower": [1, 6, 7, 10], "dimension": [1, 10], "subspac": [1, 6, 7, 9, 10], "transform": [1, 4, 9, 10, 11], "n_compon": [1, 10, 12], "ncompon": [1, 10], "keep": [1, 6, 7, 8, 10, 13], "n_sampl": [1, 10], "n_featur": [1, 10], "n_target": [1, 10], "forest": [1, 4, 8, 10], "decis": [1, 6, 7, 8, 10, 13, 15], "tree": [1, 6, 7, 10], "variou": [1, 6, 7, 9, 10], "sub": [1, 6, 7, 10], "averag": [1, 3, 6, 7, 8, 9, 10, 13], "improv": [1, 3, 6, 7, 9, 10], "accuraci": [1, 6, 7, 10], "over": [1, 6, 7, 10], "randomforestclassifierparametersmaxdepth": [1, 10], "randomforestclassifierparametersnestim": [1, 6, 7, 10], "depth": [1, 6, 7, 10, 12], "considerwhen": [1, 10], "split": [1, 4, 9, 10, 13, 14, 15], "thenconsid": [1, 10], "sqrt": [1, 6, 7, 8, 10], "log2": [1, 8, 10, 13, 15], "randomforestregressorparametersmaxdepth": [1, 10], "randomforestregressorparametersnestim": [1, 10], "l2": [1, 10], "loss": [1, 3, 6, 7, 9, 10], "norm": [1, 8, 10], "tikhonov": [1, 10], "base": [1, 3, 4, 6, 7, 9, 10, 11, 12, 13, 14, 15], "libsvm": [1, 10], "quadrat": [1, 10], "mai": [1, 3, 6, 7, 8, 9, 10], "impract": [1, 10], "beyond": [1, 10], "ten": [1, 10], "thousand": [1, 10], "svcparametersparameterc": [1, 10], "1e": [1, 10], "gamma": [1, 10, 12], "proport": [1, 6, 7, 10], "strictli": [1, 10], "penalti": [1, 10], "kernel": [1, 10], "epsilon": [1, 10], "complex": [1, 6, 7, 10], "hard": [1, 3, 9, 10], "coupl": [1, 10], "10000": [1, 10], "svrparametersparameterc": [1, 10], "svrparametersgamma": [1, 10], "maxdepth": [1, 10], "nestim": [1, 10], "learningr": [1, 10], "xgboost": [1, 10, 12], "gradient": [1, 10], "stand": [1, 10], "extrem": [1, 6, 7, 10], "paper": [1, 3, 6, 7, 9, 10], "greedi": [1, 10], "friedman": [1, 10], "learner": [1, 10], "round": [1, 6, 7, 8, 10], "prf": [1, 4, 8, 10], "probabilist": [1, 4, 10], "seen": [1, 6, 7, 8, 10], "hybrid": [1, 6, 7, 10], "similar": [1, 3, 6, 7, 8, 9, 10, 13, 14], "take": [1, 3, 6, 7, 8, 9, 10, 13], "real": [1, 6, 7, 8, 10, 13, 14], "represent": [1, 3, 4, 9, 10], "ptr": [1, 4, 6, 7, 10, 13], "howev": [1, 3, 6, 7, 8, 9, 10], "belong": [1, 3, 6, 7, 8, 9, 10], "inact": [1, 6, 7, 8, 10, 13, 15], "use_py_gini": [1, 10, 12], "use_py_leaf": [1, 10, 12], "prfclassifierparametersmaxdepth": [1, 10], "prfclassifierparametersnestim": [1, 10], "min_py_sum_leaf": [1, 10, 12], "prfclassifierparametersminpysumleaf": [1, 10], "gini": [1, 10], "true": [1, 3, 6, 7, 8, 9, 10, 13, 14], "leav": [1, 10], "leaf": [1, 10], "allow": [1, 3, 6, 7, 8, 9, 10], "prune": [1, 6, 7, 10], "propag": [1, 10], "small": [1, 8, 9, 10], "thu": [1, 6, 7, 10], "pth": [1, 10], "scheme": [1, 10], "noisi": [1, 10], "deep": [1, 6, 7, 10], "properti": [1, 3, 6, 7, 8, 9, 10, 11], "network": [1, 3, 6, 7, 9, 10], "neural": [1, 6, 7, 9, 10], "d": [1, 3, 6, 7, 9, 10, 11], "mpnn": [1, 10], "graph": [1, 3, 6, 7, 9, 10], "feed": [1, 10], "ffnn": [1, 10], "multi": [1, 3, 9, 10], "layer": [1, 3, 6, 7, 9, 10], "perceptron": [1, 10], "wa": [1, 3, 6, 7, 9, 10, 11], "present": [1, 6, 7, 8, 10, 11], "analyz": [1, 6, 7, 10], "optuna": [1, 4, 6, 7, 9, 10, 11, 12], "optims": [1, 10], "hyperopt": [1, 10], "ensemble_s": [1, 6, 7, 10, 12], "epoch": [1, 6, 7, 10, 12], "aggreg": [1, 6, 7, 8, 10, 12, 13, 14], "aggregation_norm": [1, 6, 7, 10, 12], "chempropparametersaggregation_norm": [1, 10], "200": [1, 6, 7, 9, 10], "q": [1, 3, 6, 7, 9, 10, 12], "batch_siz": [1, 6, 7, 10, 12], "chempropparametersbatch_s": [1, 10], "chempropparametersdepth": [1, 10], "6": [1, 6, 7, 8, 10], "dropout": [1, 10, 12], "chempropparametersdropout": [1, 10], "04": [1, 6, 7, 10], "features_gener": [1, 6, 7, 10, 12], "ffn_hidden_s": [1, 6, 7, 10, 12], "chempropparametersffn_hidden_s": [1, 10], "300": [1, 6, 7, 10], "2400": [1, 10], "ffn_num_lay": [1, 6, 7, 10, 12], "chempropparametersffn_num_lay": [1, 10], "final_lr_ratio_exp": [1, 6, 7, 10, 12], "chempropparametersfinal_lr_ratio_exp": [1, 10], "hidden_s": [1, 6, 7, 10, 12], "chempropparametershidden_s": [1, 10], "init_lr_ratio_exp": [1, 6, 7, 10, 12], "chempropparametersinit_lr_ratio_exp": [1, 10], "max_lr_exp": [1, 6, 7, 10, 12], "chempropparametersmax_lr_exp": [1, 10], "warmup_epochs_ratio": [1, 6, 7, 10, 12], "chempropparameterswarmup_epochs_ratio": [1, 10], "ensembl": [1, 10, 12], "initialis": [1, 6, 7, 9, 10], "size": [1, 3, 6, 7, 8, 9, 10], "run": [1, 3, 4, 8, 9, 10, 11], "increas": [1, 6, 7, 8, 9, 10, 13, 14], "400": [1, 6, 7, 10], "sum": [1, 6, 7, 10], "atom": [1, 3, 6, 7, 9, 10, 13, 14], "divid": [1, 6, 7, 10], "up": [1, 3, 4, 6, 9, 10, 11], "batch": [1, 10, 13], "step": [1, 8, 9, 10], "visibl": [1, 10], "randomli": [1, 6, 7, 8, 10], "some": [1, 3, 6, 7, 8, 9, 10], "element": [1, 10, 13, 14], "tensor": [1, 10], "p": [1, 3, 9, 10], "bernoulli": [1, 10], "channel": [1, 10], "independ": [1, 8, 10], "everi": [1, 6, 7, 10], "proven": [1, 10], "techniqu": [1, 8, 10], "prevent": [1, 6, 7, 10], "co": [1, 8, 10], "adapt": [1, 3, 9, 10], "neuron": [1, 10], "hidden": [1, 6, 7, 10], "ffn": [1, 6, 7, 10], "exponenti": [1, 8, 10], "rate": [1, 10], "bond": [1, 3, 9, 10], "ratio": [1, 10], "linearli": [1, 10], "init_lr": [1, 10], "max_lr": [1, 10], "afterward": [1, 8, 10], "decreas": [1, 8, 10], "final_lr": [1, 10], "without": [1, 6, 7, 9, 10, 13], "hyperparamet": [1, 4, 6, 7, 9, 10], "side": [1, 3, 9, 10], "nb": [1, 3, 6, 7, 8, 9, 10], "quick": [1, 4, 10], "simpl": [1, 8, 10], "sensibl": [1, 6, 7, 8, 9, 10], "author": [1, 6, 7, 9, 10], "do": [1, 6, 7, 8, 9, 10, 13], "num_it": [1, 6, 7, 10, 12], "search_parameter_level": [1, 6, 7, 10, 12], "dictat": [1, 6, 7, 10], "larger": [1, 3, 6, 7, 8, 9, 10], "pretrin": [1, 10], "pretrain": [1, 6, 7, 9, 10], "carri": [1, 10], "suppli": [1, 3, 6, 7, 8, 9, 10], "previous": [1, 10], "qsartuna": [1, 9, 10], "chempropparametersepoch": [1, 6, 7, 10], "frzn": [1, 10, 12], "pretrained_model": [1, 6, 7, 9, 10, 12], "none": [1, 3, 6, 7, 9, 10, 11, 13, 14, 15], "fine": [1, 10], "tune": [1, 3, 4, 6, 7, 9, 10], "decid": [1, 10], "freez": [1, 10], "transfer": [1, 10], "frozen": [1, 10], "calibr": [1, 4, 9, 10], "isoton": [1, 6, 7, 10], "vennab": [1, 10], "cv": [1, 6, 7, 10], "With": [1, 3, 9, 10], "across": [1, 6, 7, 8, 10, 13], "fals": [1, 3, 6, 7, 8, 9, 10, 13], "obtain": [1, 6, 7, 8, 10], "unbias": [1, 10], "offer": [1, 3, 6, 7, 9, 10], "p0": [1, 6, 7, 10], "vs": [1, 6, 7, 8, 9, 10], "p1": [1, 6, 7, 10], "discord": [1, 6, 7, 10], "type": [1, 3, 6, 7, 8, 9, 10, 13], "calibratedclassifiercvensembl": [1, 10], "calibratedclassifiercvmethod": [1, 10], "n_fold": [1, 6, 7, 10, 12], "whether": [1, 3, 8, 9, 10, 13, 15], "agnost": [1, 6, 7, 10], "interv": [1, 6, 7, 10], "encompass": [1, 10], "aleator": [1, 10], "epistem": [1, 10], "back": [1, 6, 7, 10], "strong": [1, 10], "theoret": [1, 6, 7, 10], "thank": [1, 10], "conform": [1, 10], "mapie_alpha": [1, 6, 7, 10, 12], "05": [1, 6, 7, 8, 10], "01": [1, 6, 7, 10], "99": [1, 6, 7, 10], "see": [3, 6, 7, 8, 9, 10, 13, 14], "gedeck": [3, 9], "et": [3, 8, 9], "qsar": [3, 4, 6, 7, 8, 9], "good": [3, 6, 7, 8, 9], "practic": [3, 9], "fingerprint": [3, 9, 10], "wai": [3, 6, 7, 8, 9], "daylight": [3, 9], "enumer": [3, 6, 7, 9, 10], "custom": [3, 6, 7, 9], "ref": [3, 9, 11], "16": [3, 6, 7, 8, 9], "hash": [3, 6, 7, 9, 10, 11], "style": [3, 6, 7, 8, 9], "implicitli": [3, 9], "largest": [3, 6, 7, 9], "toward": [3, 6, 7, 8, 9], "binari": [3, 6, 7, 9, 10], "extend": [3, 6, 7, 8, 9], "connect": [3, 6, 7, 9], "roger": [3, 9], "circular": [3, 9], "morgan": [3, 9, 10], "algorithm": [3, 4, 8, 9, 10, 11, 12, 13, 14], "invari": [3, 9], "getmorganfingerprintasbitvect": [3, 9], "rdkit": [3, 6, 7, 8, 9, 10], "systemat": [3, 9], "record": [3, 6, 7, 8, 9], "neighborhood": [3, 9, 10], "substructur": [3, 6, 7, 9], "map": [3, 6, 7, 8, 9], "integ": [3, 8, 9, 13, 14], "length": [3, 6, 7, 9], "diamet": [3, 9], "append": [3, 6, 7, 8, 9, 10], "g": [3, 8, 9, 13, 15], "ecfp4": [3, 9], "correspond": [3, 6, 7, 8, 9, 10], "returnrdkit": [3, 6, 7, 9], "bit": [3, 6, 7, 9], "sometim": [3, 6, 7, 8, 9], "bool": [3, 9, 10, 13, 14], "calculate_from_mol": [3, 9], "mol": [3, 6, 7, 8, 9], "numpi": [3, 6, 7, 8, 9, 13, 14], "arrai": [3, 6, 7, 9, 13, 14], "count": [3, 6, 7, 9, 10], "gethashedmorganfingerprint": [3, 9], "appear": [3, 6, 7, 9, 12], "usefeatur": [3, 6, 7, 9, 12], "fcfp": [3, 9], "normal": [3, 6, 7, 8, 9, 10], "ones": [3, 6, 7, 9], "definit": [3, 9, 13], "gobbi": [3, 9], "popping": [3, 9], "biotechnolog": [3, 9], "bioengin": [3, 9], "61": [3, 6, 7, 9], "47": [3, 6, 7, 9], "54": [3, 6, 7, 9], "1998": [3, 6, 7, 9], "lead": [3, 8, 9], "score": [3, 4, 9, 10, 11, 13, 15], "maxpath": [3, 6, 7, 9, 12], "fpsize": [3, 6, 7, 9, 12], "macc": [3, 6, 7, 9], "system": [3, 6, 7, 8, 9], "often": [3, 6, 7, 9], "mdl": [3, 9], "kei": [3, 6, 7, 8, 9, 11, 12], "compani": [3, 9], "keyset": [3, 9], "construct": [3, 9, 12], "optim": [3, 4, 8, 9, 10, 12], "durant": [3, 9], "reoptim": [3, 9], "drug": [3, 9], "discoveri": [3, 9], "166": [3, 6, 7, 9], "2d": [3, 9, 10], "essenti": [3, 8, 9], "answer": [3, 9], "fragment": [3, 9], "question": [3, 9], "explicitli": [3, 6, 7, 8, 9], "matter": [3, 9], "becaus": [3, 6, 7, 8, 9], "address": [3, 9], "specif": [3, 6, 7, 8, 9, 12], "repres": [3, 6, 7, 8, 9], "9": [3, 6, 7, 8, 9], "1049": [3, 9], "distinct": [3, 6, 7, 8, 9, 10], "rdkit_nam": [3, 6, 7, 9, 12], "unscal": [3, 9], "These": [3, 6, 7, 8, 9, 13], "physchem": [3, 6, 7, 9], "caution": [3, 8, 9], "208": [3, 6, 7, 9], "includ": [3, 6, 7, 8, 9], "clogp": [3, 6, 7, 9], "mw": [3, 6, 7, 9], "ring": [3, 8, 9], "rotat": [3, 9], "fraction": [3, 6, 7, 8, 9, 13, 14], "sp3": [3, 9], "kier": [3, 9], "indic": [3, 6, 7, 8, 9, 13, 14], "etc": [3, 6, 7, 8, 9], "tpsa": [3, 6, 7, 9], "slogp": [3, 9], "group": [3, 8, 9, 13, 14], "vsa": [3, 9], "moe": [3, 9], "charg": [3, 9], "www": [3, 9], "org": [3, 6, 7, 9], "doc": [3, 6, 7, 9], "gettingstartedinpython": [3, 9], "html": [3, 6, 7, 8, 9, 10], "whose": [3, 9], "been": [3, 6, 7, 8, 9], "level": [3, 6, 7, 8, 9, 10], "One": [3, 8, 9], "advantag": [3, 9], "interpret": [3, 9], "mean": [3, 6, 7, 8, 9, 10, 13], "physicochem": [3, 9], "intuit": [3, 9], "understood": [3, 9], "option": [3, 4, 8, 9, 10, 12, 13, 14, 15], "jazzy_nam": [3, 6, 7, 9, 12], "jazzy_filt": [3, 6, 7, 9], "jazzi": [3, 9], "hydrat": [3, 9], "energi": [3, 9], "hydrogen": [3, 9], "acceptor": [3, 6, 7, 9], "donor": [3, 6, 7, 9], "found": [3, 6, 7, 9, 11], "doi": [3, 6, 7, 9], "1038": [3, 9], "s41598": [3, 9], "023": [3, 6, 9], "30089": [3, 9], "mmff94": [3, 9], "minimis": [3, 9], "1000da": [3, 9], "compound": [3, 6, 7, 8, 9, 13, 14], "dict": [3, 9, 10, 11, 12], "ndarrai": [3, 9], "z": [3, 9, 13, 15], "peptid": [3, 6, 7, 9, 13, 15], "unfittedsklearnscal": [3, 9], "mol_data": [3, 9], "moldata": [3, 9], "file_path": [3, 9], "smiles_column": [3, 9], "fittedsklearnscal": [3, 9], "alia": [3, 9, 10], "file": [3, 8, 9, 11, 12, 13, 14], "header": [3, 9, 11], "line": [3, 4, 6, 7, 8, 9, 11], "row": [3, 6, 7, 8, 9], "comma": [3, 6, 7, 8, 9], "pre": [3, 8, 9], "inference_paramet": [3, 6, 7, 9], "were": [3, 6, 7, 8, 9], "propos": [3, 9], "sandberg": [3, 9], "proteogen": [3, 9], "amino": [3, 6, 7, 9], "acid": [3, 6, 7, 9], "nmr": [3, 9], "thin": [3, 9], "chromatographi": [3, 9], "tlc": [3, 9], "1021": [3, 6, 7, 9], "jm9700575": [3, 9], "captur": [3, 6, 7, 8, 9], "lipophil": [3, 9], "steric": [3, 9], "bulk": [3, 9], "polariz": [3, 9], "electron": [3, 9], "polar": [3, 9], "electroneg": [3, 9], "heat": [3, 9], "electrophil": [3, 9], "anoth": [3, 6, 7, 9], "through": [3, 6, 7, 9], "_and_": [3, 9], "continu": [3, 6, 7, 9], "learnt": [3, 6, 7, 9], "manner": [3, 6, 7, 9], "intent": [3, 6, 7, 9], "much": [3, 9], "remain": [3, 9, 13], "deriv": [3, 6, 7, 8, 9], "cautiou": [3, 9], "upload": [3, 9], "_all_": [3, 9], "ruder": [3, 9], "io": [3, 7, 9, 10], "index": [3, 6, 7, 8, 9], "auxiliarytask": [3, 9], "aux_weight_pc": [3, 6, 7, 9, 10, 12], "20": [3, 6, 7, 8, 9], "info": [3, 6, 7, 9], "percentag": [3, 9], "wrap": [3, 6, 7, 9], "certain": [3, 6, 7, 8, 9], "rang": [3, 6, 7, 8, 9, 13, 14], "scaleddescriptorparamet": [3, 9], "composit": [3, 6, 7, 9], "concaten": [3, 9], "button": [3, 9], "pleas": [3, 6, 7, 9, 11], "compat": [3, 6, 7, 9], "intro": 4, "background": 4, "json": [4, 6, 7, 9, 10, 12], "command": [4, 6, 7], "interfac": [4, 6, 7, 9, 12, 13], "python": [4, 6, 7, 9, 13], "jupyt": [4, 6, 7], "notebook": [4, 6, 7], "via": [4, 6, 7, 8, 13], "cli": 4, "inspect": [4, 6, 7], "automl": [4, 5], "automat": [4, 6, 7, 8], "ad": [4, 6, 7, 8, 13, 14], "descriptor": [4, 5, 8, 10, 12], "introduct": 4, "translat": [4, 6, 7], "sdf": [4, 6, 7, 9], "deal": [4, 13], "duplic": [4, 9, 10, 13], "dedupl": [4, 6, 7, 9, 11], "experiment": [4, 6, 7, 13, 15], "error": [4, 6, 7], "tutori": 4, "remov": [4, 8, 9, 10, 13, 14], "advanc": [4, 8, 9], "functoinail": 4, "overview": 4, "hpc": 4, "setup": [4, 10], "extract": 4, "walkthough": 4, "pipelin": [4, 6], "date": [4, 6, 9, 11], "calibratedclassifiercvwithva": [4, 6, 7, 10, 12], "mapi": [4, 10, 12], "zscale": [4, 6, 7, 9, 13], "smilesfromfil": [4, 6, 7, 9, 12], "smilesandsideinfofromfil": [4, 6, 7, 9, 12], "compositedescriptor": [4, 6, 7, 9, 12], "stratifi": [4, 6, 7, 13], "scaffoldsplit": [4, 8, 13], "modeldatatransform": [4, 6, 7, 8, 9, 13], "vectorfromcolumn": [4, 6, 7, 9, 13], "keepfirst": [4, 8, 13], "keeplast": [4, 8, 13], "keeprandom": [4, 8, 13], "keepmin": [4, 8, 13], "keepmax": [4, 8, 13], "keepavg": [4, 8, 13], "keepmedian": [4, 6, 7, 8, 13], "keepkeepallnodedupl": 4, "coverag": 4, "subpackag": 5, "submodul": 5, "content": 5, "util": [5, 6, 7, 8, 9, 14, 15], "files_path": [5, 9], "load_json": [5, 9], "builder": 5, "metirc": 5, "model_writ": 5, "visual": [5, 10, 12], "intend": [6, 7, 9], "necessari": [6, 7], "gui": [6, 7], "reinvent": [6, 7], "most": [6, 7, 8], "them": [6, 7, 8, 9, 10], "influenc": [6, 7, 8, 10], "idea": [6, 7, 8], "read": [6, 7, 8, 9], "otherwis": [6, 7, 13], "might": [6, 7, 8, 13], "skip": [6, 7, 8, 9, 11], "astrazeneca": [6, 7], "qptuna_latest": 6, "toi": [6, 7], "chosen": [6, 7], "whole": [6, 7, 8], "less": [6, 7, 8], "minut": [6, 7, 9], "holdout": [6, 7, 8], "readi": [6, 7, 9], "next": [6, 7, 8], "few": [6, 7, 8], "head": [6, 7, 8], "molwt_gt_330": [6, 7], "cc1cc": [6, 7], "nc": [6, 7, 8], "o": [6, 7, 8], "c2cccc": [6, 7], "coc3ccc": [6, 7], "br": [6, 7, 8], "cc3": [6, 7, 8], "c2": [6, 7, 8], "no1": [6, 7], "387": [6, 7], "233": [6, 7], "nc1ccc": [6, 7], "f": [6, 7, 8, 13], "cc1f": [6, 7], "nc1sccc1": [6, 7], "c1nc2ccccc2s1": [6, 7], "4360000000001": [6, 7], "coc": [6, 7], "c1ccccc1nc": [6, 7], "c1cc": [6, 7], "nn1cc1ccccc1": [6, 7], "380": [6, 7], "36000000000007": [6, 7], "ccoc": [6, 7], "sc1nc": [6, 7], "c2ccccc2": [6, 7], "ccc1c": [6, 7], "312": [6, 7], "39400000000006": [6, 7], "ccc": [6, 7, 8], "cc": [6, 7, 8], "c1nn": [6, 7, 8], "cc2ccccc2": [6, 7], "c2ccccc12": [6, 7], "349": [6, 7], "4340000000001": [6, 7], "brc1ccccc1occcoc1cccc2cccnc12": [6, 7], "358": [6, 7], "235": [6, 7], "ccccn1c": [6, 7], "coc2cccc": [6, 7], "oc": [6, 7], "nc2ccccc21": [6, 7], "310": [6, 7], "39700000000005": [6, 7], "ccoc1cccc": [6, 7], "c2sc3nc": [6, 7], "c4ccc": [6, 7], "cc4": [6, 7], "ccc3c2n": [6, 7], "c1": [6, 7, 8], "407": [6, 7], "4700000000001": [6, 7], "coc1ccc": [6, 7], "nc2ccc": [6, 7], "cc2": [6, 7], "c2ccc": [6, 7], "cc1oc": [6, 7], "454": [6, 7], "54800000000023": [6, 7], "sy": [6, 7, 8], "sklearn": [6, 7, 12], "typic": [6, 7, 8], "test_dataset_fil": [6, 7, 9], "random_se": [6, 7, 10], "42": [6, 7, 8, 13, 14], "seed": [6, 7, 8, 9, 13, 14], "reproduc": [6, 7, 13, 15], "basic": [6, 7, 9, 10], "importlib": [6, 7], "reload": [6, 7], "basicconfig": [6, 7], "getlogg": [6, 7], "disabl": [6, 7, 12], "np": [6, 7, 8], "seterr": [6, 7], "ignor": [6, 7], "warn": [6, 7], "filterwarn": [6, 7], "categori": [6, 7], "futurewarn": [6, 7], "runtimewarn": [6, 7], "tqdm": [6, 7], "functool": [6, 7], "partialmethod": [6, 7], "__init__": [6, 7, 10], "flood": [6, 7], "decpreci": [6, 7], "simplefilt": [6, 7], "arg": [6, 7, 9, 10], "kwarg": [6, 7, 10], "stderr": [6, 7], "render": [6, 7, 8], "red": [6, 7], "2024": [6, 7], "08": [6, 7], "23": [6, 7, 8], "51": [6, 7], "03": [6, 7], "367": [6, 7], "memori": [6, 7, 8, 9, 11], "440": [6, 7], "study_name_0": [6, 7], "760": [6, 7], "finish": [6, 7], "3594": [6, 7], "2228073972638": [6, 7], "39": [6, 7, 8], "algorithm_nam": [6, 7, 12], "randomforestregressor_algorithm_hash": [6, 7], "f1ac01e1bba332215ccbd0c29c9ac3c3": [6, 7], "max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3": [6, 7], "n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3": [6, 7], "max_features__f1ac01e1bba332215ccbd0c29c9ac3c3": [6, 7], "lt": [6, 7, 8], "randomforestmaxfeatur": [6, 7, 10], "gt": [6, 7, 8], "34": [6, 7, 8], "915": [6, 7], "5029": [6, 7], "734616310275": [6, 7], "svr_algorithm_hash": [6, 7], "ea7ccc7ef4a9329af0d4e39eb6184933": [6, 7], "gamma__ea7ccc7ef4a9329af0d4e39eb6184933": [6, 7], "039054412752107935": [6, 7], "c__ea7ccc7ef4a9329af0d4e39eb6184933": [6, 7], "1242780840717016e": [6, 7], "07": [6, 7], "195": 6, "4242": [6, 7], "092751193529": [6, 7], "341": [6, 7], "3393": [6, 7], "577488426015": [6, 7], "ridge_algorithm_hash": [6, 7], "cfa1990d5153c8812982f034d788d7e": [6, 7], "alpha__cfa1990d5153c8812982f034d788d7e": [6, 7], "06877704223043679": [6, 7], "506": 6, "427": [6, 7], "45250420148204": [6, 7], "lasso_algorithm_hash": [6, 7], "5457f609662e44f04dcc9423066d2f58": [6, 7], "alpha__5457f609662e44f04dcc9423066d2f58": [6, 7], "7896547008552977": [6, 7], "577": [6, 7], "3387": [6, 7], "245629616474": [6, 7], "plsregression_algorithm_hash": [6, 7], "9f2f76e479633c0bf18cf2912fed9eda": [6, 7], "n_components__9f2f76e479633c0bf18cf2912fed9eda": [6, 7], "646": [6, 7], "734620250011": [6, 7], "3661540064603184": [6, 7], "1799882524170321": [6, 7], "711": 6, "7": [6, 7, 8, 10], "9650": [6, 7], "026568221794": [6, 7], "kneighborsregressor_algorithm_hash": [6, 7], "1709d2c39117ae29f6c9debe7241287b": [6, 7], "metric__1709d2c39117ae29f6c9debe7241287b": [6, 7], "kneighborsmetr": [6, 7, 10], "n_neighbors__1709d2c39117ae29f6c9debe7241287b": [6, 7], "weights__1709d2c39117ae29f6c9debe7241287b": [6, 7], "kneighborsweight": [6, 7, 10], "uniform": [6, 7, 10], "727": [6, 7], "5437": [6, 7], "151635569594": [6, 7], "05083825348819038": [6, 7], "858": [6, 7], "2669": [6, 7], "8534551928174": 6, "876": 6, "4341": [6, 7], "586120152291": [6, 7], "7921825998469865": [6, 7], "098": [6, 7], "11": [6, 7, 8], "5514": [6, 7], "404088878843": 6, "210": 6, "12": [6, 7, 8], "5431": [6, 7], "634989239215": [6, 7], "228": 6, "13": [6, 7, 8], "3530": [6, 7], "5496618991288": [6, 7], "245": [6, 7], "14": [6, 7, 8], "3497": [6, 7], "6833185436312": [6, 7], "263": [6, 7], "15": [6, 7, 8], "4382": [6, 7], "16208862162": [6, 7], "279": [6, 7], "734620031822": [6, 7], "002825619931800395": [6, 7], "309885135051862e": [6, 7], "09": [6, 7], "296": [6, 7], "17": [6, 7, 8], "679": [6, 7], "3109044887755": [6, 7], "16827992999009767": [6, 7], "370": [6, 7], "18": [6, 7, 8], "2550": [6, 7], "114129318373": [6, 7], "386": [6, 7], "19": [6, 7, 8], "4847": [6, 7], "085792360169": [6, 7], "735431606118867": [6, 7], "404": 6, "268760278916": [6, 7], "0014840820994557746": [6, 7], "04671166881768783": [6, 7], "518": 6, "21": [6, 7, 8], "4783": [6, 7], "047015479679": 6, "536": 6, "22": [6, 7, 8], "3905": [6, 7], "0064899852296": [6, 7], "604": 6, "4030": [6, 7], "4577379164707": [6, 7], "672": 6, "24": [6, 7, 8], "4681": [6, 7], "602145939593": [6, 7], "690": [6, 7], "25": [6, 7, 8], "4398": [6, 7], "544034028325": [6, 7], "6452011213193165": [6, 7], "756": 6, "26": [6, 7, 8], "4454": [6, 7], "143979828406": 6, "27": [6, 7, 8], "765": 6, "28": [6, 7, 8], "833": 6, "29": [6, 7], "4397": [6, 7], "330360587512": [6, 7], "838": 6, "880": [6, 7], "31": [6, 7], "2602": [6, 7], "7561184287083": [6, 7], "897": 6, "5267": [6, 7], "388279961089": [6, 7], "2015560027548533": [6, 7], "06": [6, 7], "014": [6, 7], "33": [6, 7], "4863": [6, 7], "5817607510535": [6, 7], "032": [6, 7], "388": [6, 7], "96473594016675": [6, 7], "5528259214839937": [6, 7], "076": 6, "35": [6, 7], "5539": [6, 7], "698232987626": [6, 7], "6400992020612235": [6, 7], "107": [6, 7], "36": [6, 7], "5180": [6, 7], "5533034102455": [6, 7], "8968910439566395": [6, 7], "125": 6, "37": [6, 7], "4989": [6, 7], "929984864281": [6, 7], "04458440839692226": [6, 7], "492108041427977": [6, 7], "130": 6, "38": [6, 7, 8], "173": [6, 7], "6528": [6, 7], "215066535042": [6, 7], "16700143339733753": [6, 7], "237": [6, 7], "40": [6, 7, 8], "4168": [6, 7], "7955967552625": 6, "292": [6, 7], "41": [6, 7], "6177": [6, 7], "060727800014": [6, 7], "3963": [6, 7], "9069546583414": [6, 7], "378": [6, 7], "43": [6, 7], "6805334166565": [6, 7], "013186009009851564": [6, 7], "001008958590140135": [6, 7], "421": [6, 7], "44": [6, 7], "9300": [6, 7], "86840721566": [6, 7], "441": 6, "45": [6, 7, 8], "83": [6, 7], "87968210939489": [6, 7], "382674443425525e": [6, 7], "447": 6, "46": [6, 7], "460": [6, 7], "48": [6, 7], "525": 6, "49": [6, 7], "3660": [6, 7], "9359502556003": 6, "550": 6, "688": [6, 7], "5244070398325": [6, 7], "5267860995545326": [6, 7], "572": [6, 7], "6494438072099": [6, 7], "8458809314722497": [6, 7], "597": 6, "52": [6, 7], "691": [6, 7], "1197058420935": [6, 7], "9167866889210807": [6, 7], "622": [6, 7], "53": [6, 7], "3111710449325": [6, 7], "945685900574672": [6, 7], "9665592812149": [6, 7], "8936837761725833": [6, 7], "55": [6, 7], "4682747008223": [6, 7], "5183865279530455": [6, 7], "695": [6, 7], "56": [6, 7], "687": [6, 7], "5230947231512": [6, 7], "3771771681361766": [6, 7], "718": [6, 7], "57": [6, 7], "4503442069594": [6, 7], "3663259819415374": [6, 7], "743": [6, 7], "58": [6, 7], "686": [6, 7], "9553733616618": [6, 7], "2925652230875628": [6, 7], "766": [6, 7], "59": [6, 7], "2038330506566": [6, 7], "3962903248948568": [6, 7], "790": 6, "60": [6, 7], "377": [6, 7], "25988028857313": [6, 7], "45237513161879": [6, 7], "814": [6, 7], "379": [6, 7], "8933285317637": [6, 7], "4741161933311207": [6, 7], "62": [6, 7], "374": [6, 7], "50897467366013": [6, 7], "4290962207409417": [6, 7], "864": [6, 7], "63": [6, 7, 8], "376": [6, 7], "5588572940058": [6, 7], "4464295711264585": [6, 7], "890": 6, "64": [6, 7], "237448916406": [6, 7], "4687500034684213": [6, 7], "914": [6, 7], "65": [6, 7], "375": [6, 7], "7474776359051": [6, 7], "4395650011783436": [6, 7], "941": 6, "66": [6, 7], "362": [6, 7], "2834906299732": [6, 7], "3326755354190032": [6, 7], "966": [6, 7], "67": [6, 7], "357": [6, 7], "3474880122588": [6, 7], "2887212943233457": [6, 7], "993": 6, "68": [6, 7], "354": [6, 7], "279045046449": [6, 7], "2577677164664005": [6, 7], "031": 6, "69": [6, 7], "347": [6, 7], "36894395697703": [6, 7], "1672928587680225": [6, 7], "069": [6, 7], "70": [6, 7], "345": [6, 7], "17697390093394": [6, 7], "1242367255308854": [6, 7], "095": 6, "71": [6, 7], "74610809299037": [6, 7], "1728352983905301": [6, 7], "133": [6, 7], "72": [6, 7], "23464281634324": [6, 7], "1265380781508565": [6, 7], "171": 6, "73": [6, 7], "344": [6, 7], "6848312222365": [6, 7], "0829896313820404": [6, 7], "74": [6, 7, 8], "9111966504334": [6, 7], "1070414661080543": [6, 7], "75": [6, 7], "70116419828565": [6, 7], "0875643695329498": [6, 7], "271": [6, 7], "76": [6, 7], "62647974688133": [6, 7], "0716281620790837": [6, 7], "298": 6, "77": [6, 7], "6759429204596": [6, 7], "0456289319914898": [6, 7], "324": 6, "78": [6, 7], "343": [6, 7], "58131497761616": [6, 7], "0010195360522613": [6, 7], "351": 6, "79": [6, 7], "342": [6, 7], "7290581014813": [6, 7], "9073210715005748": [6, 7], "80": [6, 7, 8], "67866114080107": [6, 7], "9166305667100072": [6, 7], "402": 6, "81": [6, 7], "6440308445311": [6, 7], "9248722692093634": [6, 7], "430": [6, 7], "82": [6, 7], "02085648448934": [6, 7], "8776928646870886": [6, 7], "457": [6, 7], "1662266300702": [6, 7], "867592364677856": [6, 7], "484": [6, 7], "84": [6, 7], "30158716569775": [6, 7], "8599491178327108": [6, 7], "523": 6, "85": [6, 7, 9], "2803074848341": [6, 7], "8396948389352923": [6, 7], "563": 6, "86": [6, 7], "28301101884045": [6, 7], "8396651775801683": [6, 7], "589": [6, 7], "87": [6, 7], "6781906268143": [6, 7], "8356021935129933": [6, 7], "617": 6, "88": [6, 7], "0405418264898": [6, 7], "7430046191126949": [6, 7], "645": [6, 7], "89": [6, 7], "77203208258476": [6, 7], "9015965341429055": [6, 7], "684": 6, "90": [6, 7], "363": [6, 7], "1622720320929": [6, 7], "6746575663752555": [6, 7], "712": 6, "91": [6, 7], "7403796626193": [6, 7], "9057564666836629": [6, 7], "740": 6, "92": [6, 7], "63579667712696": [6, 7], "9332275205203372": [6, 7], "767": [6, 7], "93": [6, 7, 8], "6886425884964": [6, 7], "9433063264508291": [6, 7], "795": [6, 7], "94": [6, 7], "9341048659705": [6, 7], "884739221967487": [6, 7], "823": 6, "95": [6, 7, 8], "63507445779743": [6, 7], "9381000493689634": [6, 7], "851": [6, 7], "96": [6, 7], "06021011302374": [6, 7], "963138023068903": [6, 7], "879": 6, "97": [6, 7], "9990546212019": [6, 7], "9601651093867907": [6, 7], "910": 6, "98": [6, 7], "3821": [6, 7], "2267845437514": [6, 7], "938": 6, "356": [6, 7], "6786067133016": [6, 7], "721603508336166": [6, 7], "seaborn": [6, 7, 8], "sn": [6, 7, 8], "set_them": [6, 7], "darkgrid": [6, 7], "default_reg_scor": [6, 7], "ax": [6, 7, 8], "scatterplot": [6, 7], "trials_datafram": [6, 7], "xlabel": [6, 7, 8], "ylabel": [6, 7, 8], "ojbect": [6, 7], "interest": [6, 7, 8], "neg_mean_squared_error": [6, 7, 10], "highlight": [6, 7], "color": [6, 7, 8], "cv_test": [6, 7], "user_attrs_test_scor": [6, 7], "lambda": [6, 7, 13], "item": [6, 7, 11], "idx": [6, 7, 8], "hue": [6, 7], "palett": [6, 7], "set1": [6, 7], "buildconfig_as_dict": [6, 7], "serial": [6, 7], "response_typ": [6, 7, 8, 9], "deduplication_strategi": [6, 7, 8, 9], "split_strategi": [6, 7, 8, 9], "nosplit": [6, 7, 13], "save_intermediate_fil": [6, 7, 9], "log_transform": [6, 7, 8, 9], "log_transform_bas": [6, 7, 8, 9], "null": [6, 7], "log_transform_neg": [6, 7, 8, 9], "log_transform_unit_convers": [6, 7, 8, 9], "probabilistic_threshold_represent": [6, 7, 8, 9], "probabilistic_threshold_representation_threshold": [6, 7, 8, 9], "probabilistic_threshold_representation_std": [6, 7, 8, 9], "shuffl": [6, 7, 10, 12, 13, 14], "best_trial": [6, 7, 10, 12], "best_valu": [6, 7, 10, 12], "tracking_rest_endpoint": [6, 7, 10], "best_build": [6, 7], "rb": [6, 7], "predict_from_smil": [6, 7, 9], "cc1": [6, 7, 8], "43103985": [6, 7], "177": [6, 7], "99850936": [6, 7], "panda": [6, 7, 8], "pd": [6, 7, 8], "df": [6, 7, 13, 14], "read_csv": [6, 7], "matplotlib": [6, 7, 8], "pyplot": [6, 7, 8], "plt": [6, 7, 8], "scatter": [6, 7], "lim": [6, 7], "diagon": [6, 7], "r2_score": [6, 7], "mean_squared_error": [6, 7], "mean_absolute_error": [6, 7], "y_true": [6, 7, 9, 12], "y_pred": [6, 7, 9, 12], "rmse": [6, 7], "mae": [6, 7], "absolut": [6, 7], "8566354978126369": [6, 7], "204909888075044": [6, 7], "298453946973815": [6, 7], "again": [6, 7], "hopefulli": [6, 7, 8], "littl": [6, 7], "better": [6, 7, 8, 9, 13], "send": [6, 7], "strategi": [6, 7, 9], "current": [6, 7, 9, 11], "observ": [6, 7, 8], "last": [6, 7, 8, 13], "alreadi": [6, 7, 8, 9, 11], "sort": [6, 7, 8, 13, 14], "oldest": [6, 7, 8, 13, 14], "newest": [6, 7, 8, 9, 13, 14], "end": [6, 7, 8, 13, 14], "extern": [6, 7], "tool": [6, 7], "excel": [6, 7], "unballanc": [6, 7], "come": [6, 7, 8], "measur": [6, 7, 8], "fact": [6, 7], "disregard": [6, 7], "stereochemistri": [6, 7, 8, 9], "sever": [6, 7], "median": [6, 7, 8, 13], "factor": [6, 7, 8], "replic": [6, 7, 8], "robust": [6, 7, 8], "outlier": [6, 7, 8], "acorss": [6, 7], "trust": [6, 7], "kept": [6, 7], "splitter": [6, 7, 8, 9, 11], "track_to_mlflow": [6, 7, 10], "my_study_stratified_split": [6, 7], "165": 6, "207": [6, 7], "303": [6, 7], "261": [6, 7], "95269731189177": 6, "586114272804535": 6, "439": [6, 7], "3455": 6, "51800700426": 6, "1856": [6, 7], "4459752935309": [6, 7], "477": 6, "1235": 6, "3128104073717": 6, "5613443439636077": 6, "495": [6, 7], "3949": [6, 7], "4997740833423": [6, 7], "259060787354118": 6, "06151214721649829": 6, "560": [6, 7], "3258": 6, "3324669641333": 6, "580": 6, "281": [6, 7], "6313215642597": 6, "821793264230599": 6, "2756": [6, 7], "046839500092": [6, 7], "615": 6, "2720": [6, 7], "793752592223": [6, 7], "631": 6, "4702695112846": 6, "11028790699101433": 6, "001202131310186554": 6, "710": [6, 7], "2695": [6, 7], "2514836330784": [6, 7], "731": 6, "1688": 6, "7128683041683": 6, "1044548905141272": 6, "746": 6, "2658": 6, "13214897931": 6, "813": [6, 7], "1948": 6, "0314425327626": 6, "831": [6, 7], "1332": 6, "6840893052315": 6, "8033739312636219": 6, "848": [6, 7], "7730407032913": 6, "978415570131035": 6, "380966239365776": 6, "5380266414879525e": 6, "882": [6, 7], "39037036873405": 6, "13170545295199e": 6, "898": [6, 7], "347685324232952": 6, "782238919549724e": 6, "902": 6, "920": [6, 7], "4997657609406": 6, "004091119479264935": 6, "7670039814136804e": 6, "939": [6, 7], "4997709689146": 6, "020406357580717727": 6, "826432657033465e": 6, "956": [6, 7], "3942": 6, "5257596151837": 6, "00017594354214526438": 6, "3221158157501884": 6, "972": [6, 7], "1775": [6, 7], "55204856041": [6, 7], "989": [6, 7], "9426790782418": 6, "28574770987033293": 6, "006": [6, 7], "1254": 6, "9841129079468": 6, "0742769549097546": 6, "073": [6, 7], "090": 6, "1249": 6, "5519579928275": 6, "26166764283582": 6, "122": [6, 7], "4997740490603": 6, "1551243322855379": 6, "869530660905885e": 6, "141": 6, "613671789797623": 6, "18743805815241568": 6, "160": 6, "4997740057183": 6, "0006647090582038176": 6, "720240531591189e": 6, "188": [6, 7], "236": [6, 7], "75701162742902": 6, "15225101226627": 6, "2726": [6, 7], "0476769808097": [6, 7], "225": [6, 7], "98897579737036": 6, "3434026346873007e": 6, "3596": 6, "741420193717": 6, "311": 6, "1242": 6, "8479265462504": 6, "3806781553300398": 6, "148057819462277": 6, "1220747475846438e": 6, "410": [6, 7], "2906": 6, "3484169581293": 6, "474": [6, 7], "2182": 6, "2854817163393": 6, "494": 6, "1682": 6, "7555601297397": 6, "7692026965764096": 6, "527": 6, "1885": 6, "3761105075926": 6, "8499325582942474": 6, "7934477837753": 6, "26437658363366806": 6, "399729524954495": 6, "4996545768313": 6, "03999295021459913": 6, "487454158254508e": 6, "648": [6, 7], "2279": 6, "772434063323": 6, "668": 6, "1686": 6, "497519225056": 6, "9798152426640634": 6, "700": [6, 7], "1734": 6, "418175645478": 6, "1638039970995402": 6, "720": [6, 7, 9], "2641": [6, 7], "7637473751115": [6, 7], "726": [6, 7], "732": 6, "751": 6, "4997740833387": 6, "6381698921109232": 6, "0041111342254524e": 6, "774": [6, 7], "8133725349282": 6, "9498873960159637": 6, "797": [6, 7], "7735399551454": 6, "9780612881075026": 6, "822": 6, "8160071680375": 6, "9480302946593064": 6, "843": 6, "75592491031455": 6, "9905788379110985": 6, "866": [6, 7], "7455012578744": 6, "998003047330558": 6, "891": 6, "265": [6, 7], "5420569489236": 6, "731766992009085": 6, "925": 6, "268": [6, 7], "5837896907764": 6, "8088769537936915": 6, "961": [6, 7], "270": [6, 7], "2819638853734": 6, "8381998920032558": 6, "986": 6, "5370756433875": 6, "8423274630826914": 6, "009": [6, 7], "6648549453774": 6, "8105870658571404": 6, "034": 6, "267": [6, 7], "33331573420924": 6, "7812473578529109": 6, "058": 6, "54266068640237": 6, "7865813805833881": 6, "084": [6, 7], "264": [6, 7], "7374685857255": 6, "7033718535925544": 6, "108": [6, 7], "259": 6, "06013832754854": 6, "530230339296878": 6, "134": [6, 7], "254": 6, "45098385749847": 6, "4449038663990794": 6, "252": [6, 7], "46933447499055": 6, "4118163766482357": 6, "211": [6, 7], "400610865412": 6, "3751234485145145": 6, "248": [6, 7], "55142126098917": 6, "3782312158054713": 6, "285": [6, 7], "249": [6, 7], "939720762774": 6, "3654947227249123": 6, "51859203038146": 6, "3389300472278876": 6, "247": [6, 7], "97854622218964": 6, "3291551817821483": 6, "82875013698148": 6, "344470263084507": 6, "437": 6, "89404238932664": 6, "2945916241697062": 6, "475": 6, "88444574036467": 6, "294423585518049": 6, "512": [6, 7], "242": [6, 7], "7250858383981": 6, "2374026497690556": 6, "241": [6, 7], "38995410978927": 6, "2216216823389983": 6, "588": [6, 7], "75773569374167": 6, "1685257395531474": 6, "627": [6, 7], "238": [6, 7], "9591618086847": 6, "1871718734668695": 6, "667": 6, "16615158396067": 6, "1749827907502346": 6, "705": [6, 7], "87253431766433": 6, "1541307320952652": 6, "744": [6, 7], "234": [6, 7], "54432497574712": 6, "1118826871769896": 6, "783": [6, 7], "500370208023": 6, "1109739335876776": 6, "820": 6, "227": [6, 7], "05479722761888": 6, "9557242358902104": 6, "859": [6, 7], "226": 6, "75744778941316": 6, "9492111894491083": 6, "900": [6, 7], "23291544469544": 6, "9371731029417466": 6, "940": [6, 7], "8608948363877": 6, "9283493142218042": 6, "981": [6, 7], "223": [6, 7], "79470023518647": 6, "8924342905874942": 6, "021": [6, 7, 8], "04998656317707": 6, "914666812200899": 6, "061": 6, "3255192874075": 6, "8835546302939554": 6, "099": [6, 7], "224": [6, 7], "5251215421697": 6, "9055752025758994": 6, "140": [6, 7], "49998736816636": 6, "9051359167587669": 6, "180": [6, 7], "40892455090952": 6, "9035104089361927": 6, "1896344823456": 6, "9170686489009984": 6, "217": 6, "03166841852928": 6, "6196471760805207": 6, "289": [6, 7], "15921264908027": 6, "6137087588616705": 6, "330": [6, 8], "216": [6, 7], "30437532378687": 6, "6380025600331409": 6, "372": [6, 7], "215": [6, 7], "71630507323695": 6, "663588879747517": 6, "411": [6, 7], "1690838497103": 6, "641298655189503": 6, "450": 6, "79332895242592": 6, "654362351183699": 6, "491": [6, 7], "737398967865": 6, "6605844367915987": 6, "By": [6, 7, 8], "roc_auc": [6, 7, 10], "stabl": [6, 7, 9], "model_evalu": [6, 7], "amongst": [6, 7], "regression_scor": [6, 7], "classification_scor": [6, 7], "explained_vari": [6, 7, 10], "max_error": [6, 7, 10], "neg_mean_absolute_error": [6, 7, 10], "neg_median_absolute_error": [6, 7, 10], "average_precis": [6, 7, 10], "balanced_accuraci": [6, 7, 10], "f1": [6, 7, 10], "f1_macro": [6, 7, 10], "f1_micro": [6, 7, 10], "f1_weight": [6, 7, 10], "jaccard": [6, 7, 10], "jaccard_macro": [6, 7, 10], "jaccard_micro": [6, 7, 10], "jaccard_weight": [6, 7, 10], "neg_brier_scor": [6, 7, 10], "precis": [6, 7, 8, 10], "precision_macro": [6, 7, 10], "precision_micro": [6, 7, 10], "precision_weight": [6, 7, 10], "recal": [6, 7, 10], "recall_macro": [6, 7, 10], "recall_micro": [6, 7, 10], "recall_weight": [6, 7, 10], "auc_pr_cal": [6, 7, 9, 10], "bedroc": [6, 7, 9, 10], "concordance_index": [6, 7, 9, 10], "my_study_r2": [6, 7], "590": 6, "01117186866515977": [6, 7], "657": [6, 7], "08689402230378156": [6, 7], "12553701248394863": [6, 7], "141096648805748": [6, 7], "4893466963980463e": [6, 7], "922": 6, "3039309544203818": [6, 7], "936": 6, "20182749628697164": [6, 7], "957": [6, 7], "8187194367176578": [6, 7], "979": [6, 7], "4647239019719945": [6, 7], "6574750183038587": [6, 7], "8614818478547979": [6, 7], "3974313630683448": [6, 7], "086": [6, 7], "12769795082909816": 6, "127": [6, 7], "8639946428338224": [6, 7], "2391884918766034": [6, 7], "157": [6, 7], "12553701248377633": [6, 7], "00044396482429275296": [6, 7], "3831436879125245e": [6, 7], "186": [6, 7], "12553700871203702": [6, 7], "00028965395242758657": [6, 7], "99928292425642e": [6, 7], "202": [6, 7], "2935582042429075": [6, 7], "219": [6, 7], "18476333152695587": [6, 7], "8190707459213998": [6, 7], "4060379177903557": [6, 7], "301": [6, 7], "12206148974315863": [6, 7], "318": [6, 7], "3105263811279067": [6, 7], "344271094811757": [6, 7], "336": [6, 7], "3562469062424869": [6, 7], "670604991178476": [6, 7], "401": [6, 7], "045959695906983344": [6, 7], "432": 6, "8583939656024446": [6, 7], "5158832554303112": [6, 7], "448": 6, "3062574078515544": [6, 7], "479": 6, "11657354998283716": [6, 7], "0009327650919528738": [6, 7], "062479210472502": [6, 7], "483": 6, "502": 6, "8498478905829554": [6, 7], "1366172066709432": [6, 7], "602": [6, 7], "13519830637607919": [6, 7], "92901911959232": [6, 7], "999026012594694": [6, 7], "621": [6, 7], "8198078293055633": [6, 7], "5888977841391714": [6, 7], "640": 6, "8201573964824842": [6, 7], "19435298754153707": [6, 7], "706": [6, 7], "04595969590698312": 6, "736": [6, 7], "6285506249643193": [6, 7], "35441495011256785": [6, 7], "803": [6, 7], "11934070343348317": [6, 7], "4374125584543907": [6, 7], "2457809516380005": [6, 7], "852": 6, "3625576518621392": [6, 7], "6459129458824919": [6, 7], "871": [6, 7], "36175556871883746": [6, 7], "8179058888285398": [6, 7], "896": 6, "8202473217121523": [6, 7], "0920052840435055": [6, 7], "913": [6, 7], "3672927879319306": [6, 7], "8677032984759461": [6, 7], "918": 6, "40076792599874356": [6, 7], "2865764368847064": [6, 7], "996": 6, "26560316846701765": [6, 7], "064": [6, 7], "41215254857081174": [6, 7], "221": [6, 7], "004614143721600701": 6, "240": 6, "27282533524183633": [6, 7], "322": 6, "10220127407364972": 6, "30323404130582854": [6, 7], "3044553805553568": [6, 7], "6437201185807124": [6, 7], "382": 6, "41502276709562": [6, 7], "10978379088847677": [6, 7], "36160209098547913": [6, 7], "022707289534838138": [6, 7], "423": 6, "2916101445983833": [6, 7], "kljk345": [6, 7], "pypoetri": [6, 7], "virtualenv": [6, 7], "_qsktrft": 6, "py3": [6, 7], "lib": [6, 7], "python3": [6, 7], "site": [6, 7], "linear_model": [6, 7], "_coordinate_desc": [6, 7], "678": [6, 7], "convergencewarn": [6, 7], "did": [6, 7], "regularis": [6, 7], "dualiti": [6, 7], "gap": [6, 7], "936e": [6, 7], "02": [6, 7], "toler": [6, 7], "782e": [6, 7], "cd_fast": [6, 7], "enet_coordinate_desc": [6, 7], "434e": [6, 7], "977e": [6, 7], "496": 6, "8609413020928532": [6, 7], "04987590926279814": [6, 7], "794e": [6, 7], "830e": [6, 7], "906e": [6, 7], "578e": [6, 7], "8610289662757457": [6, 7], "019211413400468974": [6, 7], "754e": [6, 7], "843e": [6, 7], "507e": [6, 7], "8610070549049179": [6, 7], "018492644772509947": [6, 7], "840e": [6, 7], "924e": [6, 7], "513e": [6, 7], "754": [6, 7], "8569771623635769": [6, 7], "008783442408928633": [6, 7], "243e": [6, 7], "014e": [6, 7], "825": 6, "8624781673814641": [6, 7], "05782221001517797": [6, 7], "113e": [6, 7], "935e": [6, 7], "122e": [6, 7], "8618589507037001": [6, 7], "02487072255316275": [6, 7], "960": [6, 7], "864754359721037": [6, 7], "2079910754941946": [6, 7], "998": [6, 7], "8622236413326235": [6, 7], "333215560931422": [6, 7], "861832165638517": [6, 7], "3628098560209365": [6, 7], "072": 6, "8620108533993581": [6, 7], "34240779695521706": [6, 7], "120": [6, 7], "8638540565650902": [6, 7], "26493714991266293": [6, 7], "8629799500771645": [6, 7], "30596394512914815": [6, 7], "8621408609583922": [6, 7], "33648829357762355": [6, 7], "8638132124078156": [6, 7], "2679814646317183": [6, 7], "319": [6, 7], "863983758876634": [6, 7], "24062119162159595": [6, 7], "8627356047945115": [6, 7], "3141728910335158": [6, 7], "8639203054085788": [6, 7], "23391390640786494": [6, 7], "8570103863991635": [6, 7], "6124885145996103": [6, 7], "532": 6, "8647961976727571": [6, 7], "2059976546070975": [6, 7], "591": 6, "8648312544921793": [6, 7], "20266060662750784": [6, 7], "653": [6, 7], "8648431452862716": [6, 7], "20027647978240445": [6, 7], "715": 6, "8648491459660418": [6, 7], "1968919999787333": [6, 7], "778": 6, "8650873115156988": [6, 7], "174598921162764": [6, 7], "855": 6, "8650350577921149": [6, 7], "16468002989641095": [6, 7], "928": 6, "8649412283687147": [6, 7], "1606717091615047": [6, 7], "986e": [6, 7], "015": [6, 7], "8649537211609554": [6, 7], "14694925097689848": [6, 7], "8649734575435447": [6, 7], "147612713300643": [6, 7], "446e": [6, 7], "175": [6, 7], "8648761002838515": [6, 7], "14440434705706803": [6, 7], "398e": [6, 7], "251": [6, 7], "8639826593122782": [6, 7], "1265357179513065": [6, 7], "690e": [6, 7], "328": [6, 7], "864435565531768": [6, 7], "1374245525868926": [6, 7], "366": [6, 7], "8590221951825531": [6, 7], "49890830155012533": [6, 7], "8649098880804443": [6, 7], "1573428812070292": [6, 7], "405e": [6, 7], "520": 6, "864536410656637": [6, 7], "13886104722511608": [6, 7], "561": [6, 7], "8597401050431873": [6, 7], "47746341180045787": [6, 7], "600": 6, "8537465461603838": [6, 7], "050e": [6, 7], "8642643827090003": [6, 7], "13446778921611002": [6, 7], "175e": [6, 7], "8641621818665252": [6, 7], "1286796719653316": [6, 7], "854": [6, 7], "864182755916388": [6, 7], "13303218726548235": [6, 7], "1255357440899417": [6, 7], "021711452917433944": [6, 7], "559714273835951e": [6, 7], "937": [6, 7], "8604596648091501": [6, 7], "43644874418279245": [6, 7], "463e": [6, 7], "8635689909135862": [6, 7], "10940922083495383": [6, 7], "078": 6, "8648544336551733": [6, 7], "1912756875742137": [6, 7], "142": 6, "8648496595672595": [6, 7], "19628449928540487": [6, 7], "170": [6, 7], "8452625121122099": [6, 7], "4324661283995224": [6, 7], "198": [6, 7], "8378670635846416": [6, 7], "839206620815206": [6, 7], "002e": [6, 7], "082e": [6, 7], "286": 6, "8649365368153895": [6, 7], "07270781179126021": [6, 7], "373": 6, "8875676754699953": [6, 7], "0006995169897945908": [6, 7], "618e": [6, 7], "234e": [6, 7], "586e": [6, 7], "465": [6, 7], "8730555131061773": [6, 7], "0018186269840273495": [6, 7], "509": [6, 7], "12553508835019533": [6, 7], "04867556317570456": [6, 7], "0011658455138452": [6, 7], "177e": [6, 7], "284e": [6, 7], "016e": [6, 7], "599": [6, 7], "8586292788613132": [6, 7], "005078762921098462": [6, 7], "anyalgorithm": [6, 7], "__args__": [6, 7], "consider": [6, 7, 8], "modif": [6, 7, 11, 13], "establish": [6, 7], "rf": [6, 7], "account": [6, 7, 8, 9], "though": [6, 7], "treat": [6, 7, 8], "pdf": [6, 7, 10], "denot": [6, 7, 13, 14], "determinist": [6, 7, 8], "quantiti": [6, 7], "tradit": [6, 7, 8], "discret": [6, 7], "discretis": [6, 7, 13, 15], "bioactiv": [6, 7, 8], "integr": [6, 7], "afford": [6, 7, 8], "liklihood": [6, 7], "membership": [6, 7, 8], "iopscienc": [6, 7], "iop": [6, 7], "articl": [6, 7, 8], "3847": [6, 7], "1538": [6, 7], "3881": [6, 7], "aaf101": [6, 7], "pxc50": [6, 7, 8], "p24863": [6, 7], "enabl": [6, 7, 8], "alwai": [6, 7, 8, 9], "724": 6, "0811707042483984": 6, "prfclassifier_algorithm_hash": [6, 7], "efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "max_depth__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "n_estimators__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "max_features__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "prfclassifiermaxfeatur": [6, 7, 10], "min_py_sum_leaf__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "use_py_gini__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "use_py_leafs__efe0ba9870529a6cde0dd3ad22447cbb": [6, 7], "07385123845467624": 6, "08693605025593726": 6, "782": [6, 7], "07306390786920249": 6, "07213945175504542": 6, "055757209329220986": 6, "039": 6, "06330901806749258": 6, "811": 6, "07619841217081819": 6, "061815145745506755": 6, "091": 6, "07429343450473058": 6, "06446287784137206": 6, "574": 6, "06120344765133655": 6, "745": 6, "0686143607166384": 6, "199": 6, "05295650394252901": 6, "best_built": [6, 7], "demonstr": [6, 7, 8], "purpos": [6, 7, 8], "transduct": [6, 7], "example_smil": [6, 7], "get_set": [6, 7, 8, 9], "outsid": [6, 7, 8, 9], "likelihood": [6, 7], "problemat": [6, 7], "except": [6, 7, 9, 11, 13], "valueerror": [6, 7], "As": [6, 7, 8], "raw": [6, 7, 8, 9, 13], "551": [6, 7], "595": [6, 7], "w": [6, 7, 9], "fail": [6, 7, 9], "traceback": [6, 7], "recent": [6, 7], "_optim": [6, 7], "196": [6, 7], "_run_trial": [6, 7], "value_or_valu": [6, 7], "func": [6, 7], "pycharmproject": [6, 7], "optuna_az": [6, 8], "128": [6, 7], "__call__": [6, 7], "_validate_algo": [6, 7], "rais": [6, 7, 9, 11, 13], "598": 6, "summaris": [6, 7], "handl": [6, 7], "convent": [6, 7, 8, 11], "classic": [6, 7], "relev": [6, 7], "cutoff": [6, 7, 8, 13], "ouput": [6, 7], "reflect": [6, 7, 8], "abov": [6, 7, 8], "arguabl": [6, 7], "mpo": [6, 7], "pub": [6, 7], "ac": [6, 7], "full": [6, 7, 10], "jcim": [6, 7], "9b00237": [6, 7], "slide": [6, 7], "googl": [6, 7], "14pbd9ltxzfpsjhyxykflxnk8q80lhvnjimg8a3wqcrm": [6, 7], "edit": [6, 7], "calcault": [6, 7], "smilesbaseddescriptor": [6, 7], "architectur": [6, 7, 8], "quickli": [6, 7], "650": [6, 7], "root": [6, 7, 10, 11], "enqueu": [6, 7, 9], "manual": [6, 7], "activation__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "relu": [6, 7, 10], "aggregation__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "aggregation_norm__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "batch_size__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "depth__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "dropout__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "features_generator__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "ffn_hidden_size__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "ffn_num_layers__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "final_lr_ratio_exp__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "hidden_size__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "init_lr_ratio_exp__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "max_lr_exp__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "warmup_epochs_ratio__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "chempropregressor_algorithm_hash": [6, 7], "668a7428ff5cdb271b01c0925e8fea45": [6, 7], "416": 6, "6833": [6, 7], "034983241957": [6, 7], "chempropactiv": [6, 7, 10], "chempropaggreg": [6, 7, 10], "ensemble_size__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "epochs__668a7428ff5cdb271b01c0925e8fea45": [6, 7], "chempropfeatures_gener": [6, 7, 10], "531": [6, 7], "6341": 6, "72494883772": 6, "115": [6, 7], "500": [6, 7], "1500": 6, "safe": [6, 7], "nan": [6, 7, 9, 13, 14], "prompt": [6, 7], "due": [6, 7, 8, 9, 11], "deactiv": [6, 7], "own": [6, 7], "still": [6, 7], "commun": [6, 7], "facilit": [6, 7, 8, 10], "preset": [6, 7], "enqu": [6, 7], "bayesian": [6, 7], "split_chemprop": [6, 7, 10], "flag": [6, 7, 8, 13, 14], "n_chemprop_tri": [6, 7, 10], "desir": [6, 7], "undirect": [6, 7], "shown": [6, 7, 8], "aspect": [6, 7, 9], "princip": [6, 7, 8], "expand": [6, 7, 9], "differnt": [6, 7], "rememb": [6, 7], "unless": [6, 7], "alter": [6, 7, 10], "characterist": [6, 7, 8], "too": [6, 7, 10], "limit": [6, 7, 8, 10], "vice": [6, 7, 10], "versa": [6, 7, 10], "extens": [6, 7, 10], "trail": [6, 7, 10], "applic": [6, 7, 8, 10], "chanc": [6, 7], "caruana": [6, 7], "particular": [6, 7], "achiev": [6, 7, 8], "st": [6, 7], "figur": [6, 7, 8], "signal": [6, 7], "aka": [6, 7], "could": [6, 7, 8], "share": [6, 7, 13, 14], "until": [6, 7, 10], "longer": [6, 7, 11], "mt": [6, 7], "onc": [6, 7, 8, 13], "knowledg": [6, 7], "order": [6, 7, 8, 10, 13], "earlier": [6, 7, 8], "accompi": [6, 7], "train_side_info": [6, 7], "clog": [6, 7], "surfac": [6, 7], "area": [6, 7, 8], "psa": [6, 7], "293": [6, 7], "22475": [6, 7], "8088": [6, 7], "883": [6, 7], "32297": [6, 7], "6237": [6, 7], "835": [6, 7], "287": [6, 7], "33334": [6, 7], "2804": [6, 7], "314": [6, 7], "26075": [6, 7], "2533": [6, 7], "498": [6, 7], "278": [6, 7], "18917": [6, 7], "5102": [6, 7], "694": [6, 7], "246": [6, 7], "12575": [6, 7], "7244": [6, 7], "255": [6, 7], "14831": [6, 7], "4338": [6, 7], "895": [6, 7], "302": [6, 7], "26838": [6, 7], "2041": [6, 7], "057": [6, 7], "22298": [6, 7], "match": [6, 7], "train_side_info_cl": [6, 7], "clogp_gt2": [6, 7], "clogs_gt": [6, 7], "acceptors_gt5": [6, 7], "donors_gt0": [6, 7], "area_gt250": [6, 7], "psa_lt0": [6, 7], "832": 6, "809": [6, 7], "5817": [6, 7], "944294219682": 6, "chemprophyperoptregressor_algorithm_hash": [6, 7], "db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "ensemble_size__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "epochs__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "features_generator__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "num_iters__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "search_parameter_level__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "chempropsearch_parameter_level": [6, 7, 10], "aux_weight_pc__db9e60f9b8f0a43eff4b41917b6293d9": [6, 7], "841": 6, "5796": [6, 7], "344216469237": 6, "443": 6, "5795": [6, 7], "086276167766": 6, "468": [6, 7], "5820": [6, 7], "228288292862": 6, "012": [6, 7], "5852": [6, 7], "160071204277": 6, "inlfuenc": [6, 7], "henc": [6, 7, 8], "percent": [6, 7], "product": [6, 7], "user_attrs_trial_ran": [6, 7], "drop": [6, 7, 8, 9], "erron": [6, 7], "__": [6, 7], "params_aux_weight_pc": [6, 7], "conclud": [6, 7, 8], "produc": [6, 7], "overrid": [6, 7, 10], "situat": [6, 7, 8], "along": [6, 7], "potenti": [6, 7, 8], "compris": [6, 7, 8], "incompat": [6, 7, 11], "whilst": [6, 7, 8], "desciptor": [6, 7], "grei": [6, 7, 8], "tial": [6, 7], "what": [6, 7], "unpromis": [6, 7], "why": [6, 7, 8], "poor": [6, 7], "sampler": [6, 7], "incompta": [6, 7], "repeatedli": [6, 7], "hyerparamet": [6, 7], "ident": [6, 7, 11], "368": 6, "9525489095524835": [6, 7], "aux_weight_pc__cfa1990d5153c8812982f034d788d7e": [6, 7], "4824": [6, 7], "686269039228": [6, 7], "7731425652872588": [6, 7], "555": [6, 7], "4409": [6, 7], "946844928445": [6, 7], "791002332112292": [6, 7], "874": [6, 7], "329624779366306": [6, 7], "00015024763718638216": [6, 7], "917": [6, 7], "4396": [6, 7], "722635068717": [6, 7], "081": [6, 7], "309": [6, 7], "320": 6, "consult": [6, 7], "incompitbl": [6, 7], "algo": [6, 7, 10], "occur": [6, 7, 9], "assign": [6, 7, 8], "doe": [6, 7, 8, 9, 10, 11, 13], "params_algorithm_nam": [6, 7], "move_legend": [6, 7], "upper": [6, 7, 8], "bbox_to_anchor": [6, 7, 8], "never": [6, 7], "successfulli": [6, 7], "absenc": [6, 7], "8th": [6, 7], "miss": [6, 7, 9, 13, 14], "associ": [6, 7, 8], "asid": [6, 7], "mitig": [6, 7], "overal": [6, 7, 8], "serv": [6, 7, 12], "tl": [6, 7], "wider": [6, 7], "787": 6, "788": [6, 7], "activation__e0d3a442222d4b38f3aa1434851320db": [6, 7], "aggregation__e0d3a442222d4b38f3aa1434851320db": [6, 7], "aggregation_norm__e0d3a442222d4b38f3aa1434851320db": [6, 7], "batch_size__e0d3a442222d4b38f3aa1434851320db": [6, 7], "depth__e0d3a442222d4b38f3aa1434851320db": [6, 7], "dropout__e0d3a442222d4b38f3aa1434851320db": [6, 7], "features_generator__e0d3a442222d4b38f3aa1434851320db": [6, 7], "ffn_hidden_size__e0d3a442222d4b38f3aa1434851320db": [6, 7], "ffn_num_layers__e0d3a442222d4b38f3aa1434851320db": [6, 7], "final_lr_ratio_exp__e0d3a442222d4b38f3aa1434851320db": [6, 7], "hidden_size__e0d3a442222d4b38f3aa1434851320db": [6, 7], "init_lr_ratio_exp__e0d3a442222d4b38f3aa1434851320db": [6, 7], "max_lr_exp__e0d3a442222d4b38f3aa1434851320db": [6, 7], "warmup_epochs_ratio__e0d3a442222d4b38f3aa1434851320db": [6, 7], "e0d3a442222d4b38f3aa1434851320db": [6, 7], "4937": [6, 7], "540075659691": [6, 7], "ensemble_size__e0d3a442222d4b38f3aa1434851320db": [6, 7], "epochs__e0d3a442222d4b38f3aa1434851320db": [6, 7], "953": 6, "462": [6, 7], "5114": [6, 7], "7131239123555": [6, 7], "chempropregressorpretrained_algorithm_hash": [6, 7], "dfc518a76317f23d95e5aa5a3eac77f0": [6, 7], "frzn__dfc518a76317f23d95e5aa5a3eac77f0": [6, 7], "chempropfrzn": [6, 7, 10], "epochs__dfc518a76317f23d95e5aa5a3eac77f0": [6, 7], "cover": [6, 7], "global": [6, 7], "fair": [6, 7], "tl_studi": [6, 7], "loc": [6, 7, 8], "params_epoch": [6, 7], "fillna": [6, 7], "astyp": [6, 7, 8], "agg": [6, 7], "join": [6, 7, 8], "params_chempropregressor_algorithm_hash": [6, 7], "isna": [6, 7], "570": [6, 7], "452": [6, 7], "5891": [6, 7], "7552821093905": [6, 7], "994": [6, 7], "105": [6, 7], "5846": [6, 7], "8674879655655": [6, 7], "1600": [6, 7], "861": [6, 7], "5890": [6, 7], "94653501547": [6, 7], "77dfc8230317e08504ed5e643243fbc2": [6, 7], "frzn__77dfc8230317e08504ed5e643243fbc2": [6, 7], "epochs__77dfc8230317e08504ed5e643243fbc2": [6, 7], "283": 6, "881210303758": [6, 7], "right": [6, 7, 8], "ncol": [6, 7], "world": [6, 7, 8, 13, 14], "penultim": [6, 7, 10], "chemprop_model": [6, 7], "heatmap": [6, 7], "predictor": [6, 7, 9], "chemprop_fingerprint": [6, 7], "fingerprint_typ": [6, 7], "mpn": [6, 7], "cbar_kw": [6, 7], "semi": [6, 7], "supervis": [6, 7], "altern": [6, 7], "last_ffn": [6, 7], "howeev": [6, 7], "respect": [6, 7, 8], "kind": [6, 7, 8, 13], "confid": [6, 7], "calibratedclassifiercv": [6, 7], "understand": [6, 7], "predict_proba": [6, 7, 9], "gave": [6, 7], "close": [6, 7, 8], "actual": [6, 7, 8], "topic": [6, 7], "sigmoid": [6, 7, 10], "review": [6, 7], "those": [6, 7, 8, 9], "calibration_curv": [6, 7], "collect": [6, 7], "defaultdict": [6, 7], "precision_scor": [6, 7], "recall_scor": [6, 7], "f1_score": [6, 7], "brier_score_loss": [6, 7], "log_loss": [6, 7], "roc_auc_scor": [6, 7], "n_job": [6, 7, 10, 12], "calibrated_rf": [6, 7], "calibrated_model": [6, 7], "701": [6, 7], "703": 6, "775": [6, 7], "8353535353535354": [6, 7], "calibratedclassifiercvwithva_algorithm_hash": [6, 7], "e788dfbfc5075967acb5ddf9d971ea20": [6, 7], "n_folds__e788dfbfc5075967acb5ddf9d971ea20": [6, 7], "max_depth__e788dfbfc5075967acb5ddf9d971ea20": [6, 7], "n_estimators__e788dfbfc5075967acb5ddf9d971ea20": [6, 7], "max_features__e788dfbfc5075967acb5ddf9d971ea20": [6, 7], "uncalibr": [6, 7], "uncalibrated_rf": [6, 7], "uncalibrated_model": [6, 7], "306": 6, "352": 6, "719": [6, 7], "8185858585858585": [6, 7], "randomforestclassifier_algorithm_hash": [6, 7], "167e1e88dd2a80133e317c78f009bdc9": [6, 7], "max_depth__167e1e88dd2a80133e317c78f009bdc9": [6, 7], "n_estimators__167e1e88dd2a80133e317c78f009bdc9": [6, 7], "max_features__167e1e88dd2a80133e317c78f009bdc9": [6, 7], "conserv": [6, 7], "1000": [6, 7, 8], "random_st": [6, 7, 13, 14], "123": [6, 7], "calibrated_predict": [6, 7], "uncalibrated_predict": [6, 7], "cal_df": [6, 7], "datafram": [6, 7, 8, 9, 12, 13], "boxplot": [6, 7], "melt": [6, 7], "set_ylabel": [6, 7, 8], "behaviour": [6, 7, 8], "curv": [6, 7, 8], "reliabl": [6, 7], "diagram": [6, 7], "against": [6, 7], "figsiz": [6, 7, 8], "ax1": [6, 7], "subplot2grid": [6, 7], "rowspan": [6, 7], "ax2": [6, 7], "perfectli": [6, 7, 8], "pred": [6, 7], "fraction_of_posit": [6, 7], "mean_predicted_valu": [6, 7], "n_bin": [6, 7], "brier": [6, 7], "2f": [6, 7], "hist": [6, 7], "histtyp": [6, 7], "lw": [6, 7], "set_ylim": [6, 7], "legend": [6, 7, 8], "set_titl": [6, 7], "set_xlabel": [6, 7, 8], "center": [6, 7, 8], "tight_layout": [6, 7, 8], "compos": [6, 7], "refin": [6, 7], "notic": [6, 7], "significantli": [6, 7], "cell": [6, 7], "accur": [6, 7], "alloc": [6, 7, 9], "y_prob": [6, 7], "ye": [6, 7], "score_nam": [6, 7], "__name__": [6, 7], "replac": [6, 7, 11], "capit": [6, 7], "score_df": [6, 7], "set_index": [6, 7], "decim": [6, 7], "roc": [6, 7], "auc": [6, 7, 9], "184705": [6, 7], "547129": [6, 7], "830565": [6, 7], "744048": [6, 7], "784929": [6, 7], "716536": [6, 7], "175297": [6, 7], "529474": [6, 7], "811209": [6, 7], "818452": [6, 7], "814815": [6, 7], "714104": [6, 7], "va": [6, 7], "multipoint": [6, 7], "0c00476": [6, 7], "margin": [6, 7, 8], "bounari": [6, 7], "384": [6, 7], "469": [6, 7], "8213131313131313": [6, 7], "79765fbec1586f3c917ff30de274fdb4": [6, 7], "n_folds__79765fbec1586f3c917ff30de274fdb4": [6, 7], "max_depth__79765fbec1586f3c917ff30de274fdb4": [6, 7], "n_estimators__79765fbec1586f3c917ff30de274fdb4": [6, 7], "max_features__79765fbec1586f3c917ff30de274fdb4": [6, 7], "uncert": [6, 7, 9], "chem": [6, 7, 8, 9], "allchem": [6, 7], "pandastool": [6, 7, 8], "rdconfig": [6, 7], "datastruct": [6, 7], "train_df": [6, 7], "addmoleculecolumntofram": [6, 7], "includefingerprint": [6, 7], "getmorganfingerprint": [6, 7], "nn": [6, 7], "bulktanimotosimilar": [6, 7], "va_pr": [6, 7], "va_uncert": [6, 7], "dtm": [6, 7], "trelli": [6, 7], "fig": [6, 7, 8], "subplot": [6, 7, 8], "sharei": [6, 7], "regplot": [6, 7], "referenc": [6, 7], "boundari": [6, 7, 8, 13, 15], "neither": [6, 7], "nor": [6, 7], "dissimilar": [6, 7], "cp_pred_ensembl": [6, 7], "cp_uncert_ensembl": [6, 7], "886": 6, "933": [6, 7], "activation__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "aggregation__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "aggregation_norm__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "batch_size__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "depth__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "dropout__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "features_generator__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "ffn_hidden_size__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "ffn_num_layers__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "final_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "hidden_size__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "init_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "max_lr_exp__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "warmup_epochs_ratio__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "chempropclassifier_algorithm_hash": [6, 7], "fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "137": [6, 7], "65625": [6, 7], "ensemble_size__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "epochs__fd833c2dde0b7147e6516ea5eebb2657": [6, 7], "midpoint": [6, 7], "mont": [6, 7], "carlo": [6, 7], "virtual": [6, 7, 9], "931": 6, "activation__c73885c5d5a4182168b8b002d321965a": [6, 7], "aggregation__c73885c5d5a4182168b8b002d321965a": [6, 7], "aggregation_norm__c73885c5d5a4182168b8b002d321965a": [6, 7], "batch_size__c73885c5d5a4182168b8b002d321965a": [6, 7], "depth__c73885c5d5a4182168b8b002d321965a": [6, 7], "dropout__c73885c5d5a4182168b8b002d321965a": [6, 7], "features_generator__c73885c5d5a4182168b8b002d321965a": [6, 7], "ffn_hidden_size__c73885c5d5a4182168b8b002d321965a": [6, 7], "ffn_num_layers__c73885c5d5a4182168b8b002d321965a": [6, 7], "final_lr_ratio_exp__c73885c5d5a4182168b8b002d321965a": [6, 7], "hidden_size__c73885c5d5a4182168b8b002d321965a": [6, 7], "init_lr_ratio_exp__c73885c5d5a4182168b8b002d321965a": [6, 7], "max_lr_exp__c73885c5d5a4182168b8b002d321965a": [6, 7], "warmup_epochs_ratio__c73885c5d5a4182168b8b002d321965a": [6, 7], "c73885c5d5a4182168b8b002d321965a": [6, 7], "371": [6, 7], "46875": [6, 7], "ensemble_size__c73885c5d5a4182168b8b002d321965a": [6, 7], "epochs__c73885c5d5a4182168b8b002d321965a": [6, 7], "cp_pred_dropout": [6, 7], "cp_uncert_dropout": [6, 7], "proabil": [6, 7], "va_predict": [6, 7], "correl": [6, 7, 8], "drouput": [6, 7], "uncertatinti": [6, 7], "cp_uncert_delta": [6, 7], "categor": [6, 7, 13], "unit": [6, 7, 8], "parsabl": [6, 7], "cast": [6, 7], "appropri": [6, 7], "befor": [6, 7, 8, 13], "choic": [6, 7, 13], "346": [6, 7], "391": [6, 7], "582": [6, 7], "4259": 6, "713886871285": 6, "mapie_algorithm_hash": [6, 7], "976d211e4ac64e5568d369bcddd3aeb1": [6, 7], "mapie_alpha__976d211e4ac64e5568d369bcddd3aeb1": [6, 7], "max_depth__976d211e4ac64e5568d369bcddd3aeb1": [6, 7], "n_estimators__976d211e4ac64e5568d369bcddd3aeb1": [6, 7], "max_features__976d211e4ac64e5568d369bcddd3aeb1": [6, 7], "analysi": [6, 7, 8, 9], "perfom": [6, 7], "post": [6, 7], "mapie_pr": [6, 7], "mapie_unc": [6, 7], "bar": [6, 7], "visualis": [6, 7], "errorbar": [6, 7], "yerr": [6, 7], "ab": [6, 7], "fmt": [6, 7], "black": [6, 7, 8], "ecolor": [6, 7], "grai": [6, 7], "elinewidth": [6, 7], "capsiz": [6, 7], "move": [6, 7, 11], "analys": [6, 7, 8], "width": [6, 7, 8], "alpha_impact": [6, 7], "ma": [6, 7], "unc_df": [6, 7], "unc": [6, 7], "reset_index": [6, 7, 8], "concat": [6, 7], "lineplot": [6, 7], "err_styl": [6, 7], "se": [6, 7], "incorpor": [6, 7], "tradition": [6, 7], "unsupport": [6, 7], "kernelexplain": [6, 7, 9], "shaplei": [6, 7], "explan": [6, 7], "slundberg": [6, 7], "game": [6, 7], "credit": [6, 7], "theori": [6, 7], "publish": [6, 7], "comopsit": [6, 7], "101": [6, 7], "146": 6, "_ridg": [6, 7], "243": [6, 7], "userwarn": [6, 7, 8], "singular": [6, 7], "matrix": [6, 7], "dual": [6, 7], "578": 6, "36553318492385256": 6, "9346053663473015": 6, "dga": [6, 7], "dgp": [6, 7], "dgtot": [6, 7], "sa": [6, 7], "sdc": [6, 7], "sdx": [6, 7], "numhacceptor": [6, 7], "numhdonor": [6, 7], "maxabsestateindex": [6, 7], "maxestateindex": [6, 7], "minabsestateindex": [6, 7], "minestateindex": [6, 7], "qed": [6, 7], "sp": [6, 7], "heavyatommolwt": [6, 7], "exactmolwt": [6, 7], "numvalenceelectron": [6, 7], "numradicalelectron": [6, 7], "maxpartialcharg": [6, 7], "minpartialcharg": [6, 7], "maxabspartialcharg": [6, 7], "minabspartialcharg": [6, 7], "fpdensitymorgan1": [6, 7], "fpdensitymorgan2": [6, 7], "fpdensitymorgan3": [6, 7], "bcut2d_mwhi": [6, 7], "bcut2d_mwlow": [6, 7], "bcut2d_chghi": [6, 7], "bcut2d_chglo": [6, 7], "bcut2d_logphi": [6, 7], "bcut2d_logplow": [6, 7], "bcut2d_mrhi": [6, 7], "bcut2d_mrlow": [6, 7], "avgipc": [6, 7], "balabanj": [6, 7], "bertzct": [6, 7], "chi0": [6, 7], "chi0n": [6, 7], "chi0v": [6, 7], "chi1": [6, 7], "chi1n": [6, 7], "chi1v": [6, 7], "chi2n": [6, 7], "chi2v": [6, 7], "chi3n": [6, 7], "chi3v": [6, 7], "chi4n": [6, 7], "chi4v": [6, 7], "hallkieralpha": [6, 7], "ipc": [6, 7], "kappa1": [6, 7], "kappa2": [6, 7], "kappa3": [6, 7], "labuteasa": [6, 7], "peoe_vsa1": [6, 7], "peoe_vsa10": [6, 7], "peoe_vsa11": [6, 7], "peoe_vsa12": [6, 7], "peoe_vsa13": [6, 7], "peoe_vsa14": [6, 7], "peoe_vsa2": [6, 7], "peoe_vsa3": [6, 7], "peoe_vsa4": [6, 7], "peoe_vsa5": [6, 7], "peoe_vsa6": [6, 7], "peoe_vsa7": [6, 7], "peoe_vsa8": [6, 7], "peoe_vsa9": [6, 7], "smr_vsa1": [6, 7], "smr_vsa10": [6, 7], "smr_vsa2": [6, 7], "smr_vsa3": [6, 7], "smr_vsa4": [6, 7], "smr_vsa5": [6, 7], "smr_vsa6": [6, 7], "smr_vsa7": [6, 7], "smr_vsa8": [6, 7], "smr_vsa9": [6, 7], "slogp_vsa1": [6, 7], "slogp_vsa10": [6, 7], "slogp_vsa11": [6, 7], "slogp_vsa12": [6, 7], "slogp_vsa2": [6, 7], "slogp_vsa3": [6, 7], "slogp_vsa4": [6, 7], "slogp_vsa5": [6, 7], "slogp_vsa6": [6, 7], "slogp_vsa7": [6, 7], "slogp_vsa8": [6, 7], "slogp_vsa9": [6, 7], "estate_vsa1": [6, 7], "estate_vsa10": [6, 7], "estate_vsa11": [6, 7], "estate_vsa2": [6, 7], "estate_vsa3": [6, 7], "estate_vsa4": [6, 7], "estate_vsa5": [6, 7], "estate_vsa6": [6, 7], "estate_vsa7": [6, 7], "estate_vsa8": [6, 7], "estate_vsa9": [6, 7], "vsa_estate1": [6, 7], "vsa_estate10": [6, 7], "vsa_estate2": [6, 7], "vsa_estate3": [6, 7], "vsa_estate4": [6, 7], "vsa_estate5": [6, 7], "vsa_estate6": [6, 7], "vsa_estate7": [6, 7], "vsa_estate8": [6, 7], "vsa_estate9": [6, 7], "fractioncsp3": [6, 7], "heavyatomcount": [6, 7], "nhohcount": [6, 7], "nocount": [6, 7], "numaliphaticcarbocycl": [6, 7], "numaliphaticheterocycl": [6, 7], "numaliphaticr": [6, 7], "numaromaticcarbocycl": [6, 7], "numaromaticheterocycl": [6, 7], "numaromaticr": [6, 7], "numheteroatom": [6, 7], "numrotatablebond": [6, 7], "numsaturatedcarbocycl": [6, 7], "numsaturatedheterocycl": [6, 7], "numsaturatedr": [6, 7], "ringcount": [6, 7], "mollogp": [6, 7], "molmr": [6, 7], "fr_al_coo": [6, 7], "fr_al_oh": [6, 7], "fr_al_oh_notert": [6, 7], "fr_arn": [6, 7], "fr_ar_coo": [6, 7], "fr_ar_n": [6, 7], "fr_ar_nh": [6, 7], "fr_ar_oh": [6, 7], "fr_coo": [6, 7], "fr_coo2": [6, 7], "fr_c_o": [6, 7], "fr_c_o_nocoo": [6, 7], "fr_c_": [6, 7], "fr_hoccn": [6, 7], "fr_imin": [6, 7], "fr_nh0": [6, 7], "fr_nh1": [6, 7], "fr_nh2": [6, 7], "fr_n_o": [6, 7], "fr_ndealkylation1": [6, 7], "fr_ndealkylation2": [6, 7], "fr_nhpyrrol": [6, 7], "fr_sh": [6, 7], "fr_aldehyd": [6, 7], "fr_alkyl_carbam": [6, 7], "fr_alkyl_halid": [6, 7], "fr_allylic_oxid": [6, 7], "fr_amid": [6, 7], "fr_amidin": [6, 7], "fr_anilin": [6, 7], "fr_aryl_methyl": [6, 7], "fr_azid": [6, 7], "fr_azo": [6, 7], "fr_barbitur": [6, 7], "fr_benzen": [6, 7], "fr_benzodiazepin": [6, 7], "fr_bicycl": [6, 7], "fr_diazo": [6, 7], "fr_dihydropyridin": [6, 7], "fr_epoxid": [6, 7], "fr_ester": [6, 7], "fr_ether": [6, 7], "fr_furan": [6, 7], "fr_guanido": [6, 7], "fr_halogen": [6, 7], "fr_hdrzine": [6, 7], "fr_hdrzone": [6, 7], "fr_imidazol": [6, 7], "fr_imid": [6, 7], "fr_isocyan": [6, 7], "fr_isothiocyan": [6, 7], "fr_keton": [6, 7], "fr_ketone_topliss": [6, 7], "fr_lactam": [6, 7], "fr_lacton": [6, 7], "fr_methoxi": [6, 7], "fr_morpholin": [6, 7], "fr_nitril": [6, 7], "fr_nitro": [6, 7], "fr_nitro_arom": [6, 7], "fr_nitro_arom_nonortho": [6, 7], "fr_nitroso": [6, 7], "fr_oxazol": [6, 7], "fr_oxim": [6, 7], "fr_para_hydroxyl": [6, 7], "fr_phenol": [6, 7], "fr_phenol_noorthohbond": [6, 7], "fr_phos_acid": [6, 7], "fr_phos_est": [6, 7], "fr_piperdin": [6, 7], "fr_piperzin": [6, 7], "fr_priamid": [6, 7], "fr_prisulfonamd": [6, 7], "fr_pyridin": [6, 7], "fr_quatn": [6, 7], "fr_sulfid": [6, 7], "fr_sulfonamd": [6, 7], "fr_sulfon": [6, 7], "fr_term_acetylen": [6, 7], "fr_tetrazol": [6, 7], "fr_thiazol": [6, 7], "fr_thiocyan": [6, 7], "fr_thiophen": [6, 7], "fr_unbrch_alkan": [6, 7], "fr_urea": [6, 7], "shap_valu": [6, 7], "2227": [6, 7], "042517e": 6, "2229": [6, 7], "025057e": 6, "2228": [6, 7], "804876e": 6, "2267": [6, 7], "372192e": 6, "00": [6, 7], "2230": [6, 7], "106846e": 6, "352611e": 6, "1375": 6, "1376": 6, "s1": 6, "n1c": [6, 7], "1784": 6, "1785": 6, "995": 6, "1617": 6, "1618": 6, "1570": [6, 7], "contrinubt": [6, 7], "datset": [6, 7], "unscaledphyschemjazzi": [6, 7], "rank": [6, 7, 9], "053": 6, "742": 6, "t": [6, 7, 8, 9, 10], "kekul": [6, 7], "unkekul": [6, 7], "rational": [6, 7], "rationale_scor": [6, 7], "097": [6, 7], "ch3": [6, 7], "ch": [6, 7], "389": [6, 7, 8], "151": [6, 7], "485": [6, 7], "c1c": [6, 7], "c1n": [6, 7], "ch2": [6, 7], "nh2": [6, 7], "565": [6, 7], "nn1cc1c": [6, 7], "c1cccc": [6, 7], "110": [6, 7], "997": [6, 7], "contian": [6, 7], "second": [6, 7], "dummi": [6, 7], "third": [6, 7], "smallest": [6, 7], "made": [6, 7, 8], "fourth": [6, 7], "irregularli": [6, 7], "xc50": [6, 7, 8], "log10": [6, 7, 8, 13, 15], "6th": [6, 7], "convers": [6, 7, 8, 13, 15], "logbas": [6, 7, 8, 13, 15], "logneg": [6, 7, 8, 13, 15], "negat": [6, 7, 8, 13, 15], "transformed_studi": [6, 7], "transform_exampl": [6, 7], "5959493772536109": 6, "6571993250300608": [6, 7], "426": 6, "1511102853256885": [6, 7], "516": 6, "2487063317112765": [6, 7], "6714912461080983": [6, 7], "2725944467796781": [6, 7], "606": [6, 7], "194926264155893": [6, 7], "7520919188596032": [6, 7], "748": 6, "7803723847416691": [6, 7], "764": [6, 7], "6397753979196248": [6, 7], "781": 6, "151110299986041": [6, 7], "798": 6, "151110111437006": [6, 7], "5410418750776741": [6, 7], "829": [6, 7], "7183231137124538": [6, 7], "845": [6, 7], "2721824844856162": [6, 7], "912": [6, 7], "19009294702225": [6, 7], "929": 6, "945": [6, 7], "5585323973564646": [6, 7], "3169218304262786": [6, 7], "028": 6, "7974925066137679": [6, 7], "045": 6, "218395226466336": [6, 7], "062": [6, 7], "1474226942497083": [6, 7], "066": [6, 7], "0239005731675412": [6, 7], "150": [6, 7], "169": [6, 7], "178901060853144": [6, 7], "187": 6, "27137790098830755": [6, 7], "206": [6, 7], "2710284516876423": [6, 7], "6273152492418945": [6, 7], "1900929470222508": [6, 7], "361": 6, "1907041717628215": [6, 7], "398": [6, 7], "3209075619139279": [6, 7], "403": 6, "2709423025014604": [6, 7], "438": [6, 7], "3133943310851415": [6, 7], "461": [6, 7], "257769959239938": [6, 7], "40359637945134746": 6, "658": 6, "4127882135896648": [6, 7], "663": 6, "734": [6, 7], "9246005133276612": [6, 7], "885": [6, 7], "8908739215746118": 6, "905": [6, 7], "107536316777608": [6, 7], "054360360588395": [6, 7], "964": 6, "5428179904345867": [6, 7], "983": 6, "5696273642213351": [6, 7], "007": [6, 7], "27099769667470536": [6, 7], "1580741708125475": [6, 7], "2709564785634315": [6, 7], "10900413894771653": [6, 7], "056": [6, 7], "2709799905898163": [6, 7], "13705914456987853": [6, 7], "080": [6, 7], "27097230608092054": [6, 7], "12790870116376127": [6, 7], "102": [6, 7], "2709499903064464": [6, 7], "10123180962907431": [6, 7], "2710895886052581": [6, 7], "26565663774320425": [6, 7], "149": 6, "2708711012023424": [6, 7], "005637048678674678": [6, 7], "174": [6, 7], "27092322402109364": [6, 7], "06902647427781451": [6, 7], "2712140349882": [6, 7], "4076704953178294": [6, 7], "27090080367174": [6, 7], "04187106800188596": [6, 7], "27086925247190047": [6, 7], "003371853599610078": [6, 7], "2708933298483799": [6, 7], "032781796328385376": [6, 7], "27087205624489635": [6, 7], "006806773659187283": [6, 7], "2708869511176179": [6, 7], "025009489814943348": [6, 7], "2711465077924297": [6, 7], "3311125627707556": [6, 7], "369": [6, 7], "2708756855936628": [6, 7], "011249102380159387": [6, 7], "395": [6, 7], "27087301924224993": [6, 7], "007985924302396141": [6, 7], "419": [6, 7], "2708685399954944": [6, 7], "00249856291483601": [6, 7], "444": [6, 7], "27121879554836553": [6, 7], "4130244908975993": [6, 7], "470": 6, "2708693196600531": [6, 7], "0034541978803366022": [6, 7], "27110195265802334": [6, 7], "27994943662091765": [6, 7], "2708682582859318": [6, 7], "0021532199144365088": [6, 7], "545": [6, 7], "27087024523986086": [6, 7], "0045884092728113585": [6, 7], "569": 6, "27087351807632193": [6, 7], "008596600952859433": [6, 7], "2710818633795896": [6, 7], "2567049271070902": [6, 7], "620": [6, 7], "27103241786565463": [6, 7], "1990111983307052": [6, 7], "2710350879598171": [6, 7], "20214459724424078": [6, 7], "2708688328221868": [6, 7], "00285750520671645": [6, 7], "697": [6, 7], "27100832234449684": [6, 7], "17064008990759916": [6, 7], "721": [6, 7], "27268613236193845": [6, 7], "8725420109733135": [6, 7], "747": [6, 7], "27119617446689237": [6, 7], "387533542012365": [6, 7], "773": 6, "2708691110831552": [6, 7], "0031985656730512953": [6, 7], "800": [6, 7], "27086852174155146": [6, 7], "002476186542950981": [6, 7], "27135383618835024": [6, 7], "5626643670396761": [6, 7], "2709819654433871": [6, 7], "1394077979875128": [6, 7], "2718548944510965": [6, 7], "0858347526799794": [6, 7], "1508084699212935": [6, 7], "03329943145150872": [6, 7], "00025672309762227527": [6, 7], "27249853374634975": [6, 7], "702026434077893": [6, 7], "27095660957755363": [6, 7], "10916094511173127": [6, 7], "987": [6, 7], "27102160995407715": [6, 7], "18630665884100353": [6, 7], "27095708822582026": [6, 7], "10973377642487026": [6, 7], "041": [6, 7], "27088222008661084": [6, 7], "019235980282946118": [6, 7], "2708703086029017": [6, 7], "004666043957133775": [6, 7], "27095279044622245": [6, 7], "1045877457096882": [6, 7], "2709408288690431": [6, 7], "09023455456986404": [6, 7], "152": [6, 7], "9289218260898663": [6, 7], "8200088368788958": [6, 7], "181": [6, 7], "27086675101898655": [6, 7], "00030502148265565063": [6, 7], "209": 6, "2710491243757999": [6, 7], "21858260742423916": [6, 7], "239": [6, 7], "1491615840508995": [6, 7], "024725853754515203": [6, 7], "2709462479577586": [6, 7], "0967427718847167": [6, 7], "default_studi": [6, 7], "837": [6, 7], "3501": [6, 7], "942111261296": [6, 7], "5451": [6, 7], "207265576796": [6, 7], "1049201007814": [6, 7], "9964": [6, 7], "541364058234": [6, 7], "003": [6, 7], "3543": [6, 7], "953608539901": [6, 7], "6837": [6, 7], "057544630979": [6, 7], "043": [6, 7], "2507": [6, 7], "1794330606067": [6, 7], "21534": [6, 7], "719219668405": [6, 7], "2899": [6, 7], "736555614694": [6, 7], "294e": [6, 7], "760e": [6, 7], "167": 6, "21674": [6, 7], "445000284228": [6, 7], "1049203123567": [6, 7], "1049192609138": [6, 7], "3630": [6, 7], "72768093756": [6, 7], "3431": [6, 7], "942816967268": [6, 7], "6908": [6, 7], "462045154488": [6, 7], "5964": [6, 7], "65935954044": [6, 7], "332": [6, 7], "21070": [6, 7], "107195348774": [6, 7], "348": 6, "4977": [6, 7], "068508997133": [6, 7], "8873": [6, 7], "669262669626": [6, 7], "21387": [6, 7], "63697424318": [6, 7], "9958": [6, 7], "573006910125": [6, 7], "463": [6, 7], "5182695600183": [6, 7], "467": [6, 7], "20684": [6, 7], "56412138056": [6, 7], "3435882510586": [6, 7], "7068": [6, 7], "705383113378": [6, 7], "613": 6, "7150": [6, 7], "482090052133": [6, 7], "680": [6, 7], "698": 6, "203": [6, 7], "93637462922368": [6, 7], "762": [6, 7], "779": [6, 7], "2570": [6, 7], "5111262532305": [6, 7], "21987": [6, 7], "659957192194": [6, 7], "9889": [6, 7], "493204596083": [6, 7], "819": [6, 7], "7172": [6, 7], "208490771303": [6, 7], "856": [6, 7], "9804": [6, 7], "512701665093": [6, 7], "881": [6, 7], "9165": [6, 7], "74081120673": [6, 7], "949": [6, 7], "543": [6, 7], "0280270800017": [6, 7], "161": [6, 7], "1602933782954": [6, 7], "888460860864": [6, 7], "109": 6, "8414": [6, 7], "932694243476": [6, 7], "2270": [6, 7], "540799189148": 6, "10383": [6, 7], "79559309305": [6, 7], "20815": [6, 7], "025469865475": [6, 7], "7560385808573": [6, 7], "244": 6, "5264": [6, 7], "4700789389035": [6, 7], "3668": [6, 7], "255064135424": [6, 7], "290": 6, "156": [6, 7], "12174877890536": [6, 7], "793408178086295": [6, 7], "99902820845678": [6, 7], "316": [6, 7], "371632749506": [6, 7], "88307313087517": [6, 7], "140915461519354": [6, 7], "340": [6, 7], "153": [6, 7], "66773675231477": [6, 7], "177324126813716": [6, 7], "77906017834145": [6, 7], "52056745848623": [6, 7], "4565714180547": [6, 7], "6710444346508": [6, 7], "392": [6, 8], "30976119334312": [6, 7], "62916671166313": [6, 7], "023639423189294": [6, 7], "418": [6, 7], "053696900694": [6, 7], "914617418880486": [6, 7], "31140591484044": [6, 7], "201": [6, 7], "33573874994386": [6, 7], "569769302718845": [6, 7], "5781354926491789": [6, 7], "190": [6, 7], "1384885119049": [6, 7], "87666716965626": [6, 7], "2537791489618": [6, 7], "076949848299": [6, 7], "9559574710535281": [6, 7], "0032830967319653665": [6, 7], "522": 6, "764974036324": [6, 7], "03910427457823": [6, 7], "406811480459925": [6, 7], "546": 6, "164": [6, 7], "4477304958181": [6, 7], "701690847791482": [6, 7], "819274780536123": [6, 7], "573": [6, 7], "87939164358104": [6, 7], "32187661108304": [6, 7], "660320437878754": [6, 7], "601": [6, 7], "01705178481896": [6, 7], "61397716361812": [6, 7], "603665957830847": [6, 7], "629": [6, 7], "155": [6, 7], "73257312230092": [6, 7], "759645965959294": [6, 7], "503212714246787": [6, 7], "656": [6, 7], "154": [6, 7], "46848394144124": [6, 7], "8546740801317": [6, 7], "35327336610912": [6, 7], "683": 6, "20421802817864": [6, 7], "57596974747163": [6, 7], "84756262407801": [6, 7], "709": 6, "51233215278089": [6, 7], "3564642040401464": [6, 7], "5034542273159819": [6, 7], "68667089892196": [6, 7], "034895878929095": [6, 7], "03653571911285094": [6, 7], "52277054278186": [6, 7], "01961499216484045": [6, 7], "670937191883546": [6, 7], "28722475694815": [6, 7], "012434370509176538": [6, 7], "34222704431493": [6, 7], "816": [6, 7], "87402050281146": [6, 7], "008452015347522093": [6, 7], "914863578437455": [6, 7], "844": 6, "38847505937936": [6, 7], "01573542234868893": [6, 7], "99307522974174": [6, 7], "870": 6, "96336195786391": [6, 7], "009845516063879428": [6, 7], "59422914099683": [6, 7], "19345618324213": [6, 7], "009382525091504246": [6, 7], "35573659237662": [6, 7], "30772721342525": [6, 7], "010579672066291478": [6, 7], "35550323165882": [6, 7], "954": [6, 7], "23970902543148": [6, 7], "013369359066405863": [6, 7], "4744102498801": [6, 7], "984": 6, "34331248758777": [6, 7], "011398351701814368": [6, 7], "54146340620301": [6, 7], "104535853341": [6, 7], "011708779850509646": [6, 7], "682286191624579e": [6, 7], "040": [6, 7], "0653774146952": [6, 7], "009806826677473646": [6, 7], "90274406278985": [6, 7], "64646042813787": [6, 7], "0038598153381434685": [6, 7], "20918134828555": [6, 7], "68420472011734": [6, 7], "0032474576673554513": [6, 7], "35551178979624": [6, 7], "85985201823172": [6, 7], "003187930738019005": [6, 7], "29431603544847": [6, 7], "21583898009355": [6, 7], "003122319313153475": [6, 7], "83526418992966": [6, 7], "185": 6, "34787242859676": [6, 7], "002781955938462633": [6, 7], "76228981520067": [6, 7], "213": [6, 7], "194": [6, 7], "70914272129673": [6, 7], "0023173546614751305": [6, 7], "3000082904498813": [6, 7], "10492031097328": [6, 7], "002606064524407": [6, 7], "7861330234653922e": [6, 7], "1049154281806": [6, 7], "0029210589377408366": [6, 7], "200933937391094e": [6, 7], "10492028002287": [6, 7], "06431564840324226": [6, 7], "2981641934644904e": [6, 7], "56066541774658": [6, 7], "0010848843623839548": [6, 7], "151493073951163": [6, 7], "76337597039308": [6, 7], "004134805589645341": [6, 7], "88115336652716": [6, 7], "58009587759925": [6, 7], "004763418454688096": [6, 7], "02920758025023": [6, 7], "415": [6, 7], "113": [6, 7], "35230417583477": [6, 7], "0009098023238189749": [6, 7], "57100980886017": [6, 7], "445": [6, 7], "30807467406214": [6, 7], "03739791555156691": [6, 7], "12818940557025": [6, 7], "476": 6, "44100655116532": [6, 7], "006380481141720477": [6, 7], "4882351186755": [6, 7], "505": 6, "35181001564942": [6, 7], "0036244007454981787": [6, 7], "608797806921866": [6, 7], "533": 6, "124": [6, 7], "3719027482892": [6, 7], "0014198536004321608": [6, 7], "05588994284273": [6, 7], "562": [6, 7], "28568052794907": [6, 7], "005434972462746285": [6, 7], "215759789700954": [6, 7], "20325": [6, 7], "66479442037": [6, 7], "9696417046589247": [6, 7], "132": [6, 7], "21507621375022": [6, 7], "0004528978867024753": [6, 7], "80386923876023": [6, 7], "655": [6, 7], "85570350846885": [6, 7], "0016948043699497222": [6, 7], "455627755557016": [6, 7], "contrast": [6, 7, 8], "relplot": [6, 7], "col": [6, 7, 8], "facet_kw": [6, 7], "axisgrid": [6, 7, 8], "facetgrid": [6, 7], "0x7ff3a1d3ba30": 6, "noramlis": [6, 7], "unlog": [6, 7], "yield": [6, 7, 8, 13, 14], "mse": [6, 7], "1126": [6, 7], "56968721": [6, 7], "20237903": [6, 7], "revers": [6, 7, 8, 13, 15], "onto": [6, 7], "action": [6, 7], "importantli": [6, 7], "easili": [6, 7, 8], "94824194": [6, 7], "92008694": [6, 7], "instruct": [6, 7], "untransform": [6, 7], "wish": [6, 7], "cut": [6, 7, 8], "10um": [6, 7], "ptr_config_log_transform": [6, 7], "ptr_transformed_studi": [6, 7], "ptr_and_transform_exampl": [6, 7], "002341918451736244": 6, "0024908979029632677": [6, 7], "526": [6, 7], "007901407671048116": [6, 7], "00496231674623194": [6, 7], "585": [6, 7], "0026848278110363512": [6, 7], "0010872728889471893": [6, 7], "624": 6, "008706109201510277": [6, 7], "704": [6, 7], "002999462459688866": 6, "00825680029907454": [6, 7], "007901407993550248": [6, 7], "753": 6, "007901405163828307": [6, 7], "769": [6, 7], "0021653695362066753": [6, 7], "002869169486971014": [6, 7], "804": 6, "0010855652626111146": [6, 7], "867": [6, 7], "005505338042993082": [6, 7], "884": 6, "901": [6, 7], "002236800860454562": [6, 7], "955": [6, 7], "006105985607235417": [6, 7], "971": 6, "004846526544994462": [6, 7], "119": 6, "006964668794465202": [6, 7], "204": 6, "0029994624596888677": [6, 7], "222": [6, 7], "008384326901042542": [6, 7], "001082194093844804": [6, 7], "256": 6, "0010807084256204563": [6, 7], "321": 6, "338": [6, 7], "422": 6, "458": 6, "005247934991526694": [6, 7], "480": [6, 7], "0010803393728928605": [6, 7], "005218354425190125": [6, 7], "503": 6, "521": 6, "004999207507691546": [6, 7], "0015694919308122948": [6, 7], "0019757694194001397": 6, "664": [6, 7], "730": [6, 7], "002341918451736245": [6, 7], "00368328296527152": [6, 7], "003412828259848677": [6, 7], "836": [6, 7], "004412110711416997": [6, 7], "893": [6, 7], "0021743798524909573": [6, 7], "911": [6, 7], "0022761245849848527": [6, 7], "934": 6, "0010805768178458735": [6, 7], "959": 6, "001080400188305814": [6, 7], "982": 6, "0010805009783570441": [6, 7], "0010804680472500541": [6, 7], "030": [6, 7], "0010803723579987025": [6, 7], "001080969596032512": [6, 7], "0010800333715082816": [6, 7], "0010802574700236845": [6, 7], "0010814994986419817": [6, 7], "147": [6, 7], "001080161136846237": [6, 7], "0010800254136811547": [6, 7], "197": [6, 7], "0010801290036870739": [6, 7], "001080037482216557": [6, 7], "0010801015705851358": [6, 7], "0010812122378841013": [6, 7], "295": [6, 7], "0010800531021304936": [6, 7], "00108004162698813": [6, 7], "0010800223466649803": [6, 7], "0010815197263834202": [6, 7], "394": [6, 8], "0010800257029027847": [6, 7], "0010810223438672223": [6, 7], "442": 6, "0010800211339555509": [6, 7], "0010800296871141684": [6, 7], "492": [6, 7], "0010800437739166451": [6, 7], "517": [6, 7], "0010809366267195716": [6, 7], "540": 6, "001080725386603206": [6, 7], "0010807368035830652": [6, 7], "0010800236072155854": [6, 7], "616": 6, "0010806223050773966": [6, 7], "642": [6, 7], "0010876516369772728": [6, 7], "669": 6, "00108142358144501": [6, 7], "0010800248050489667": [6, 7], "001080022268085466": [6, 7], "0010820922958715991": [6, 7], "771": [6, 7], "0010805094397523254": [6, 7], "0010841993753324146": [6, 7], "826": 6, "007899735988203994": [6, 7], "853": 6, "0010868762004637347": [6, 7], "001080400750193767": [6, 7], "907": [6, 7], "0010806791616300314": [6, 7], "0010804028029753213": [6, 7], "962": [6, 7], "0010800812188506515": [6, 7], "0010800299598580359": [6, 7], "017": 6, "0010803843696362083": [6, 7], "047": 6, "001080333048974234": [6, 7], "001080014645182176": [6, 7], "129": [6, 7], "0010807968027851892": [6, 7], "007907028395366658": [6, 7], "0010803563024666294": [6, 7], "3506154": [6, 7], "inlin": [6, 7, 8], "timepoint": [6, 7, 9, 11], "aux_column": [6, 7, 9], "accord": [6, 7, 8, 9], "aux_col_config": [6, 7], "aux_descriptors_dataset": [6, 7], "train_with_conc": [6, 7], "aux1": [6, 7], "aux_col_studi": [6, 7], "covariate_exampl": [6, 7], "aux1_model": [6, 7], "904": 6, "946": 6, "070": 6, "5186": [6, 7], "76766395672": 6, "138": 6, "4679": [6, 7], "740824270968": [6, 7], "4890": [6, 7], "6705099499995": [6, 7], "276": [6, 7], "3803": [6, 7], "9324375833753": [6, 7], "291": [6, 7], "3135": [6, 7], "6497388676926": [6, 7], "2518812859375": [6, 7], "4309": [6, 7], "124112370974": [6, 7], "30159424580074": [6, 7], "4357": [6, 7], "02827013125": 6, "1437929337522": [6, 7], "45281013": [6, 7], "shape": [6, 7, 8, 9], "thrown": [6, 7, 9], "prediciton": [6, 7], "regardless": [6, 7], "utilis": [6, 7, 8], "seper": [6, 7], "vector_covariate_config": [6, 7], "precomputed_descriptor": [6, 7], "train_with_fp": [6, 7], "aux_transform": [6, 7, 9], "vector_covariate_studi": [6, 7], "vector_aux_exampl": [6, 7], "vector_covariate_model": [6, 7], "735": 6, "776": 6, "857": 6, "2200": [6, 7], "6817959410578": [6, 7], "011994365911634164": [6, 7], "95660880078": [6, 7], "029071783512897825": [6, 7], "5798": [6, 7], "564494725643": [6, 7], "022631709120790048": [6, 7], "2198637677605415": [6, 7], "2899178898048": [6, 7], "8916194399474267": [6, 7], "022": [6, 7], "647": [6, 7], "3336440433073": [6, 7], "5914093983615214": [6, 7], "050": [6, 7], "3036472748931": [6, 7], "6201811079699818": [6, 7], "068": 6, "3807": [6, 7], "8035919667395": [6, 7], "914e": [6, 7], "901e": [6, 7], "892e": [6, 7], "5019": [6, 7], "459500770764": [6, 7], "1376436589359351": [6, 7], "4017711284796": [6, 7], "797115414836": [6, 7], "74340620175102": [6, 7], "train_smil": [6, 7, 9], "train_i": [6, 7, 9], "train_aux": [6, 7, 9], "test_smil": [6, 7, 9], "test_i": [6, 7, 9], "test_aux": [6, 7, 9], "legth": [6, 7], "39754917": [6, 7], "06352766": [6, 7], "52031134": [6, 7], "89875316": [6, 7], "5516046": [6, 7], "85042171": [6, 7], "436": [6, 7], "33406203": [6, 7], "504": [6, 7], "91439129": [6, 7], "80585907": [6, 7], "48565041": [6, 7], "protein": [6, 7, 13, 15], "alongsid": [6, 7], "chemic": [6, 7, 8, 13, 14], "sequenc": [6, 7, 13, 15], "former": [6, 7], "wherea": [6, 7], "latter": [6, 7, 8], "interact": [6, 7], "basi": [6, 7, 8, 9], "toxinpred3": [6, 7], "mdlititwasvmvaftfslslvvwgrsgl": [6, 7], "ccsc": [6, 7], "cc1c": [6, 7, 8], "nh": [6, 7, 8], "cc1ccccc1": [6, 7], "ncc": [6, 7], "cccnc": [6, 7], "arrggvlnfgqfglqalecgfvtnr": [6, 7], "cs": [6, 7], "gwcgdpgatcgklrlyccsgacdcytktckdkssa": [6, 7], "n1": [6, 7], "ccc1": [6, 7], "ccccn": [6, 7], "cc1ccc": [6, 7], "ngnllggllrpvlgvvkgltgglgkk": [6, 7], "demponstr": [6, 7], "zscale_covariate_config": [6, 7], "zscale_covariate_studi": [6, 7], "zscale_aux_exampl": [6, 7], "zscale_covariate_model": [6, 7], "425": 6, "385": 6, "8735224395254063": [6, 7], "kneighborsclassifier_algorithm_hash": [6, 7], "e51ca55089f389fc37a736adb2aa0e42": [6, 7], "metric__e51ca55089f389fc37a736adb2aa0e42": [6, 7], "n_neighbors__e51ca55089f389fc37a736adb2aa0e42": [6, 7], "weights__e51ca55089f389fc37a736adb2aa0e42": [6, 7], "unlik": [6, 7], "31176471": [6, 7], "08058824": [6, 7], "27176471": [6, 7], "56470588": [6, 7], "62529412": [6, 7], "99521739": [6, 7], "59826087": [6, 7], "34695652": [6, 7], "03086957": [6, 7], "13391304": [6, 7], "08083333": [6, 7], "6125": [6, 7], "82916667": [6, 7], "05083333": [6, 7], "56083333": [6, 7], "93357143": [6, 7], "02785714": [6, 7], "04214286": [6, 7], "30461538": [6, 7], "55307692": [6, 7], "31307692": [6, 7], "11076923": [6, 7], "00846154": [6, 7], "1232": [6, 7], "3364": [6, 7], "2328": [6, 7], "1368": [6, 7], "2304": [6, 7], "7060": [6, 7], "7062": [6, 7], "x_": [6, 7], "vmin": [6, 7], "vmax": [6, 7], "cmap": [6, 7], "spectral": [6, 7], "248bit": [6, 7], "128bit": [6, 7], "minimz": [6, 7], "generaliz": [6, 7], "minimize_std_dev": [6, 7], "minimise_std_dev": [6, 7, 10], "std": [6, 7, 8, 13, 15], "dev": [6, 7, 8], "example_multi": [6, 7], "parameter_analysi": [6, 7], "set_metric_nam": [6, 7], "4008740644240856": [6, 7], "9876203329634794": 6, "673": 6, "3561484909673425": [6, 7], "9875061220991905": [6, 7], "725": 6, "7856521165563053": [6, 7], "21863029956806662": [6, 7], "9125905675311808": [6, 7], "7861693342190089": [6, 7], "850": [6, 7], "5238765412750027": [6, 7], "2789424384877304": [6, 7], "873": [6, 7], "5348363849100434": [6, 7], "5741725628917808": [6, 7], "894": 6, "0072511048320134": [6, 7], "2786318125997387": [6, 7], "9625764609276656": [6, 7], "27575381401822424": [6, 7], "973": [6, 7], "1114006274062536": [6, 7], "7647766019001522": [6, 7], "990": [6, 8], "7801680863916906": [6, 7], "2725738454485389": [6, 7], "785652116470164": [6, 7], "21863029955530786": [6, 7], "060": 6, "785651973436432": [6, 7], "21863032832257323": [6, 7], "075": [6, 7], "6101359993004856": [6, 7], "3011280543457062": [6, 7], "092": 6, "5361950698070447": [6, 7], "23560786523195643": [6, 7], "5356113574175657": [6, 7], "5769721187181905": [6, 7], "5434303669217287": 6, "5147474123466615": 6, "191": [6, 7], "5194661889628072": [6, 7], "40146744515282495": [6, 7], "659749443628722": 6, "6659085938841998": 6, "1068495306229729": [6, 7], "24457822094737378": [6, 7], "305": 6, "8604898820838102": [6, 7], "7086875504668667": [6, 7], "5919869916997383": [6, 7], "2367498627927979": [6, 7], "327": [6, 7], "2497762395862362": [6, 7], "10124660026536195": [6, 7], "399": 6, "study_name_1": [6, 7], "0621601907738047": [6, 7], "2749020946925899": [6, 7], "xxx": [6, 7], "values_neg_mean_squared_error": [6, 7], "values_standard": [6, 7], "twinx": [6, 7], "r": [6, 7, 9], "floor": [6, 7], "ceil": [6, 7], "align": [6, 7], "set_ytick": [6, 7], "linspac": [6, 7], "set_xtick": [6, 7], "text": [6, 7, 8, 9, 13], "pareto": [6, 7], "front": [6, 7], "plot_pareto_front": [6, 7], "plot_param_import": [6, 7], "dictionari": [6, 7, 11], "ordereddict": [6, 7], "descend": [6, 7], "algortihm": [6, 7], "impact": [6, 7, 9], "durat": [6, 7], "total_second": [6, 7], "target_nam": [6, 7], "relationship": [6, 7], "plot_parallel_coordin": [6, 7, 9, 10, 12], "param": [6, 7, 8, 10, 11], "taken": [6, 7, 8], "precomputed_config": [6, 7], "precomputed_studi": [6, 7], "precomputed_exampl": [6, 7], "precomputed_model": [6, 7], "3014": [6, 7], "274803630188": [6, 7], "481": 6, "471088599086": [6, 7], "03592375122963953": [6, 7], "519": 6, "3029": [6, 7], "113810544919": [6, 7], "8153295905650357": [6, 7], "618": 6, "4358": [6, 7], "575772003129": [6, 7], "unseen": [6, 7], "caus": [6, 7], "new_molecul": [6, 7], "tempfil": [6, 7], "temp": [6, 7, 8], "store": [6, 7, 8, 9, 12], "temporari": [6, 7, 11], "1st": [6, 7], "example_fp": [6, 7], "namedtemporaryfil": [6, 7], "temp_fil": [6, 7], "len": [6, 7, 8], "to_csv": [6, 7], "65709987": [6, 7], "64327077": [6, 7], "clean": [6, 7], "stage": [6, 7, 8], "workflow": [6, 7], "slurm": [6, 7, 9, 11], "leverag": [6, 7], "dynam": [6, 7, 9], "gpu": [6, 7], "customiz": [6, 7], "tailor": [6, 7], "customis": [6, 7], "export": [6, 7], "aid": [6, 7], "monitor": [6, 7], "pseudo": [6, 7, 9], "prospect": [6, 7, 9], "resubmiss": [6, 7, 11], "resubmit": [6, 7, 9], "modifi": [6, 7, 9], "enhanc": [6, 7], "parallel": [6, 7, 9], "simultan": [6, 7], "simul": [6, 7], "submit": [6, 7, 11], "verifi": [6, 7], "unittest": [6, 7], "mock": [6, 7], "patch": [6, 7, 8], "aml_arg": [6, 7], "prog": [6, 7], "argv": [6, 7], "systemexit": [6, 7], "functionila": [6, 7], "signific": [6, 7, 8], "thorough": [6, 7], "warehous": [6, 7], "databas": [6, 7], "flat": [6, 7], "compress": [6, 7], "natur": [6, 7, 8], "uniqu": [6, 7, 8], "106": 6, "ls": [6, 7], "lrth": [6, 7], "rw": [6, 7], "staff": [6, 7], "2k": [6, 7], "aug": [6, 7], "12k": [6, 7], "438b": [6, 7], "written": [6, 7], "undergon": [6, 7], "updat": [6, 7, 8], "trigger": [6, 7], "bash": [6, 7], "orchestr": [6, 7], "easi": [6, 7], "request": [6, 7], "exce": [6, 7], "50g": [6, 7], "retain": [6, 7, 9], "futur": [6, 7, 9], "example_automl": [6, 7], "workbook": [6, 7], "automl_exampl": [6, 7], "vv": [6, 7], "debug": [6, 7], "namespac": 6, "dry_run": [6, 9], "dgx": 6, "save_previous_model": [6, 9], "24_01_01": [6, 7], "042": [6, 7], "first_run": [6, 9], "processed_timepoint": [6, 7, 9], "044": 6, "checkskip": [6, 9], "tid1": [6, 7], "checkislock": [6, 9], "lockfil": 6, "lock": [6, 7, 9, 11], "taskcod": [6, 9], "046": [6, 7], "checkrunningslurmjob": [6, 9], "usr": [6, 7], "squeue": 6, "resubmitanyfailedjob": [6, 7, 9], "ran": 6, "submitjob": [6, 9], "054": 6, "ongo": 6, "took": 6, "024824142": 6, "055": [6, 7], "pid": 6, "posix": 6, "pidfil": 6, "0x7ff3f48a5cc0": 6, "scene": [6, 7], "sed": [6, 7], "togeth": [6, 7], "correctli": [6, 7, 9], "ingest": [6, 7], "meet": [6, 7], "quourum": [6, 7], "happen": [6, 7], "statu": [6, 7], "past": [6, 7, 11], "cron": [6, 7], "513": 6, "0x7ff3f48a5c00": 6, "enter": 6, "515": [6, 7], "524": [6, 7], "529": [6, 7], "534": 6, "535": [6, 7], "019070148": 6, "retir": [6, 7], "acut": [6, 7], "attempt": [6, 7], "insuffici": [6, 7, 9, 13], "emul": [6, 7, 8, 13, 14], "sucess": [6, 7], "shutil": [6, 7], "os": [6, 7, 8], "drd2_reg": [6, 7], "549": 6, "0x7ff3f48a5e40": 6, "552": 6, "556": [6, 7], "557": 6, "558": [6, 7], "576": 6, "processretrain": [6, 9], "fist": 6, "setprocessedtimepoint": [6, 9], "581": [6, 7], "getretrainingdata": [6, 9], "24_02_01": [6, 7], "586": [6, 7], "587": [6, 7], "592": [6, 7], "processtrain": [6, 9], "60g": [6, 7], "No": [6, 10, 11, 13], "writedataset": [6, 9], "wrote": 6, "608": 6, "writeslurm": [6, 9], "611": 6, "writejson": [6, 9], "612": [6, 7], "setjoblock": [6, 9], "lock_fil": 6, "614": 6, "062794924": 6, "proce": [6, 7], "datapoint": [6, 7, 8, 9, 11, 13, 14], "pseodu": [6, 7], "9zyw8gtc": 7, "tqdmwarn": 7, "iprogress": 7, "ipywidget": 7, "readthedoc": [7, 10], "en": [7, 10], "user_instal": 7, "autonotebook": 7, "notebook_tqdm": 7, "713": 7, "794": 7, "810": 7, "827": 7, "892": 7, "853455192818": 7, "048": 7, "112": 7, "404088878841": 7, "284": 7, "339": 7, "047015479678": 7, "459": 7, "559": 7, "143979828407": 7, "660": 7, "799": 7, "924": 7, "795596755263": 7, "193": 7, "212": 7, "297": 7, "9359502556013": 7, "482": 7, "507": 7, "530": 7, "553": 7, "637": 7, "661": 7, "785": 7, "899": 7, "999": 7, "037": 7, "288": 7, "355": 7, "420": 7, "514": 7, "596": 7, "635": 7, "676": 7, "821": 7, "963": 7, "262": 7, "joblib": [7, 9], "joblibcollisionwarn": 7, "collis": 7, "public_qsartuna": 7, "_cached_cal": 7, "shelv": 7, "408": [7, 8], "3999": 7, "9364276424735": 7, "11270803112210707": 7, "81076443656638": 7, "3215970512413": 7, "4503197998963022": 7, "412900098594": 7, "0005181574946923789": 7, "025601513670726564": 7, "4941115157144": 7, "04539011914094239": 7, "0004375261377371938": 7, "758": 7, "2116": 7, "9335959003747": 7, "2124": 7, "9660426577593": 7, "1286": 7, "0769369193436": 7, "8784876169901574": 7, "839": 7, "1276": 7, "7802172741008": 7, "9512603410202876": 7, "2795207825823": 7, "9555128319114616": 7, "926": 7, "8121584310656": 7, "08008391330553266": 7, "942": 7, "277": 7, "22285881334636": 7, "950404670920864": 7, "340295864211": 7, "03834458564679112": 7, "0012347340743566007": 7, "025": 7, "3286": 7, "3458857183705": 7, "1671": 7, "978884132793": 7, "1617522685589332": 7, "466e": 7, "820e": 7, "2291": 7, "4431541048393": 7, "11135166203819158": 7, "218": 7, "3551": 7, "4754762175066": 7, "1703": 7, "5472682894215": 7, "9386828094838913": 7, "253": 7, "1595": 7, "6713281001928": 7, "1334174010640954": 7, "317": 7, "3057": 7, "0737441471406": 7, "335": 7, "358207737329": 7, "8045138424869749": 7, "406": 7, "3163": 7, "129883232068": 7, "745e": 7, "824e": 7, "473": 7, "00091009328474": 7, "03221878838522718": 7, "1306": 7, "5184610043127": 7, "7499005468308115": 7, "510": 7, "1262": 7, "6469892776183": 7, "0985974843950514": 7, "575": 7, "3059": 7, "470983832716": 7, "274": 7, "7005065089059": 7, "9093347536574419": 7, "3054": 7, "7066202193814": 7, "665": 7, "1325": 7, "4979657271272": 7, "5409105715354152": 7, "670": 7, "1814": 7, "6019641143478": 7, "3331": 7, "867542200907": 7, "2240": 7, "669934747297": 7, "828": 7, "8972970077489": 7, "6774731649874095": 7, "846": 7, "1879": 7, "2457309916924": 7, "8772717895282218": 7, "927": 7, "8197755321637": 7, "5177471708941157": 7, "499774083188": 7, "3690814560784887": 7, "012140477955952245": 7, "978": 7, "280": 7, "17463144475477": 7, "7022855415761313": 7, "69499953504345": 7, "7868425071077856": 7, "2174": 7, "0174962828364": 7, "2478696042156301": 7, "2733": 7, "5772576431627": 7, "275": 7, "9100107045787": 7, "9291713852865917": 7, "273": 7, "0829803041618": 7, "8837007827687249": 7, "144": 7, "49436461257073": 7, "9898473627215156": 7, "8855537592183": 7, "9765992415502778": 7, "30111488501615": 7, "9842537157445685": 7, "266": 7, "9084083294047": 7, "7700364511238211": 7, "08546968046016": 7, "7174555152957753": 7, "87394849447105": 7, "6657778446979243": 7, "57037115440716": 7, "6549600121936776": 7, "73632857486865": 7, "6012341182929566": 7, "8912182200218": 7, "610338208270851": 7, "8551585556689": 7, "608205745163954": 7, "2138932313906": 7, "5903994630391254": 7, "2415991435093": 7, "5908543043200158": 7, "258": 7, "9523786752699": 7, "5278661577890018": 7, "53897978343346": 7, "3779758893668723": 7, "508": [7, 9], "47213290450173": 7, "1905703564298876e": 7, "06884768780446": 7, "3682097961495725": 7, "583": 7, "39234737037964": 7, "336648765853807": 7, "619": 7, "49357359736462": 7, "3384792184834002": 7, "654": 7, "98988892704782": 7, "3472988458237292": 7, "4318590800788": 7, "3203044400907151": 7, "729": 7, "60939991827328": 7, "2896152552004716": 7, "57908944967576": 7, "3400204345244455": 7, "3328308520906": 7, "3355893292668126": 7, "89284193590962": 7, "2399635656610752": 7, "877": 7, "38938750703497": 7, "19357886055335": 7, "4997740789586": 7, "00020513916607513548": 7, "4326248941768776e": 7, "947": 7, "72495253431336": 7, "2374010908702786": 7, "16509356166648": 7, "1589849176145737": 7, "019": 7, "07682320089074": 7, "140733480213489": 7, "38922657607546": 7, "1460326309523254": 7, "096": 7, "48603723419197": 7, "1106769242312984": 7, "135": 7, "2330323343841": 7, "105401956026003": 7, "97865576673902": 7, "1000318093457389": 7, "232": 7, "01471657314468": 7, "0553438336940761": 7, "82080194631138": 7, "9715618816799196": 7, "49039871573063": 7, "9049680809556248": 7, "75568720888796": 7, "8917112780641941": 7, "52818001153125": 7, "8874420080681129": 7, "76711515271572": 7, "3506098555413268e": 7, "449": 7, "98946208159907": 7, "8769574977693346": 7, "490": 7, "9478946070053": 7, "8952523217347376": 7, "01732338929523": 7, "8965185664534796": 7, "567": 7, "7486972968999": 7, "8509681340315446": 7, "19689822636008": 7, "8810095036429842": 7, "26432510046484": 7, "8621657970877505": 7, "55052102161756": 7, "8680843345290663": 7, "56366099802298": 7, "7442205305129062": 7, "0644622341688": 7, "7150915543843963": 7, "796": 7, "093": 7, "12769795082909807": 7, "390": [7, 8], "446": 7, "464": 7, "750": 7, "916": 7, "117": 7, "136": 7, "159": 7, "178": 7, "183": 7, "337": 7, "00461414372160085": 7, "511": 7, "10220127407364965": 7, "579": 7, "089": 7, "148": 7, "903": 7, "977": 7, "272": 7, "628": 7, "126": 7, "365": 7, "393": 7, "860": 7, "08048357913360568": 7, "499": 7, "07632537970908462": 7, "08984764740598594": 7, "06847327885133497": 7, "07559783310619407": 7, "05514462099560352": 7, "061375603485350996": 7, "921": 7, "07939472167407403": 7, "0684392715056296": 7, "489": 7, "07494614575719116": 7, "07133468298392816": 7, "061875032318225075": 7, "07572085582137136": 7, "054237426197199234": 7, "299": 7, "331": 7, "6743": 7, "225992071741": 7, "584": 7, "944009132488": 7, "34392897437": 7, "086720713623": 7, "424": 7, "228032558769": 7, "456": 7, "16017644995": 7, "544": 7, "815": 7, "027": 7, "487": 7, "497": 7, "722": 7, "326": 7, "992": 7, "808": 7, "189": 7, "118": 7, "231": 7, "4253": 7, "872561867463": 7, "433": 7, "36708973607664297": 7, "006253064467624636": 7, "043440e": 7, "025864e": 7, "805554e": 7, "367604e": 7, "104342e": 7, "1496": 7, "052067e": 7, "1497": 7, "015542e": 7, "2234": 7, "387391e": 7, "862": 7, "140929e": 7, "863": 7, "083": 7, "143": 7, "472": 7, "595949377253611": 7, "943": 7, "033": 7, "172": 7, "325": 7, "417": 7, "488": [7, 9], "554": 7, "571": 7, "605": 7, "609": 7, "626": 7, "780": 7, "817": 7, "985": 7, "026": 7, "067": 7, "40359637945134724": 7, "214": 7, "5959493772536111": 7, "308": 7, "8908739215746114": 7, "413": 7, "493": 7, "537": 7, "651": 7, "674": 7, "791": 7, "840": 7, "887": 7, "065": 7, "162": 7, "313": 7, "364": 7, "675": 7, "702": 7, "333": 7, "353": 7, "548": 7, "932": 7, "988": 7, "111": 7, "304": 7, "396": [7, 8], "5407991891466": 7, "636": 7, "738": 7, "888": 7, "967": 7, "049": 7, "074": 7, "205": 7, "260": 7, "315": 7, "428": 7, "685": 7, "714": 7, "772": 7, "830": 7, "0x7fa8b811a5c0": 7, "594": 7, "633": 7, "935": 7, "013": 7, "063": 7, "114": 7, "409": 7, "528": 7, "547": 7, "639": 7, "662": 7, "717": 7, "001975769419400139": 7, "930": 7, "087": 7, "414": 7, "630": 7, "805": 7, "082": 7, "323": 7, "767663956718": 7, "028270131251": 7, "869": 7, "948": 7, "681": 7, "9876203329634793": 7, "543430366921729": 7, "514747412346662": 7, "610": 7, "6597494436287219": 7, "6659085938841999": 7, "644": 7, "682": 7, "643": 7, "752": 7, "919": 7, "usernam": 7, "hous": 7, "103": 7, "104": 7, "tb": 7, "assess": [7, 8], "frequent": 7, "slurm_update_models_parallel": 7, "qsartuna_automl": 7, "j": [7, 9], "12g": 7, "your_path": 7, "update_it": 7, "hourli": 7, "common": 8, "proper": 8, "process": [8, 9, 11], "functionail": 8, "configur": [8, 9, 10, 11, 12], "draw": 8, "ipythonconsol": 8, "ipython": 8, "displai": 8, "listdir": 8, "isfil": 8, "walk": 8, "handi": 8, "med": 8, "titles": 8, "fontsiz": 8, "labels": 8, "xtick": 8, "ytick": 8, "rcparam": 8, "v0_8": 8, "whitegrid": 8, "set_styl": 8, "white": 8, "boolean": 8, "nomin": 8, "convert": [8, 9, 13], "conduct": 8, "primarydf": 8, "loadsdf": 8, "inchi": 8, "skeletonspher": 8, "nm": 8, "id": 8, "romol": 8, "ic50": 8, "\u00b5m": 8, "c1ccc2c": 8, "co2": 8, "004320939": 8, "1s": 8, "c8h7no2": 8, "c10": 8, "qrcgftxrxymjo": 8, "uhfffaoysa": 8, "86075": 8, "kinas": 8, "p38": 8, "rdchem": 8, "0x7f9ca0112340": 8, "c1ccc": 8, "ccc2ccccc2occ3ccc": 8, "882397308": 8, "c22h20o3": 8, "c23": 8, "ytdaoqyeyfcini": 8, "89637": 8, "kd": 8, "retinoid": 8, "receptor": 8, "0x7f9c808beff0": 8, "130299026": 8, "0x7f9c808bf060": 8, "48148606": 8, "c9h7no": 8, "c11": 8, "lisfmebwquvkpj": 8, "n93": 8, "n82": 8, "n65": 8, "n36": 8, "n33": 8, "ki": 8, "nki": 8, "carbon": 8, "anhydras": 8, "xii": 8, "ncarbon": 8, "0x7f9c808bf0d0": 8, "nc1ccccn1": 8, "c7h8n2o": 8, "h2": 8, "5h": 8, "qrokotbwfzitjz": 8, "86233": 8, "nicotin": 8, "phosphoribosyltransferas": 8, "0x7f9c808bf140": 8, "renam": 8, "conveni": [8, 9, 10, 13], "rest": 8, "moltosmil": 8, "isomericsmil": 8, "c1coc2ccccc2n1": 8, "004321": 8, "coc2ccccc2ccc2ccccc2": 8, "882397": 8, "130299": 8, "c1ccc2ccccc2": 8, "481486": 8, "stick": 8, "engin": 8, "assum": [8, 13, 14], "slightli": 8, "pose": 8, "wise": 8, "outlin": 8, "occurr": 8, "preserv": 8, "vari": 8, "recommend": 8, "abil": 8, "being": 8, "version": [8, 9, 10], "df_po": 8, "dedup": [8, 13], "df_rnd": 8, "df_max": 8, "df_avg": 8, "df_med": 8, "deduplidc": 8, "397": 8, "indici": 8, "coc1cc2ncnc": 8, "nc3ccc": 8, "scc4ccccc4": 8, "cl": 8, "c3": 8, "c2cc1oc": 8, "282579": 8, "912929": 8, "cc1cccc": 8, "nc2ncnc3ccc": 8, "c4ccccc4": 8, "cc23": 8, "n2cc": 8, "cc2c": 8, "nc2cccc": 8, "n2": 8, "065502": 8, "958607": 8, "oc2cccc": 8, "cn1nc": 8, "c2cnc": 8, "c3ccc": 8, "nc1c1": 8, "oc1nc": 8, "oc2cc": 8, "c3ccccc3": 8, "c3cccc": 8, "cn": 8, "936291": 8, "359": 8, "minim": [8, 10], "densiti": 8, "dpi": 8, "kdeplot": 8, "fill": 8, "orang": 8, "ndigit": 8, "blue": 8, "keepaverag": 8, "deeppink": 8, "hold": [8, 9], "aim": 8, "simpli": 8, "sai": 8, "veri": 8, "intern": [8, 11], "resembl": 8, "easiest": 8, "especi": 8, "reli": 8, "stochast": 8, "train_ran": 8, "test_ran": 8, "time_column": 8, "old": [8, 9], "accru": 8, "entri": [8, 13, 14], "timestamp": 8, "top": 8, "df_med_tempor": 8, "fake": 8, "nccccccoc1ccc2c": 8, "n1cc": 8, "684240": 8, "1037": 8, "481464": 8, "1036": 8, "c1cn": 8, "n2c": 8, "nc3cccc": 8, "n3": 8, "cc3cc3": 8, "732625": 8, "1035": 8, "568332": 8, "1034": 8, "790259": 8, "1033": 8, "train_tempor": 8, "test_tempor": 8, "highli": 8, "skew": 8, "fd": [8, 13, 14], "histogram": [8, 13, 14], "determin": [8, 13, 14], "balanc": 8, "fd_merg": [8, 13, 14], "train_str": 8, "test_str": 8, "realist": 8, "deplopi": 8, "hop": 8, "opportun": 8, "seri": 8, "push": 8, "domain": 8, "realibl": 8, "challeng": 8, "scaf_split": 8, "train_sca": 8, "test_sca": 8, "ground": 8, "df_val": 8, "roughli": [8, 10], "evid": 8, "pronounc": 8, "dodgerblu": 8, "middl": 8, "saffold": 8, "discuss": 8, "propreti": 8, "endpoint": 8, "routin": 8, "linearis": 8, "variat": 8, "gaussian": 8, "realiti": 8, "nearli": 8, "exhibit": 8, "superior": 8, "wide": 8, "xc50_data": 8, "keepallnodedupl": [8, 13], "pxc50_data": 8, "zip": 8, "jointplot": 8, "suptitl": 8, "plot_margin": 8, "rugplot": 8, "crimson": 8, "height": 8, "clip_on": 8, "jointgrid": 8, "0x7f9ca05ade10": 8, "heteroscedast": 8, "homoscedast": 8, "transorm": 8, "0x7f9c458f85e0": 8, "logartihm": 8, "power": [8, 13, 15], "um": 8, "dataset_transform": 8, "THe": 8, "0x7f9ca05aeb30": 8, "had": 8, "reverse_transform": [8, 13], "0x7f9c926f8970": 8, "mervin": 8, "framework": [8, 9], "somewher": 8, "unavoid": 8, "ideal": 8, "deviat": [8, 13, 15], "\u03c3": 8, "heterogen": 8, "versu": 8, "assimil": 8, "hypothesi": 8, "degre": 8, "p_": 8, "activityt": 8, "cumul": 8, "cdf": 8, "eq": 8, "equal": [8, 10], "delta": 8, "vec": 8, "frac": 8, "erf": 8, "overrightarrow": 8, "sigma": 8, "concret": 8, "arbitrari": 8, "unknown": [8, 11], "therefor": [8, 9], "schemat": 8, "lookup": 8, "tabl": 8, "sd": 8, "scenario": [8, 13, 14], "philosoph": 8, "delimit": [8, 13, 15], "operand": 8, "censor": 8, "far": 8, "granular": 8, "therebi": 8, "combin": [8, 9], "becom": 8, "jcheminf": 8, "biomedcentr": 8, "1186": 8, "s13321": 8, "00539": 8, "sec12": 8, "pxc50_threshold": 8, "pxc50_std": 8, "exmapl": 8, "ptr_data": 8, "gather": 8, "certainti": 8, "lower_reproduc": 8, "upper_reproduc": 8, "dataload": 8, "somewhat": 8, "invert": 8, "bell": 8, "kde": 8, "behav": 8, "mpatch": 8, "line2d": 8, "ax_joint": 8, "axhlin": 8, "linestyl": 8, "ax_marg_i": 8, "ax_marg_x": 8, "axvlin": 8, "region": 8, "uncert_color": 8, "purpl": 8, "uncert_region": 8, "rectangl": 8, "add_patch": 8, "box": 8, "nthreshold": 8, "nptr": 8, "nregion": 8, "fancybox": 8, "borderaxespad": 8, "leg": 8, "get_legend": 8, "legend_handl": 8, "set_alpha": 8, "set_color": 8, "tight": 8, "layout": 8, "subplots_adjust": 8, "set_size_inch": 8, "var": 8, "1v": 8, "9y_z128d7gvcp8mf8q0pz3ch0000gq": 8, "ipykernel_33301": 8, "3093832163": 8, "cannot": 8, "enough": [8, 9], "accommod": 8, "decor": 8, "dash": 8, "shade": 8, "histrogram": 8, "clip": 8, "aforement": 8, "ptrtransform": [8, 13, 15], "ptr_transform": 8, "histplot": 8, "stat": 8, "scipi": 8, "resp_col": [8, 9], "pearsonr": 8, "std_df": 8, "groupbi": 8, "mdn_df": 8, "std_vs_median": 8, "suffix": 8, "_std": 8, "_median": 8, "dropna": 8, "activity_std": 8, "activity_median": 8, "088539": 8, "674782": 8, "265123": 8, "138620": 8, "157605": 8, "stdev": 8, "stat_func": 8, "plot_joint": 8, "zorder": 8, "0x7f9be19abaf0": 8, "assumpt": 8, "fulfil": 8, "ptr_train_ran": 8, "ptr_test_ran": 8, "ptr_train_str": 8, "ptr_test_str": 8, "ptr_train_tempor": 8, "ptr_test_tempor": 8, "ptr_train_sca": 8, "ptr_test_sca": 8, "warn_singular": 8, "xlim": 8, "peak": 8, "extem": 8, "dsitribut": 8, "awai": 8, "bias": 8, "enum": [9, 10, 11, 13], "building_configuration_enum": [9, 11], "configuration_enum": [9, 11], "interface_enum": [9, 11], "model_runner_enum": [9, 11], "objective_enum": [9, 11], "optimization_configuration_enum": [9, 11], "prediction_configuration_enum": [9, 11], "return_values_enum": [9, 11], "visualization_enum": [9, 11], "modelautoml": 9, "smiles_col": [9, 11, 13, 14], "activity_col": 9, "task_col": 9, "timestr": 9, "20240828": 9, "172746": 9, "modeldispatch": 9, "pend": 9, "last_timepoint": 9, "getallretrainingdata": 9, "wilcard": 9, "datetim": 9, "unprocess": 9, "bucket": 9, "nonewretrainingdata": [9, 11], "setretrainingdata": 9, "initprocessedtimepoint": 9, "cfg": 9, "initial_templ": 9, "retrain_templ": 9, "slurm_templ": 9, "slurm_al_smil": 9, "slurm_partit": 9, "log_conf": 9, "checkifretrainingprocess": 9, "unabl": 9, "static": 9, "calcslurmmem": 9, "len_fil": 9, "setdispatchervari": 9, "overwrit": 9, "_taskcode_df": 9, "attribut": 9, "prev": 9, "processquorum": 9, "_input_df": 9, "istrain": 9, "checksavetemporalmodel": 9, "dotemporalpredict": 9, "new_data": 9, "out_df": 9, "setskippedtimepoint": 9, "elig": 9, "checkslurmstatusandnextprocedur": 9, "cancel": 9, "increasejobtim": 9, "increasejobmem": 9, "max_mem": 9, "increasejobcpu": 9, "max_cpu": 9, "addslurmretri": 9, "getslurmretri": 9, "locked_job": 9, "max_retri": 9, "process_retraining_task": 9, "dispatcher_process": 9, "global_cfg": 9, "validate_arg": 9, "prepare_dispatch": 9, "merge_train_and_test_data": 9, "isvalid": 9, "read_data": 9, "aux_col": 9, "invalid": 9, "pars": [9, 10, 12], "tupl": [9, 13, 14], "ambigu": 9, "smiles_": 9, "y_": [9, 11, 13], "aux_": 9, "factori": [9, 10], "intermediate_training_dataset_fil": 9, "intermediate_test_dataset_fil": 9, "get_merged_set": 9, "check_set": 9, "scalingfittingerror": 9, "descriptor_str": 9, "unfittedsklearnscla": [9, 13], "novalidsmil": 9, "mol_from_smi": 9, "numpy_from_rdkit": 9, "dtype": [9, 13], "moldescriptor": 9, "nameparameterdataclass": [9, 10, 13], "abc": [9, 10, 13], "abstract": [9, 10, 13], "parallel_compute_descriptor": 9, "amorprot": [9, 13], "ecfp6": 9, "seq": 9, "pathlib": 9, "get_fitted_scaler_for_fp": 9, "saved_param": 9, "get_fitted_scal": 9, "minhash": 9, "chiral": 9, "orsi": 9, "map4": 9, "unifi": 9, "percept": 9, "benchmark": 9, "cip": 9, "highest": 9, "disproportion": 9, "affect": [9, 13], "maxradiu": [9, 12], "npermut": [9, 12], "permut": 9, "set_unfitted_scaler_data": 9, "fp_info": 9, "canonicalsmil": 9, "scaffold": [9, 13, 14], "genericscaffold": 9, "validdescriptor": 9, "descriptor_from_config": 9, "return_failed_idx": 9, "score_al": 9, "get_scor": 9, "score_all_smil": 9, "get_train_test_scor": 9, "get_merged_train_scor": 9, "get_ecfp_fpinfo": 9, "get_ecfpcount_fpinfo": 9, "explain_ecfp": 9, "len_feat": 9, "get_fp_info": 9, "exp_df": 9, "fp_idx": 9, "strt_idx": 9, "runshap": 9, "x_pred": 9, "shapexplain": 9, "popul": 9, "explainpr": 9, "shallow": 9, "validate_cls_input": 9, "pi_zero": 9, "pr": 9, "melloddi": 9, "sparsechem": 9, "imbal": 9, "bedroc_scor": [9, 10], "truchon": 9, "bayli": 9, "screen": 9, "bad": 9, "recognit": 9, "2007": 9, "concord": 9, "statist": 9, "qualiti": 9, "harald": 9, "On": 9, "surviv": 9, "bound": 9, "2008": 9, "1209": 9, "1216": 9, "api": 9, "posterior": 9, "mark": 9, "abstractmethod": [9, 10], "predict_uncert": 9, "quantifi": 9, "qsartunamodel": 9, "nonetyp": [9, 10], "sent": 9, "get_metadata": 9, "train_scor": [9, 12], "test_scor": [9, 11, 12], "get_transform": 9, "perform_ptr": 9, "wrap_model": 9, "save_model": 9, "novaliddescriptor": 9, "null_scor": 9, "argserror": 9, "issu": [9, 11, 13], "uncertaintyerror": 9, "auxcovariatemiss": 9, "precomputederror": 9, "validate_uncertainti": 9, "check_precomp_arg": 9, "set_inference_param": 9, "desc": [9, 10], "validate_set_precomput": 9, "validate_aux": 9, "doctitl": 9, "docstr": 9, "type_base_schema": 9, "tp": 9, "wyfo": 9, "json_schema": 9, "patch_schema_gener": 9, "patch_schema_optunaz": 9, "split_optim": 9, "base_chemprop_param": 9, "pop": 9, "run_studi": 9, "storag": [9, 12], "trial_number_offset": [9, 11], "log_scor": 9, "main_scor": 9, "outfnam": 9, "plot_by_configur": 9, "conf": 9, "plot_slic": [9, 10, 12], "folder_path": 9, "file_format": [9, 10, 12], "png": [9, 10], "plot_contour": [9, 10, 12], "plot_histori": [9, 10, 12], "set_build_cach": 10, "preexist": 10, "remove_algo_hash": 10, "buildconfig_from_tri": 10, "encode_nam": 10, "cenam": 10, "suggest_alg_param": 10, "suggest_aux_param": 10, "check_invalid_descriptor_param": 10, "adaboostclassifierparamet": 10, "lassoparamet": 10, "kneighborsclassifierparamet": 10, "kneighborsregressorparamet": 10, "logisticregressionparamet": 10, "plsparamet": 10, "randomforestparamet": 10, "ridgeparamet": 10, "svcparamet": 10, "svrparamet": 10, "xgbregressorparamet": 10, "prfclassifierparamet": 10, "bootstrap": 10, "new_syn_data_frac": 10, "chempropregressorparamet": 10, "chempropclassifierparamet": 10, "chempropregressorpretrainedparamet": 10, "chemprophyperoptclassifierparamet": 10, "chemprophyperoptregressorparamet": 10, "calibratedclassifiercvparamet": 10, "mapieparamet": 10, "regressionscor": 10, "classificationscor": 10, "closer": 10, "greater": 10, "manhattan": 10, "trainarg": 10, "tanh": 10, "leakyrelu": 10, "prelu": 10, "selu": 10, "elu": 10, "morgan_count": 10, "rdkit_2d": 10, "rdkit_2d_norm": 10, "mpnn_first_ffn": 10, "mpnn_last_ffn": 10, "linked_hidden_s": 10, "constrain": 10, "l3": 10, "init_lr_exp": 10, "final_lr_exp": 10, "warmup_epoch": 10, "l4": 10, "l5": 10, "l6": 10, "l7": 10, "l8": 10, "isanyof": 10, "obj": [10, 11], "detect_mode_from_alg": 10, "copy_path_for_scaled_descriptor": 10, "cv_split_strategi": 10, "use_cach": 10, "optuna_storag": 10, "set_cach": 10, "set_algo_hash": 10, "declar": 10, "pydant": 10, "don": 10, "classmethod": 10, "1024": 10, "shorter": 10, "output_fold": [10, 12], "use_xvfb": [10, 12], "imagefileformat": 10, "jpeg": 10, "jpg": 10, "svg": 10, "move_up_directori": 11, "attach_root_path": 11, "attach": 11, "loadjson": 11, "add_ellipsi": 11, "max_length": 11, "shorten_nam": 11, "mlflowcallback": 11, "tracking_uri": 11, "callback": 11, "uri": 11, "server": 11, "set_tracking_uri": 11, "prepare_tag": 11, "tag": 11, "tmp_buildconfig": 11, "noretrainingdataconvent": 11, "nodifferingretrainingdata": 11, "retrainingheadersissu": 11, "retrainingisalreadyprocess": 11, "retrainingislock": 11, "temporalpredspredict": 11, "nopreviousmodel": 11, "prev_model_nam": 11, "samepreviousmodel": 11, "timepointskip": 11, "slurmnolog": 11, "itcod": 11, "slurmtimelimitexceed": 11, "exceed": 11, "slurmmemoryexceed": 11, "slurmjobskip": 11, "qptuna": 11, "slurmparseerror": 11, "create_depend": 11, "remove_schema_properti": 11, "add_boolean_guards_for_schema_properti": 11, "replacekei": 11, "input_": 11, "replacevalu": 11, "addsibl": 11, "delsibl": 11, "sibl": 11, "getref": 11, "context": 11, "recurs": 11, "nest": 11, "copytitl": 11, "oneof": 11, "replaceenum": 11, "singleton": 11, "const": 11, "addtitl": 11, "get_authorization_head": 11, "trackingdata": 11, "trial_numb": [11, 12], "trial_valu": 11, "trial_stat": 11, "all_cv_test_scor": 11, "removeprefix": 11, "round_scor": 11, "internaltrackingcallback": 11, "progress": 11, "buildtrackingdata": 11, "response_column_nam": 11, "test_point": 11, "track_build": 11, "mkdict": 11, "load_df_from_fil": 11, "remove_failed_idx": 11, "failed_idx": 11, "md5_hash": 11, "md5": 11, "buildingconfigurationenum": 12, "configurationenum": 12, "general_hyperparamet": 12, "hyper_paramet": 12, "general_regressor": 12, "general_classifi": 12, "metadata_besttri": 12, "metadata_bestvalu": 12, "general_dis": 12, "general_paramet": 12, "task_optim": 12, "task_build": 12, "data_inputcolumn": 12, "data_responsecolumn": 12, "data_train": 12, "data_test": 12, "descriptors_avalon": 12, "descriptors_avalon_nbit": 12, "descriptors_ecfp": 12, "descriptors_ecfp_radiu": 12, "descriptors_ecfp_nbit": 12, "descriptors_ecfpcount": 12, "descriptors_ecfpcounts_radiu": 12, "descriptors_ecfpcounts_usefeatur": 12, "descriptors_pathfp": 12, "descriptors_pathfp_maxpath": 12, "descriptors_pathfp_fps": 12, "descriptors_maccskei": 12, "descriptors_unsc_physchem": 12, "descriptors_physchem": 12, "descriptors_physchem_rdkitnam": 12, "descriptors_amorprot": 12, "descriptors_unsc_mapc": 12, "descriptors_mapc": 12, "descriptors_mapc_maxradiu": 12, "descriptors_mapc_npermut": 12, "descriptors_unsc_jazzi": 12, "descriptors_jazzi": 12, "descriptors_jazzy_jazzynam": 12, "descriptors_precomput": 12, "descriptors_precomputed_fil": 12, "descriptors_precomputed_input_columnn": 12, "descriptors_precomputed_response_column": 12, "descriptors_unsc_zscal": 12, "descriptors_zscal": 12, "descriptors_smil": 12, "descriptors_smiles_and_si": 12, "descriptors_smiles_and_si_fil": 12, "descriptors_smiles_and_si_input_column": 12, "descriptors_smiles_and_si_aux_weight_pc": 12, "descriptors_sc": 12, "descriptors_scaled_descriptor": 12, "descriptors_scaled_descriptor_paramet": 12, "descriptors_composit": 12, "settings_mod": 12, "settings_mode_regress": 12, "settings_mode_classif": 12, "settings_cross_valid": 12, "settings_direct": 12, "settings_n_tri": 12, "settings_n_job": 12, "settings_shuffl": 12, "algorithms_low": 12, "algorithms_high": 12, "algorithms_q": 12, "algorithms_interface_sklearn": 12, "algorithms_interface_xgboost": 12, "algorithms_rfregressor": 12, "algorithms_rfclassifi": 12, "algorithms_rf_max_featur": 12, "algorithms_rf_max_depth": 12, "algorithms_rf_n_estim": 12, "algorithms_svr": 12, "algorithms_svr_c": 12, "algorithms_svr_gamma": 12, "algorithms_svc": 12, "algorithms_svc_c": 12, "algorithms_svc_gamma": 12, "algorithms_lasso": 12, "algorithms_lasso_alpha": 12, "algorithms_kneighborsclassifi": 12, "algorithms_kneighborsregressor": 12, "algorithms_kneighbors_n_neighbor": 12, "algorithms_kneighbors_metr": 12, "algorithms_kneighbors_weight": 12, "algorithms_ridg": 12, "algorithms_ridge_alpha": 12, "algorithms_plsregress": 12, "algorithms_plsregression_n_compon": 12, "algorithms_logisticregress": 12, "algorithms_logisticregression_solv": 12, "algorithms_logisticregression_c": 12, "algorithms_adaboostclassifi": 12, "algorithms_adaboostclassifier_n_estim": 12, "algorithms_adaboostclassifier_learning_r": 12, "algorithms_xgbregressor": 12, "algorithms_xgbregressor_max_depth": 12, "algorithms_xgbregressor_n_estim": 12, "algorithms_xgbregressor_learning_r": 12, "algorithms_prf": 12, "algorithms_prf_max_featur": 12, "algorithms_prf_max_depth": 12, "algorithms_prf_n_estim": 12, "algorithms_prf_minpysumleaf": 12, "algorithms_prf_use_py_gini": 12, "algorithms_prf_use_py_leaf": 12, "algorithms_chemprop": 12, "basechemprop": 12, "algorithms_chemprop_regressor": 12, "algorithms_chemprop_hyperopt_regressor": 12, "algorithms_chemprop_classifi": 12, "algorithms_chemprop_hyperopt_classifi": 12, "algorithms_chemprop_activ": 12, "algorithms_chemprop_aggreg": 12, "algorithms_chemprop_aggregation_norm": 12, "algorithms_chemprop_batch_s": 12, "algorithms_chemprop_depth": 12, "algorithms_chemprop_dropout": 12, "algorithms_chemprop_epoch": 12, "algorithms_chemprop_ensemble_s": 12, "algorithms_chemprop_features_gener": 12, "algorithms_chemprop_ffn_hidden_s": 12, "algorithms_chemprop_ffn_num_lay": 12, "algorithms_chemprop_frzn": 12, "algorithms_chemprop_final_lr_ratio_exp": 12, "algorithms_chemprop_hidden_s": 12, "algorithms_chemprop_num_it": 12, "algorithms_chemprop_init_lr_ratio_exp": 12, "algorithms_chemprop_max_lr_exp": 12, "algorithms_chemprop_pretrained_model": 12, "algorithms_chemprop_search_parameter_level": 12, "algorithms_chemprop_startup_random_it": 12, "startup_random_it": 12, "algorithms_chemprop_warmup_epochs_ratio": 12, "algorithms_calibratedclassifiercv": 12, "algorithms_calibratedclassifiercv_ensembl": 12, "algorithms_calibratedclassifiercv_estim": 12, "algorithms_calibratedclassifiercv_method": 12, "algorithms_calibratedclassifiercv_n_fold": 12, "algorithms_calibratedclassifiercv_param": 12, "calibrated_param": 12, "algorithms_mapi": 12, "algorithms_mapie_alpha": 12, "interfaceenum": 12, "sklearn_set": 12, "xgboost_set": 12, "chemprop_set": 12, "prf_set": 12, "calibrated_set": 12, "modelrunnerdataframeenum": 12, "modelrunn": 12, "objectiveenum": 12, "attribute_trial_train_scor": 12, "extra_column_besthit": 12, "besthit": 12, "optimizationconfigurationenum": 12, "predictionconfigurationenum": 12, "data_dataset": 12, "sklearnreturnvalueenum": 12, "cross_validate_fit_tim": 12, "fit_tim": 12, "cross_validate_score_tim": 12, "score_tim": 12, "cross_validate_test_scor": 12, "cross_validate_train_scor": 12, "xgboostreturnvalueenum": 12, "visualizationenum": 12, "visualization_regressor": 12, "visualization_classifi": 12, "visualization_use_xvfb": 12, "visualization_output_fold": 12, "visualization_file_format": 12, "visualization_plot": 12, "visualization_plots_histori": 12, "visualization_plots_contour": 12, "visualization_plots_parallel_coordin": 12, "visualization_plots_slic": 12, "optuna_system_attrs_numb": 12, "_number": 12, "optuna_system_attrs_intermediate_valu": 12, "intermediate_valu": 12, "optuna_system_attrs_trial_id": 12, "trial_id": 12, "studyuserattr": 12, "trialuserattr": 12, "trialparam": 12, "algorithm_hash": 12, "mlflowlogparam": 12, "sklearnsplitt": 13, "get_n_split": 13, "cvsplitter": 13, "although": 13, "underli": 13, "get_sklearn_splitt": 13, "n_split": 13, "repeat": [13, 14], "edg": [13, 14], "stratifiedshufflesplit": [13, 14], "revert": [13, 14], "empti": 13, "kfold": 13, "consecut": 13, "fd_bin": 13, "11879": 13, "10297": 13, "adjac": 13, "downstream": 13, "nativ": 13, "histogramstratifiedshufflesplit": 13, "test_fract": 13, "groupingsplitt": 13, "column_nam": [13, 14], "butina_clust": [13, 14], "cluster": [13, 14], "butina": [13, 14], "make_scaffold_gener": [13, 14], "murcko": [13, 14], "hetero": [13, 14], "difficulti": [13, 14], "novel": [13, 14], "datatransformerror": 13, "datatransform": 13, "logarithm": [13, 15], "base_dict": 13, "ufunc": 13, "base_neg": 13, "reverse_dict": 13, "exp": 13, "transform_df": 13, "transform_on": 13, "reverse_transform_df": 13, "reverse_transform_on": 13, "auxtransform": 13, "transfor": 13, "auxiliary_data": 13, "usabl": [13, 15]}, "objects": {"": [[9, 0, 0, "-", "optunaz"]], "optunaz": [[9, 0, 0, "-", "automl"], [9, 0, 0, "-", "builder"], [10, 0, 0, "-", "config"], [9, 0, 0, "-", "datareader"], [9, 0, 0, "-", "descriptors"], [9, 0, 0, "-", "evaluate"], [9, 0, 0, "-", "explainability"], [9, 0, 0, "-", "metircs"], [9, 0, 0, "-", "model_writer"], [9, 0, 0, "-", "objective"], [9, 0, 0, "-", "optbuild"], [9, 0, 0, "-", "predict"], [9, 0, 0, "-", "schemagen"], [9, 0, 0, "-", "three_step_opt_build_merge"], [11, 0, 0, "-", "utils"], [9, 0, 0, "-", "visualizer"]], "optunaz.automl": [[9, 1, 1, "", "ModelAutoML"], [9, 1, 1, "", "ModelDispatcher"], [9, 4, 1, "", "dispatcher_process"], [9, 4, 1, "", "main"], [9, 4, 1, "", "meta"], [9, 4, 1, "", "prepare_dispatcher"], [9, 4, 1, "", "process_retraining_task"], [9, 4, 1, "", "validate_args"]], "optunaz.automl.ModelAutoML": [[9, 2, 1, "", "first_run"], [9, 3, 1, "", "getAllRetrainingData"], [9, 3, 1, "", "getRetrainingData"], [9, 3, 1, "", "initProcessedTimepoints"], [9, 2, 1, "", "last_timepoint"], [9, 2, 1, "", "processed_timepoints"], [9, 3, 1, "", "setProcessedTimepoints"], [9, 3, 1, "", "setRetrainingData"]], "optunaz.automl.ModelDispatcher": [[9, 3, 1, "", "addSlurmRetry"], [9, 3, 1, "", "calcSlurmMem"], [9, 3, 1, "", "checkIfRetrainingProcessed"], [9, 3, 1, "", "checkRunningSlurmJobs"], [9, 3, 1, "", "checkSaveTemporalModel"], [9, 3, 1, "", "checkSkipped"], [9, 3, 1, "", "checkSlurmStatusAndNextProcedure"], [9, 3, 1, "", "checkisLocked"], [9, 3, 1, "", "doTemporalPredictions"], [9, 3, 1, "", "getSlurmRetry"], [9, 3, 1, "", "increaseJobCpu"], [9, 3, 1, "", "increaseJobMem"], [9, 3, 1, "", "increaseJobTime"], [9, 3, 1, "", "isTrained"], [9, 2, 1, "", "pretrained_model"], [9, 3, 1, "", "processQuorum"], [9, 3, 1, "", "processRetraining"], [9, 3, 1, "", "processTrain"], [9, 3, 1, "", "resubmitAnyFailedJobs"], [9, 3, 1, "", "setDispatcherVariables"], [9, 3, 1, "", "setJobLocked"], [9, 3, 1, "", "setSkippedTimepoint"], [9, 3, 1, "", "submitJob"], [9, 3, 1, "", "writeDataset"], [9, 3, 1, "", "writeJson"], [9, 3, 1, "", "writeSlurm"]], "optunaz.builder": [[9, 4, 1, "", "build"]], "optunaz.config": [[10, 1, 1, "", "Algorithm"], [10, 1, 1, "", "ModelMode"], [10, 1, 1, "", "NameParameterDataclass"], [10, 1, 1, "", "OptimizationDirection"], [10, 1, 1, "", "Task"], [10, 1, 1, "", "Visualization"], [10, 0, 0, "-", "build_from_opt"], [10, 0, 0, "-", "buildconfig"], [10, 0, 0, "-", "optconfig"]], "optunaz.config.ModelMode": [[10, 5, 1, "", "CLASSIFICATION"], [10, 5, 1, "", "REGRESSION"]], "optunaz.config.NameParameterDataclass": [[10, 3, 1, "", "new"]], "optunaz.config.OptimizationDirection": [[10, 5, 1, "", "MAXIMIZATION"], [10, 5, 1, "", "MINIMIZATION"]], "optunaz.config.Task": [[10, 5, 1, "", "BUILDING"], [10, 5, 1, "", "OPTIMIZATION"], [10, 5, 1, "", "PREDICTION"]], "optunaz.config.Visualization": [[10, 1, 1, "", "ImageFileFormat"], [10, 1, 1, "", "Plots"], [10, 5, 1, "", "file_format"], [10, 5, 1, "", "output_folder"], [10, 5, 1, "", "plots"], [10, 5, 1, "", "use_xvfb"]], "optunaz.config.Visualization.ImageFileFormat": [[10, 5, 1, "", "JPEG"], [10, 5, 1, "", "JPG"], [10, 5, 1, "", "PDF"], [10, 5, 1, "", "PNG"], [10, 5, 1, "", "SVG"]], "optunaz.config.Visualization.Plots": [[10, 5, 1, "", "plot_contour"], [10, 5, 1, "", "plot_history"], [10, 5, 1, "", "plot_parallel_coordinate"], [10, 5, 1, "", "plot_slice"]], "optunaz.config.build_from_opt": [[10, 4, 1, "", "buildconfig_from_trial"], [10, 4, 1, "", "check_invalid_descriptor_param"], [10, 4, 1, "", "encode_name"], [10, 4, 1, "", "remove_algo_hash"], [10, 4, 1, "", "set_build_cache"], [10, 4, 1, "", "suggest_alg_params"], [10, 4, 1, "", "suggest_aux_params"]], "optunaz.config.buildconfig": [[10, 1, 1, "", "AdaBoostClassifier"], [10, 1, 1, "", "Algorithm"], [10, 1, 1, "", "BuildConfig"], [10, 1, 1, "", "CalibratedClassifierCVWithVA"], [10, 1, 1, "", "ChemPropClassifier"], [10, 1, 1, "", "ChemPropHyperoptClassifier"], [10, 1, 1, "", "ChemPropHyperoptRegressor"], [10, 1, 1, "", "ChemPropRegressor"], [10, 1, 1, "", "ChemPropRegressorPretrained"], [10, 1, 1, "", "KNeighborsClassifier"], [10, 1, 1, "", "KNeighborsRegressor"], [10, 1, 1, "", "Lasso"], [10, 1, 1, "", "LogisticRegression"], [10, 1, 1, "", "Mapie"], [10, 1, 1, "", "PLSRegression"], [10, 1, 1, "", "PRFClassifier"], [10, 1, 1, "", "RandomForestClassifier"], [10, 1, 1, "", "RandomForestRegressor"], [10, 1, 1, "", "Ridge"], [10, 1, 1, "", "SVC"], [10, 1, 1, "", "SVR"], [10, 1, 1, "", "XGBRegressor"]], "optunaz.config.buildconfig.AdaBoostClassifier": [[10, 1, 1, "", "AdaBoostClassifierParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.AdaBoostClassifier.AdaBoostClassifierParameters": [[10, 5, 1, "", "learning_rate"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.buildconfig.Algorithm": [[10, 3, 1, "", "estimator"]], "optunaz.config.buildconfig.BuildConfig": [[10, 1, 1, "", "Metadata"], [10, 1, 1, "", "Settings"], [10, 5, 1, "", "algorithm"], [10, 5, 1, "", "data"], [10, 5, 1, "", "descriptor"], [10, 5, 1, "", "metadata"], [10, 5, 1, "", "settings"], [10, 5, 1, "", "task"]], "optunaz.config.buildconfig.BuildConfig.Metadata": [[10, 5, 1, "", "best_trial"], [10, 5, 1, "", "best_value"], [10, 5, 1, "", "cross_validation"], [10, 5, 1, "", "n_trials"], [10, 5, 1, "", "name"], [10, 5, 1, "", "shuffle"], [10, 5, 1, "", "visualization"]], "optunaz.config.buildconfig.BuildConfig.Settings": [[10, 5, 1, "", "direction"], [10, 5, 1, "", "mode"], [10, 5, 1, "", "n_trials"], [10, 5, 1, "", "scoring"], [10, 5, 1, "", "tracking_rest_endpoint"]], "optunaz.config.buildconfig.CalibratedClassifierCVWithVA": [[10, 1, 1, "", "CalibratedClassifierCVParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.CalibratedClassifierCVWithVA.CalibratedClassifierCVParameters": [[10, 5, 1, "", "ensemble"], [10, 5, 1, "", "estimator"], [10, 5, 1, "", "method"], [10, 5, 1, "", "n_folds"]], "optunaz.config.buildconfig.ChemPropClassifier": [[10, 1, 1, "", "ChemPropClassifierParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.ChemPropClassifier.ChemPropClassifierParameters": [[10, 5, 1, "", "activation"], [10, 5, 1, "", "aggregation"], [10, 5, 1, "", "aggregation_norm"], [10, 5, 1, "", "aux_weight_pc"], [10, 5, 1, "", "batch_size"], [10, 5, 1, "", "depth"], [10, 5, 1, "", "dropout"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "ffn_hidden_size"], [10, 5, 1, "", "ffn_num_layers"], [10, 5, 1, "", "final_lr_ratio_exp"], [10, 5, 1, "", "hidden_size"], [10, 5, 1, "", "init_lr_ratio_exp"], [10, 5, 1, "", "max_lr_exp"], [10, 5, 1, "", "warmup_epochs_ratio"]], "optunaz.config.buildconfig.ChemPropHyperoptClassifier": [[10, 1, 1, "", "ChemPropHyperoptClassifierParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.ChemPropHyperoptClassifier.ChemPropHyperoptClassifierParameters": [[10, 5, 1, "", "aux_weight_pc"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "num_iters"], [10, 5, 1, "", "search_parameter_level"]], "optunaz.config.buildconfig.ChemPropHyperoptRegressor": [[10, 1, 1, "", "ChemPropHyperoptRegressorParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.ChemPropHyperoptRegressor.ChemPropHyperoptRegressorParameters": [[10, 5, 1, "", "aux_weight_pc"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "num_iters"], [10, 5, 1, "", "search_parameter_level"]], "optunaz.config.buildconfig.ChemPropRegressor": [[10, 1, 1, "", "ChemPropRegressorParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.ChemPropRegressor.ChemPropRegressorParameters": [[10, 5, 1, "", "activation"], [10, 5, 1, "", "aggregation"], [10, 5, 1, "", "aggregation_norm"], [10, 5, 1, "", "aux_weight_pc"], [10, 5, 1, "", "batch_size"], [10, 5, 1, "", "depth"], [10, 5, 1, "", "dropout"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "ffn_hidden_size"], [10, 5, 1, "", "ffn_num_layers"], [10, 5, 1, "", "final_lr_ratio_exp"], [10, 5, 1, "", "hidden_size"], [10, 5, 1, "", "init_lr_ratio_exp"], [10, 5, 1, "", "max_lr_exp"], [10, 5, 1, "", "warmup_epochs_ratio"]], "optunaz.config.buildconfig.ChemPropRegressorPretrained": [[10, 1, 1, "", "ChemPropRegressorPretrainedParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.ChemPropRegressorPretrained.ChemPropRegressorPretrainedParameters": [[10, 5, 1, "", "epochs"], [10, 5, 1, "", "frzn"], [10, 5, 1, "", "pretrained_model"]], "optunaz.config.buildconfig.KNeighborsClassifier": [[10, 1, 1, "", "KNeighborsClassifierParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.KNeighborsClassifier.KNeighborsClassifierParameters": [[10, 5, 1, "", "metric"], [10, 5, 1, "", "n_neighbors"], [10, 5, 1, "", "weights"]], "optunaz.config.buildconfig.KNeighborsRegressor": [[10, 1, 1, "", "KNeighborsRegressorParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.KNeighborsRegressor.KNeighborsRegressorParameters": [[10, 5, 1, "", "metric"], [10, 5, 1, "", "n_neighbors"], [10, 5, 1, "", "weights"]], "optunaz.config.buildconfig.Lasso": [[10, 1, 1, "", "LassoParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.Lasso.LassoParameters": [[10, 5, 1, "", "alpha"]], "optunaz.config.buildconfig.LogisticRegression": [[10, 1, 1, "", "LogisticRegressionParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.LogisticRegression.LogisticRegressionParameters": [[10, 5, 1, "", "C"], [10, 5, 1, "", "solver"]], "optunaz.config.buildconfig.Mapie": [[10, 1, 1, "", "MapieParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.Mapie.MapieParameters": [[10, 5, 1, "", "estimator"], [10, 5, 1, "", "mapie_alpha"]], "optunaz.config.buildconfig.PLSRegression": [[10, 1, 1, "", "PLSParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.PLSRegression.PLSParameters": [[10, 5, 1, "", "n_components"]], "optunaz.config.buildconfig.PRFClassifier": [[10, 1, 1, "", "PRFClassifierParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.PRFClassifier.PRFClassifierParameters": [[10, 5, 1, "", "bootstrap"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "min_py_sum_leaf"], [10, 5, 1, "", "n_estimators"], [10, 5, 1, "", "new_syn_data_frac"], [10, 5, 1, "", "use_py_gini"], [10, 5, 1, "", "use_py_leafs"]], "optunaz.config.buildconfig.RandomForestClassifier": [[10, 1, 1, "", "RandomForestParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.RandomForestClassifier.RandomForestParameters": [[10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.buildconfig.RandomForestRegressor": [[10, 1, 1, "", "RandomForestParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.RandomForestRegressor.RandomForestParameters": [[10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.buildconfig.Ridge": [[10, 1, 1, "", "RidgeParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.Ridge.RidgeParameters": [[10, 5, 1, "", "alpha"]], "optunaz.config.buildconfig.SVC": [[10, 1, 1, "", "SVCParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.SVC.SVCParameters": [[10, 5, 1, "", "C"], [10, 5, 1, "", "gamma"]], "optunaz.config.buildconfig.SVR": [[10, 1, 1, "", "SVRParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.SVR.SVRParameters": [[10, 5, 1, "", "C"], [10, 5, 1, "", "gamma"]], "optunaz.config.buildconfig.XGBRegressor": [[10, 1, 1, "", "XGBRegressorParameters"], [10, 3, 1, "", "estimator"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.buildconfig.XGBRegressor.XGBRegressorParameters": [[10, 5, 1, "", "learning_rate"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.optconfig": [[10, 1, 1, "", "AdaBoostClassifier"], [10, 1, 1, "", "Algorithm"], [10, 1, 1, "", "CalibratedClassifierCVEnsemble"], [10, 1, 1, "", "CalibratedClassifierCVMethod"], [10, 1, 1, "", "CalibratedClassifierCVWithVA"], [10, 1, 1, "", "ChemPropActivation"], [10, 1, 1, "", "ChemPropAggregation"], [10, 1, 1, "", "ChemPropClassifier"], [10, 1, 1, "", "ChemPropFeatures_Generator"], [10, 1, 1, "", "ChemPropFrzn"], [10, 1, 1, "", "ChemPropHyperoptClassifier"], [10, 1, 1, "", "ChemPropHyperoptRegressor"], [10, 1, 1, "", "ChemPropRegressor"], [10, 1, 1, "", "ChemPropRegressorPretrained"], [10, 1, 1, "", "ChemPropSearch_Parameter_Level"], [10, 1, 1, "", "ClassificationScore"], [10, 1, 1, "", "KNeighborsClassifier"], [10, 1, 1, "", "KNeighborsMetric"], [10, 1, 1, "", "KNeighborsRegressor"], [10, 1, 1, "", "KNeighborsWeights"], [10, 1, 1, "", "Lasso"], [10, 1, 1, "", "LogisticRegression"], [10, 1, 1, "", "Mapie"], [10, 1, 1, "", "OptimizationConfig"], [10, 1, 1, "", "PLSRegression"], [10, 1, 1, "", "PRFClassifier"], [10, 1, 1, "", "PRFClassifierMaxFeatures"], [10, 1, 1, "", "RandomForestClassifier"], [10, 1, 1, "", "RandomForestMaxFeatures"], [10, 1, 1, "", "RandomForestRegressor"], [10, 1, 1, "", "RegressionScore"], [10, 1, 1, "", "Ridge"], [10, 1, 1, "", "SVC"], [10, 1, 1, "", "SVR"], [10, 1, 1, "", "XGBRegressor"], [10, 4, 1, "", "copy_path_for_scaled_descriptor"], [10, 4, 1, "", "detect_mode_from_algs"], [10, 4, 1, "", "isanyof"]], "optunaz.config.optconfig.AdaBoostClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.AdaBoostClassifier.Parameters": [[10, 1, 1, "", "AdaBoostClassifierParametersLearningRate"], [10, 1, 1, "", "AdaBoostClassifierParametersNEstimators"], [10, 5, 1, "", "learning_rate"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.optconfig.AdaBoostClassifier.Parameters.AdaBoostClassifierParametersLearningRate": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.AdaBoostClassifier.Parameters.AdaBoostClassifierParametersNEstimators": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.CalibratedClassifierCVEnsemble": [[10, 5, 1, "", "FALSE"], [10, 5, 1, "", "TRUE"]], "optunaz.config.optconfig.CalibratedClassifierCVMethod": [[10, 5, 1, "", "ISOTONIC"], [10, 5, 1, "", "SIGMOID"], [10, 5, 1, "", "VENNABERS"]], "optunaz.config.optconfig.CalibratedClassifierCVWithVA": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.CalibratedClassifierCVWithVA.Parameters": [[10, 5, 1, "", "ensemble"], [10, 5, 1, "", "estimator"], [10, 5, 1, "", "method"], [10, 5, 1, "", "n_folds"]], "optunaz.config.optconfig.ChemPropActivation": [[10, 5, 1, "", "ELU"], [10, 5, 1, "", "LEAKYRELU"], [10, 5, 1, "", "PRELU"], [10, 5, 1, "", "RELU"], [10, 5, 1, "", "SELU"], [10, 5, 1, "", "TANH"]], "optunaz.config.optconfig.ChemPropAggregation": [[10, 5, 1, "", "MEAN"], [10, 5, 1, "", "NORM"], [10, 5, 1, "", "SUM"]], "optunaz.config.optconfig.ChemPropClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters": [[10, 1, 1, "", "ChemPropParametersAggregation_Norm"], [10, 1, 1, "", "ChemPropParametersBatch_Size"], [10, 1, 1, "", "ChemPropParametersDepth"], [10, 1, 1, "", "ChemPropParametersDropout"], [10, 1, 1, "", "ChemPropParametersFFN_Hidden_Size"], [10, 1, 1, "", "ChemPropParametersFFN_Num_Layers"], [10, 1, 1, "", "ChemPropParametersFinal_Lr_Ratio_Exp"], [10, 1, 1, "", "ChemPropParametersHidden_Size"], [10, 1, 1, "", "ChemPropParametersInit_Lr_Ratio_Exp"], [10, 1, 1, "", "ChemPropParametersMax_Lr_Exp"], [10, 1, 1, "", "ChemPropParametersWarmup_Epochs_Ratio"], [10, 5, 1, "", "activation"], [10, 5, 1, "", "aggregation"], [10, 5, 1, "", "aggregation_norm"], [10, 5, 1, "", "batch_size"], [10, 5, 1, "", "depth"], [10, 5, 1, "", "dropout"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "ffn_hidden_size"], [10, 5, 1, "", "ffn_num_layers"], [10, 5, 1, "", "final_lr_ratio_exp"], [10, 5, 1, "", "hidden_size"], [10, 5, 1, "", "init_lr_ratio_exp"], [10, 5, 1, "", "max_lr_exp"], [10, 5, 1, "", "warmup_epochs_ratio"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersAggregation_Norm": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersBatch_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersDropout": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersFFN_Hidden_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersFFN_Num_Layers": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersFinal_Lr_Ratio_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersHidden_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersInit_Lr_Ratio_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersMax_Lr_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropClassifier.Parameters.ChemPropParametersWarmup_Epochs_Ratio": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropFeatures_Generator": [[10, 5, 1, "", "MORGAN"], [10, 5, 1, "", "MORGAN_COUNT"], [10, 5, 1, "", "NONE"], [10, 5, 1, "", "RDKIT_2D"], [10, 5, 1, "", "RDKIT_2D_NORMALIZED"]], "optunaz.config.optconfig.ChemPropFrzn": [[10, 5, 1, "", "MPNN"], [10, 5, 1, "", "MPNN_FIRST_FFN"], [10, 5, 1, "", "MPNN_LAST_FFN"], [10, 5, 1, "", "NONE"]], "optunaz.config.optconfig.ChemPropHyperoptClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.ChemPropHyperoptClassifier.Parameters": [[10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "num_iters"], [10, 5, 1, "", "search_parameter_level"]], "optunaz.config.optconfig.ChemPropHyperoptRegressor": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.ChemPropHyperoptRegressor.Parameters": [[10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "num_iters"], [10, 5, 1, "", "search_parameter_level"]], "optunaz.config.optconfig.ChemPropRegressor": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters": [[10, 1, 1, "", "ChemPropParametersAggregation_Norm"], [10, 1, 1, "", "ChemPropParametersBatch_Size"], [10, 1, 1, "", "ChemPropParametersDepth"], [10, 1, 1, "", "ChemPropParametersDropout"], [10, 1, 1, "", "ChemPropParametersFFN_Hidden_Size"], [10, 1, 1, "", "ChemPropParametersFFN_Num_Layers"], [10, 1, 1, "", "ChemPropParametersFinal_Lr_Ratio_Exp"], [10, 1, 1, "", "ChemPropParametersHidden_Size"], [10, 1, 1, "", "ChemPropParametersInit_Lr_Ratio_Exp"], [10, 1, 1, "", "ChemPropParametersMax_Lr_Exp"], [10, 1, 1, "", "ChemPropParametersWarmup_Epochs_Ratio"], [10, 5, 1, "", "activation"], [10, 5, 1, "", "aggregation"], [10, 5, 1, "", "aggregation_norm"], [10, 5, 1, "", "batch_size"], [10, 5, 1, "", "depth"], [10, 5, 1, "", "dropout"], [10, 5, 1, "", "ensemble_size"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "features_generator"], [10, 5, 1, "", "ffn_hidden_size"], [10, 5, 1, "", "ffn_num_layers"], [10, 5, 1, "", "final_lr_ratio_exp"], [10, 5, 1, "", "hidden_size"], [10, 5, 1, "", "init_lr_ratio_exp"], [10, 5, 1, "", "max_lr_exp"], [10, 5, 1, "", "warmup_epochs_ratio"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersAggregation_Norm": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersBatch_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersDropout": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersFFN_Hidden_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersFFN_Num_Layers": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersFinal_Lr_Ratio_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersHidden_Size": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersInit_Lr_Ratio_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersMax_Lr_Exp": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.ChemPropRegressor.Parameters.ChemPropParametersWarmup_Epochs_Ratio": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropRegressorPretrained": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.ChemPropRegressorPretrained.Parameters": [[10, 1, 1, "", "ChemPropParametersEpochs"], [10, 5, 1, "", "epochs"], [10, 5, 1, "", "frzn"], [10, 5, 1, "", "pretrained_model"]], "optunaz.config.optconfig.ChemPropRegressorPretrained.Parameters.ChemPropParametersEpochs": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"], [10, 5, 1, "", "q"]], "optunaz.config.optconfig.ChemPropSearch_Parameter_Level": [[10, 5, 1, "", "AUTO"], [10, 5, 1, "", "L1"], [10, 5, 1, "", "L2"], [10, 5, 1, "", "L3"], [10, 5, 1, "", "L4"], [10, 5, 1, "", "L5"], [10, 5, 1, "", "L6"], [10, 5, 1, "", "L7"], [10, 5, 1, "", "L8"]], "optunaz.config.optconfig.ClassificationScore": [[10, 5, 1, "", "ACCURACY"], [10, 5, 1, "", "AUC_PR_CAL"], [10, 5, 1, "", "AVERAGE_PRECISION"], [10, 5, 1, "", "BALANCED_ACCURACY"], [10, 5, 1, "", "BEDROC"], [10, 5, 1, "", "CONCORDANCE_INDEX"], [10, 5, 1, "", "F1"], [10, 5, 1, "", "F1_MACRO"], [10, 5, 1, "", "F1_MICRO"], [10, 5, 1, "", "F1_WEIGHTED"], [10, 5, 1, "", "JACCARD"], [10, 5, 1, "", "JACCARD_MACRO"], [10, 5, 1, "", "JACCARD_MICRO"], [10, 5, 1, "", "JACCARD_WEIGHTED"], [10, 5, 1, "", "NEG_BRIER_SCORE"], [10, 5, 1, "", "PRECISION"], [10, 5, 1, "", "PRECISION_MACRO"], [10, 5, 1, "", "PRECISION_MICRO"], [10, 5, 1, "", "PRECISION_WEIGHTED"], [10, 5, 1, "", "RECALL"], [10, 5, 1, "", "RECALL_MACRO"], [10, 5, 1, "", "RECALL_MICRO"], [10, 5, 1, "", "RECALL_WEIGHTED"], [10, 5, 1, "", "ROC_AUC"]], "optunaz.config.optconfig.KNeighborsClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.KNeighborsClassifier.Parameters": [[10, 1, 1, "", "KNeighborsClassifierParametersN_Neighbors"], [10, 5, 1, "", "metric"], [10, 5, 1, "", "n_neighbors"], [10, 5, 1, "", "weights"]], "optunaz.config.optconfig.KNeighborsClassifier.Parameters.KNeighborsClassifierParametersN_Neighbors": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.KNeighborsMetric": [[10, 5, 1, "", "EUCLIDEAN"], [10, 5, 1, "", "MANHATTAN"], [10, 5, 1, "", "MINKOWSKI"]], "optunaz.config.optconfig.KNeighborsRegressor": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.KNeighborsRegressor.Parameters": [[10, 1, 1, "", "KNeighborsRegressorParametersN_Neighbors"], [10, 5, 1, "", "metric"], [10, 5, 1, "", "n_neighbors"], [10, 5, 1, "", "weights"]], "optunaz.config.optconfig.KNeighborsRegressor.Parameters.KNeighborsRegressorParametersN_Neighbors": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.KNeighborsWeights": [[10, 5, 1, "", "DISTANCE"], [10, 5, 1, "", "UNIFORM"]], "optunaz.config.optconfig.Lasso": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.Lasso.Parameters": [[10, 1, 1, "", "LassoParametersAlpha"], [10, 5, 1, "", "alpha"]], "optunaz.config.optconfig.Lasso.Parameters.LassoParametersAlpha": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.LogisticRegression": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.LogisticRegression.Parameters": [[10, 5, 1, "", "C"], [10, 1, 1, "", "LogisticRegressionParametersParameterC"], [10, 5, 1, "", "solver"]], "optunaz.config.optconfig.LogisticRegression.Parameters.LogisticRegressionParametersParameterC": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.Mapie": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.Mapie.Parameters": [[10, 5, 1, "", "estimator"], [10, 5, 1, "", "mapie_alpha"]], "optunaz.config.optconfig.OptimizationConfig": [[10, 1, 1, "", "Settings"], [10, 5, 1, "", "algorithms"], [10, 5, 1, "", "data"], [10, 5, 1, "", "description"], [10, 5, 1, "", "descriptors"], [10, 5, 1, "", "mode"], [10, 5, 1, "", "name"], [10, 3, 1, "", "set_algo_hashes"], [10, 3, 1, "", "set_cache"], [10, 5, 1, "", "settings"], [10, 5, 1, "", "task"], [10, 5, 1, "", "visualization"]], "optunaz.config.optconfig.OptimizationConfig.Settings": [[10, 5, 1, "", "cross_validation"], [10, 5, 1, "", "cv_split_strategy"], [10, 5, 1, "", "direction"], [10, 5, 1, "", "minimise_std_dev"], [10, 5, 1, "", "mode"], [10, 5, 1, "", "n_chemprop_trials"], [10, 5, 1, "", "n_jobs"], [10, 5, 1, "", "n_startup_trials"], [10, 5, 1, "", "n_trials"], [10, 5, 1, "", "optuna_storage"], [10, 5, 1, "", "random_seed"], [10, 5, 1, "", "scoring"], [10, 5, 1, "", "shuffle"], [10, 5, 1, "", "split_chemprop"], [10, 5, 1, "", "track_to_mlflow"], [10, 5, 1, "", "tracking_rest_endpoint"], [10, 5, 1, "", "use_cache"]], "optunaz.config.optconfig.PLSRegression": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.PLSRegression.Parameters": [[10, 1, 1, "", "NComponents"], [10, 5, 1, "", "n_components"]], "optunaz.config.optconfig.PLSRegression.Parameters.NComponents": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.PRFClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.PRFClassifier.Parameters": [[10, 1, 1, "", "PRFClassifierParametersMaxDepth"], [10, 1, 1, "", "PRFClassifierParametersMinPySumLeaf"], [10, 1, 1, "", "PRFClassifierParametersNEstimators"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "min_py_sum_leaf"], [10, 5, 1, "", "n_estimators"], [10, 5, 1, "", "use_py_gini"], [10, 5, 1, "", "use_py_leafs"]], "optunaz.config.optconfig.PRFClassifier.Parameters.PRFClassifierParametersMaxDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.PRFClassifier.Parameters.PRFClassifierParametersMinPySumLeaf": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.PRFClassifier.Parameters.PRFClassifierParametersNEstimators": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.PRFClassifierMaxFeatures": [[10, 5, 1, "", "AUTO"], [10, 5, 1, "", "LOG2"], [10, 5, 1, "", "SQRT"]], "optunaz.config.optconfig.RandomForestClassifier": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.RandomForestClassifier.Parameters": [[10, 1, 1, "", "RandomForestClassifierParametersMaxDepth"], [10, 1, 1, "", "RandomForestClassifierParametersNEstimators"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.optconfig.RandomForestClassifier.Parameters.RandomForestClassifierParametersMaxDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.RandomForestClassifier.Parameters.RandomForestClassifierParametersNEstimators": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.RandomForestMaxFeatures": [[10, 5, 1, "", "AUTO"], [10, 5, 1, "", "LOG2"], [10, 5, 1, "", "SQRT"]], "optunaz.config.optconfig.RandomForestRegressor": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.RandomForestRegressor.Parameters": [[10, 1, 1, "", "RandomForestRegressorParametersMaxDepth"], [10, 1, 1, "", "RandomForestRegressorParametersNEstimators"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "max_features"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.optconfig.RandomForestRegressor.Parameters.RandomForestRegressorParametersMaxDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.RandomForestRegressor.Parameters.RandomForestRegressorParametersNEstimators": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.RegressionScore": [[10, 5, 1, "", "EXPLAINED_VARIANCE"], [10, 5, 1, "", "MAX_ERROR"], [10, 5, 1, "", "NEG_MEAN_ABSOLUTE_ERROR"], [10, 5, 1, "", "NEG_MEAN_SQUARED_ERROR"], [10, 5, 1, "", "NEG_MEDIAN_ABSOLUTE_ERROR"], [10, 5, 1, "", "R2"]], "optunaz.config.optconfig.Ridge": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.Ridge.Parameters": [[10, 1, 1, "", "Alpha"], [10, 5, 1, "", "alpha"]], "optunaz.config.optconfig.Ridge.Parameters.Alpha": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.SVC": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.SVC.Parameters": [[10, 5, 1, "", "C"], [10, 1, 1, "", "Gamma"], [10, 1, 1, "", "SVCParametersParameterC"], [10, 5, 1, "", "gamma"]], "optunaz.config.optconfig.SVC.Parameters.Gamma": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.SVC.Parameters.SVCParametersParameterC": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.SVR": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.SVR.Parameters": [[10, 5, 1, "", "C"], [10, 1, 1, "", "SVRParametersGamma"], [10, 1, 1, "", "SVRParametersParameterC"], [10, 5, 1, "", "gamma"]], "optunaz.config.optconfig.SVR.Parameters.SVRParametersGamma": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.SVR.Parameters.SVRParametersParameterC": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.XGBRegressor": [[10, 1, 1, "", "Parameters"], [10, 5, 1, "", "name"], [10, 5, 1, "", "parameters"]], "optunaz.config.optconfig.XGBRegressor.Parameters": [[10, 1, 1, "", "LearningRate"], [10, 1, 1, "", "MaxDepth"], [10, 1, 1, "", "NEstimators"], [10, 5, 1, "", "learning_rate"], [10, 5, 1, "", "max_depth"], [10, 5, 1, "", "n_estimators"]], "optunaz.config.optconfig.XGBRegressor.Parameters.LearningRate": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.XGBRegressor.Parameters.MaxDepth": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.config.optconfig.XGBRegressor.Parameters.NEstimators": [[10, 5, 1, "", "high"], [10, 5, 1, "", "low"]], "optunaz.datareader": [[9, 1, 1, "", "Dataset"], [9, 4, 1, "", "deduplicate"], [9, 4, 1, "", "isvalid"], [9, 4, 1, "", "merge"], [9, 4, 1, "", "read_data"], [9, 4, 1, "", "split"], [9, 4, 1, "", "transform"]], "optunaz.datareader.Dataset": [[9, 5, 1, "", "aux_column"], [9, 5, 1, "", "aux_transform"], [9, 3, 1, "", "check_sets"], [9, 5, 1, "", "deduplication_strategy"], [9, 3, 1, "", "get_merged_sets"], [9, 3, 1, "", "get_sets"], [9, 5, 1, "", "input_column"], [9, 5, 1, "", "intermediate_test_dataset_file"], [9, 5, 1, "", "intermediate_training_dataset_file"], [9, 5, 1, "", "log_transform"], [9, 5, 1, "", "log_transform_base"], [9, 5, 1, "", "log_transform_negative"], [9, 5, 1, "", "log_transform_unit_conversion"], [9, 5, 1, "", "probabilistic_threshold_representation"], [9, 5, 1, "", "probabilistic_threshold_representation_std"], [9, 5, 1, "", "probabilistic_threshold_representation_threshold"], [9, 5, 1, "", "response_column"], [9, 5, 1, "", "response_type"], [9, 5, 1, "", "save_intermediate_files"], [9, 5, 1, "", "split_strategy"], [9, 5, 1, "", "test_dataset_file"], [9, 5, 1, "", "training_dataset_file"]], "optunaz.descriptors": [[9, 1, 1, "", "AmorProtDescriptors"], [9, 1, 1, "", "Avalon"], [9, 1, 1, "", "CanonicalSmiles"], [9, 1, 1, "", "CompositeDescriptor"], [9, 1, 1, "", "ECFP"], [9, 1, 1, "", "ECFP_counts"], [9, 1, 1, "", "FittedSklearnScaler"], [9, 1, 1, "", "GenericScaffold"], [9, 1, 1, "", "JazzyDescriptors"], [9, 1, 1, "", "MACCS_keys"], [9, 1, 1, "", "MAPC"], [9, 1, 1, "", "MolDescriptor"], [9, 6, 1, "", "NoValidSmiles"], [9, 1, 1, "", "PathFP"], [9, 1, 1, "", "PhyschemDescriptors"], [9, 1, 1, "", "PrecomputedDescriptorFromFile"], [9, 1, 1, "", "RdkitDescriptor"], [9, 1, 1, "", "Scaffold"], [9, 1, 1, "", "ScaledDescriptor"], [9, 6, 1, "", "ScalingFittingError"], [9, 1, 1, "", "SmilesAndSideInfoFromFile"], [9, 1, 1, "", "SmilesFromFile"], [9, 1, 1, "", "UnfittedSklearnScaler"], [9, 1, 1, "", "UnscaledJazzyDescriptors"], [9, 1, 1, "", "UnscaledMAPC"], [9, 1, 1, "", "UnscaledPhyschemDescriptors"], [9, 1, 1, "", "UnscaledZScalesDescriptors"], [9, 1, 1, "", "ValidDescriptor"], [9, 1, 1, "", "ZScalesDescriptors"], [9, 4, 1, "", "descriptor_from_config"], [9, 4, 1, "", "mol_from_smi"], [9, 4, 1, "", "numpy_from_rdkit"]], "optunaz.descriptors.AmorProtDescriptors": [[9, 1, 1, "", "AmorProt"], [9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.AmorProtDescriptors.AmorProt": [[9, 3, 1, "", "T"], [9, 3, 1, "", "fingerprint"]], "optunaz.descriptors.Avalon": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.Avalon.Parameters": [[9, 5, 1, "", "nBits"]], "optunaz.descriptors.CanonicalSmiles": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.CompositeDescriptor": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 3, 1, "", "fp_info"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.CompositeDescriptor.Parameters": [[9, 5, 1, "", "descriptors"]], "optunaz.descriptors.ECFP": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ECFP.Parameters": [[9, 5, 1, "", "nBits"], [9, 5, 1, "", "radius"], [9, 5, 1, "", "returnRdkit"]], "optunaz.descriptors.ECFP_counts": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ECFP_counts.Parameters": [[9, 5, 1, "", "nBits"], [9, 5, 1, "", "radius"], [9, 5, 1, "", "useFeatures"]], "optunaz.descriptors.FittedSklearnScaler": [[9, 3, 1, "", "get_fitted_scaler"], [9, 5, 1, "", "name"], [9, 5, 1, "", "saved_params"]], "optunaz.descriptors.GenericScaffold": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.JazzyDescriptors": [[9, 1, 1, "", "Parameters"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.JazzyDescriptors.Parameters": [[9, 5, 1, "", "descriptor"], [9, 5, 1, "", "jazzy_filters"], [9, 5, 1, "", "jazzy_names"], [9, 5, 1, "", "scaler"]], "optunaz.descriptors.MACCS_keys": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.MAPC": [[9, 1, 1, "", "Parameters"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.MAPC.Parameters": [[9, 5, 1, "", "descriptor"], [9, 5, 1, "", "maxRadius"], [9, 5, 1, "", "nPermutations"], [9, 5, 1, "", "scaler"]], "optunaz.descriptors.MolDescriptor": [[9, 3, 1, "", "calculate_from_smi"], [9, 3, 1, "", "parallel_compute_descriptor"]], "optunaz.descriptors.PathFP": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.PathFP.Parameters": [[9, 5, 1, "", "fpSize"], [9, 5, 1, "", "maxPath"]], "optunaz.descriptors.PhyschemDescriptors": [[9, 1, 1, "", "Parameters"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.PhyschemDescriptors.Parameters": [[9, 5, 1, "", "descriptor"], [9, 5, 1, "", "rdkit_names"], [9, 5, 1, "", "scaler"]], "optunaz.descriptors.PrecomputedDescriptorFromFile": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 3, 1, "", "inference_parameters"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.PrecomputedDescriptorFromFile.Parameters": [[9, 5, 1, "", "file"], [9, 5, 1, "", "input_column"], [9, 5, 1, "", "response_column"]], "optunaz.descriptors.RdkitDescriptor": [[9, 3, 1, "", "calculate_from_mol"], [9, 3, 1, "", "calculate_from_smi"]], "optunaz.descriptors.Scaffold": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ScaledDescriptor": [[9, 1, 1, "", "ScaledDescriptorParameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"], [9, 3, 1, "", "set_unfitted_scaler_data"]], "optunaz.descriptors.ScaledDescriptor.ScaledDescriptorParameters": [[9, 5, 1, "", "descriptor"], [9, 5, 1, "", "scaler"]], "optunaz.descriptors.SmilesAndSideInfoFromFile": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.SmilesAndSideInfoFromFile.Parameters": [[9, 1, 1, "", "Aux_Weight_Pc"], [9, 5, 1, "", "aux_weight_pc"], [9, 5, 1, "", "file"], [9, 5, 1, "", "input_column"]], "optunaz.descriptors.SmilesAndSideInfoFromFile.Parameters.Aux_Weight_Pc": [[9, 5, 1, "", "high"], [9, 5, 1, "", "low"], [9, 5, 1, "", "q"]], "optunaz.descriptors.SmilesFromFile": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.UnfittedSklearnScaler": [[9, 1, 1, "", "MolData"], [9, 3, 1, "", "get_fitted_scaler_for_fp"], [9, 5, 1, "", "mol_data"], [9, 5, 1, "", "name"]], "optunaz.descriptors.UnfittedSklearnScaler.MolData": [[9, 5, 1, "", "file_path"], [9, 5, 1, "", "smiles_column"]], "optunaz.descriptors.UnscaledJazzyDescriptors": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.UnscaledJazzyDescriptors.Parameters": [[9, 5, 1, "", "jazzy_filters"], [9, 5, 1, "", "jazzy_names"]], "optunaz.descriptors.UnscaledMAPC": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.UnscaledMAPC.Parameters": [[9, 5, 1, "", "maxRadius"], [9, 5, 1, "", "nPermutations"]], "optunaz.descriptors.UnscaledPhyschemDescriptors": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_mol"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.UnscaledPhyschemDescriptors.Parameters": [[9, 5, 1, "", "rdkit_names"]], "optunaz.descriptors.UnscaledZScalesDescriptors": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ValidDescriptor": [[9, 1, 1, "", "Parameters"], [9, 3, 1, "", "calculate_from_smi"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ZScalesDescriptors": [[9, 1, 1, "", "Parameters"], [9, 5, 1, "", "name"], [9, 5, 1, "", "parameters"]], "optunaz.descriptors.ZScalesDescriptors.Parameters": [[9, 5, 1, "", "descriptor"], [9, 5, 1, "", "scaler"]], "optunaz.evaluate": [[9, 4, 1, "", "get_merged_train_score"], [9, 4, 1, "", "get_scores"], [9, 4, 1, "", "get_train_test_scores"], [9, 4, 1, "", "score_all"], [9, 4, 1, "", "score_all_smiles"]], "optunaz.explainability": [[9, 4, 1, "", "ExplainPreds"], [9, 4, 1, "", "ShapExplainer"], [9, 4, 1, "", "explain_ECFP"], [9, 4, 1, "", "get_ecfp_fpinfo"], [9, 4, 1, "", "get_ecfpcount_fpinfo"], [9, 4, 1, "", "get_fp_info"], [9, 4, 1, "", "runShap"]], "optunaz.metircs": [[9, 4, 1, "", "auc_pr_cal"], [9, 4, 1, "", "bedroc_score"], [9, 4, 1, "", "concordance_index"], [9, 4, 1, "", "validate_cls_input"]], "optunaz.model_writer": [[9, 1, 1, "", "Predictor"], [9, 1, 1, "", "QSARtunaModel"], [9, 4, 1, "", "get_metadata"], [9, 4, 1, "", "get_transform"], [9, 4, 1, "", "perform_ptr"], [9, 4, 1, "", "save_model"], [9, 4, 1, "", "wrap_model"]], "optunaz.model_writer.Predictor": [[9, 3, 1, "", "explain"], [9, 3, 1, "", "predict"], [9, 3, 1, "", "predict_proba"], [9, 3, 1, "", "predict_uncert"]], "optunaz.model_writer.QSARtunaModel": [[9, 5, 1, "", "aux_transform"], [9, 5, 1, "", "descriptor"], [9, 5, 1, "", "metadata"], [9, 5, 1, "", "mode"], [9, 3, 1, "", "predict_from_smiles"], [9, 5, 1, "", "predictor"], [9, 5, 1, "", "transform"]], "optunaz.objective": [[9, 6, 1, "", "NoValidDescriptors"], [9, 1, 1, "", "Objective"], [9, 4, 1, "", "null_scores"]], "optunaz.objective.Objective": [[9, 5, 1, "", "cache"], [9, 5, 1, "", "optconfig"], [9, 5, 1, "", "train_aux"], [9, 5, 1, "", "train_smiles"], [9, 5, 1, "", "train_y"]], "optunaz.optbuild": [[9, 4, 1, "", "main"]], "optunaz.predict": [[9, 6, 1, "", "ArgsError"], [9, 6, 1, "", "AuxCovariateMissing"], [9, 6, 1, "", "PrecomputedError"], [9, 6, 1, "", "UncertaintyError"], [9, 4, 1, "", "check_precomp_args"], [9, 4, 1, "", "main"], [9, 4, 1, "", "set_inference_params"], [9, 4, 1, "", "validate_args"], [9, 4, 1, "", "validate_aux"], [9, 4, 1, "", "validate_set_precomputed"], [9, 4, 1, "", "validate_uncertainty"]], "optunaz.schemagen": [[9, 4, 1, "", "doctitle"], [9, 4, 1, "", "main"], [9, 4, 1, "", "patch_schema_generic"], [9, 4, 1, "", "patch_schema_optunaz"], [9, 4, 1, "", "type_base_schema"]], "optunaz.three_step_opt_build_merge": [[9, 4, 1, "", "base_chemprop_params"], [9, 4, 1, "", "build_best"], [9, 4, 1, "", "build_merged"], [9, 4, 1, "", "buildconfig_best"], [9, 4, 1, "", "log_scores"], [9, 4, 1, "", "optimize"], [9, 4, 1, "", "run_study"], [9, 4, 1, "", "split_optimize"]], "optunaz.utils": [[12, 0, 0, "-", "enums"], [11, 0, 0, "-", "files_paths"], [11, 4, 1, "", "load_df_from_file"], [11, 0, 0, "-", "load_json"], [11, 4, 1, "", "md5_hash"], [11, 4, 1, "", "mkdict"], [11, 0, 0, "-", "mlflow"], [13, 0, 0, "-", "preprocessing"], [11, 4, 1, "", "remove_failed_idx"], [11, 0, 0, "-", "retraining"], [11, 0, 0, "-", "schema"], [11, 0, 0, "-", "tracking"]], "optunaz.utils.enums": [[12, 1, 1, "", "MlflowLogParams"], [12, 1, 1, "", "StudyUserAttrs"], [12, 1, 1, "", "TrialParams"], [12, 1, 1, "", "TrialUserAttrs"], [12, 0, 0, "-", "building_configuration_enum"], [12, 0, 0, "-", "configuration_enum"], [12, 0, 0, "-", "interface_enum"], [12, 0, 0, "-", "model_runner_enum"], [12, 0, 0, "-", "objective_enum"], [12, 0, 0, "-", "optimization_configuration_enum"], [12, 0, 0, "-", "prediction_configuration_enum"], [12, 0, 0, "-", "return_values_enum"], [12, 0, 0, "-", "visualization_enum"]], "optunaz.utils.enums.MlflowLogParams": [[12, 5, 1, "", "TRIAL_NUMBER"]], "optunaz.utils.enums.StudyUserAttrs": [[12, 5, 1, "", "OPTCONFIG"]], "optunaz.utils.enums.TrialParams": [[12, 5, 1, "", "ALGORITHM_HASH"], [12, 5, 1, "", "ALGORITHM_NAME"], [12, 5, 1, "", "DESCRIPTOR"]], "optunaz.utils.enums.TrialUserAttrs": [[12, 5, 1, "", "TEST_SCORES"], [12, 5, 1, "", "TRAIN_SCORES"]], "optunaz.utils.enums.building_configuration_enum": [[12, 1, 1, "", "BuildingConfigurationEnum"]], "optunaz.utils.enums.building_configuration_enum.BuildingConfigurationEnum": [[12, 5, 1, "", "GENERAL_CLASSIFIER"], [12, 5, 1, "", "GENERAL_HYPERPARAMETERS"], [12, 5, 1, "", "GENERAL_REGRESSOR"], [12, 5, 1, "", "METADATA"], [12, 5, 1, "", "METADATA_BESTTRIAL"], [12, 5, 1, "", "METADATA_BESTVALUE"]], "optunaz.utils.enums.configuration_enum": [[12, 1, 1, "", "ConfigurationEnum"]], "optunaz.utils.enums.configuration_enum.ConfigurationEnum": [[12, 5, 1, "", "ALGORITHMS"], [12, 5, 1, "", "ALGORITHMS_ADABOOSTCLASSIFIER"], [12, 5, 1, "", "ALGORITHMS_ADABOOSTCLASSIFIER_LEARNING_RATE"], [12, 5, 1, "", "ALGORITHMS_ADABOOSTCLASSIFIER_N_ESTIMATORS"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV_ENSEMBLE"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV_ESTIMATOR"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV_METHOD"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV_N_FOLDS"], [12, 5, 1, "", "ALGORITHMS_CALIBRATEDCLASSIFIERCV_PARAMS"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_ACTIVATION"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_AGGREGATION"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_AGGREGATION_NORM"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_BATCH_SIZE"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_CLASSIFIER"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_DEPTH"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_DROPOUT"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_ENSEMBLE_SIZE"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_EPOCHS"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_FEATURES_GENERATOR"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_FFN_HIDDEN_SIZE"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_FFN_NUM_LAYERS"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_FINAL_LR_RATIO_EXP"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_FRZN"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_HIDDEN_SIZE"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_HYPEROPT_CLASSIFIER"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_HYPEROPT_REGRESSOR"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_INIT_LR_RATIO_EXP"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_MAX_LR_EXP"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_NUM_ITERS"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_PRETRAINED_MODEL"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_REGRESSOR"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_SEARCH_PARAMETER_LEVEL"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_STARTUP_RANDOM_ITERS"], [12, 5, 1, "", "ALGORITHMS_CHEMPROP_WARMUP_EPOCHS_RATIO"], [12, 5, 1, "", "ALGORITHMS_HIGH"], [12, 5, 1, "", "ALGORITHMS_INTERFACE_SKLEARN"], [12, 5, 1, "", "ALGORITHMS_INTERFACE_XGBOOST"], [12, 5, 1, "", "ALGORITHMS_KNEIGHBORSCLASSIFIER"], [12, 5, 1, "", "ALGORITHMS_KNEIGHBORSREGRESSOR"], [12, 5, 1, "", "ALGORITHMS_KNEIGHBORS_METRIC"], [12, 5, 1, "", "ALGORITHMS_KNEIGHBORS_N_NEIGHBORS"], [12, 5, 1, "", "ALGORITHMS_KNEIGHBORS_WEIGHTS"], [12, 5, 1, "", "ALGORITHMS_LASSO"], [12, 5, 1, "", "ALGORITHMS_LASSO_ALPHA"], [12, 5, 1, "", "ALGORITHMS_LOGISTICREGRESSION"], [12, 5, 1, "", "ALGORITHMS_LOGISTICREGRESSION_C"], [12, 5, 1, "", "ALGORITHMS_LOGISTICREGRESSION_SOLVER"], [12, 5, 1, "", "ALGORITHMS_LOW"], [12, 5, 1, "", "ALGORITHMS_MAPIE"], [12, 5, 1, "", "ALGORITHMS_MAPIE_ALPHA"], [12, 5, 1, "", "ALGORITHMS_PLSREGRESSION"], [12, 5, 1, "", "ALGORITHMS_PLSREGRESSION_N_COMPONENTS"], [12, 5, 1, "", "ALGORITHMS_PRF"], [12, 5, 1, "", "ALGORITHMS_PRF_MAX_DEPTH"], [12, 5, 1, "", "ALGORITHMS_PRF_MAX_FEATURES"], [12, 5, 1, "", "ALGORITHMS_PRF_MINPYSUMLEAF"], [12, 5, 1, "", "ALGORITHMS_PRF_N_ESTIMATORS"], [12, 5, 1, "", "ALGORITHMS_PRF_USE_PY_GINI"], [12, 5, 1, "", "ALGORITHMS_PRF_USE_PY_LEAFS"], [12, 5, 1, "", "ALGORITHMS_Q"], [12, 5, 1, "", "ALGORITHMS_RFCLASSIFIER"], [12, 5, 1, "", "ALGORITHMS_RFREGRESSOR"], [12, 5, 1, "", "ALGORITHMS_RF_MAX_DEPTH"], [12, 5, 1, "", "ALGORITHMS_RF_MAX_FEATURES"], [12, 5, 1, "", "ALGORITHMS_RF_N_ESTIMATORS"], [12, 5, 1, "", "ALGORITHMS_RIDGE"], [12, 5, 1, "", "ALGORITHMS_RIDGE_ALPHA"], [12, 5, 1, "", "ALGORITHMS_SVC"], [12, 5, 1, "", "ALGORITHMS_SVC_C"], [12, 5, 1, "", "ALGORITHMS_SVC_GAMMA"], [12, 5, 1, "", "ALGORITHMS_SVR"], [12, 5, 1, "", "ALGORITHMS_SVR_C"], [12, 5, 1, "", "ALGORITHMS_SVR_GAMMA"], [12, 5, 1, "", "ALGORITHMS_XGBREGRESSOR"], [12, 5, 1, "", "ALGORITHMS_XGBREGRESSOR_LEARNING_RATE"], [12, 5, 1, "", "ALGORITHMS_XGBREGRESSOR_MAX_DEPTH"], [12, 5, 1, "", "ALGORITHMS_XGBREGRESSOR_N_ESTIMATORS"], [12, 5, 1, "", "DATA"], [12, 5, 1, "", "DATA_INPUTCOLUMN"], [12, 5, 1, "", "DATA_RESPONSECOLUMN"], [12, 5, 1, "", "DATA_TEST"], [12, 5, 1, "", "DATA_TRAINING"], [12, 5, 1, "", "DESCRIPTORS"], [12, 5, 1, "", "DESCRIPTORS_AMORPROT"], [12, 5, 1, "", "DESCRIPTORS_AVALON"], [12, 5, 1, "", "DESCRIPTORS_AVALON_NBITS"], [12, 5, 1, "", "DESCRIPTORS_COMPOSITE"], [12, 5, 1, "", "DESCRIPTORS_ECFP"], [12, 5, 1, "", "DESCRIPTORS_ECFPCOUNTS"], [12, 5, 1, "", "DESCRIPTORS_ECFPCOUNTS_RADIUS"], [12, 5, 1, "", "DESCRIPTORS_ECFPCOUNTS_USEFEATURES"], [12, 5, 1, "", "DESCRIPTORS_ECFP_NBITS"], [12, 5, 1, "", "DESCRIPTORS_ECFP_RADIUS"], [12, 5, 1, "", "DESCRIPTORS_JAZZY"], [12, 5, 1, "", "DESCRIPTORS_JAZZY_JAZZYNAMES"], [12, 5, 1, "", "DESCRIPTORS_MACCSKEYS"], [12, 5, 1, "", "DESCRIPTORS_MAPC"], [12, 5, 1, "", "DESCRIPTORS_MAPC_MAXRADIUS"], [12, 5, 1, "", "DESCRIPTORS_MAPC_NPERMUTATIONS"], [12, 5, 1, "", "DESCRIPTORS_PATHFP"], [12, 5, 1, "", "DESCRIPTORS_PATHFP_FPSIZE"], [12, 5, 1, "", "DESCRIPTORS_PATHFP_MAXPATH"], [12, 5, 1, "", "DESCRIPTORS_PHYSCHEM"], [12, 5, 1, "", "DESCRIPTORS_PHYSCHEM_RDKITNAMES"], [12, 5, 1, "", "DESCRIPTORS_PRECOMPUTED"], [12, 5, 1, "", "DESCRIPTORS_PRECOMPUTED_FILE"], [12, 5, 1, "", "DESCRIPTORS_PRECOMPUTED_INPUT_COLUMNN"], [12, 5, 1, "", "DESCRIPTORS_PRECOMPUTED_RESPONSE_COLUMN"], [12, 5, 1, "", "DESCRIPTORS_SCALED"], [12, 5, 1, "", "DESCRIPTORS_SCALED_DESCRIPTOR"], [12, 5, 1, "", "DESCRIPTORS_SCALED_DESCRIPTOR_PARAMETERS"], [12, 5, 1, "", "DESCRIPTORS_SMILES"], [12, 5, 1, "", "DESCRIPTORS_SMILES_AND_SI"], [12, 5, 1, "", "DESCRIPTORS_SMILES_AND_SI_AUX_WEIGHT_PC"], [12, 5, 1, "", "DESCRIPTORS_SMILES_AND_SI_FILE"], [12, 5, 1, "", "DESCRIPTORS_SMILES_AND_SI_INPUT_COLUMN"], [12, 5, 1, "", "DESCRIPTORS_UNSC_JAZZY"], [12, 5, 1, "", "DESCRIPTORS_UNSC_MAPC"], [12, 5, 1, "", "DESCRIPTORS_UNSC_PHYSCHEM"], [12, 5, 1, "", "DESCRIPTORS_UNSC_ZSCALES"], [12, 5, 1, "", "DESCRIPTORS_ZSCALES"], [12, 5, 1, "", "GENERAL_DISABLED"], [12, 5, 1, "", "GENERAL_PARAMETERS"], [12, 5, 1, "", "SETTINGS"], [12, 5, 1, "", "SETTINGS_CROSS_VALIDATION"], [12, 5, 1, "", "SETTINGS_DIRECTION"], [12, 5, 1, "", "SETTINGS_MODE"], [12, 5, 1, "", "SETTINGS_MODE_CLASSIFICATION"], [12, 5, 1, "", "SETTINGS_MODE_REGRESSION"], [12, 5, 1, "", "SETTINGS_N_JOBS"], [12, 5, 1, "", "SETTINGS_N_TRIALS"], [12, 5, 1, "", "SETTINGS_SHUFFLE"], [12, 5, 1, "", "TASK"], [12, 5, 1, "", "TASK_BUILDING"], [12, 5, 1, "", "TASK_OPTIMIZATION"]], "optunaz.utils.enums.interface_enum": [[12, 1, 1, "", "InterfaceEnum"]], "optunaz.utils.enums.interface_enum.InterfaceEnum": [[12, 5, 1, "", "CALIBRATED_SET"], [12, 5, 1, "", "CHEMPROP_SET"], [12, 5, 1, "", "PRF_SET"], [12, 5, 1, "", "SKLEARN_SET"], [12, 5, 1, "", "XGBOOST_SET"]], "optunaz.utils.enums.model_runner_enum": [[12, 1, 1, "", "ModelRunnerDataframeEnum"]], "optunaz.utils.enums.model_runner_enum.ModelRunnerDataframeEnum": [[12, 5, 1, "", "SET"], [12, 5, 1, "", "SMILES"], [12, 5, 1, "", "TEST"], [12, 5, 1, "", "TRAIN"], [12, 5, 1, "", "Y_PRED"], [12, 5, 1, "", "Y_TRUE"]], "optunaz.utils.enums.objective_enum": [[12, 1, 1, "", "ObjectiveEnum"]], "optunaz.utils.enums.objective_enum.ObjectiveEnum": [[12, 5, 1, "", "ATTRIBUTE_TRIAL_TRAIN_SCORE"], [12, 5, 1, "", "EXTRA_COLUMN_BESTHIT"]], "optunaz.utils.enums.optimization_configuration_enum": [[12, 1, 1, "", "OptimizationConfigurationEnum"]], "optunaz.utils.enums.prediction_configuration_enum": [[12, 1, 1, "", "PredictionConfigurationEnum"]], "optunaz.utils.enums.prediction_configuration_enum.PredictionConfigurationEnum": [[12, 5, 1, "", "DATA_DATASET"]], "optunaz.utils.enums.return_values_enum": [[12, 1, 1, "", "SklearnReturnValueEnum"], [12, 1, 1, "", "XGBoostReturnValueEnum"]], "optunaz.utils.enums.return_values_enum.SklearnReturnValueEnum": [[12, 5, 1, "", "CROSS_VALIDATE_FIT_TIME"], [12, 5, 1, "", "CROSS_VALIDATE_SCORE_TIME"], [12, 5, 1, "", "CROSS_VALIDATE_TEST_SCORE"], [12, 5, 1, "", "CROSS_VALIDATE_TRAIN_SCORE"]], "optunaz.utils.enums.return_values_enum.XGBoostReturnValueEnum": [[12, 5, 1, "", "CROSS_VALIDATE_FIT_TIME"], [12, 5, 1, "", "CROSS_VALIDATE_SCORE_TIME"], [12, 5, 1, "", "CROSS_VALIDATE_TEST_SCORE"], [12, 5, 1, "", "CROSS_VALIDATE_TRAIN_SCORE"]], "optunaz.utils.enums.visualization_enum": [[12, 1, 1, "", "VisualizationEnum"]], "optunaz.utils.enums.visualization_enum.VisualizationEnum": [[12, 5, 1, "", "OPTUNA_SYSTEM_ATTRS_INTERMEDIATE_VALUES"], [12, 5, 1, "", "OPTUNA_SYSTEM_ATTRS_NUMBER"], [12, 5, 1, "", "OPTUNA_SYSTEM_ATTRS_TRIAL_ID"], [12, 5, 1, "", "VISUALIZATION"], [12, 5, 1, "", "VISUALIZATION_CLASSIFIER"], [12, 5, 1, "", "VISUALIZATION_FILE_FORMAT"], [12, 5, 1, "", "VISUALIZATION_OUTPUT_FOLDER"], [12, 5, 1, "", "VISUALIZATION_PLOTS"], [12, 5, 1, "", "VISUALIZATION_PLOTS_CONTOUR"], [12, 5, 1, "", "VISUALIZATION_PLOTS_HISTORY"], [12, 5, 1, "", "VISUALIZATION_PLOTS_PARALLEL_COORDINATE"], [12, 5, 1, "", "VISUALIZATION_PLOTS_SLICE"], [12, 5, 1, "", "VISUALIZATION_REGRESSOR"], [12, 5, 1, "", "VISUALIZATION_USE_XVFB"]], "optunaz.utils.files_paths": [[11, 4, 1, "", "attach_root_path"], [11, 4, 1, "", "move_up_directory"]], "optunaz.utils.load_json": [[11, 4, 1, "", "loadJSON"]], "optunaz.utils.mlflow": [[11, 1, 1, "", "MLflowCallback"], [11, 4, 1, "", "add_ellipsis"], [11, 4, 1, "", "shorten_names"]], "optunaz.utils.mlflow.MLflowCallback": [[11, 5, 1, "", "optconfig"], [11, 3, 1, "", "prepare_tags"], [11, 3, 1, "", "tmp_buildconfig"], [11, 5, 1, "", "tracking_uri"], [11, 5, 1, "", "trial_number_offset"]], "optunaz.utils.preprocessing": [[13, 0, 0, "-", "deduplicator"], [13, 0, 0, "-", "splitter"], [13, 0, 0, "-", "transform"]], "optunaz.utils.preprocessing.deduplicator": [[13, 1, 1, "", "Deduplicator"], [13, 1, 1, "", "KeepAllNoDeduplication"], [13, 1, 1, "", "KeepAvg"], [13, 1, 1, "", "KeepFirst"], [13, 1, 1, "", "KeepLast"], [13, 1, 1, "", "KeepMax"], [13, 1, 1, "", "KeepMedian"], [13, 1, 1, "", "KeepMin"], [13, 1, 1, "", "KeepRandom"]], "optunaz.utils.preprocessing.deduplicator.Deduplicator": [[13, 3, 1, "", "dedup"]], "optunaz.utils.preprocessing.deduplicator.KeepAllNoDeduplication": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepAvg": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepFirst": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepLast": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepMax": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepMedian": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepMin": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"]], "optunaz.utils.preprocessing.deduplicator.KeepRandom": [[13, 3, 1, "", "dedup"], [13, 5, 1, "", "name"], [13, 5, 1, "", "seed"]], "optunaz.utils.preprocessing.splitter": [[13, 1, 1, "", "GroupingSplitter"], [13, 1, 1, "", "HistogramStratifiedShuffleSplit"], [13, 1, 1, "", "KFold"], [13, 1, 1, "", "NoSplitting"], [14, 1, 1, "", "Predefined"], [14, 1, 1, "", "Random"], [14, 1, 1, "", "ScaffoldSplit"], [13, 1, 1, "", "SklearnSplitter"], [13, 1, 1, "", "Splitter"], [14, 1, 1, "", "Stratified"], [14, 1, 1, "", "Temporal"], [13, 4, 1, "", "butina_cluster"], [13, 4, 1, "", "fd_bin"], [13, 4, 1, "", "stratify"]], "optunaz.utils.preprocessing.splitter.GroupingSplitter": [[13, 3, 1, "", "groups"]], "optunaz.utils.preprocessing.splitter.HistogramStratifiedShuffleSplit": [[13, 5, 1, "", "bins"], [13, 3, 1, "", "get_n_splits"], [13, 5, 1, "", "n_splits"], [13, 5, 1, "", "random_state"], [13, 3, 1, "", "split"], [13, 5, 1, "", "test_fraction"]], "optunaz.utils.preprocessing.splitter.KFold": [[13, 3, 1, "", "get_sklearn_splitter"], [13, 5, 1, "", "name"], [13, 5, 1, "", "random_state"], [13, 5, 1, "", "shuffle"], [13, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.NoSplitting": [[13, 3, 1, "", "get_sklearn_splitter"], [13, 5, 1, "", "name"], [13, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.Predefined": [[13, 5, 1, "", "column_name"], [13, 3, 1, "", "get_sklearn_splitter"], [13, 3, 1, "", "groups"], [13, 5, 1, "", "name"], [14, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.Random": [[13, 5, 1, "", "fraction"], [13, 3, 1, "", "get_sklearn_splitter"], [13, 5, 1, "", "name"], [13, 5, 1, "", "seed"]], "optunaz.utils.preprocessing.splitter.ScaffoldSplit": [[13, 5, 1, "", "bins"], [13, 5, 1, "", "butina_cluster"], [13, 3, 1, "", "get_n_splits"], [13, 3, 1, "", "get_sklearn_splitter"], [14, 3, 1, "", "groups"], [13, 5, 1, "", "make_scaffold_generic"], [13, 5, 1, "", "name"], [13, 5, 1, "", "random_state"], [14, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.SklearnSplitter": [[13, 3, 1, "", "get_n_splits"], [13, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.Splitter": [[13, 3, 1, "", "get_sklearn_splitter"], [13, 3, 1, "", "split"]], "optunaz.utils.preprocessing.splitter.Stratified": [[13, 5, 1, "", "bins"], [13, 5, 1, "", "fraction"], [13, 3, 1, "", "get_sklearn_splitter"], [13, 5, 1, "", "name"], [13, 5, 1, "", "seed"]], "optunaz.utils.preprocessing.splitter.Temporal": [[13, 5, 1, "", "fraction"], [13, 3, 1, "", "get_sklearn_splitter"], [13, 5, 1, "", "name"], [14, 3, 1, "", "split"]], "optunaz.utils.preprocessing.transform": [[13, 1, 1, "", "AmorProt"], [13, 1, 1, "", "AuxTransformer"], [13, 1, 1, "", "DataTransform"], [13, 6, 1, "", "DataTransformError"], [13, 1, 1, "", "LogBase"], [13, 1, 1, "", "LogNegative"], [15, 1, 1, "", "ModelDataTransform"], [15, 1, 1, "", "PTRTransform"], [15, 1, 1, "", "VectorFromColumn"], [15, 1, 1, "", "ZScales"]], "optunaz.utils.preprocessing.transform.AmorProt": [[13, 1, 1, "", "Parameters"], [13, 5, 1, "", "name"], [13, 5, 1, "", "parameters"], [13, 3, 1, "", "transform"]], "optunaz.utils.preprocessing.transform.AuxTransformer": [[13, 3, 1, "", "transform"]], "optunaz.utils.preprocessing.transform.DataTransform": [[13, 3, 1, "", "transform"]], "optunaz.utils.preprocessing.transform.LogBase": [[13, 5, 1, "", "LOG"], [13, 5, 1, "", "LOG10"], [13, 5, 1, "", "LOG2"]], "optunaz.utils.preprocessing.transform.LogNegative": [[13, 5, 1, "", "FALSE"], [13, 5, 1, "", "TRUE"]], "optunaz.utils.preprocessing.transform.ModelDataTransform": [[15, 1, 1, "", "Parameters"], [13, 5, 1, "", "base_dict"], [13, 5, 1, "", "base_negation"], [13, 5, 1, "", "name"], [13, 5, 1, "", "parameters"], [13, 5, 1, "", "reverse_dict"], [13, 3, 1, "", "reverse_transform"], [13, 3, 1, "", "reverse_transform_df"], [13, 3, 1, "", "reverse_transform_one"], [13, 3, 1, "", "transform"], [13, 3, 1, "", "transform_df"], [13, 3, 1, "", "transform_one"]], "optunaz.utils.preprocessing.transform.ModelDataTransform.Parameters": [[13, 5, 1, "", "base"], [13, 5, 1, "", "conversion"], [13, 5, 1, "", "negation"]], "optunaz.utils.preprocessing.transform.PTRTransform": [[15, 1, 1, "", "Parameters"], [13, 5, 1, "", "name"], [13, 5, 1, "", "parameters"], [13, 3, 1, "", "reverse_transform"], [13, 3, 1, "", "transform"]], "optunaz.utils.preprocessing.transform.PTRTransform.Parameters": [[13, 5, 1, "", "std"], [13, 5, 1, "", "threshold"]], "optunaz.utils.preprocessing.transform.VectorFromColumn": [[15, 1, 1, "", "Parameters"], [13, 5, 1, "", "name"], [13, 5, 1, "", "parameters"], [13, 3, 1, "", "transform"]], "optunaz.utils.preprocessing.transform.VectorFromColumn.Parameters": [[13, 5, 1, "", "delimiter"]], "optunaz.utils.preprocessing.transform.ZScales": [[15, 1, 1, "", "Parameters"], [13, 5, 1, "", "name"], [13, 5, 1, "", "parameters"], [13, 3, 1, "", "transform"]], "optunaz.utils.retraining": [[11, 6, 1, "", "NoDifferingRetrainingData"], [11, 6, 1, "", "NoNewRetrainingData"], [11, 6, 1, "", "NoPreviousModel"], [11, 6, 1, "", "NoRetrainingDataConvention"], [11, 6, 1, "", "RetrainingHeadersIssue"], [11, 6, 1, "", "RetrainingIsAlreadyProcessed"], [11, 6, 1, "", "RetrainingIsLocked"], [11, 6, 1, "", "SamePreviousModel"], [11, 6, 1, "", "SlurmJobSkip"], [11, 6, 1, "", "SlurmMemoryExceeded"], [11, 6, 1, "", "SlurmNoLog"], [11, 6, 1, "", "SlurmParseError"], [11, 6, 1, "", "SlurmTimeLimitExceeded"], [11, 6, 1, "", "TemporalPredsPredicted"], [11, 6, 1, "", "TimepointSkipped"]], "optunaz.utils.schema": [[11, 4, 1, "", "add_boolean_guards_for_schema_properties"], [11, 4, 1, "", "addsibling"], [11, 4, 1, "", "addtitles"], [11, 4, 1, "", "copytitle"], [11, 4, 1, "", "create_dependency"], [11, 4, 1, "", "delsibling"], [11, 4, 1, "", "getref"], [11, 4, 1, "", "remove_schema_properties"], [11, 4, 1, "", "replaceenum"], [11, 4, 1, "", "replacekey"], [11, 4, 1, "", "replacevalue"]], "optunaz.utils.tracking": [[11, 1, 1, "", "BuildTrackingData"], [11, 1, 1, "", "Datapoint"], [11, 1, 1, "", "InternalTrackingCallback"], [11, 1, 1, "", "TrackingData"], [11, 4, 1, "", "get_authorization_header"], [11, 4, 1, "", "removeprefix"], [11, 4, 1, "", "round_scores"], [11, 4, 1, "", "track_build"]], "optunaz.utils.tracking.BuildTrackingData": [[11, 5, 1, "", "response_column_name"], [11, 5, 1, "", "test_points"], [11, 5, 1, "", "test_scores"]], "optunaz.utils.tracking.Datapoint": [[11, 5, 1, "", "expected"], [11, 5, 1, "", "predicted"], [11, 5, 1, "", "smiles"]], "optunaz.utils.tracking.InternalTrackingCallback": [[11, 5, 1, "", "optconfig"], [11, 5, 1, "", "trial_number_offset"]], "optunaz.utils.tracking.TrackingData": [[11, 5, 1, "", "all_cv_test_scores"], [11, 5, 1, "", "buildconfig"], [11, 5, 1, "", "scoring"], [11, 5, 1, "", "trial_number"], [11, 5, 1, "", "trial_state"], [11, 5, 1, "", "trial_value"]], "optunaz.visualizer": [[9, 1, 1, "", "Visualizer"]], "optunaz.visualizer.Visualizer": [[9, 3, 1, "", "plot_by_configuration"], [9, 3, 1, "", "plot_contour"], [9, 3, 1, "", "plot_history"], [9, 3, 1, "", "plot_parallel_coordinate"], [9, 3, 1, "", "plot_slice"]]}, "objtypes": {"0": "py:module", "1": "py:class", "2": "py:property", "3": "py:method", "4": "py:function", "5": "py:attribute", "6": "py:exception"}, "objnames": {"0": ["py", "module", "Python module"], "1": ["py", "class", "Python class"], "2": ["py", "property", "Python property"], "3": ["py", "method", "Python method"], "4": ["py", "function", "Python function"], "5": ["py", "attribute", "Python attribute"], "6": ["py", "exception", "Python exception"]}, "titleterms": {"qsartuna": [0, 4, 7, 8], "\ud80c\udd9b": 0, "qsar": 0, "us": 0, "optim": [0, 6, 7], "hyperparamet": 0, "tune": 0, "formerli": 0, "optuna": 0, "az": 0, "qptuna": [0, 6], "background": [0, 6, 7], "The": [0, 6, 7], "three": [0, 6, 7], "step": [0, 6, 7], "process": [0, 6, 7], "json": 0, "base": [0, 8], "command": 0, "line": 0, "interfac": 0, "configur": [0, 6, 7], "file": [0, 6, 7], "run": [0, 6, 7], "from": [0, 6, 7, 8], "python": 0, "jupyt": 0, "notebook": 0, "via": 0, "cli": [0, 6, 7], "submit": 0, "slurm": 0, "model": [0, 6, 7], "option": [0, 6, 7], "inspect": 0, "automl": [0, 6, 7, 9], "automat": 0, "machin": 0, "learn": [0, 6, 7], "ad": 0, "descriptor": [0, 3, 6, 7, 9], "algorithm": [0, 1, 6, 7], "avail": [1, 2, 3, 14, 15], "adaboostclassifi": 1, "lasso": 1, "kneighborsclassifi": 1, "kneighborsregressor": 1, "logisticregress": 1, "plsregress": 1, "randomforestclassifi": 1, "randomforestregressor": 1, "ridg": 1, "svc": 1, "svr": 1, "xgbregressor": 1, "prfclassifi": 1, "chempropregressor": 1, "chempropclassifi": 1, "chemprophyperoptclassifi": 1, "chemprophyperoptregressor": 1, "chempropregressorpretrain": 1, "calibratedclassifiercvwithva": 1, "mapi": [1, 6, 7], "dedupl": [2, 8, 13], "keepfirst": 2, "keeplast": 2, "keeprandom": 2, "keepmin": 2, "keepmax": 2, "keepavg": 2, "keepmedian": 2, "keepkeepallnodedupl": 2, "avalon": 3, "ecfp": 3, "ecfp_count": 3, "pathfp": 3, "maccs_kei": 3, "unscaledphyschemdescriptor": 3, "unscaledjazzydescriptor": 3, "unscaledzscalesdescriptor": 3, "physchemdescriptor": 3, "jazzydescriptor": 3, "precomputeddescriptorfromfil": 3, "zscale": [3, 15], "smilesfromfil": 3, "smilesandsideinfofromfil": 3, "scaleddescriptor": 3, "compositedescriptor": 3, "welcom": 4, "document": 4, "develop": 4, "optunaz": [5, 9, 10, 11, 12, 13], "tutori": [6, 7], "thi": [6, 7], "prepar": [6, 7], "regress": [6, 7], "exampl": [6, 7], "creat": [6, 7], "visual": [6, 7, 9], "progress": [6, 7], "pick": [6, 7], "best": [6, 7, 8], "trial": [6, 7], "build": [6, 7], "merg": [6, 7], "preprocess": [6, 7, 8, 13], "split": [6, 7, 8], "data": [6, 7, 8], "train": [6, 7], "test": [6, 7], "set": [6, 7], "remov": [6, 7], "duplic": [6, 7, 8], "dataset": [6, 7], "choos": [6, 7], "score": [6, 7], "function": [6, 7], "advanc": [6, 7], "functoinail": [6, 7], "probabilist": [6, 7, 8], "random": [6, 7, 8, 14], "forest": [6, 7], "prf": [6, 7], "interlud": [6, 7, 8], "cautionari": [6, 7], "advic": [6, 7], "y": [6, 7], "respons": [6, 7], "column": [6, 7], "valid": [6, 7], "chemprop": [6, 7], "simpl": [6, 7], "separ": [6, 7], "shallow": [6, 7], "method": [6, 7], "default": [6, 7], "behavior": [6, 7], "turn": [6, 7], "hyperopt": [6, 7], "within": [6, 7, 8], "functionail": [6, 7], "veri": [6, 7], "larg": [6, 7], "comput": [6, 7], "cost": [6, 7], "A": [6, 7], "note": [6, 7], "mpnn": [6, 7], "search": [6, 7], "space": [6, 7], "side": [6, 7], "inform": [6, 7], "multi": [6, 7], "task": [6, 7], "mtl": [6, 7], "combin": [6, 7], "onli": [6, 7], "recommend": [6, 7], "long": [6, 7], "time": [6, 7], "pre": [6, 7], "adapt": [6, 7], "transfer": [6, 7], "fingerprint": [6, 7], "encod": [6, 7], "latent": [6, 7], "represent": [6, 7, 8], "probabl": [6, 7], "calibr": [6, 7], "classif": [6, 7], "uncertainti": [6, 7], "estim": [6, 7], "vennab": [6, 7], "ensembl": [6, 7], "dropout": [6, 7], "explain": [6, 7, 9], "shap": [6, 7], "interpret": [6, 7], "log": [6, 7, 8], "transform": [6, 7, 8, 13, 15], "covari": [6, 7], "one": [6, 7], "e": [6, 7], "g": [6, 7], "dose": [6, 7], "point": [6, 7], "co": [6, 7], "variat": [6, 7], "proteochemometr": [6, 7], "pcm": [6, 7], "more": [6, 7], "vectorfromsmil": [6, 7], "z": [6, 7], "scale": [6, 7], "object": [6, 7, 9], "priorit": [6, 7], "perform": [6, 7, 8], "standard": [6, 7], "deviat": [6, 7], "further": [6, 7], "precomput": [6, 7], "autom": [6, 7], "retrain": [6, 7, 11], "overview": [6, 7], "high": [6, 7], "hpc": [6, 7], "setup": [6, 7], "extract": [6, 7], "walkthough": [6, 7], "an": [6, 7], "pipelin": 7, "schedul": 7, "daemon": 7, "up": 7, "date": 7, "introduct": 8, "translat": 8, "sdf": 8, "csv": 8, "need": 8, "deal": 8, "compar": 8, "differ": 8, "strategi": 8, "tempor": [8, 14], "stratifi": [8, 14], "scaffold": 8, "input": 8, "user": 8, "import": 8, "logarithm": 8, "dataread": [8, 9], "threshold": 8, "ptr": [8, 15], "experiment": 8, "error": 8, "definit": 8, "implement": 8, "conclus": 8, "calcul": 8, "evalu": [8, 9], "reproduc": 8, "practic": 8, "packag": [9, 10, 11, 12, 13], "subpackag": [9, 11], "submodul": [9, 10, 11, 12, 13], "modul": [9, 10, 11, 12, 13], "builder": 9, "metirc": 9, "model_writ": 9, "optbuild": 9, "predict": 9, "schemagen": 9, "three_step_opt_build_merg": 9, "content": [9, 10, 11, 12, 13], "config": 10, "build_from_opt": 10, "buildconfig": 10, "optconfig": 10, "util": [11, 12, 13], "files_path": 11, "load_json": 11, "mlflow": 11, "schema": 11, "track": 11, "enum": 12, "building_configuration_enum": 12, "configuration_enum": 12, "interface_enum": 12, "model_runner_enum": 12, "objective_enum": 12, "optimization_configuration_enum": 12, "prediction_configuration_enum": 12, "return_values_enum": 12, "visualization_enum": 12, "splitter": [13, 14], "predefin": 14, "scaffoldsplit": 14, "modeldatatransform": 15, "vectorfromcolumn": 15}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 6, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "nbsphinx": 4, "sphinx.ext.todo": 2, "sphinx.ext.viewcode": 1, "sphinx": 56}}) \ No newline at end of file diff --git a/notebooks/QSARtuna_Tutorial.ipynb b/notebooks/QSARtuna_Tutorial.ipynb index 3968fe6..030a871 100644 --- a/notebooks/QSARtuna_Tutorial.ipynb +++ b/notebooks/QSARtuna_Tutorial.ipynb @@ -893,7 +893,7 @@ "text": [ "[I 2024-08-27 14:01:27,262] A new study created in memory with name: my_study_stratified_split\n", "[I 2024-08-27 14:01:27,303] A new study created in memory with name: study_name_0\n", - "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:180)\n", + "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:180)\n", " return self._cached_call(args, kwargs, shelving=False)[0]\n", "[I 2024-08-27 14:01:27,408] Trial 0 finished with value: -3999.9364276424735 and parameters: {'algorithm_name': 'SVR', 'SVR_algorithm_hash': 'ea7ccc7ef4a9329af0d4e39eb6184933', 'gamma__ea7ccc7ef4a9329af0d4e39eb6184933': 0.11270803112210707, 'C__ea7ccc7ef4a9329af0d4e39eb6184933': 43.81076443656638, 'descriptor': '{\"name\": \"ECFP\", \"parameters\": {\"radius\": 3, \"nBits\": 2048, \"returnRdkit\": false}}'}. Best is trial 0 with value: -3999.9364276424735.\n", "[I 2024-08-27 14:01:27,485] Trial 1 finished with value: -1856.4459752935309 and parameters: {'algorithm_name': 'PLSRegression', 'PLSRegression_algorithm_hash': '9f2f76e479633c0bf18cf2912fed9eda', 'n_components__9f2f76e479633c0bf18cf2912fed9eda': 4, 'descriptor': '{\"name\": \"MACCS_keys\", \"parameters\": {}}'}. Best is trial 1 with value: -1856.4459752935309.\n", @@ -1726,9 +1726,9 @@ "Traceback (most recent call last):\n", " File \"/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/optuna/study/_optimize.py\", line 196, in _run_trial\n", " value_or_values = func(trial)\n", - " File \"/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/objective.py\", line 128, in __call__\n", + " File \"/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/objective.py\", line 128, in __call__\n", " self._validate_algos()\n", - " File \"/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/objective.py\", line 270, in _validate_algos\n", + " File \"/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/objective.py\", line 270, in _validate_algos\n", " raise ValueError(\n", "ValueError: PRFClassifier supplied but response column outside [0.0-1.0] acceptable range. Response max: 9.7, response min: 5.3 \n", "[W 2024-08-27 14:02:47,253] Trial 0 failed with value None.\n" @@ -3388,7 +3388,7 @@ "[I 2024-08-27 14:09:24,367] A new study created in memory with name: my_study\n", "[I 2024-08-27 14:09:24,410] A new study created in memory with name: study_name_0\n", "INFO:root:Enqueued ChemProp manual trial with sensible defaults: {'activation__fd833c2dde0b7147e6516ea5eebb2657': 'ReLU', 'aggregation__fd833c2dde0b7147e6516ea5eebb2657': 'mean', 'aggregation_norm__fd833c2dde0b7147e6516ea5eebb2657': 100, 'batch_size__fd833c2dde0b7147e6516ea5eebb2657': 50, 'depth__fd833c2dde0b7147e6516ea5eebb2657': 3, 'dropout__fd833c2dde0b7147e6516ea5eebb2657': 0.0, 'features_generator__fd833c2dde0b7147e6516ea5eebb2657': 'none', 'ffn_hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300, 'ffn_num_layers__fd833c2dde0b7147e6516ea5eebb2657': 2, 'final_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300, 'init_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'max_lr_exp__fd833c2dde0b7147e6516ea5eebb2657': -3, 'warmup_epochs_ratio__fd833c2dde0b7147e6516ea5eebb2657': 0.1, 'algorithm_name': 'ChemPropClassifier', 'ChemPropClassifier_algorithm_hash': 'fd833c2dde0b7147e6516ea5eebb2657'}\n", - "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:859)\n", + "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:859)\n", " return self._cached_call(args, kwargs, shelving=False)[0]\n", "[I 2024-08-27 14:16:18,484] Trial 0 finished with value: 0.65625 and parameters: {'algorithm_name': 'ChemPropClassifier', 'ChemPropClassifier_algorithm_hash': 'fd833c2dde0b7147e6516ea5eebb2657', 'activation__fd833c2dde0b7147e6516ea5eebb2657': , 'aggregation__fd833c2dde0b7147e6516ea5eebb2657': , 'aggregation_norm__fd833c2dde0b7147e6516ea5eebb2657': 100.0, 'batch_size__fd833c2dde0b7147e6516ea5eebb2657': 50.0, 'depth__fd833c2dde0b7147e6516ea5eebb2657': 3.0, 'dropout__fd833c2dde0b7147e6516ea5eebb2657': 0.0, 'ensemble_size__fd833c2dde0b7147e6516ea5eebb2657': 5, 'epochs__fd833c2dde0b7147e6516ea5eebb2657': 4, 'features_generator__fd833c2dde0b7147e6516ea5eebb2657': , 'ffn_hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300.0, 'ffn_num_layers__fd833c2dde0b7147e6516ea5eebb2657': 2.0, 'final_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'hidden_size__fd833c2dde0b7147e6516ea5eebb2657': 300.0, 'init_lr_ratio_exp__fd833c2dde0b7147e6516ea5eebb2657': -4, 'max_lr_exp__fd833c2dde0b7147e6516ea5eebb2657': -3, 'warmup_epochs_ratio__fd833c2dde0b7147e6516ea5eebb2657': 0.1, 'descriptor': '{\"name\": \"SmilesFromFile\", \"parameters\": {}}'}. Best is trial 0 with value: 0.65625.\n", " \r" @@ -4745,7 +4745,7 @@ "text": [ "[I 2024-08-27 15:09:26,977] A new study created in memory with name: non-transform_example\n", "[I 2024-08-27 15:09:26,979] A new study created in memory with name: study_name_0\n", - "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_Qptuna/D/QSARtuna/optunaz/descriptors.py:180)\n", + "/Users/kljk345/Library/Caches/pypoetry/virtualenvs/qsartuna-9ZyW8GtC-py3.10/lib/python3.10/site-packages/joblib/memory.py:577: JobLibCollisionWarning: Possible name collisions between functions 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:-1) and 'calculate_from_smi' (/Users/kljk345/PycharmProjects/Public_QSARtuna/D/QSARtuna/optunaz/descriptors.py:180)\n", " return self._cached_call(args, kwargs, shelving=False)[0]\n", "[I 2024-08-27 15:09:27,144] Trial 0 finished with value: -3501.942111261296 and parameters: {'algorithm_name': 'RandomForestRegressor', 'RandomForestRegressor_algorithm_hash': 'f1ac01e1bba332215ccbd0c29c9ac3c3', 'max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3': 6, 'n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3': 5, 'max_features__f1ac01e1bba332215ccbd0c29c9ac3c3': , 'descriptor': '{\"name\": \"ECFP\", \"parameters\": {\"radius\": 3, \"nBits\": 2048, \"returnRdkit\": false}}'}. Best is trial 0 with value: -3501.942111261296.\n", "[I 2024-08-27 15:09:27,220] Trial 1 finished with value: -5451.207265576796 and parameters: {'algorithm_name': 'RandomForestRegressor', 'RandomForestRegressor_algorithm_hash': 'f1ac01e1bba332215ccbd0c29c9ac3c3', 'max_depth__f1ac01e1bba332215ccbd0c29c9ac3c3': 7, 'n_estimators__f1ac01e1bba332215ccbd0c29c9ac3c3': 6, 'max_features__f1ac01e1bba332215ccbd0c29c9ac3c3': , 'descriptor': '{\"name\": \"ECFP\", \"parameters\": {\"radius\": 3, \"nBits\": 2048, \"returnRdkit\": false}}'}. Best is trial 0 with value: -3501.942111261296.\n", @@ -11399,7 +11399,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "The AutoML daemon functionaility in Qptuna automates the process of preparing data for model training, including data cleaning, feature extraction, and data formatting, streamlining the data preprocessing stage. The main aspects of this workflow are the following:\n", + "The AutoML daemon functionaility in QSARtuna automates the process of preparing data for model training, including data cleaning, feature extraction, and data formatting, streamlining the data preprocessing stage. The main aspects of this workflow are the following:\n", "\n", "* __Automated Data Preparation__: Automated process of preparing data for model training, including cleaning, feature extraction, formatting and quorum checks, streamlining data preprocessing\n", "\n", @@ -11407,9 +11407,9 @@ "\n", "* __Scalable and Efficient with Dynamic Resource Allocation__: Workflow designed to handle large datasets (with multiple prediction tasks) and dynamically utilize CPU/GPU/memory HPC resources\n", "\n", - "* __Customizable SLURM and Qptuna Templates__: SLURM templates can be tailored for different use cases. Both initial training and retraining Qptuna JSON configurations are used, allowing users customise which algorithms and descriptors should be trialed. The default configuration will for e.g. train an initial ChemProp model, and subsequent models will automatically trial Transfer Learning (TL) from previous models for new data, when appropriate\n", + "* __Customizable SLURM and QSARtuna Templates__: SLURM templates can be tailored for different use cases. Both initial training and retraining QSARtuna JSON configurations are used, allowing users customise which algorithms and descriptors should be trialed. The default configuration will for e.g. train an initial ChemProp model, and subsequent models will automatically trial Transfer Learning (TL) from previous models for new data, when appropriate\n", "\n", - "* __Metadata, Prediction and Model Tracking__: The code includes functionality for tracking temporal performance, raw test predictions, active learning predictions and exported Qptuna models, aiding monitoring and evaluating pseudo-prospective model performance over time\n", + "* __Metadata, Prediction and Model Tracking__: The code includes functionality for tracking temporal performance, raw test predictions, active learning predictions and exported QSARtuna models, aiding monitoring and evaluating pseudo-prospective model performance over time\n", "\n", "* __Automatic Job Resubmission__: In case of SLURM job failures, the code provides functionality to automatically resubmit failed jobs with modified resource allocations, enhancing the robustness of the model training process\n", "\n", @@ -11417,7 +11417,7 @@ "\n", "* __Dry Run Mode__: Dry run mode option enables users to simulate the process without actually submitting jobs, useful for verifying configurations and testing the workflow\n", "\n", - "The following is an example from the Qptuna unit tests:" + "The following is an example from the QSARtuna unit tests:" ] }, { @@ -11534,7 +11534,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "Qptuna AutoML expects temporal data (`--input-data`) to have been exported from warehouses/databases in a flat file structure in CSV format (which can also be gz compressed), containing SMILES, activity and task (which denotes each distinct property to be modelled) CSV columns. \n", + "QSARtuna AutoML expects temporal data (`--input-data`) to have been exported from warehouses/databases in a flat file structure in CSV format (which can also be gz compressed), containing SMILES, activity and task (which denotes each distinct property to be modelled) CSV columns. \n", "\n", "Exports are expected to be temporal in nature, with the naming convention `%Y-%m-%d` (see [here](https://docs.python.org/3/library/datetime.html#strftime-and-strptime-behavior) for details). Data can be exported in two ways:\n", "\n", @@ -11605,7 +11605,7 @@ "Then our configuration would be:\n", "\n", "```\n", - "qptuna-automl \n", + "qsartuna-automl \n", " --input-data \"../tests/data/automl/*\" \\\n", " --email @astrazeneca.com --user_name \\ # username should be accurate to monitor jobs\n", " --input-smiles-csv-column canonical --input-activity-csv-column molwt \\\n", @@ -11690,7 +11690,7 @@ " \"--n-cores\",\n", " \"1\",\n", " \"--dry-run\", # The dry-run option is enabled, so the AutoML pipeline does not submit to SLURM\n", - " \"-vv\", # Use this CLI option to enable detailed debugging logging to observe Qptuna AutoML behaviour \n", + " \"-vv\", # Use this CLI option to enable detailed debugging logging to observe QSARtuna AutoML behaviour \n", " \"--slurm-al-pool\",\n", " \"../tests/data/DRD2/subset-1000/train.csv\",\n", " \"--slurm-al-smiles-csv-column\",\n", @@ -11733,11 +11733,11 @@ "* resulting folder `data/TID1` comprises the following processed data:\n", " * `TID1.csv` : molecular property data set ready for modelling\n", " * `TID1.json`: config for an initial round of model training\n", - " * `TID1.sh`: used to run run Qptuna AutoML via an `sbatch` command, though `-- dry-run` prevented this happening\n", + " * `TID1.sh`: used to run run QSARtuna AutoML via an `sbatch` command, though `-- dry-run` prevented this happening\n", " * `.24_01_01` lock file initiated to track the status of the training at this timepoint\n", "* `processed_timepoints.json` is created to track which timepoints are processed\n", "\n", - "The script stopped at this point, to allow for HPC resources to submit the initial optimisation job. Subsequent runs of the Qptuna AutoML are required to progress past the initial optimisation run, and so could be scheduled (e.g. using `cron` or similar).\n", + "The script stopped at this point, to allow for HPC resources to submit the initial optimisation job. Subsequent runs of the QSARtuna AutoML are required to progress past the initial optimisation run, and so could be scheduled (e.g. using `cron` or similar).\n", "\n", "Running the AutoML workflow does a dry-run check of the status of the run:" ] @@ -11817,7 +11817,7 @@ "ml Miniconda3\n", "conda activate my_env_with_qsartuna\n", "\n", - "qptuna-automl \n", + "qsartuna-automl \n", " --input-data \"/tests/data/automl/*\" \\\n", " --email @astrazeneca.com --user_name \\\n", " --input-smiles-csv-column canonical --input-activity-csv-column molwt \\\n",