Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@

# DATA -- Glob paths must be relative to the root of the repository: REPO / features
PARQUET_FILES = [
"ligand-only-graph-subsample/_output/ligand__SmilesToLigandFeaturizer__GraphLigandFeaturizer/ChEMBLDatasetProvider/*.parquet",
"ligand-only-graph-EGFR-subsample/_output/ligand__SmilesToLigandFeaturizer__GraphLigandFeaturizer/ChEMBLDatasetProvider/*.parquet",
]

# Model -- specified with the full import path to the class object
Expand Down Expand Up @@ -38,4 +38,4 @@
BOOTSTRAP_SAMPLE_RATIO = 1

# Output
VERBOSE = False
VERBOSE = False
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@

DATASET_CLS = "kinoml.datasets.chembl.ChEMBLDatasetProvider"
DATASET_KWARGS = {
"path_or_url": "https://github.com/openkinome/kinodata/releases/download/v0.2/activities-chembl28-sample100_v0.2.zip",
"path_or_url": "https://github.com/openkinome/kinodata/releases/download/v0.3/EGFR-activities-chembl29-sample.zip",
}

PIPELINES = {
Expand All @@ -24,14 +24,10 @@
FEATURIZE_KWARGS = {"keep": False}

GROUPS = [
[
"kinoml.datasets.groups.CallableGrouper",
{"function": "lambda measurement: measurement.system.protein.name"},
], # by kinase
[
"kinoml.datasets.groups.CallableGrouper",
{"function": "lambda measurement: type(measurement).__name__"},
], # by measurement type
]

TRAIN_TEST_VAL_KWARGS = {"idx_train": 0.8, "idx_test": 0.1, "idx_val": 0.1}
TRAIN_TEST_VAL_KWARGS = {"idx_train": 0.8, "idx_test": 0.1, "idx_val": 0.1}
9 changes: 6 additions & 3 deletions tests/experiments/test_model_ligand_only.sh
Original file line number Diff line number Diff line change
Expand Up @@ -6,8 +6,11 @@ echo "Models"

echo "Ligand only"

echo "Running model for '001_example-ligand-only-morgan1024-EGFR-subset'"
python run_notebook.py experiments/torch-train-test-debug-template.ipynb experiments/001_example-ligand-only-morgan1024-EGFR-subset.py --overwrite
echo "Running model for '001_example-ligand-only-graph-EGFR-subset'"
python run_notebook.py experiments/torch-train-test-debug-template.ipynb experiments/001_example-ligand-only-graph-EGFR-subset.py --overwrite

# echo "Running model for '001_example-ligand-only-morgan1024-EGFR-subset'"
# python run_notebook.py experiments/torch-train-test-debug-template.ipynb experiments/001_example-ligand-only-morgan1024-EGFR-subset.py --overwrite

# These won't run because there are not enough data points for each kinase on the sample data.

Expand All @@ -18,4 +21,4 @@ python run_notebook.py experiments/torch-train-test-debug-template.ipynb experim
# python run_notebook.py experiments/torch-train-test-debug-template.ipynb experiments/001_example-ligand-only-smiles-subset.py --overwrite

# echo "Running model for '001_example-ligand-only-graph-subset'"
# python run_notebook.py experiments/torch-train-test-debug-template.ipynb experiments/001_example-ligand-only-graph-subset.py --overwrite
# python run_notebook.py experiments/torch-train-test-debug-template.ipynb experiments/001_example-ligand-only-graph-subset.py --overwrite
11 changes: 5 additions & 6 deletions tests/features/test_featurization_ligand_only.sh
Original file line number Diff line number Diff line change
Expand Up @@ -7,14 +7,13 @@ echo "Featurization"
echo "Ligand only"

echo "Running featurization for 'ligand-only-morgan1024-EGFR-subsample'"
python run_notebook.py features/featurize-template.ipynb features/ligand-only-morgan1024-EGFR-subsample.py --overwrite
# python run_notebook.py features/featurize-template.ipynb features/ligand-only-morgan1024-EGFR-subsample.py --overwrite

echo "Running featurization for 'ligand-only-morgan1024-subsample'"
python run_notebook.py features/featurize-template.ipynb features/ligand-only-morgan1024-subsample.py --overwrite
# python run_notebook.py features/featurize-template.ipynb features/ligand-only-morgan1024-subsample.py --overwrite

echo "Running featurization for 'ligand-only-onehotsmiles-subsample'"
python run_notebook.py features/featurize-template.ipynb features/ligand-only-onehotsmiles-subsample.py --overwrite

echo "Running featurization for 'ligand-only-graph-subsample'"
python run_notebook.py features/featurize-template.ipynb features/ligand-only-graph-subsample.py --overwrite
# python run_notebook.py features/featurize-template.ipynb features/ligand-only-onehotsmiles-subsample.py --overwrite

echo "Running featurization for 'ligand-only-graph-EGFR-subsample'"
python run_notebook.py features/featurize-template.ipynb features/ligand-only-graph-EGFR-subsample.py --overwrite