Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
37 changes: 37 additions & 0 deletions configs/dataset/pointcloud/atlas_top_tagging.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
# Dataset loader config
loader:
_target_: topobench.data.loaders.pointcloud.atlas_top_tagging_loader.ATLASTopTaggingDatasetLoader
parameters:
data_domain: pointcloud
data_name: atlas_top_tagging
split: train # Options: 'train' or 'test'
subset: 0.01 # Fraction of dataset to use (0.01 = 1% due to large size)
max_constituents: 80 # Maximum number of constituents per jet
use_high_level: true # Include high-level features
verbose: false # Print detailed processing information
data_dir: ${paths.data_dir}/${dataset.loader.parameters.data_domain}/${dataset.loader.parameters.data_name}

# Dataset parameters
parameters:
num_features: 4 # Constituent features: pt, eta, phi, energy
num_classes: 2 # Binary classification: signal (1) vs background (0)
task: classification
loss_type: cross_entropy
monitor_metric: accuracy
task_level: graph

# Splits
split_params:
learning_setting: inductive
data_split_dir: ${paths.data_dir}/data_splits/${dataset.loader.parameters.data_name}
data_seed: 0
split_type: random # Options: 'k-fold' or 'random'
k: 10 # For "k-fold" Cross-Validation
train_prop: 0.5 # For "random" strategy splitting
standardize: false # Whether to standardize features

# Dataloader parameters
dataloader_params:
batch_size: 64 # Batch size (can be adjusted based on memory)
num_workers: 3 # Number of workers for data loading
pin_memory: false # Pin memory for faster GPU transfer
31 changes: 31 additions & 0 deletions configs/experiment/atlas_top_tagging/mlp.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,31 @@
# @package _global_

# to run:
# python -m topobench experiment=atlas_top_tagging/mlp

defaults:
- override /dataset: pointcloud/atlas_top_tagging
- override /model: graph/graph_mlp
- override /callbacks: default
- override /trainer: default
- override /transforms: null

tags: ["mlp", "atlas_top_tagging"]

seed: 42

trainer:
min_epochs: 0
max_epochs: 100
gradient_clip_val: 0.5
check_val_every_n_epoch: 1

model:
feature_encoder:
out_channels: 32
backbone:
num_layers: 2
compile: false

evaluator:
metrics: ['accuracy', 'precision', 'recall', 'auroc', 'f1']
1 change: 1 addition & 0 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -48,6 +48,7 @@ dependencies=[
"ipykernel",
"notebook",
"jupyterlab",
"h5py",
"rich",
"ogb",
"rootutils",
Expand Down
1 change: 1 addition & 0 deletions requirements.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
h5py>=3.0.0 # Required for ATLAS Top Tagging dataset
Loading
Loading