From e8cf94741a1e9dd372080b69eb54842c5686c898 Mon Sep 17 00:00:00 2001 From: <> Date: Thu, 24 Oct 2024 15:54:36 +0000 Subject: [PATCH] Deployed 28c1166 with MkDocs version: 1.6.1 --- .nojekyll | 0 404.html | 2332 ++++ CNAME | 1 + README_backup/index.html | 2668 ++++ assets/_mkdocstrings.css | 143 + assets/images/favicon.png | Bin 0 -> 1870 bytes assets/javascripts/bundle.83f73b43.min.js | 16 + assets/javascripts/bundle.83f73b43.min.js.map | 7 + assets/javascripts/lunr/min/lunr.ar.min.js | 1 + assets/javascripts/lunr/min/lunr.da.min.js | 18 + assets/javascripts/lunr/min/lunr.de.min.js | 18 + assets/javascripts/lunr/min/lunr.du.min.js | 18 + assets/javascripts/lunr/min/lunr.el.min.js | 1 + assets/javascripts/lunr/min/lunr.es.min.js | 18 + assets/javascripts/lunr/min/lunr.fi.min.js | 18 + assets/javascripts/lunr/min/lunr.fr.min.js | 18 + assets/javascripts/lunr/min/lunr.he.min.js | 1 + assets/javascripts/lunr/min/lunr.hi.min.js | 1 + assets/javascripts/lunr/min/lunr.hu.min.js | 18 + assets/javascripts/lunr/min/lunr.hy.min.js | 1 + assets/javascripts/lunr/min/lunr.it.min.js | 18 + assets/javascripts/lunr/min/lunr.ja.min.js | 1 + assets/javascripts/lunr/min/lunr.jp.min.js | 1 + assets/javascripts/lunr/min/lunr.kn.min.js | 1 + assets/javascripts/lunr/min/lunr.ko.min.js | 1 + assets/javascripts/lunr/min/lunr.multi.min.js | 1 + assets/javascripts/lunr/min/lunr.nl.min.js | 18 + assets/javascripts/lunr/min/lunr.no.min.js | 18 + assets/javascripts/lunr/min/lunr.pt.min.js | 18 + assets/javascripts/lunr/min/lunr.ro.min.js | 18 + assets/javascripts/lunr/min/lunr.ru.min.js | 18 + assets/javascripts/lunr/min/lunr.sa.min.js | 1 + .../lunr/min/lunr.stemmer.support.min.js | 1 + assets/javascripts/lunr/min/lunr.sv.min.js | 18 + assets/javascripts/lunr/min/lunr.ta.min.js | 1 + assets/javascripts/lunr/min/lunr.te.min.js | 1 + assets/javascripts/lunr/min/lunr.th.min.js | 1 + assets/javascripts/lunr/min/lunr.tr.min.js | 18 + assets/javascripts/lunr/min/lunr.vi.min.js | 1 + assets/javascripts/lunr/min/lunr.zh.min.js | 1 + assets/javascripts/lunr/tinyseg.js | 206 + assets/javascripts/lunr/wordcut.js | 6708 ++++++++++ .../workers/search.6ce7567c.min.js | 42 + .../workers/search.6ce7567c.min.js.map | 7 + assets/stylesheets/main.0253249f.min.css | 1 + assets/stylesheets/main.0253249f.min.css.map | 1 + assets/stylesheets/palette.06af60db.min.css | 1 + .../stylesheets/palette.06af60db.min.css.map | 1 + configs/__init__.py | 1 + configs/callbacks/default.yaml | 19 + configs/callbacks/early_stopping.yaml | 17 + configs/callbacks/learning_rate_monitor.yaml | 3 + configs/callbacks/model_checkpoint.yaml | 19 + configs/callbacks/model_summary.yaml | 7 + configs/callbacks/rich_progress_bar.yaml | 6 + configs/callbacks/speed_monitor.yaml | 7 + configs/debug/default.yaml | 45 + configs/debug/fdr.yaml | 9 + configs/debug/limit.yaml | 12 + configs/debug/overfit.yaml | 13 + configs/debug/profiler.yaml | 12 + configs/env/cvrp.yaml | 10 + configs/env/cvrptw.yaml | 10 + configs/env/default.yaml | 6 + configs/env/dpp.yaml | 10 + configs/env/ffsp.yaml | 10 + configs/env/fjsp/10j-5m.yaml | 13 + configs/env/fjsp/15j-10m.yaml | 13 + configs/env/fjsp/20j-10m.yaml | 13 + configs/env/fjsp/20j-5m.yaml | 13 + configs/env/jssp/10j-10m.yaml | 11 + configs/env/jssp/15j-15m.yaml | 11 + configs/env/jssp/20j-20m.yaml | 11 + configs/env/jssp/6j-6m.yaml | 11 + configs/env/mdcpdp.yaml | 13 + configs/env/mdpp.yaml | 11 + configs/env/mtsp.yaml | 11 + configs/env/op.yaml | 10 + configs/env/pctsp.yaml | 9 + configs/env/pdp.yaml | 12 + configs/env/sdvrp.yaml | 10 + configs/env/spctsp.yaml | 10 + configs/env/svrp.yaml | 10 + configs/env/tsp.yaml | 10 + configs/experiment/base.yaml | 48 + configs/experiment/eda/am-a2c.yaml | 35 + configs/experiment/eda/am-ppo.yaml | 42 + configs/experiment/eda/am.yaml | 30 + configs/experiment/graph/am.yaml | 30 + configs/experiment/routing/am-a2c.yaml | 22 + configs/experiment/routing/am-ppo.yaml | 52 + configs/experiment/routing/am-svrp.yaml | 40 + configs/experiment/routing/am-xl.yaml | 45 + configs/experiment/routing/am.yaml | 42 + configs/experiment/routing/ar-gnn.yaml | 47 + configs/experiment/routing/deepaco.yaml | 55 + configs/experiment/routing/mdpomo.yaml | 41 + configs/experiment/routing/polynet.yaml | 44 + configs/experiment/routing/pomo.yaml | 40 + configs/experiment/routing/ptrnet.yaml | 45 + configs/experiment/routing/symnco.yaml | 43 + .../experiment/routing/tsp-stepwise-ppo.yaml | 57 + configs/experiment/scheduling/am-pomo.yaml | 24 + configs/experiment/scheduling/am-ppo.yaml | 50 + configs/experiment/scheduling/base.yaml | 40 + .../experiment/scheduling/ffsp-matnet.yaml | 46 + configs/experiment/scheduling/gnn-ppo.yaml | 33 + configs/experiment/scheduling/hgnn-pomo.yaml | 28 + configs/experiment/scheduling/hgnn-ppo.yaml | 27 + .../experiment/scheduling/matnet-pomo.yaml | 38 + configs/experiment/scheduling/matnet-ppo.yaml | 42 + configs/extras/default.yaml | 8 + configs/hydra/default.yaml | 14 + configs/logger/aim.yaml | 28 + configs/logger/comet.yaml | 12 + configs/logger/csv.yaml | 7 + configs/logger/many_loggers.yaml | 9 + configs/logger/mlflow.yaml | 12 + configs/logger/neptune.yaml | 9 + configs/logger/none.yaml | 1 + configs/logger/tensorboard.yaml | 10 + configs/logger/wandb.yaml | 25 + configs/main.yaml | 65 + configs/model/am-ppo.yaml | 4 + configs/model/am.yaml | 3 + configs/model/deepaco.yaml | 3 + configs/model/default.yaml | 2 + configs/model/ham.yaml | 1 + configs/model/l2d.yaml | 1 + configs/model/matnet.yaml | 7 + configs/model/mdam.yaml | 1 + configs/model/polynet.yaml | 11 + configs/model/pomo.yaml | 10 + configs/model/ptrnet.yaml | 1 + configs/model/symnco.yaml | 10 + configs/paths/default.yaml | 18 + configs/trainer/default.yaml | 15 + docs/__pycache__/hooks.cpython-312.pyc | Bin 0 -> 3625 bytes docs/assets/figs/MIT_logo.svg | 9 + docs/assets/figs/embeddings.png | Bin 0 -> 39019 bytes docs/assets/figs/framework.png | Bin 0 -> 28745 bytes docs/assets/figs/policies.png | Bin 0 -> 78113 bytes docs/assets/figs/rl4co-logo.svg | 38 + docs/assets/rl4co_animated_full_tricks.svg | 77 + docs/content/api/data/index.html | 4924 ++++++++ docs/content/api/decoding/index.html | 4813 +++++++ docs/content/api/envs/base/index.html | 4258 +++++++ docs/content/api/envs/eda/index.html | 3433 +++++ docs/content/api/envs/graph/index.html | 3220 +++++ docs/content/api/envs/routing/index.html | 8716 +++++++++++++ docs/content/api/envs/scheduling/index.html | 4077 ++++++ .../api/networks/base_policies/index.html | 5525 ++++++++ .../api/networks/env_embeddings/index.html | 5568 +++++++++ .../networks/improvement_policies/index.html | 3154 +++++ docs/content/api/networks/nn/index.html | 6238 +++++++++ docs/content/api/rl/a2c/index.html | 2706 ++++ docs/content/api/rl/base/index.html | 4374 +++++++ docs/content/api/rl/ppo/index.html | 2739 ++++ docs/content/api/rl/reinforce/index.html | 5239 ++++++++ docs/content/api/tasks/index.html | 3634 ++++++ docs/content/api/train_and_eval/index.html | 2357 ++++ .../api/zoo/constructive_ar/index.html | 10435 ++++++++++++++++ .../api/zoo/constructive_nar/index.html | 5456 ++++++++ docs/content/api/zoo/improvement/index.html | 7472 +++++++++++ docs/content/api/zoo/transductive/index.html | 5314 ++++++++ docs/content/general/ai4co/index.html | 2447 ++++ docs/content/general/contribute/index.html | 2447 ++++ docs/content/general/faq/index.html | 2448 ++++ docs/content/general/licensing/index.html | 2390 ++++ docs/content/general/paper/index.html | 2445 ++++ docs/content/intro/environments/index.html | 2944 +++++ docs/content/intro/intro/index.html | 2555 ++++ docs/content/intro/policies/index.html | 2556 ++++ docs/content/intro/rl/index.html | 2498 ++++ docs/content/start/hydra/index.html | 2726 ++++ docs/content/start/installation/index.html | 2491 ++++ docs/hooks.py | 61 + docs/index.html | 2410 ++++ docs/js/autolink.js | 34 + docs/js/katex.js | 10 + docs/js/tsparticles.js | 2 + docs/overrides/fancylogo.txt | 257 + docs/overrides/main.html | 12 + docs/stylesheets/extra.css | 30 + docs/stylesheets/mkdocstrings.css | 54 + examples/1-quickstart/1-quickstart.ipynb | 455 + examples/1-quickstart/index.html | 3735 ++++++ .../2-full-training/2-full-training.ipynb | 937 ++ examples/2-full-training/index.html | 4469 +++++++ examples/2b-train-simple.py | 67 + examples/2d-meta_train.py | 80 + .../3-creating-new-env-model.ipynb | 941 ++ examples/3-creating-new-env-model/index.html | 4916 ++++++++ .../1-hydra-config/1-hydra-config.ipynb | 430 + examples/advanced/1-hydra-config/index.html | 3592 ++++++ .../2-flash-attention-2.ipynb | 410 + .../advanced/2-flash-attention-2/index.html | 3541 ++++++ .../3-local-search/3-local-search.ipynb | 185 + examples/advanced/3-local-search/index.html | 3235 +++++ examples/advanced/index.html | 2385 ++++ .../1-test-on-tsplib/1-test-on-tsplib.ipynb | 660 + examples/datasets/1-test-on-tsplib/index.html | 4011 ++++++ .../2-test-on-cvrplib/2-test-on-cvrplib.ipynb | 643 + .../datasets/2-test-on-cvrplib/index.html | 3958 ++++++ examples/datasets/index.html | 2385 ++++ examples/index.html | 2449 ++++ .../1-decoding-strategies.ipynb | 679 + .../modeling/1-decoding-strategies/index.html | 4269 +++++++ .../2-transductive-methods.ipynb | 436 + .../2-transductive-methods/index.html | 3625 ++++++ .../3-change-encoder/3-change-encoder.ipynb | 520 + examples/modeling/3-change-encoder/index.html | 3669 ++++++ examples/modeling/index.html | 2386 ++++ examples/other/1-mtvrp/1-mtvrp.ipynb | 647 + examples/other/1-mtvrp/index.html | 3996 ++++++ .../other/2-scheduling/2-scheduling.ipynb | 829 ++ examples/other/2-scheduling/index.html | 4336 +++++++ .../3-data-generator-distributions.ipynb | 372 + .../3-data-generator-distributions/index.html | 3483 ++++++ examples/other/index.html | 2386 ++++ index.html | 3069 +++++ objects.inv | Bin 0 -> 3291 bytes rl4co/__init__.py | 4 + rl4co/data/__init__.py | 0 rl4co/data/dataset.py | 134 + rl4co/data/generate_data.py | 397 + rl4co/data/transforms.py | 150 + rl4co/data/utils.py | 71 + rl4co/envs/__init__.py | 77 + rl4co/envs/common/__init__.py | 2 + rl4co/envs/common/base.py | 403 + rl4co/envs/common/distribution_utils.py | 292 + rl4co/envs/common/utils.py | 109 + rl4co/envs/eda/__init__.py | 2 + rl4co/envs/eda/dpp/__init__.py | 0 rl4co/envs/eda/dpp/env.py | 251 + rl4co/envs/eda/dpp/generator.py | 169 + rl4co/envs/eda/dpp/render.py | 84 + rl4co/envs/eda/mdpp/__init__.py | 0 rl4co/envs/eda/mdpp/env.py | 154 + rl4co/envs/eda/mdpp/generator.py | 178 + rl4co/envs/eda/mdpp/render.py | 161 + rl4co/envs/graph/__init__.py | 4 + rl4co/envs/graph/flp/__init__.py | 0 rl4co/envs/graph/flp/env.py | 169 + rl4co/envs/graph/flp/generator.py | 74 + rl4co/envs/graph/mcp/__init__.py | 0 rl4co/envs/graph/mcp/env.py | 193 + rl4co/envs/graph/mcp/generator.py | 138 + rl4co/envs/routing/__init__.py | 24 + rl4co/envs/routing/atsp/__init__.py | 0 rl4co/envs/routing/atsp/env.py | 168 + rl4co/envs/routing/atsp/generator.py | 66 + rl4co/envs/routing/atsp/render.py | 50 + rl4co/envs/routing/cvrp/__init__.py | 0 rl4co/envs/routing/cvrp/env.py | 265 + rl4co/envs/routing/cvrp/generator.py | 143 + rl4co/envs/routing/cvrp/local_search.py | 215 + rl4co/envs/routing/cvrp/render.py | 139 + rl4co/envs/routing/cvrptw/__init__.py | 0 rl4co/envs/routing/cvrptw/env.py | 287 + rl4co/envs/routing/cvrptw/generator.py | 162 + rl4co/envs/routing/cvrptw/render.py | 133 + rl4co/envs/routing/mdcpdp/__init__.py | 0 rl4co/envs/routing/mdcpdp/env.py | 400 + rl4co/envs/routing/mdcpdp/generator.py | 126 + rl4co/envs/routing/mdcpdp/render.py | 120 + rl4co/envs/routing/mpdp/__init__.py | 0 rl4co/envs/routing/mpdp/env.py | 394 + rl4co/envs/routing/mpdp/generator.py | 95 + rl4co/envs/routing/mpdp/render.py | 114 + rl4co/envs/routing/mtsp/__init__.py | 0 rl4co/envs/routing/mtsp/env.py | 240 + rl4co/envs/routing/mtsp/generator.py | 72 + rl4co/envs/routing/mtsp/render.py | 95 + rl4co/envs/routing/mtvrp/__init__.py | 0 .../envs/routing/mtvrp/baselines/__init__.py | 0 .../envs/routing/mtvrp/baselines/constants.py | 42 + rl4co/envs/routing/mtvrp/baselines/lkh.py | 214 + rl4co/envs/routing/mtvrp/baselines/ortools.py | 248 + rl4co/envs/routing/mtvrp/baselines/pyvrp.py | 109 + rl4co/envs/routing/mtvrp/baselines/solve.py | 83 + rl4co/envs/routing/mtvrp/baselines/utils.py | 36 + rl4co/envs/routing/mtvrp/env.py | 494 + rl4co/envs/routing/mtvrp/generator.py | 436 + rl4co/envs/routing/mtvrp/render.py | 145 + rl4co/envs/routing/op/__init__.py | 0 rl4co/envs/routing/op/env.py | 257 + rl4co/envs/routing/op/generator.py | 149 + rl4co/envs/routing/op/render.py | 86 + rl4co/envs/routing/pctsp/__init__.py | 0 rl4co/envs/routing/pctsp/env.py | 279 + rl4co/envs/routing/pctsp/generator.py | 143 + rl4co/envs/routing/pctsp/render.py | 93 + rl4co/envs/routing/pdp/__init__.py | 0 rl4co/envs/routing/pdp/env.py | 530 + rl4co/envs/routing/pdp/generator.py | 152 + rl4co/envs/routing/pdp/render.py | 142 + rl4co/envs/routing/sdvrp/__init__.py | 0 rl4co/envs/routing/sdvrp/env.py | 205 + rl4co/envs/routing/spctsp/__init__.py | 0 rl4co/envs/routing/spctsp/env.py | 31 + rl4co/envs/routing/svrp/__init__.py | 0 rl4co/envs/routing/svrp/env.py | 248 + rl4co/envs/routing/svrp/generator.py | 107 + rl4co/envs/routing/svrp/render.py | 103 + rl4co/envs/routing/tsp/__init__.py | 0 rl4co/envs/routing/tsp/env.py | 601 + rl4co/envs/routing/tsp/generator.py | 99 + rl4co/envs/routing/tsp/local_search.py | 74 + rl4co/envs/routing/tsp/render.py | 110 + rl4co/envs/scheduling/__init__.py | 4 + rl4co/envs/scheduling/ffsp/__init__.py | 0 rl4co/envs/scheduling/ffsp/env.py | 453 + rl4co/envs/scheduling/ffsp/generator.py | 65 + rl4co/envs/scheduling/ffsp/render.py | 72 + rl4co/envs/scheduling/fjsp/__init__.py | 2 + rl4co/envs/scheduling/fjsp/env.py | 503 + rl4co/envs/scheduling/fjsp/generator.py | 238 + rl4co/envs/scheduling/fjsp/parser.py | 180 + rl4co/envs/scheduling/fjsp/render.py | 72 + rl4co/envs/scheduling/fjsp/utils.py | 334 + rl4co/envs/scheduling/jssp/__init__.py | 0 rl4co/envs/scheduling/jssp/env.py | 123 + rl4co/envs/scheduling/jssp/generator.py | 208 + rl4co/envs/scheduling/jssp/parser.py | 110 + rl4co/envs/scheduling/smtwtp/__init__.py | 0 rl4co/envs/scheduling/smtwtp/env.py | 198 + rl4co/envs/scheduling/smtwtp/generator.py | 88 + rl4co/envs/scheduling/smtwtp/render.py | 15 + rl4co/models/__init__.py | 49 + rl4co/models/common/__init__.py | 21 + rl4co/models/common/constructive/__init__.py | 15 + .../constructive/autoregressive/__init__.py | 3 + .../constructive/autoregressive/decoder.py | 13 + .../constructive/autoregressive/encoder.py | 13 + .../constructive/autoregressive/policy.py | 46 + rl4co/models/common/constructive/base.py | 268 + .../nonautoregressive/__init__.py | 9 + .../constructive/nonautoregressive/decoder.py | 40 + .../constructive/nonautoregressive/encoder.py | 13 + .../constructive/nonautoregressive/policy.py | 40 + rl4co/models/common/improvement/__init__.py | 1 + rl4co/models/common/improvement/base.py | 146 + rl4co/models/common/transductive/__init__.py | 1 + rl4co/models/common/transductive/base.py | 93 + rl4co/models/nn/__init__.py | 0 rl4co/models/nn/attention.py | 538 + rl4co/models/nn/env_embeddings/__init__.py | 4 + rl4co/models/nn/env_embeddings/context.py | 372 + rl4co/models/nn/env_embeddings/dynamic.py | 121 + rl4co/models/nn/env_embeddings/edge.py | 153 + rl4co/models/nn/env_embeddings/init.py | 512 + rl4co/models/nn/flash_attention.py | 64 + rl4co/models/nn/graph/__init__.py | 0 rl4co/models/nn/graph/attnnet.py | 103 + rl4co/models/nn/graph/gcn.py | 114 + rl4co/models/nn/graph/gnn.py | 99 + rl4co/models/nn/graph/hgnn.py | 133 + rl4co/models/nn/graph/mpnn.py | 173 + rl4co/models/nn/mlp.py | 80 + rl4co/models/nn/moe.py | 277 + rl4co/models/nn/ops.py | 137 + rl4co/models/nn/pos_embeddings.py | 159 + rl4co/models/rl/__init__.py | 6 + rl4co/models/rl/a2c/__init__.py | 0 rl4co/models/rl/a2c/a2c.py | 58 + rl4co/models/rl/common/__init__.py | 0 rl4co/models/rl/common/base.py | 333 + rl4co/models/rl/common/critic.py | 77 + rl4co/models/rl/common/utils.py | 48 + rl4co/models/rl/ppo/__init__.py | 0 rl4co/models/rl/ppo/n_step_ppo.py | 280 + rl4co/models/rl/ppo/ppo.py | 235 + rl4co/models/rl/ppo/stepwise_ppo.py | 171 + rl4co/models/rl/reinforce/__init__.py | 0 rl4co/models/rl/reinforce/baselines.py | 311 + rl4co/models/rl/reinforce/reinforce.py | 210 + rl4co/models/zoo/__init__.py | 30 + rl4co/models/zoo/active_search/__init__.py | 1 + rl4co/models/zoo/active_search/search.py | 202 + rl4co/models/zoo/am/__init__.py | 2 + rl4co/models/zoo/am/decoder.py | 235 + rl4co/models/zoo/am/encoder.py | 91 + rl4co/models/zoo/am/model.py | 34 + rl4co/models/zoo/am/policy.py | 122 + rl4co/models/zoo/amppo/__init__.py | 1 + rl4co/models/zoo/amppo/model.py | 49 + rl4co/models/zoo/dact/__init__.py | 2 + rl4co/models/zoo/dact/decoder.py | 132 + rl4co/models/zoo/dact/encoder.py | 274 + rl4co/models/zoo/dact/model.py | 62 + rl4co/models/zoo/dact/policy.py | 188 + rl4co/models/zoo/deepaco/__init__.py | 2 + rl4co/models/zoo/deepaco/antsystem.py | 347 + rl4co/models/zoo/deepaco/model.py | 51 + rl4co/models/zoo/deepaco/policy.py | 147 + rl4co/models/zoo/eas/__init__.py | 1 + rl4co/models/zoo/eas/decoder.py | 128 + rl4co/models/zoo/eas/nn.py | 30 + rl4co/models/zoo/eas/search.py | 346 + rl4co/models/zoo/ham/__init__.py | 2 + rl4co/models/zoo/ham/attention.py | 488 + rl4co/models/zoo/ham/encoder.py | 73 + rl4co/models/zoo/ham/model.py | 37 + rl4co/models/zoo/ham/policy.py | 62 + rl4co/models/zoo/l2d/__init__.py | 2 + rl4co/models/zoo/l2d/decoder.py | 389 + rl4co/models/zoo/l2d/encoder.py | 26 + rl4co/models/zoo/l2d/model.py | 69 + rl4co/models/zoo/l2d/policy.py | 251 + rl4co/models/zoo/matnet/__init__.py | 2 + rl4co/models/zoo/matnet/decoder.py | 157 + rl4co/models/zoo/matnet/encoder.py | 224 + rl4co/models/zoo/matnet/matnet_w_sa.py | 202 + rl4co/models/zoo/matnet/model.py | 54 + rl4co/models/zoo/matnet/policy.py | 210 + rl4co/models/zoo/mdam/__init__.py | 2 + rl4co/models/zoo/mdam/decoder.py | 331 + rl4co/models/zoo/mdam/encoder.py | 101 + rl4co/models/zoo/mdam/mha.py | 87 + rl4co/models/zoo/mdam/model.py | 125 + rl4co/models/zoo/mdam/policy.py | 90 + rl4co/models/zoo/mvmoe/__init__.py | 2 + rl4co/models/zoo/mvmoe/model.py | 79 + rl4co/models/zoo/n2s/__init__.py | 2 + rl4co/models/zoo/n2s/decoder.py | 261 + rl4co/models/zoo/n2s/encoder.py | 217 + rl4co/models/zoo/n2s/model.py | 62 + rl4co/models/zoo/n2s/policy.py | 222 + rl4co/models/zoo/nargnn/__init__.py | 2 + rl4co/models/zoo/nargnn/encoder.py | 212 + rl4co/models/zoo/nargnn/policy.py | 107 + rl4co/models/zoo/neuopt/__init__.py | 2 + rl4co/models/zoo/neuopt/decoder.py | 77 + rl4co/models/zoo/neuopt/model.py | 62 + rl4co/models/zoo/neuopt/policy.py | 300 + rl4co/models/zoo/polynet/__init__.py | 1 + rl4co/models/zoo/polynet/decoder.py | 145 + rl4co/models/zoo/polynet/model.py | 240 + rl4co/models/zoo/polynet/policy.py | 101 + rl4co/models/zoo/pomo/__init__.py | 1 + rl4co/models/zoo/pomo/model.py | 148 + rl4co/models/zoo/ptrnet/__init__.py | 2 + rl4co/models/zoo/ptrnet/critic.py | 58 + rl4co/models/zoo/ptrnet/decoder.py | 182 + rl4co/models/zoo/ptrnet/encoder.py | 29 + rl4co/models/zoo/ptrnet/model.py | 35 + rl4co/models/zoo/ptrnet/policy.py | 107 + rl4co/models/zoo/symnco/__init__.py | 2 + rl4co/models/zoo/symnco/losses.py | 39 + rl4co/models/zoo/symnco/model.py | 142 + rl4co/models/zoo/symnco/policy.py | 91 + rl4co/tasks/__init__.py | 0 rl4co/tasks/eval.py | 591 + rl4co/tasks/index.html | 2454 ++++ rl4co/tasks/train.py | 117 + rl4co/utils/__init__.py | 11 + rl4co/utils/callbacks/__init__.py | 0 rl4co/utils/callbacks/speed_monitor.py | 123 + rl4co/utils/decoding.py | 606 + rl4co/utils/instantiators.py | 61 + rl4co/utils/lightning.py | 76 + rl4co/utils/meta_trainer.py | 170 + rl4co/utils/ops.py | 262 + rl4co/utils/optim_helpers.py | 38 + rl4co/utils/pylogger.py | 25 + rl4co/utils/rich_utils.py | 97 + rl4co/utils/test_utils.py | 71 + rl4co/utils/trainer.py | 152 + rl4co/utils/utils.py | 285 + search/search_index.json | 1 + sitemap.xml | 223 + sitemap.xml.gz | Bin 0 -> 678 bytes tests/__init__.py | 0 tests/test_envs.py | 157 + tests/test_policy.py | 88 + tests/test_tasks.py | 78 + tests/test_training.py | 312 + tests/test_utils.py | 52 + 480 files changed, 261376 insertions(+) create mode 100644 .nojekyll create mode 100644 404.html create mode 100644 CNAME create mode 100644 README_backup/index.html create mode 100644 assets/_mkdocstrings.css create mode 100644 assets/images/favicon.png create mode 100644 assets/javascripts/bundle.83f73b43.min.js create mode 100644 assets/javascripts/bundle.83f73b43.min.js.map create mode 100644 assets/javascripts/lunr/min/lunr.ar.min.js create mode 100644 assets/javascripts/lunr/min/lunr.da.min.js create mode 100644 assets/javascripts/lunr/min/lunr.de.min.js create mode 100644 assets/javascripts/lunr/min/lunr.du.min.js create mode 100644 assets/javascripts/lunr/min/lunr.el.min.js create mode 100644 assets/javascripts/lunr/min/lunr.es.min.js create mode 100644 assets/javascripts/lunr/min/lunr.fi.min.js create mode 100644 assets/javascripts/lunr/min/lunr.fr.min.js create mode 100644 assets/javascripts/lunr/min/lunr.he.min.js create mode 100644 assets/javascripts/lunr/min/lunr.hi.min.js create mode 100644 assets/javascripts/lunr/min/lunr.hu.min.js create mode 100644 assets/javascripts/lunr/min/lunr.hy.min.js create mode 100644 assets/javascripts/lunr/min/lunr.it.min.js create mode 100644 assets/javascripts/lunr/min/lunr.ja.min.js create mode 100644 assets/javascripts/lunr/min/lunr.jp.min.js create mode 100644 assets/javascripts/lunr/min/lunr.kn.min.js create mode 100644 assets/javascripts/lunr/min/lunr.ko.min.js create mode 100644 assets/javascripts/lunr/min/lunr.multi.min.js create mode 100644 assets/javascripts/lunr/min/lunr.nl.min.js create mode 100644 assets/javascripts/lunr/min/lunr.no.min.js create mode 100644 assets/javascripts/lunr/min/lunr.pt.min.js create mode 100644 assets/javascripts/lunr/min/lunr.ro.min.js create mode 100644 assets/javascripts/lunr/min/lunr.ru.min.js create mode 100644 assets/javascripts/lunr/min/lunr.sa.min.js create mode 100644 assets/javascripts/lunr/min/lunr.stemmer.support.min.js create mode 100644 assets/javascripts/lunr/min/lunr.sv.min.js create mode 100644 assets/javascripts/lunr/min/lunr.ta.min.js create mode 100644 assets/javascripts/lunr/min/lunr.te.min.js create mode 100644 assets/javascripts/lunr/min/lunr.th.min.js create mode 100644 assets/javascripts/lunr/min/lunr.tr.min.js create mode 100644 assets/javascripts/lunr/min/lunr.vi.min.js create mode 100644 assets/javascripts/lunr/min/lunr.zh.min.js create mode 100644 assets/javascripts/lunr/tinyseg.js create mode 100644 assets/javascripts/lunr/wordcut.js create mode 100644 assets/javascripts/workers/search.6ce7567c.min.js create mode 100644 assets/javascripts/workers/search.6ce7567c.min.js.map create mode 100644 assets/stylesheets/main.0253249f.min.css create mode 100644 assets/stylesheets/main.0253249f.min.css.map create mode 100644 assets/stylesheets/palette.06af60db.min.css create mode 100644 assets/stylesheets/palette.06af60db.min.css.map create mode 100644 configs/__init__.py create mode 100644 configs/callbacks/default.yaml create mode 100644 configs/callbacks/early_stopping.yaml create mode 100644 configs/callbacks/learning_rate_monitor.yaml create mode 100644 configs/callbacks/model_checkpoint.yaml create mode 100644 configs/callbacks/model_summary.yaml create mode 100644 configs/callbacks/rich_progress_bar.yaml create mode 100644 configs/callbacks/speed_monitor.yaml create mode 100644 configs/debug/default.yaml create mode 100644 configs/debug/fdr.yaml create mode 100644 configs/debug/limit.yaml create mode 100644 configs/debug/overfit.yaml create mode 100644 configs/debug/profiler.yaml create mode 100644 configs/env/cvrp.yaml create mode 100644 configs/env/cvrptw.yaml create mode 100644 configs/env/default.yaml create mode 100644 configs/env/dpp.yaml create mode 100644 configs/env/ffsp.yaml create mode 100644 configs/env/fjsp/10j-5m.yaml create mode 100644 configs/env/fjsp/15j-10m.yaml create mode 100644 configs/env/fjsp/20j-10m.yaml create mode 100644 configs/env/fjsp/20j-5m.yaml create mode 100644 configs/env/jssp/10j-10m.yaml create mode 100644 configs/env/jssp/15j-15m.yaml create mode 100644 configs/env/jssp/20j-20m.yaml create mode 100644 configs/env/jssp/6j-6m.yaml create mode 100644 configs/env/mdcpdp.yaml create mode 100644 configs/env/mdpp.yaml create mode 100644 configs/env/mtsp.yaml create mode 100644 configs/env/op.yaml create mode 100644 configs/env/pctsp.yaml create mode 100644 configs/env/pdp.yaml create mode 100644 configs/env/sdvrp.yaml create mode 100644 configs/env/spctsp.yaml create mode 100644 configs/env/svrp.yaml create mode 100644 configs/env/tsp.yaml create mode 100644 configs/experiment/base.yaml create mode 100644 configs/experiment/eda/am-a2c.yaml create mode 100644 configs/experiment/eda/am-ppo.yaml create mode 100644 configs/experiment/eda/am.yaml create mode 100644 configs/experiment/graph/am.yaml create mode 100644 configs/experiment/routing/am-a2c.yaml create mode 100644 configs/experiment/routing/am-ppo.yaml create mode 100644 configs/experiment/routing/am-svrp.yaml create mode 100644 configs/experiment/routing/am-xl.yaml create mode 100644 configs/experiment/routing/am.yaml create mode 100644 configs/experiment/routing/ar-gnn.yaml create mode 100644 configs/experiment/routing/deepaco.yaml create mode 100644 configs/experiment/routing/mdpomo.yaml create mode 100644 configs/experiment/routing/polynet.yaml create mode 100644 configs/experiment/routing/pomo.yaml create mode 100644 configs/experiment/routing/ptrnet.yaml create mode 100644 configs/experiment/routing/symnco.yaml create mode 100644 configs/experiment/routing/tsp-stepwise-ppo.yaml create mode 100644 configs/experiment/scheduling/am-pomo.yaml create mode 100644 configs/experiment/scheduling/am-ppo.yaml create mode 100644 configs/experiment/scheduling/base.yaml create mode 100644 configs/experiment/scheduling/ffsp-matnet.yaml create mode 100644 configs/experiment/scheduling/gnn-ppo.yaml create mode 100644 configs/experiment/scheduling/hgnn-pomo.yaml create mode 100644 configs/experiment/scheduling/hgnn-ppo.yaml create mode 100644 configs/experiment/scheduling/matnet-pomo.yaml create mode 100644 configs/experiment/scheduling/matnet-ppo.yaml create mode 100644 configs/extras/default.yaml create mode 100644 configs/hydra/default.yaml create mode 100644 configs/logger/aim.yaml create mode 100644 configs/logger/comet.yaml create mode 100644 configs/logger/csv.yaml create mode 100644 configs/logger/many_loggers.yaml create mode 100644 configs/logger/mlflow.yaml create mode 100644 configs/logger/neptune.yaml create mode 100644 configs/logger/none.yaml create mode 100644 configs/logger/tensorboard.yaml create mode 100644 configs/logger/wandb.yaml create mode 100644 configs/main.yaml create mode 100644 configs/model/am-ppo.yaml create mode 100644 configs/model/am.yaml create mode 100644 configs/model/deepaco.yaml create mode 100644 configs/model/default.yaml create mode 100644 configs/model/ham.yaml create mode 100644 configs/model/l2d.yaml create mode 100644 configs/model/matnet.yaml create mode 100644 configs/model/mdam.yaml create mode 100644 configs/model/polynet.yaml create mode 100644 configs/model/pomo.yaml create mode 100644 configs/model/ptrnet.yaml create mode 100644 configs/model/symnco.yaml create mode 100644 configs/paths/default.yaml create mode 100644 configs/trainer/default.yaml create mode 100644 docs/__pycache__/hooks.cpython-312.pyc create mode 100644 docs/assets/figs/MIT_logo.svg create mode 100644 docs/assets/figs/embeddings.png create mode 100644 docs/assets/figs/framework.png create mode 100644 docs/assets/figs/policies.png create mode 100644 docs/assets/figs/rl4co-logo.svg create mode 100644 docs/assets/rl4co_animated_full_tricks.svg create mode 100644 docs/content/api/data/index.html create mode 100644 docs/content/api/decoding/index.html create mode 100644 docs/content/api/envs/base/index.html create mode 100644 docs/content/api/envs/eda/index.html create mode 100644 docs/content/api/envs/graph/index.html create mode 100644 docs/content/api/envs/routing/index.html create mode 100644 docs/content/api/envs/scheduling/index.html create mode 100644 docs/content/api/networks/base_policies/index.html create mode 100644 docs/content/api/networks/env_embeddings/index.html create mode 100644 docs/content/api/networks/improvement_policies/index.html create mode 100644 docs/content/api/networks/nn/index.html create mode 100644 docs/content/api/rl/a2c/index.html create mode 100644 docs/content/api/rl/base/index.html create mode 100644 docs/content/api/rl/ppo/index.html create mode 100644 docs/content/api/rl/reinforce/index.html create mode 100644 docs/content/api/tasks/index.html create mode 100644 docs/content/api/train_and_eval/index.html create mode 100644 docs/content/api/zoo/constructive_ar/index.html create mode 100644 docs/content/api/zoo/constructive_nar/index.html create mode 100644 docs/content/api/zoo/improvement/index.html create mode 100644 docs/content/api/zoo/transductive/index.html create mode 100644 docs/content/general/ai4co/index.html create mode 100644 docs/content/general/contribute/index.html create mode 100644 docs/content/general/faq/index.html create mode 100644 docs/content/general/licensing/index.html create mode 100644 docs/content/general/paper/index.html create mode 100644 docs/content/intro/environments/index.html create mode 100644 docs/content/intro/intro/index.html create mode 100644 docs/content/intro/policies/index.html create mode 100644 docs/content/intro/rl/index.html create mode 100644 docs/content/start/hydra/index.html create mode 100644 docs/content/start/installation/index.html create mode 100644 docs/hooks.py create mode 100644 docs/index.html create mode 100644 docs/js/autolink.js create mode 100644 docs/js/katex.js create mode 100644 docs/js/tsparticles.js create mode 100644 docs/overrides/fancylogo.txt create mode 100644 docs/overrides/main.html create mode 100644 docs/stylesheets/extra.css create mode 100644 docs/stylesheets/mkdocstrings.css create mode 100644 examples/1-quickstart/1-quickstart.ipynb create mode 100644 examples/1-quickstart/index.html create mode 100644 examples/2-full-training/2-full-training.ipynb create mode 100644 examples/2-full-training/index.html create mode 100644 examples/2b-train-simple.py create mode 100644 examples/2d-meta_train.py create mode 100644 examples/3-creating-new-env-model/3-creating-new-env-model.ipynb create mode 100644 examples/3-creating-new-env-model/index.html create mode 100644 examples/advanced/1-hydra-config/1-hydra-config.ipynb create mode 100644 examples/advanced/1-hydra-config/index.html create mode 100644 examples/advanced/2-flash-attention-2/2-flash-attention-2.ipynb create mode 100644 examples/advanced/2-flash-attention-2/index.html create mode 100644 examples/advanced/3-local-search/3-local-search.ipynb create mode 100644 examples/advanced/3-local-search/index.html create mode 100644 examples/advanced/index.html create mode 100644 examples/datasets/1-test-on-tsplib/1-test-on-tsplib.ipynb create mode 100644 examples/datasets/1-test-on-tsplib/index.html create mode 100644 examples/datasets/2-test-on-cvrplib/2-test-on-cvrplib.ipynb create mode 100644 examples/datasets/2-test-on-cvrplib/index.html create mode 100644 examples/datasets/index.html create mode 100644 examples/index.html create mode 100644 examples/modeling/1-decoding-strategies/1-decoding-strategies.ipynb create mode 100644 examples/modeling/1-decoding-strategies/index.html create mode 100644 examples/modeling/2-transductive-methods/2-transductive-methods.ipynb create mode 100644 examples/modeling/2-transductive-methods/index.html create mode 100644 examples/modeling/3-change-encoder/3-change-encoder.ipynb create mode 100644 examples/modeling/3-change-encoder/index.html create mode 100644 examples/modeling/index.html create mode 100644 examples/other/1-mtvrp/1-mtvrp.ipynb create mode 100644 examples/other/1-mtvrp/index.html create mode 100644 examples/other/2-scheduling/2-scheduling.ipynb create mode 100644 examples/other/2-scheduling/index.html create mode 100644 examples/other/3-data-generator-distributions/3-data-generator-distributions.ipynb create mode 100644 examples/other/3-data-generator-distributions/index.html create mode 100644 examples/other/index.html create mode 100644 index.html create mode 100644 objects.inv create mode 100644 rl4co/__init__.py create mode 100644 rl4co/data/__init__.py create mode 100644 rl4co/data/dataset.py create mode 100644 rl4co/data/generate_data.py create mode 100644 rl4co/data/transforms.py create mode 100644 rl4co/data/utils.py create mode 100644 rl4co/envs/__init__.py create mode 100644 rl4co/envs/common/__init__.py create mode 100644 rl4co/envs/common/base.py create mode 100644 rl4co/envs/common/distribution_utils.py create mode 100644 rl4co/envs/common/utils.py create mode 100644 rl4co/envs/eda/__init__.py create mode 100644 rl4co/envs/eda/dpp/__init__.py create mode 100644 rl4co/envs/eda/dpp/env.py create mode 100644 rl4co/envs/eda/dpp/generator.py create mode 100644 rl4co/envs/eda/dpp/render.py create mode 100644 rl4co/envs/eda/mdpp/__init__.py create mode 100644 rl4co/envs/eda/mdpp/env.py create mode 100644 rl4co/envs/eda/mdpp/generator.py create mode 100644 rl4co/envs/eda/mdpp/render.py create mode 100644 rl4co/envs/graph/__init__.py create mode 100644 rl4co/envs/graph/flp/__init__.py create mode 100644 rl4co/envs/graph/flp/env.py create mode 100644 rl4co/envs/graph/flp/generator.py create mode 100644 rl4co/envs/graph/mcp/__init__.py create mode 100644 rl4co/envs/graph/mcp/env.py create mode 100644 rl4co/envs/graph/mcp/generator.py create mode 100644 rl4co/envs/routing/__init__.py create mode 100644 rl4co/envs/routing/atsp/__init__.py create mode 100644 rl4co/envs/routing/atsp/env.py create mode 100644 rl4co/envs/routing/atsp/generator.py create mode 100644 rl4co/envs/routing/atsp/render.py create mode 100644 rl4co/envs/routing/cvrp/__init__.py create mode 100644 rl4co/envs/routing/cvrp/env.py create mode 100644 rl4co/envs/routing/cvrp/generator.py create mode 100644 rl4co/envs/routing/cvrp/local_search.py create mode 100644 rl4co/envs/routing/cvrp/render.py create mode 100644 rl4co/envs/routing/cvrptw/__init__.py create mode 100644 rl4co/envs/routing/cvrptw/env.py create mode 100644 rl4co/envs/routing/cvrptw/generator.py create mode 100644 rl4co/envs/routing/cvrptw/render.py create mode 100644 rl4co/envs/routing/mdcpdp/__init__.py create mode 100644 rl4co/envs/routing/mdcpdp/env.py create mode 100644 rl4co/envs/routing/mdcpdp/generator.py create mode 100644 rl4co/envs/routing/mdcpdp/render.py create mode 100644 rl4co/envs/routing/mpdp/__init__.py create mode 100644 rl4co/envs/routing/mpdp/env.py create mode 100644 rl4co/envs/routing/mpdp/generator.py create mode 100644 rl4co/envs/routing/mpdp/render.py create mode 100644 rl4co/envs/routing/mtsp/__init__.py create mode 100644 rl4co/envs/routing/mtsp/env.py create mode 100644 rl4co/envs/routing/mtsp/generator.py create mode 100644 rl4co/envs/routing/mtsp/render.py create mode 100644 rl4co/envs/routing/mtvrp/__init__.py create mode 100644 rl4co/envs/routing/mtvrp/baselines/__init__.py create mode 100644 rl4co/envs/routing/mtvrp/baselines/constants.py create mode 100644 rl4co/envs/routing/mtvrp/baselines/lkh.py create mode 100644 rl4co/envs/routing/mtvrp/baselines/ortools.py create mode 100644 rl4co/envs/routing/mtvrp/baselines/pyvrp.py create mode 100644 rl4co/envs/routing/mtvrp/baselines/solve.py create mode 100644 rl4co/envs/routing/mtvrp/baselines/utils.py create mode 100644 rl4co/envs/routing/mtvrp/env.py create mode 100644 rl4co/envs/routing/mtvrp/generator.py create mode 100644 rl4co/envs/routing/mtvrp/render.py create mode 100644 rl4co/envs/routing/op/__init__.py create mode 100644 rl4co/envs/routing/op/env.py create mode 100644 rl4co/envs/routing/op/generator.py create mode 100644 rl4co/envs/routing/op/render.py create mode 100644 rl4co/envs/routing/pctsp/__init__.py create mode 100644 rl4co/envs/routing/pctsp/env.py create mode 100644 rl4co/envs/routing/pctsp/generator.py create mode 100644 rl4co/envs/routing/pctsp/render.py create mode 100644 rl4co/envs/routing/pdp/__init__.py create mode 100644 rl4co/envs/routing/pdp/env.py create mode 100644 rl4co/envs/routing/pdp/generator.py create mode 100644 rl4co/envs/routing/pdp/render.py create mode 100644 rl4co/envs/routing/sdvrp/__init__.py create mode 100644 rl4co/envs/routing/sdvrp/env.py create mode 100644 rl4co/envs/routing/spctsp/__init__.py create mode 100644 rl4co/envs/routing/spctsp/env.py create mode 100644 rl4co/envs/routing/svrp/__init__.py create mode 100644 rl4co/envs/routing/svrp/env.py create mode 100644 rl4co/envs/routing/svrp/generator.py create mode 100644 rl4co/envs/routing/svrp/render.py create mode 100644 rl4co/envs/routing/tsp/__init__.py create mode 100644 rl4co/envs/routing/tsp/env.py create mode 100644 rl4co/envs/routing/tsp/generator.py create mode 100644 rl4co/envs/routing/tsp/local_search.py create mode 100644 rl4co/envs/routing/tsp/render.py create mode 100644 rl4co/envs/scheduling/__init__.py create mode 100644 rl4co/envs/scheduling/ffsp/__init__.py create mode 100644 rl4co/envs/scheduling/ffsp/env.py create mode 100644 rl4co/envs/scheduling/ffsp/generator.py create mode 100644 rl4co/envs/scheduling/ffsp/render.py create mode 100644 rl4co/envs/scheduling/fjsp/__init__.py create mode 100644 rl4co/envs/scheduling/fjsp/env.py create mode 100644 rl4co/envs/scheduling/fjsp/generator.py create mode 100644 rl4co/envs/scheduling/fjsp/parser.py create mode 100644 rl4co/envs/scheduling/fjsp/render.py create mode 100644 rl4co/envs/scheduling/fjsp/utils.py create mode 100644 rl4co/envs/scheduling/jssp/__init__.py create mode 100644 rl4co/envs/scheduling/jssp/env.py create mode 100644 rl4co/envs/scheduling/jssp/generator.py create mode 100644 rl4co/envs/scheduling/jssp/parser.py create mode 100644 rl4co/envs/scheduling/smtwtp/__init__.py create mode 100644 rl4co/envs/scheduling/smtwtp/env.py create mode 100644 rl4co/envs/scheduling/smtwtp/generator.py create mode 100644 rl4co/envs/scheduling/smtwtp/render.py create mode 100644 rl4co/models/__init__.py create mode 100644 rl4co/models/common/__init__.py create mode 100644 rl4co/models/common/constructive/__init__.py create mode 100644 rl4co/models/common/constructive/autoregressive/__init__.py create mode 100644 rl4co/models/common/constructive/autoregressive/decoder.py create mode 100644 rl4co/models/common/constructive/autoregressive/encoder.py create mode 100644 rl4co/models/common/constructive/autoregressive/policy.py create mode 100644 rl4co/models/common/constructive/base.py create mode 100644 rl4co/models/common/constructive/nonautoregressive/__init__.py create mode 100644 rl4co/models/common/constructive/nonautoregressive/decoder.py create mode 100644 rl4co/models/common/constructive/nonautoregressive/encoder.py create mode 100644 rl4co/models/common/constructive/nonautoregressive/policy.py create mode 100644 rl4co/models/common/improvement/__init__.py create mode 100644 rl4co/models/common/improvement/base.py create mode 100644 rl4co/models/common/transductive/__init__.py create mode 100644 rl4co/models/common/transductive/base.py create mode 100644 rl4co/models/nn/__init__.py create mode 100644 rl4co/models/nn/attention.py create mode 100644 rl4co/models/nn/env_embeddings/__init__.py create mode 100644 rl4co/models/nn/env_embeddings/context.py create mode 100644 rl4co/models/nn/env_embeddings/dynamic.py create mode 100644 rl4co/models/nn/env_embeddings/edge.py create mode 100644 rl4co/models/nn/env_embeddings/init.py create mode 100644 rl4co/models/nn/flash_attention.py create mode 100644 rl4co/models/nn/graph/__init__.py create mode 100644 rl4co/models/nn/graph/attnnet.py create mode 100644 rl4co/models/nn/graph/gcn.py create mode 100644 rl4co/models/nn/graph/gnn.py create mode 100644 rl4co/models/nn/graph/hgnn.py create mode 100644 rl4co/models/nn/graph/mpnn.py create mode 100644 rl4co/models/nn/mlp.py create mode 100644 rl4co/models/nn/moe.py create mode 100644 rl4co/models/nn/ops.py create mode 100644 rl4co/models/nn/pos_embeddings.py create mode 100644 rl4co/models/rl/__init__.py create mode 100644 rl4co/models/rl/a2c/__init__.py create mode 100644 rl4co/models/rl/a2c/a2c.py create mode 100644 rl4co/models/rl/common/__init__.py create mode 100644 rl4co/models/rl/common/base.py create mode 100644 rl4co/models/rl/common/critic.py create mode 100644 rl4co/models/rl/common/utils.py create mode 100644 rl4co/models/rl/ppo/__init__.py create mode 100644 rl4co/models/rl/ppo/n_step_ppo.py create mode 100644 rl4co/models/rl/ppo/ppo.py create mode 100644 rl4co/models/rl/ppo/stepwise_ppo.py create mode 100644 rl4co/models/rl/reinforce/__init__.py create mode 100644 rl4co/models/rl/reinforce/baselines.py create mode 100644 rl4co/models/rl/reinforce/reinforce.py create mode 100644 rl4co/models/zoo/__init__.py create mode 100644 rl4co/models/zoo/active_search/__init__.py create mode 100644 rl4co/models/zoo/active_search/search.py create mode 100644 rl4co/models/zoo/am/__init__.py create mode 100644 rl4co/models/zoo/am/decoder.py create mode 100644 rl4co/models/zoo/am/encoder.py create mode 100644 rl4co/models/zoo/am/model.py create mode 100644 rl4co/models/zoo/am/policy.py create mode 100644 rl4co/models/zoo/amppo/__init__.py create mode 100644 rl4co/models/zoo/amppo/model.py create mode 100644 rl4co/models/zoo/dact/__init__.py create mode 100644 rl4co/models/zoo/dact/decoder.py create mode 100644 rl4co/models/zoo/dact/encoder.py create mode 100644 rl4co/models/zoo/dact/model.py create mode 100644 rl4co/models/zoo/dact/policy.py create mode 100644 rl4co/models/zoo/deepaco/__init__.py create mode 100644 rl4co/models/zoo/deepaco/antsystem.py create mode 100644 rl4co/models/zoo/deepaco/model.py create mode 100644 rl4co/models/zoo/deepaco/policy.py create mode 100644 rl4co/models/zoo/eas/__init__.py create mode 100644 rl4co/models/zoo/eas/decoder.py create mode 100644 rl4co/models/zoo/eas/nn.py create mode 100644 rl4co/models/zoo/eas/search.py create mode 100644 rl4co/models/zoo/ham/__init__.py create mode 100644 rl4co/models/zoo/ham/attention.py create mode 100644 rl4co/models/zoo/ham/encoder.py create mode 100644 rl4co/models/zoo/ham/model.py create mode 100644 rl4co/models/zoo/ham/policy.py create mode 100644 rl4co/models/zoo/l2d/__init__.py create mode 100644 rl4co/models/zoo/l2d/decoder.py create mode 100644 rl4co/models/zoo/l2d/encoder.py create mode 100644 rl4co/models/zoo/l2d/model.py create mode 100644 rl4co/models/zoo/l2d/policy.py create mode 100644 rl4co/models/zoo/matnet/__init__.py create mode 100644 rl4co/models/zoo/matnet/decoder.py create mode 100644 rl4co/models/zoo/matnet/encoder.py create mode 100644 rl4co/models/zoo/matnet/matnet_w_sa.py create mode 100644 rl4co/models/zoo/matnet/model.py create mode 100644 rl4co/models/zoo/matnet/policy.py create mode 100644 rl4co/models/zoo/mdam/__init__.py create mode 100644 rl4co/models/zoo/mdam/decoder.py create mode 100644 rl4co/models/zoo/mdam/encoder.py create mode 100644 rl4co/models/zoo/mdam/mha.py create mode 100644 rl4co/models/zoo/mdam/model.py create mode 100644 rl4co/models/zoo/mdam/policy.py create mode 100644 rl4co/models/zoo/mvmoe/__init__.py create mode 100644 rl4co/models/zoo/mvmoe/model.py create mode 100644 rl4co/models/zoo/n2s/__init__.py create mode 100644 rl4co/models/zoo/n2s/decoder.py create mode 100644 rl4co/models/zoo/n2s/encoder.py create mode 100644 rl4co/models/zoo/n2s/model.py create mode 100644 rl4co/models/zoo/n2s/policy.py create mode 100644 rl4co/models/zoo/nargnn/__init__.py create mode 100644 rl4co/models/zoo/nargnn/encoder.py create mode 100644 rl4co/models/zoo/nargnn/policy.py create mode 100644 rl4co/models/zoo/neuopt/__init__.py create mode 100644 rl4co/models/zoo/neuopt/decoder.py create mode 100644 rl4co/models/zoo/neuopt/model.py create mode 100644 rl4co/models/zoo/neuopt/policy.py create mode 100644 rl4co/models/zoo/polynet/__init__.py create mode 100644 rl4co/models/zoo/polynet/decoder.py create mode 100644 rl4co/models/zoo/polynet/model.py create mode 100644 rl4co/models/zoo/polynet/policy.py create mode 100644 rl4co/models/zoo/pomo/__init__.py create mode 100644 rl4co/models/zoo/pomo/model.py create mode 100644 rl4co/models/zoo/ptrnet/__init__.py create mode 100644 rl4co/models/zoo/ptrnet/critic.py create mode 100644 rl4co/models/zoo/ptrnet/decoder.py create mode 100644 rl4co/models/zoo/ptrnet/encoder.py create mode 100644 rl4co/models/zoo/ptrnet/model.py create mode 100644 rl4co/models/zoo/ptrnet/policy.py create mode 100644 rl4co/models/zoo/symnco/__init__.py create mode 100644 rl4co/models/zoo/symnco/losses.py create mode 100644 rl4co/models/zoo/symnco/model.py create mode 100644 rl4co/models/zoo/symnco/policy.py create mode 100644 rl4co/tasks/__init__.py create mode 100644 rl4co/tasks/eval.py create mode 100644 rl4co/tasks/index.html create mode 100644 rl4co/tasks/train.py create mode 100644 rl4co/utils/__init__.py create mode 100644 rl4co/utils/callbacks/__init__.py create mode 100644 rl4co/utils/callbacks/speed_monitor.py create mode 100644 rl4co/utils/decoding.py create mode 100644 rl4co/utils/instantiators.py create mode 100644 rl4co/utils/lightning.py create mode 100644 rl4co/utils/meta_trainer.py create mode 100644 rl4co/utils/ops.py create mode 100644 rl4co/utils/optim_helpers.py create mode 100644 rl4co/utils/pylogger.py create mode 100644 rl4co/utils/rich_utils.py create mode 100644 rl4co/utils/test_utils.py create mode 100644 rl4co/utils/trainer.py create mode 100644 rl4co/utils/utils.py create mode 100644 search/search_index.json create mode 100644 sitemap.xml create mode 100644 sitemap.xml.gz create mode 100644 tests/__init__.py create mode 100644 tests/test_envs.py create mode 100644 tests/test_policy.py create mode 100644 tests/test_tasks.py create mode 100644 tests/test_training.py create mode 100644 tests/test_utils.py diff --git a/.nojekyll b/.nojekyll new file mode 100644 index 00000000..e69de29b diff --git a/404.html b/404.html new file mode 100644 index 00000000..4afa6a36 --- /dev/null +++ b/404.html @@ -0,0 +1,2332 @@ + + + + + + + + + + + + + + + + + + + + + RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ +

404 - Not found

+ +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/CNAME b/CNAME new file mode 100644 index 00000000..f5e8dcc0 --- /dev/null +++ b/CNAME @@ -0,0 +1 @@ +rl4.co \ No newline at end of file diff --git a/README_backup/index.html b/README_backup/index.html new file mode 100644 index 00000000..5a0f0124 --- /dev/null +++ b/README_backup/index.html @@ -0,0 +1,2668 @@ + + + + + + + + + + + + + + + + + + + + + + + README backup - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + Skip to content + + +
+
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + +

README backup

+ +


+
+ +AI4CO Logo + +

+ + +PyTorch +Lightning +base: TorchRL +config: Hydra +Code style: black +Slack +License: MIT +Open In Colab +PyPI +Codecov +Test + +

+ Documentation | + Getting Started | + Usage | + Contributing | + Paper | + Join Us +

+ + + +
+ +

An extensive Reinforcement Learning (RL) for Combinatorial Optimization (CO) benchmark. Our goal is to provide a unified framework for RL-based CO algorithms, and to facilitate reproducible research in this field, decoupling the science from the engineering.

+

RL4CO is built upon:

+
    +
  • TorchRL: official PyTorch framework for RL algorithms and vectorized environments on GPUs
  • +
  • TensorDict: a library to easily handle heterogeneous data such as states, actions and rewards
  • +
  • PyTorch Lightning: a lightweight PyTorch wrapper for high-performance AI research
  • +
  • Hydra: a framework for elegantly configuring complex applications
  • +
+
+ RL4CO-Overview +
+ +

We offer flexible and efficient implementations of the following policies:

+
    +
  • Constructive: learn to construct a solution from scratch
      +
    • Autoregressive (AR): construct solutions one step at a time via a decoder
    • +
    • NonAutoregressive (NAR): learn to predict a heuristic, such as a heatmap, to then construct a solution
    • +
    +
  • +
  • Improvement: learn to improve a pre-existing solution
  • +
+
+ RL4CO-Policy-Overview +
+ +

We provide several utilities and modularization. For example, we modularize reusable components such as environment embeddings that can easily be swapped to solve new problems.

+
+ RL4CO-Env-Embedding +
+ +

Getting started

+

Open In Colab

+

RL4CO is now available for installation on pip! +

pip install rl4co
+

+

To get started, we recommend checking out our quickstart notebook or the minimalistic example below.

+

Install from source

+

This command installs the bleeding edge main version, useful for staying up-to-date with the latest developments - for instance, if a bug has been fixed since the last official release but a new release hasn’t been rolled out yet:

+
pip install -U git+https://github.com/ai4co/rl4co.git
+
+

Local install and development

+

If you want to develop RL4CO we recommend you to install it locally with pip in editable mode:

+
git clone https://github.com/ai4co/rl4co && cd rl4co
+pip install -e .
+
+

We recommend using a virtual environment such as conda to install rl4co locally.

+

Usage

+

Train model with default configuration (AM on TSP environment): +

python run.py
+

+
+

Tip

+

You may check out this notebook to get started with Hydra!

+
+
+ Change experiment settings + +Train model with chosen experiment configuration from [configs/experiment/](configs/experiment/) +
python run.py experiment=routing/am env=tsp env.num_loc=50 model.optimizer_kwargs.lr=2e-4
+
+Here you may change the environment, e.g. with `env=cvrp` by command line or by modifying the corresponding experiment e.g. [configs/experiment/routing/am.yaml](configs/experiment/routing/am.yaml). + +
+ +
+ Disable logging + +
python run.py experiment=routing/am logger=none '~callbacks.learning_rate_monitor'
+
+Note that `~` is used to disable a callback that would need a logger. + +
+ +
+ Create a sweep over hyperparameters (-m for multirun) + +
python run.py -m experiment=routing/am  model.optimizer.lr=1e-3,1e-4,1e-5
+
+
+ +

Minimalistic Example

+

Here is a minimalistic example training the Attention Model with greedy rollout baseline on TSP in less than 30 lines of code:

+
from rl4co.envs.routing import TSPEnv, TSPGenerator
+from rl4co.models import AttentionModelPolicy, POMO
+from rl4co.utils import RL4COTrainer
+
+# Instantiate generator and environment
+generator = TSPGenerator(num_loc=50, loc_distribution="uniform")
+env = TSPEnv(generator)
+
+# Create policy and RL model
+policy = AttentionModelPolicy(env_name=env.name, num_encoder_layers=6)
+model = POMO(env, policy, batch_size=64, optimizer_kwargs={"lr": 1e-4})
+
+# Instantiate Trainer and fit
+trainer = RL4COTrainer(max_epochs=10, accelerator="gpu", precision="16-mixed")
+trainer.fit(model)
+
+

Other examples can be found on our documentation!

+

Testing

+

Run tests with pytest from the root directory:

+
pytest tests
+
+

Known Bugs

+

Bugs installing PyTorch Geometric (PyG)

+

Installing PyG via Conda seems to update Torch itself. We have found that this update introduces some bugs with torchrl. At this moment, we recommend installing PyG with Pip: +

pip install torch_geometric
+

+

Contributing

+

Have a suggestion, request, or found a bug? Feel free to open an issue or submit a pull request. +If you would like to contribute, please check out our contribution guidelines here. We welcome and look forward to all contributions to RL4CO!

+

We are also on Slack if you have any questions or would like to discuss RL4CO with us. We are open to collaborations and would love to hear from you 🚀

+

Contributors

+

+ +

+

Citation

+

If you find RL4CO valuable for your research or applied projects:

+
@article{berto2024rl4co,
+    title={{RL4CO: an Extensive Reinforcement Learning for Combinatorial Optimization Benchmark}},
+    author={Federico Berto and Chuanbo Hua and Junyoung Park and Laurin Luttmann and Yining Ma and Fanchen Bu and Jiarui Wang and Haoran Ye and Minsu Kim and Sanghyeok Choi and Nayeli Gast Zepeda and Andr\'e Hottung and Jianan Zhou and Jieyi Bi and Yu Hu and Fei Liu and Hyeonah Kim and Jiwoo Son and Haeyeon Kim and Davide Angioni and Wouter Kool and Zhiguang Cao and Jie Zhang and Kijung Shin and Cathy Wu and Sungsoo Ahn and Guojie Song and Changhyun Kwon and Lin Xie and Jinkyoo Park},
+    year={2024},
+    journal={arXiv preprint arXiv:2306.17100},
+    note={\url{https://github.com/ai4co/rl4co}}
+}
+
+

Note that a previous version of RL4CO has been accepted as an oral presentation at the NeurIPS 2023 GLFrontiers Workshop. Since then, the library has greatly evolved and improved!

+
+

Join us

+

Slack

+

We invite you to join our AI4CO community, an open research group in Artificial Intelligence (AI) for Combinatorial Optimization (CO)!

+
+ AI4CO Logo +
+ + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/assets/_mkdocstrings.css b/assets/_mkdocstrings.css new file mode 100644 index 00000000..b500381b --- /dev/null +++ b/assets/_mkdocstrings.css @@ -0,0 +1,143 @@ + +/* Avoid breaking parameter names, etc. in table cells. */ +.doc-contents td code { + word-break: normal !important; +} + +/* No line break before first paragraph of descriptions. */ +.doc-md-description, +.doc-md-description>p:first-child { + display: inline; +} + +/* Max width for docstring sections tables. */ +.doc .md-typeset__table, +.doc .md-typeset__table table { + display: table !important; + width: 100%; +} + +.doc .md-typeset__table tr { + display: table-row; +} + +/* Defaults in Spacy table style. */ +.doc-param-default { + float: right; +} + +/* Parameter headings must be inline, not blocks. */ +.doc-heading-parameter { + display: inline; +} + +/* Prefer space on the right, not the left of parameter permalinks. */ +.doc-heading-parameter .headerlink { + margin-left: 0 !important; + margin-right: 0.2rem; +} + +/* Backward-compatibility: docstring section titles in bold. */ +.doc-section-title { + font-weight: bold; +} + +/* Symbols in Navigation and ToC. */ +:root, :host, +[data-md-color-scheme="default"] { + --doc-symbol-parameter-fg-color: #df50af; + --doc-symbol-attribute-fg-color: #953800; + --doc-symbol-function-fg-color: #8250df; + --doc-symbol-method-fg-color: #8250df; + --doc-symbol-class-fg-color: #0550ae; + --doc-symbol-module-fg-color: #5cad0f; + + --doc-symbol-parameter-bg-color: #df50af1a; + --doc-symbol-attribute-bg-color: #9538001a; + --doc-symbol-function-bg-color: #8250df1a; + --doc-symbol-method-bg-color: #8250df1a; + --doc-symbol-class-bg-color: #0550ae1a; + --doc-symbol-module-bg-color: #5cad0f1a; +} + +[data-md-color-scheme="slate"] { + --doc-symbol-parameter-fg-color: #ffa8cc; + --doc-symbol-attribute-fg-color: #ffa657; + --doc-symbol-function-fg-color: #d2a8ff; + --doc-symbol-method-fg-color: #d2a8ff; + --doc-symbol-class-fg-color: #79c0ff; + --doc-symbol-module-fg-color: #baff79; + + --doc-symbol-parameter-bg-color: #ffa8cc1a; + --doc-symbol-attribute-bg-color: #ffa6571a; + --doc-symbol-function-bg-color: #d2a8ff1a; + --doc-symbol-method-bg-color: #d2a8ff1a; + --doc-symbol-class-bg-color: #79c0ff1a; + --doc-symbol-module-bg-color: #baff791a; +} + +code.doc-symbol { + border-radius: .1rem; + font-size: .85em; + padding: 0 .3em; + font-weight: bold; +} + +code.doc-symbol-parameter { + color: var(--doc-symbol-parameter-fg-color); + background-color: var(--doc-symbol-parameter-bg-color); +} + +code.doc-symbol-parameter::after { + content: "param"; +} + +code.doc-symbol-attribute { + color: var(--doc-symbol-attribute-fg-color); + background-color: var(--doc-symbol-attribute-bg-color); +} + +code.doc-symbol-attribute::after { + content: "attr"; +} + +code.doc-symbol-function { + color: var(--doc-symbol-function-fg-color); + background-color: var(--doc-symbol-function-bg-color); +} + +code.doc-symbol-function::after { + content: "func"; +} + +code.doc-symbol-method { + color: var(--doc-symbol-method-fg-color); + background-color: var(--doc-symbol-method-bg-color); +} + +code.doc-symbol-method::after { + content: "meth"; +} + +code.doc-symbol-class { + color: var(--doc-symbol-class-fg-color); + background-color: var(--doc-symbol-class-bg-color); +} + +code.doc-symbol-class::after { + content: "class"; +} + +code.doc-symbol-module { + color: var(--doc-symbol-module-fg-color); + background-color: var(--doc-symbol-module-bg-color); +} + +code.doc-symbol-module::after { + content: "mod"; +} + +.doc-signature .autorefs { + color: inherit; + border-bottom: 1px dotted currentcolor; +} diff --git a/assets/images/favicon.png b/assets/images/favicon.png new file mode 100644 index 0000000000000000000000000000000000000000..1cf13b9f9d978896599290a74f77d5dbe7d1655c GIT binary patch literal 1870 zcmV-U2eJ5xP)Gc)JR9QMau)O=X#!i9;T z37kk-upj^(fsR36MHs_+1RCI)NNu9}lD0S{B^g8PN?Ww(5|~L#Ng*g{WsqleV}|#l zz8@ri&cTzw_h33bHI+12+kK6WN$h#n5cD8OQt`5kw6p~9H3()bUQ8OS4Q4HTQ=1Ol z_JAocz`fLbT2^{`8n~UAo=#AUOf=SOq4pYkt;XbC&f#7lb$*7=$na!mWCQ`dBQsO0 zLFBSPj*N?#u5&pf2t4XjEGH|=pPQ8xh7tpx;US5Cx_Ju;!O`ya-yF`)b%TEt5>eP1ZX~}sjjA%FJF?h7cX8=b!DZl<6%Cv z*G0uvvU+vmnpLZ2paivG-(cd*y3$hCIcsZcYOGh{$&)A6*XX&kXZd3G8m)G$Zz-LV z^GF3VAW^Mdv!)4OM8EgqRiz~*Cji;uzl2uC9^=8I84vNp;ltJ|q-*uQwGp2ma6cY7 z;`%`!9UXO@fr&Ebapfs34OmS9^u6$)bJxrucutf>`dKPKT%%*d3XlFVKunp9 zasduxjrjs>f8V=D|J=XNZp;_Zy^WgQ$9WDjgY=z@stwiEBm9u5*|34&1Na8BMjjgf3+SHcr`5~>oz1Y?SW^=K z^bTyO6>Gar#P_W2gEMwq)ot3; zREHn~U&Dp0l6YT0&k-wLwYjb?5zGK`W6S2v+K>AM(95m2C20L|3m~rN8dprPr@t)5lsk9Hu*W z?pS990s;Ez=+Rj{x7p``4>+c0G5^pYnB1^!TL=(?HLHZ+HicG{~4F1d^5Awl_2!1jICM-!9eoLhbbT^;yHcefyTAaqRcY zmuctDopPT!%k+}x%lZRKnzykr2}}XfG_ne?nRQO~?%hkzo;@RN{P6o`&mMUWBYMTe z6i8ChtjX&gXl`nvrU>jah)2iNM%JdjqoaeaU%yVn!^70x-flljp6Q5tK}5}&X8&&G zX3fpb3E(!rH=zVI_9Gjl45w@{(ITqngWFe7@9{mX;tO25Z_8 zQHEpI+FkTU#4xu>RkN>b3Tnc3UpWzPXWm#o55GKF09j^Mh~)K7{QqbO_~(@CVq! zS<8954|P8mXN2MRs86xZ&Q4EfM@JB94b=(YGuk)s&^jiSF=t3*oNK3`rD{H`yQ?d; ztE=laAUoZx5?RC8*WKOj`%LXEkgDd>&^Q4M^z`%u0rg-It=hLCVsq!Z%^6eB-OvOT zFZ28TN&cRmgU}Elrnk43)!>Z1FCPL2K$7}gwzIc48NX}#!A1BpJP?#v5wkNprhV** z?Cpalt1oH&{r!o3eSKc&ap)iz2BTn_VV`4>9M^b3;(YY}4>#ML6{~(4mH+?%07*qo IM6N<$f(jP3KmY&$ literal 0 HcmV?d00001 diff --git a/assets/javascripts/bundle.83f73b43.min.js b/assets/javascripts/bundle.83f73b43.min.js new file mode 100644 index 00000000..43d8b70f --- /dev/null +++ b/assets/javascripts/bundle.83f73b43.min.js @@ -0,0 +1,16 @@ +"use strict";(()=>{var Wi=Object.create;var gr=Object.defineProperty;var Di=Object.getOwnPropertyDescriptor;var Vi=Object.getOwnPropertyNames,Vt=Object.getOwnPropertySymbols,Ni=Object.getPrototypeOf,yr=Object.prototype.hasOwnProperty,ao=Object.prototype.propertyIsEnumerable;var io=(e,t,r)=>t in e?gr(e,t,{enumerable:!0,configurable:!0,writable:!0,value:r}):e[t]=r,$=(e,t)=>{for(var r in t||(t={}))yr.call(t,r)&&io(e,r,t[r]);if(Vt)for(var r of Vt(t))ao.call(t,r)&&io(e,r,t[r]);return e};var so=(e,t)=>{var r={};for(var o in e)yr.call(e,o)&&t.indexOf(o)<0&&(r[o]=e[o]);if(e!=null&&Vt)for(var o of Vt(e))t.indexOf(o)<0&&ao.call(e,o)&&(r[o]=e[o]);return r};var xr=(e,t)=>()=>(t||e((t={exports:{}}).exports,t),t.exports);var zi=(e,t,r,o)=>{if(t&&typeof t=="object"||typeof t=="function")for(let n of Vi(t))!yr.call(e,n)&&n!==r&&gr(e,n,{get:()=>t[n],enumerable:!(o=Di(t,n))||o.enumerable});return e};var Mt=(e,t,r)=>(r=e!=null?Wi(Ni(e)):{},zi(t||!e||!e.__esModule?gr(r,"default",{value:e,enumerable:!0}):r,e));var co=(e,t,r)=>new Promise((o,n)=>{var i=p=>{try{s(r.next(p))}catch(c){n(c)}},a=p=>{try{s(r.throw(p))}catch(c){n(c)}},s=p=>p.done?o(p.value):Promise.resolve(p.value).then(i,a);s((r=r.apply(e,t)).next())});var lo=xr((Er,po)=>{(function(e,t){typeof Er=="object"&&typeof po!="undefined"?t():typeof define=="function"&&define.amd?define(t):t()})(Er,function(){"use strict";function e(r){var o=!0,n=!1,i=null,a={text:!0,search:!0,url:!0,tel:!0,email:!0,password:!0,number:!0,date:!0,month:!0,week:!0,time:!0,datetime:!0,"datetime-local":!0};function s(k){return!!(k&&k!==document&&k.nodeName!=="HTML"&&k.nodeName!=="BODY"&&"classList"in k&&"contains"in k.classList)}function p(k){var ft=k.type,qe=k.tagName;return!!(qe==="INPUT"&&a[ft]&&!k.readOnly||qe==="TEXTAREA"&&!k.readOnly||k.isContentEditable)}function c(k){k.classList.contains("focus-visible")||(k.classList.add("focus-visible"),k.setAttribute("data-focus-visible-added",""))}function l(k){k.hasAttribute("data-focus-visible-added")&&(k.classList.remove("focus-visible"),k.removeAttribute("data-focus-visible-added"))}function f(k){k.metaKey||k.altKey||k.ctrlKey||(s(r.activeElement)&&c(r.activeElement),o=!0)}function u(k){o=!1}function d(k){s(k.target)&&(o||p(k.target))&&c(k.target)}function y(k){s(k.target)&&(k.target.classList.contains("focus-visible")||k.target.hasAttribute("data-focus-visible-added"))&&(n=!0,window.clearTimeout(i),i=window.setTimeout(function(){n=!1},100),l(k.target))}function L(k){document.visibilityState==="hidden"&&(n&&(o=!0),X())}function X(){document.addEventListener("mousemove",J),document.addEventListener("mousedown",J),document.addEventListener("mouseup",J),document.addEventListener("pointermove",J),document.addEventListener("pointerdown",J),document.addEventListener("pointerup",J),document.addEventListener("touchmove",J),document.addEventListener("touchstart",J),document.addEventListener("touchend",J)}function te(){document.removeEventListener("mousemove",J),document.removeEventListener("mousedown",J),document.removeEventListener("mouseup",J),document.removeEventListener("pointermove",J),document.removeEventListener("pointerdown",J),document.removeEventListener("pointerup",J),document.removeEventListener("touchmove",J),document.removeEventListener("touchstart",J),document.removeEventListener("touchend",J)}function J(k){k.target.nodeName&&k.target.nodeName.toLowerCase()==="html"||(o=!1,te())}document.addEventListener("keydown",f,!0),document.addEventListener("mousedown",u,!0),document.addEventListener("pointerdown",u,!0),document.addEventListener("touchstart",u,!0),document.addEventListener("visibilitychange",L,!0),X(),r.addEventListener("focus",d,!0),r.addEventListener("blur",y,!0),r.nodeType===Node.DOCUMENT_FRAGMENT_NODE&&r.host?r.host.setAttribute("data-js-focus-visible",""):r.nodeType===Node.DOCUMENT_NODE&&(document.documentElement.classList.add("js-focus-visible"),document.documentElement.setAttribute("data-js-focus-visible",""))}if(typeof window!="undefined"&&typeof document!="undefined"){window.applyFocusVisiblePolyfill=e;var t;try{t=new CustomEvent("focus-visible-polyfill-ready")}catch(r){t=document.createEvent("CustomEvent"),t.initCustomEvent("focus-visible-polyfill-ready",!1,!1,{})}window.dispatchEvent(t)}typeof document!="undefined"&&e(document)})});var qr=xr((hy,On)=>{"use strict";/*! + * escape-html + * Copyright(c) 2012-2013 TJ Holowaychuk + * Copyright(c) 2015 Andreas Lubbe + * Copyright(c) 2015 Tiancheng "Timothy" Gu + * MIT Licensed + */var $a=/["'&<>]/;On.exports=Pa;function Pa(e){var t=""+e,r=$a.exec(t);if(!r)return t;var o,n="",i=0,a=0;for(i=r.index;i{/*! + * clipboard.js v2.0.11 + * https://clipboardjs.com/ + * + * Licensed MIT © Zeno Rocha + */(function(t,r){typeof It=="object"&&typeof Yr=="object"?Yr.exports=r():typeof define=="function"&&define.amd?define([],r):typeof It=="object"?It.ClipboardJS=r():t.ClipboardJS=r()})(It,function(){return function(){var e={686:function(o,n,i){"use strict";i.d(n,{default:function(){return Ui}});var a=i(279),s=i.n(a),p=i(370),c=i.n(p),l=i(817),f=i.n(l);function u(V){try{return document.execCommand(V)}catch(A){return!1}}var d=function(A){var M=f()(A);return u("cut"),M},y=d;function L(V){var A=document.documentElement.getAttribute("dir")==="rtl",M=document.createElement("textarea");M.style.fontSize="12pt",M.style.border="0",M.style.padding="0",M.style.margin="0",M.style.position="absolute",M.style[A?"right":"left"]="-9999px";var F=window.pageYOffset||document.documentElement.scrollTop;return M.style.top="".concat(F,"px"),M.setAttribute("readonly",""),M.value=V,M}var X=function(A,M){var F=L(A);M.container.appendChild(F);var D=f()(F);return u("copy"),F.remove(),D},te=function(A){var M=arguments.length>1&&arguments[1]!==void 0?arguments[1]:{container:document.body},F="";return typeof A=="string"?F=X(A,M):A instanceof HTMLInputElement&&!["text","search","url","tel","password"].includes(A==null?void 0:A.type)?F=X(A.value,M):(F=f()(A),u("copy")),F},J=te;function k(V){"@babel/helpers - typeof";return typeof Symbol=="function"&&typeof Symbol.iterator=="symbol"?k=function(M){return typeof M}:k=function(M){return M&&typeof Symbol=="function"&&M.constructor===Symbol&&M!==Symbol.prototype?"symbol":typeof M},k(V)}var ft=function(){var A=arguments.length>0&&arguments[0]!==void 0?arguments[0]:{},M=A.action,F=M===void 0?"copy":M,D=A.container,Y=A.target,$e=A.text;if(F!=="copy"&&F!=="cut")throw new Error('Invalid "action" value, use either "copy" or "cut"');if(Y!==void 0)if(Y&&k(Y)==="object"&&Y.nodeType===1){if(F==="copy"&&Y.hasAttribute("disabled"))throw new Error('Invalid "target" attribute. Please use "readonly" instead of "disabled" attribute');if(F==="cut"&&(Y.hasAttribute("readonly")||Y.hasAttribute("disabled")))throw new Error(`Invalid "target" attribute. You can't cut text from elements with "readonly" or "disabled" attributes`)}else throw new Error('Invalid "target" value, use a valid Element');if($e)return J($e,{container:D});if(Y)return F==="cut"?y(Y):J(Y,{container:D})},qe=ft;function Fe(V){"@babel/helpers - typeof";return typeof Symbol=="function"&&typeof Symbol.iterator=="symbol"?Fe=function(M){return typeof M}:Fe=function(M){return M&&typeof Symbol=="function"&&M.constructor===Symbol&&M!==Symbol.prototype?"symbol":typeof M},Fe(V)}function ki(V,A){if(!(V instanceof A))throw new TypeError("Cannot call a class as a function")}function no(V,A){for(var M=0;M0&&arguments[0]!==void 0?arguments[0]:{};this.action=typeof D.action=="function"?D.action:this.defaultAction,this.target=typeof D.target=="function"?D.target:this.defaultTarget,this.text=typeof D.text=="function"?D.text:this.defaultText,this.container=Fe(D.container)==="object"?D.container:document.body}},{key:"listenClick",value:function(D){var Y=this;this.listener=c()(D,"click",function($e){return Y.onClick($e)})}},{key:"onClick",value:function(D){var Y=D.delegateTarget||D.currentTarget,$e=this.action(Y)||"copy",Dt=qe({action:$e,container:this.container,target:this.target(Y),text:this.text(Y)});this.emit(Dt?"success":"error",{action:$e,text:Dt,trigger:Y,clearSelection:function(){Y&&Y.focus(),window.getSelection().removeAllRanges()}})}},{key:"defaultAction",value:function(D){return vr("action",D)}},{key:"defaultTarget",value:function(D){var Y=vr("target",D);if(Y)return document.querySelector(Y)}},{key:"defaultText",value:function(D){return vr("text",D)}},{key:"destroy",value:function(){this.listener.destroy()}}],[{key:"copy",value:function(D){var Y=arguments.length>1&&arguments[1]!==void 0?arguments[1]:{container:document.body};return J(D,Y)}},{key:"cut",value:function(D){return y(D)}},{key:"isSupported",value:function(){var D=arguments.length>0&&arguments[0]!==void 0?arguments[0]:["copy","cut"],Y=typeof D=="string"?[D]:D,$e=!!document.queryCommandSupported;return Y.forEach(function(Dt){$e=$e&&!!document.queryCommandSupported(Dt)}),$e}}]),M}(s()),Ui=Fi},828:function(o){var n=9;if(typeof Element!="undefined"&&!Element.prototype.matches){var i=Element.prototype;i.matches=i.matchesSelector||i.mozMatchesSelector||i.msMatchesSelector||i.oMatchesSelector||i.webkitMatchesSelector}function a(s,p){for(;s&&s.nodeType!==n;){if(typeof s.matches=="function"&&s.matches(p))return s;s=s.parentNode}}o.exports=a},438:function(o,n,i){var a=i(828);function s(l,f,u,d,y){var L=c.apply(this,arguments);return l.addEventListener(u,L,y),{destroy:function(){l.removeEventListener(u,L,y)}}}function p(l,f,u,d,y){return typeof l.addEventListener=="function"?s.apply(null,arguments):typeof u=="function"?s.bind(null,document).apply(null,arguments):(typeof l=="string"&&(l=document.querySelectorAll(l)),Array.prototype.map.call(l,function(L){return s(L,f,u,d,y)}))}function c(l,f,u,d){return function(y){y.delegateTarget=a(y.target,f),y.delegateTarget&&d.call(l,y)}}o.exports=p},879:function(o,n){n.node=function(i){return i!==void 0&&i instanceof HTMLElement&&i.nodeType===1},n.nodeList=function(i){var a=Object.prototype.toString.call(i);return i!==void 0&&(a==="[object NodeList]"||a==="[object HTMLCollection]")&&"length"in i&&(i.length===0||n.node(i[0]))},n.string=function(i){return typeof i=="string"||i instanceof String},n.fn=function(i){var a=Object.prototype.toString.call(i);return a==="[object Function]"}},370:function(o,n,i){var a=i(879),s=i(438);function p(u,d,y){if(!u&&!d&&!y)throw new Error("Missing required arguments");if(!a.string(d))throw new TypeError("Second argument must be a String");if(!a.fn(y))throw new TypeError("Third argument must be a Function");if(a.node(u))return c(u,d,y);if(a.nodeList(u))return l(u,d,y);if(a.string(u))return f(u,d,y);throw new TypeError("First argument must be a String, HTMLElement, HTMLCollection, or NodeList")}function c(u,d,y){return u.addEventListener(d,y),{destroy:function(){u.removeEventListener(d,y)}}}function l(u,d,y){return Array.prototype.forEach.call(u,function(L){L.addEventListener(d,y)}),{destroy:function(){Array.prototype.forEach.call(u,function(L){L.removeEventListener(d,y)})}}}function f(u,d,y){return s(document.body,u,d,y)}o.exports=p},817:function(o){function n(i){var a;if(i.nodeName==="SELECT")i.focus(),a=i.value;else if(i.nodeName==="INPUT"||i.nodeName==="TEXTAREA"){var s=i.hasAttribute("readonly");s||i.setAttribute("readonly",""),i.select(),i.setSelectionRange(0,i.value.length),s||i.removeAttribute("readonly"),a=i.value}else{i.hasAttribute("contenteditable")&&i.focus();var p=window.getSelection(),c=document.createRange();c.selectNodeContents(i),p.removeAllRanges(),p.addRange(c),a=p.toString()}return a}o.exports=n},279:function(o){function n(){}n.prototype={on:function(i,a,s){var p=this.e||(this.e={});return(p[i]||(p[i]=[])).push({fn:a,ctx:s}),this},once:function(i,a,s){var p=this;function c(){p.off(i,c),a.apply(s,arguments)}return c._=a,this.on(i,c,s)},emit:function(i){var a=[].slice.call(arguments,1),s=((this.e||(this.e={}))[i]||[]).slice(),p=0,c=s.length;for(p;p0&&i[i.length-1])&&(c[0]===6||c[0]===2)){r=0;continue}if(c[0]===3&&(!i||c[1]>i[0]&&c[1]=e.length&&(e=void 0),{value:e&&e[o++],done:!e}}};throw new TypeError(t?"Object is not iterable.":"Symbol.iterator is not defined.")}function N(e,t){var r=typeof Symbol=="function"&&e[Symbol.iterator];if(!r)return e;var o=r.call(e),n,i=[],a;try{for(;(t===void 0||t-- >0)&&!(n=o.next()).done;)i.push(n.value)}catch(s){a={error:s}}finally{try{n&&!n.done&&(r=o.return)&&r.call(o)}finally{if(a)throw a.error}}return i}function q(e,t,r){if(r||arguments.length===2)for(var o=0,n=t.length,i;o1||p(d,L)})},y&&(n[d]=y(n[d])))}function p(d,y){try{c(o[d](y))}catch(L){u(i[0][3],L)}}function c(d){d.value instanceof nt?Promise.resolve(d.value.v).then(l,f):u(i[0][2],d)}function l(d){p("next",d)}function f(d){p("throw",d)}function u(d,y){d(y),i.shift(),i.length&&p(i[0][0],i[0][1])}}function uo(e){if(!Symbol.asyncIterator)throw new TypeError("Symbol.asyncIterator is not defined.");var t=e[Symbol.asyncIterator],r;return t?t.call(e):(e=typeof he=="function"?he(e):e[Symbol.iterator](),r={},o("next"),o("throw"),o("return"),r[Symbol.asyncIterator]=function(){return this},r);function o(i){r[i]=e[i]&&function(a){return new Promise(function(s,p){a=e[i](a),n(s,p,a.done,a.value)})}}function n(i,a,s,p){Promise.resolve(p).then(function(c){i({value:c,done:s})},a)}}function H(e){return typeof e=="function"}function ut(e){var t=function(o){Error.call(o),o.stack=new Error().stack},r=e(t);return r.prototype=Object.create(Error.prototype),r.prototype.constructor=r,r}var zt=ut(function(e){return function(r){e(this),this.message=r?r.length+` errors occurred during unsubscription: +`+r.map(function(o,n){return n+1+") "+o.toString()}).join(` + `):"",this.name="UnsubscriptionError",this.errors=r}});function Qe(e,t){if(e){var r=e.indexOf(t);0<=r&&e.splice(r,1)}}var Ue=function(){function e(t){this.initialTeardown=t,this.closed=!1,this._parentage=null,this._finalizers=null}return e.prototype.unsubscribe=function(){var t,r,o,n,i;if(!this.closed){this.closed=!0;var a=this._parentage;if(a)if(this._parentage=null,Array.isArray(a))try{for(var s=he(a),p=s.next();!p.done;p=s.next()){var c=p.value;c.remove(this)}}catch(L){t={error:L}}finally{try{p&&!p.done&&(r=s.return)&&r.call(s)}finally{if(t)throw t.error}}else a.remove(this);var l=this.initialTeardown;if(H(l))try{l()}catch(L){i=L instanceof zt?L.errors:[L]}var f=this._finalizers;if(f){this._finalizers=null;try{for(var u=he(f),d=u.next();!d.done;d=u.next()){var y=d.value;try{ho(y)}catch(L){i=i!=null?i:[],L instanceof zt?i=q(q([],N(i)),N(L.errors)):i.push(L)}}}catch(L){o={error:L}}finally{try{d&&!d.done&&(n=u.return)&&n.call(u)}finally{if(o)throw o.error}}}if(i)throw new zt(i)}},e.prototype.add=function(t){var r;if(t&&t!==this)if(this.closed)ho(t);else{if(t instanceof e){if(t.closed||t._hasParent(this))return;t._addParent(this)}(this._finalizers=(r=this._finalizers)!==null&&r!==void 0?r:[]).push(t)}},e.prototype._hasParent=function(t){var r=this._parentage;return r===t||Array.isArray(r)&&r.includes(t)},e.prototype._addParent=function(t){var r=this._parentage;this._parentage=Array.isArray(r)?(r.push(t),r):r?[r,t]:t},e.prototype._removeParent=function(t){var r=this._parentage;r===t?this._parentage=null:Array.isArray(r)&&Qe(r,t)},e.prototype.remove=function(t){var r=this._finalizers;r&&Qe(r,t),t instanceof e&&t._removeParent(this)},e.EMPTY=function(){var t=new e;return t.closed=!0,t}(),e}();var Tr=Ue.EMPTY;function qt(e){return e instanceof Ue||e&&"closed"in e&&H(e.remove)&&H(e.add)&&H(e.unsubscribe)}function ho(e){H(e)?e():e.unsubscribe()}var Pe={onUnhandledError:null,onStoppedNotification:null,Promise:void 0,useDeprecatedSynchronousErrorHandling:!1,useDeprecatedNextContext:!1};var dt={setTimeout:function(e,t){for(var r=[],o=2;o0},enumerable:!1,configurable:!0}),t.prototype._trySubscribe=function(r){return this._throwIfClosed(),e.prototype._trySubscribe.call(this,r)},t.prototype._subscribe=function(r){return this._throwIfClosed(),this._checkFinalizedStatuses(r),this._innerSubscribe(r)},t.prototype._innerSubscribe=function(r){var o=this,n=this,i=n.hasError,a=n.isStopped,s=n.observers;return i||a?Tr:(this.currentObservers=null,s.push(r),new Ue(function(){o.currentObservers=null,Qe(s,r)}))},t.prototype._checkFinalizedStatuses=function(r){var o=this,n=o.hasError,i=o.thrownError,a=o.isStopped;n?r.error(i):a&&r.complete()},t.prototype.asObservable=function(){var r=new j;return r.source=this,r},t.create=function(r,o){return new To(r,o)},t}(j);var To=function(e){oe(t,e);function t(r,o){var n=e.call(this)||this;return n.destination=r,n.source=o,n}return t.prototype.next=function(r){var o,n;(n=(o=this.destination)===null||o===void 0?void 0:o.next)===null||n===void 0||n.call(o,r)},t.prototype.error=function(r){var o,n;(n=(o=this.destination)===null||o===void 0?void 0:o.error)===null||n===void 0||n.call(o,r)},t.prototype.complete=function(){var r,o;(o=(r=this.destination)===null||r===void 0?void 0:r.complete)===null||o===void 0||o.call(r)},t.prototype._subscribe=function(r){var o,n;return(n=(o=this.source)===null||o===void 0?void 0:o.subscribe(r))!==null&&n!==void 0?n:Tr},t}(g);var _r=function(e){oe(t,e);function t(r){var o=e.call(this)||this;return o._value=r,o}return Object.defineProperty(t.prototype,"value",{get:function(){return this.getValue()},enumerable:!1,configurable:!0}),t.prototype._subscribe=function(r){var o=e.prototype._subscribe.call(this,r);return!o.closed&&r.next(this._value),o},t.prototype.getValue=function(){var r=this,o=r.hasError,n=r.thrownError,i=r._value;if(o)throw n;return this._throwIfClosed(),i},t.prototype.next=function(r){e.prototype.next.call(this,this._value=r)},t}(g);var At={now:function(){return(At.delegate||Date).now()},delegate:void 0};var Ct=function(e){oe(t,e);function t(r,o,n){r===void 0&&(r=1/0),o===void 0&&(o=1/0),n===void 0&&(n=At);var i=e.call(this)||this;return i._bufferSize=r,i._windowTime=o,i._timestampProvider=n,i._buffer=[],i._infiniteTimeWindow=!0,i._infiniteTimeWindow=o===1/0,i._bufferSize=Math.max(1,r),i._windowTime=Math.max(1,o),i}return t.prototype.next=function(r){var o=this,n=o.isStopped,i=o._buffer,a=o._infiniteTimeWindow,s=o._timestampProvider,p=o._windowTime;n||(i.push(r),!a&&i.push(s.now()+p)),this._trimBuffer(),e.prototype.next.call(this,r)},t.prototype._subscribe=function(r){this._throwIfClosed(),this._trimBuffer();for(var o=this._innerSubscribe(r),n=this,i=n._infiniteTimeWindow,a=n._buffer,s=a.slice(),p=0;p0?e.prototype.schedule.call(this,r,o):(this.delay=o,this.state=r,this.scheduler.flush(this),this)},t.prototype.execute=function(r,o){return o>0||this.closed?e.prototype.execute.call(this,r,o):this._execute(r,o)},t.prototype.requestAsyncId=function(r,o,n){return n===void 0&&(n=0),n!=null&&n>0||n==null&&this.delay>0?e.prototype.requestAsyncId.call(this,r,o,n):(r.flush(this),0)},t}(gt);var Lo=function(e){oe(t,e);function t(){return e!==null&&e.apply(this,arguments)||this}return t}(yt);var kr=new Lo(Oo);var Mo=function(e){oe(t,e);function t(r,o){var n=e.call(this,r,o)||this;return n.scheduler=r,n.work=o,n}return t.prototype.requestAsyncId=function(r,o,n){return n===void 0&&(n=0),n!==null&&n>0?e.prototype.requestAsyncId.call(this,r,o,n):(r.actions.push(this),r._scheduled||(r._scheduled=vt.requestAnimationFrame(function(){return r.flush(void 0)})))},t.prototype.recycleAsyncId=function(r,o,n){var i;if(n===void 0&&(n=0),n!=null?n>0:this.delay>0)return e.prototype.recycleAsyncId.call(this,r,o,n);var a=r.actions;o!=null&&((i=a[a.length-1])===null||i===void 0?void 0:i.id)!==o&&(vt.cancelAnimationFrame(o),r._scheduled=void 0)},t}(gt);var _o=function(e){oe(t,e);function t(){return e!==null&&e.apply(this,arguments)||this}return t.prototype.flush=function(r){this._active=!0;var o=this._scheduled;this._scheduled=void 0;var n=this.actions,i;r=r||n.shift();do if(i=r.execute(r.state,r.delay))break;while((r=n[0])&&r.id===o&&n.shift());if(this._active=!1,i){for(;(r=n[0])&&r.id===o&&n.shift();)r.unsubscribe();throw i}},t}(yt);var me=new _o(Mo);var S=new j(function(e){return e.complete()});function Yt(e){return e&&H(e.schedule)}function Hr(e){return e[e.length-1]}function Xe(e){return H(Hr(e))?e.pop():void 0}function ke(e){return Yt(Hr(e))?e.pop():void 0}function Bt(e,t){return typeof Hr(e)=="number"?e.pop():t}var xt=function(e){return e&&typeof e.length=="number"&&typeof e!="function"};function Gt(e){return H(e==null?void 0:e.then)}function Jt(e){return H(e[bt])}function Xt(e){return Symbol.asyncIterator&&H(e==null?void 0:e[Symbol.asyncIterator])}function Zt(e){return new TypeError("You provided "+(e!==null&&typeof e=="object"?"an invalid object":"'"+e+"'")+" where a stream was expected. You can provide an Observable, Promise, ReadableStream, Array, AsyncIterable, or Iterable.")}function Zi(){return typeof Symbol!="function"||!Symbol.iterator?"@@iterator":Symbol.iterator}var er=Zi();function tr(e){return H(e==null?void 0:e[er])}function rr(e){return fo(this,arguments,function(){var r,o,n,i;return Nt(this,function(a){switch(a.label){case 0:r=e.getReader(),a.label=1;case 1:a.trys.push([1,,9,10]),a.label=2;case 2:return[4,nt(r.read())];case 3:return o=a.sent(),n=o.value,i=o.done,i?[4,nt(void 0)]:[3,5];case 4:return[2,a.sent()];case 5:return[4,nt(n)];case 6:return[4,a.sent()];case 7:return a.sent(),[3,2];case 8:return[3,10];case 9:return r.releaseLock(),[7];case 10:return[2]}})})}function or(e){return H(e==null?void 0:e.getReader)}function U(e){if(e instanceof j)return e;if(e!=null){if(Jt(e))return ea(e);if(xt(e))return ta(e);if(Gt(e))return ra(e);if(Xt(e))return Ao(e);if(tr(e))return oa(e);if(or(e))return na(e)}throw Zt(e)}function ea(e){return new j(function(t){var r=e[bt]();if(H(r.subscribe))return r.subscribe(t);throw new TypeError("Provided object does not correctly implement Symbol.observable")})}function ta(e){return new j(function(t){for(var r=0;r=2;return function(o){return o.pipe(e?b(function(n,i){return e(n,i,o)}):le,Te(1),r?De(t):Qo(function(){return new ir}))}}function jr(e){return e<=0?function(){return S}:E(function(t,r){var o=[];t.subscribe(T(r,function(n){o.push(n),e=2,!0))}function pe(e){e===void 0&&(e={});var t=e.connector,r=t===void 0?function(){return new g}:t,o=e.resetOnError,n=o===void 0?!0:o,i=e.resetOnComplete,a=i===void 0?!0:i,s=e.resetOnRefCountZero,p=s===void 0?!0:s;return function(c){var l,f,u,d=0,y=!1,L=!1,X=function(){f==null||f.unsubscribe(),f=void 0},te=function(){X(),l=u=void 0,y=L=!1},J=function(){var k=l;te(),k==null||k.unsubscribe()};return E(function(k,ft){d++,!L&&!y&&X();var qe=u=u!=null?u:r();ft.add(function(){d--,d===0&&!L&&!y&&(f=Ur(J,p))}),qe.subscribe(ft),!l&&d>0&&(l=new at({next:function(Fe){return qe.next(Fe)},error:function(Fe){L=!0,X(),f=Ur(te,n,Fe),qe.error(Fe)},complete:function(){y=!0,X(),f=Ur(te,a),qe.complete()}}),U(k).subscribe(l))})(c)}}function Ur(e,t){for(var r=[],o=2;oe.next(document)),e}function P(e,t=document){return Array.from(t.querySelectorAll(e))}function R(e,t=document){let r=fe(e,t);if(typeof r=="undefined")throw new ReferenceError(`Missing element: expected "${e}" to be present`);return r}function fe(e,t=document){return t.querySelector(e)||void 0}function Ie(){var e,t,r,o;return(o=(r=(t=(e=document.activeElement)==null?void 0:e.shadowRoot)==null?void 0:t.activeElement)!=null?r:document.activeElement)!=null?o:void 0}var wa=O(h(document.body,"focusin"),h(document.body,"focusout")).pipe(_e(1),Q(void 0),m(()=>Ie()||document.body),G(1));function et(e){return wa.pipe(m(t=>e.contains(t)),K())}function $t(e,t){return C(()=>O(h(e,"mouseenter").pipe(m(()=>!0)),h(e,"mouseleave").pipe(m(()=>!1))).pipe(t?Ht(r=>Le(+!r*t)):le,Q(e.matches(":hover"))))}function Jo(e,t){if(typeof t=="string"||typeof t=="number")e.innerHTML+=t.toString();else if(t instanceof Node)e.appendChild(t);else if(Array.isArray(t))for(let r of t)Jo(e,r)}function x(e,t,...r){let o=document.createElement(e);if(t)for(let n of Object.keys(t))typeof t[n]!="undefined"&&(typeof t[n]!="boolean"?o.setAttribute(n,t[n]):o.setAttribute(n,""));for(let n of r)Jo(o,n);return o}function sr(e){if(e>999){let t=+((e-950)%1e3>99);return`${((e+1e-6)/1e3).toFixed(t)}k`}else return e.toString()}function Tt(e){let t=x("script",{src:e});return C(()=>(document.head.appendChild(t),O(h(t,"load"),h(t,"error").pipe(v(()=>$r(()=>new ReferenceError(`Invalid script: ${e}`))))).pipe(m(()=>{}),_(()=>document.head.removeChild(t)),Te(1))))}var Xo=new g,Ta=C(()=>typeof ResizeObserver=="undefined"?Tt("https://unpkg.com/resize-observer-polyfill"):I(void 0)).pipe(m(()=>new ResizeObserver(e=>e.forEach(t=>Xo.next(t)))),v(e=>O(Ye,I(e)).pipe(_(()=>e.disconnect()))),G(1));function ce(e){return{width:e.offsetWidth,height:e.offsetHeight}}function ge(e){let t=e;for(;t.clientWidth===0&&t.parentElement;)t=t.parentElement;return Ta.pipe(w(r=>r.observe(t)),v(r=>Xo.pipe(b(o=>o.target===t),_(()=>r.unobserve(t)))),m(()=>ce(e)),Q(ce(e)))}function St(e){return{width:e.scrollWidth,height:e.scrollHeight}}function cr(e){let t=e.parentElement;for(;t&&(e.scrollWidth<=t.scrollWidth&&e.scrollHeight<=t.scrollHeight);)t=(e=t).parentElement;return t?e:void 0}function Zo(e){let t=[],r=e.parentElement;for(;r;)(e.clientWidth>r.clientWidth||e.clientHeight>r.clientHeight)&&t.push(r),r=(e=r).parentElement;return t.length===0&&t.push(document.documentElement),t}function Ve(e){return{x:e.offsetLeft,y:e.offsetTop}}function en(e){let t=e.getBoundingClientRect();return{x:t.x+window.scrollX,y:t.y+window.scrollY}}function tn(e){return O(h(window,"load"),h(window,"resize")).pipe(Me(0,me),m(()=>Ve(e)),Q(Ve(e)))}function pr(e){return{x:e.scrollLeft,y:e.scrollTop}}function Ne(e){return O(h(e,"scroll"),h(window,"scroll"),h(window,"resize")).pipe(Me(0,me),m(()=>pr(e)),Q(pr(e)))}var rn=new g,Sa=C(()=>I(new IntersectionObserver(e=>{for(let t of e)rn.next(t)},{threshold:0}))).pipe(v(e=>O(Ye,I(e)).pipe(_(()=>e.disconnect()))),G(1));function tt(e){return Sa.pipe(w(t=>t.observe(e)),v(t=>rn.pipe(b(({target:r})=>r===e),_(()=>t.unobserve(e)),m(({isIntersecting:r})=>r))))}function on(e,t=16){return Ne(e).pipe(m(({y:r})=>{let o=ce(e),n=St(e);return r>=n.height-o.height-t}),K())}var lr={drawer:R("[data-md-toggle=drawer]"),search:R("[data-md-toggle=search]")};function nn(e){return lr[e].checked}function Je(e,t){lr[e].checked!==t&&lr[e].click()}function ze(e){let t=lr[e];return h(t,"change").pipe(m(()=>t.checked),Q(t.checked))}function Oa(e,t){switch(e.constructor){case HTMLInputElement:return e.type==="radio"?/^Arrow/.test(t):!0;case HTMLSelectElement:case HTMLTextAreaElement:return!0;default:return e.isContentEditable}}function La(){return O(h(window,"compositionstart").pipe(m(()=>!0)),h(window,"compositionend").pipe(m(()=>!1))).pipe(Q(!1))}function an(){let e=h(window,"keydown").pipe(b(t=>!(t.metaKey||t.ctrlKey)),m(t=>({mode:nn("search")?"search":"global",type:t.key,claim(){t.preventDefault(),t.stopPropagation()}})),b(({mode:t,type:r})=>{if(t==="global"){let o=Ie();if(typeof o!="undefined")return!Oa(o,r)}return!0}),pe());return La().pipe(v(t=>t?S:e))}function ye(){return new URL(location.href)}function lt(e,t=!1){if(B("navigation.instant")&&!t){let r=x("a",{href:e.href});document.body.appendChild(r),r.click(),r.remove()}else location.href=e.href}function sn(){return new g}function cn(){return location.hash.slice(1)}function pn(e){let t=x("a",{href:e});t.addEventListener("click",r=>r.stopPropagation()),t.click()}function Ma(e){return O(h(window,"hashchange"),e).pipe(m(cn),Q(cn()),b(t=>t.length>0),G(1))}function ln(e){return Ma(e).pipe(m(t=>fe(`[id="${t}"]`)),b(t=>typeof t!="undefined"))}function Pt(e){let t=matchMedia(e);return ar(r=>t.addListener(()=>r(t.matches))).pipe(Q(t.matches))}function mn(){let e=matchMedia("print");return O(h(window,"beforeprint").pipe(m(()=>!0)),h(window,"afterprint").pipe(m(()=>!1))).pipe(Q(e.matches))}function Nr(e,t){return e.pipe(v(r=>r?t():S))}function zr(e,t){return new j(r=>{let o=new XMLHttpRequest;return o.open("GET",`${e}`),o.responseType="blob",o.addEventListener("load",()=>{o.status>=200&&o.status<300?(r.next(o.response),r.complete()):r.error(new Error(o.statusText))}),o.addEventListener("error",()=>{r.error(new Error("Network error"))}),o.addEventListener("abort",()=>{r.complete()}),typeof(t==null?void 0:t.progress$)!="undefined"&&(o.addEventListener("progress",n=>{var i;if(n.lengthComputable)t.progress$.next(n.loaded/n.total*100);else{let a=(i=o.getResponseHeader("Content-Length"))!=null?i:0;t.progress$.next(n.loaded/+a*100)}}),t.progress$.next(5)),o.send(),()=>o.abort()})}function je(e,t){return zr(e,t).pipe(v(r=>r.text()),m(r=>JSON.parse(r)),G(1))}function fn(e,t){let r=new DOMParser;return zr(e,t).pipe(v(o=>o.text()),m(o=>r.parseFromString(o,"text/html")),G(1))}function un(e,t){let r=new DOMParser;return zr(e,t).pipe(v(o=>o.text()),m(o=>r.parseFromString(o,"text/xml")),G(1))}function dn(){return{x:Math.max(0,scrollX),y:Math.max(0,scrollY)}}function hn(){return O(h(window,"scroll",{passive:!0}),h(window,"resize",{passive:!0})).pipe(m(dn),Q(dn()))}function bn(){return{width:innerWidth,height:innerHeight}}function vn(){return h(window,"resize",{passive:!0}).pipe(m(bn),Q(bn()))}function gn(){return z([hn(),vn()]).pipe(m(([e,t])=>({offset:e,size:t})),G(1))}function mr(e,{viewport$:t,header$:r}){let o=t.pipe(ee("size")),n=z([o,r]).pipe(m(()=>Ve(e)));return z([r,t,n]).pipe(m(([{height:i},{offset:a,size:s},{x:p,y:c}])=>({offset:{x:a.x-p,y:a.y-c+i},size:s})))}function _a(e){return h(e,"message",t=>t.data)}function Aa(e){let t=new g;return t.subscribe(r=>e.postMessage(r)),t}function yn(e,t=new Worker(e)){let r=_a(t),o=Aa(t),n=new g;n.subscribe(o);let i=o.pipe(Z(),ie(!0));return n.pipe(Z(),Re(r.pipe(W(i))),pe())}var Ca=R("#__config"),Ot=JSON.parse(Ca.textContent);Ot.base=`${new URL(Ot.base,ye())}`;function xe(){return Ot}function B(e){return Ot.features.includes(e)}function Ee(e,t){return typeof t!="undefined"?Ot.translations[e].replace("#",t.toString()):Ot.translations[e]}function Se(e,t=document){return R(`[data-md-component=${e}]`,t)}function ae(e,t=document){return P(`[data-md-component=${e}]`,t)}function ka(e){let t=R(".md-typeset > :first-child",e);return h(t,"click",{once:!0}).pipe(m(()=>R(".md-typeset",e)),m(r=>({hash:__md_hash(r.innerHTML)})))}function xn(e){if(!B("announce.dismiss")||!e.childElementCount)return S;if(!e.hidden){let t=R(".md-typeset",e);__md_hash(t.innerHTML)===__md_get("__announce")&&(e.hidden=!0)}return C(()=>{let t=new g;return t.subscribe(({hash:r})=>{e.hidden=!0,__md_set("__announce",r)}),ka(e).pipe(w(r=>t.next(r)),_(()=>t.complete()),m(r=>$({ref:e},r)))})}function Ha(e,{target$:t}){return t.pipe(m(r=>({hidden:r!==e})))}function En(e,t){let r=new g;return r.subscribe(({hidden:o})=>{e.hidden=o}),Ha(e,t).pipe(w(o=>r.next(o)),_(()=>r.complete()),m(o=>$({ref:e},o)))}function Rt(e,t){return t==="inline"?x("div",{class:"md-tooltip md-tooltip--inline",id:e,role:"tooltip"},x("div",{class:"md-tooltip__inner md-typeset"})):x("div",{class:"md-tooltip",id:e,role:"tooltip"},x("div",{class:"md-tooltip__inner md-typeset"}))}function wn(...e){return x("div",{class:"md-tooltip2",role:"tooltip"},x("div",{class:"md-tooltip2__inner md-typeset"},e))}function Tn(e,t){if(t=t?`${t}_annotation_${e}`:void 0,t){let r=t?`#${t}`:void 0;return x("aside",{class:"md-annotation",tabIndex:0},Rt(t),x("a",{href:r,class:"md-annotation__index",tabIndex:-1},x("span",{"data-md-annotation-id":e})))}else return x("aside",{class:"md-annotation",tabIndex:0},Rt(t),x("span",{class:"md-annotation__index",tabIndex:-1},x("span",{"data-md-annotation-id":e})))}function Sn(e){return x("button",{class:"md-clipboard md-icon",title:Ee("clipboard.copy"),"data-clipboard-target":`#${e} > code`})}var Ln=Mt(qr());function Qr(e,t){let r=t&2,o=t&1,n=Object.keys(e.terms).filter(p=>!e.terms[p]).reduce((p,c)=>[...p,x("del",null,(0,Ln.default)(c))," "],[]).slice(0,-1),i=xe(),a=new URL(e.location,i.base);B("search.highlight")&&a.searchParams.set("h",Object.entries(e.terms).filter(([,p])=>p).reduce((p,[c])=>`${p} ${c}`.trim(),""));let{tags:s}=xe();return x("a",{href:`${a}`,class:"md-search-result__link",tabIndex:-1},x("article",{class:"md-search-result__article md-typeset","data-md-score":e.score.toFixed(2)},r>0&&x("div",{class:"md-search-result__icon md-icon"}),r>0&&x("h1",null,e.title),r<=0&&x("h2",null,e.title),o>0&&e.text.length>0&&e.text,e.tags&&x("nav",{class:"md-tags"},e.tags.map(p=>{let c=s?p in s?`md-tag-icon md-tag--${s[p]}`:"md-tag-icon":"";return x("span",{class:`md-tag ${c}`},p)})),o>0&&n.length>0&&x("p",{class:"md-search-result__terms"},Ee("search.result.term.missing"),": ",...n)))}function Mn(e){let t=e[0].score,r=[...e],o=xe(),n=r.findIndex(l=>!`${new URL(l.location,o.base)}`.includes("#")),[i]=r.splice(n,1),a=r.findIndex(l=>l.scoreQr(l,1)),...p.length?[x("details",{class:"md-search-result__more"},x("summary",{tabIndex:-1},x("div",null,p.length>0&&p.length===1?Ee("search.result.more.one"):Ee("search.result.more.other",p.length))),...p.map(l=>Qr(l,1)))]:[]];return x("li",{class:"md-search-result__item"},c)}function _n(e){return x("ul",{class:"md-source__facts"},Object.entries(e).map(([t,r])=>x("li",{class:`md-source__fact md-source__fact--${t}`},typeof r=="number"?sr(r):r)))}function Kr(e){let t=`tabbed-control tabbed-control--${e}`;return x("div",{class:t,hidden:!0},x("button",{class:"tabbed-button",tabIndex:-1,"aria-hidden":"true"}))}function An(e){return x("div",{class:"md-typeset__scrollwrap"},x("div",{class:"md-typeset__table"},e))}function Ra(e){var o;let t=xe(),r=new URL(`../${e.version}/`,t.base);return x("li",{class:"md-version__item"},x("a",{href:`${r}`,class:"md-version__link"},e.title,((o=t.version)==null?void 0:o.alias)&&e.aliases.length>0&&x("span",{class:"md-version__alias"},e.aliases[0])))}function Cn(e,t){var o;let r=xe();return e=e.filter(n=>{var i;return!((i=n.properties)!=null&&i.hidden)}),x("div",{class:"md-version"},x("button",{class:"md-version__current","aria-label":Ee("select.version")},t.title,((o=r.version)==null?void 0:o.alias)&&t.aliases.length>0&&x("span",{class:"md-version__alias"},t.aliases[0])),x("ul",{class:"md-version__list"},e.map(Ra)))}var Ia=0;function ja(e){let t=z([et(e),$t(e)]).pipe(m(([o,n])=>o||n),K()),r=C(()=>Zo(e)).pipe(ne(Ne),pt(1),He(t),m(()=>en(e)));return t.pipe(Ae(o=>o),v(()=>z([t,r])),m(([o,n])=>({active:o,offset:n})),pe())}function Fa(e,t){let{content$:r,viewport$:o}=t,n=`__tooltip2_${Ia++}`;return C(()=>{let i=new g,a=new _r(!1);i.pipe(Z(),ie(!1)).subscribe(a);let s=a.pipe(Ht(c=>Le(+!c*250,kr)),K(),v(c=>c?r:S),w(c=>c.id=n),pe());z([i.pipe(m(({active:c})=>c)),s.pipe(v(c=>$t(c,250)),Q(!1))]).pipe(m(c=>c.some(l=>l))).subscribe(a);let p=a.pipe(b(c=>c),re(s,o),m(([c,l,{size:f}])=>{let u=e.getBoundingClientRect(),d=u.width/2;if(l.role==="tooltip")return{x:d,y:8+u.height};if(u.y>=f.height/2){let{height:y}=ce(l);return{x:d,y:-16-y}}else return{x:d,y:16+u.height}}));return z([s,i,p]).subscribe(([c,{offset:l},f])=>{c.style.setProperty("--md-tooltip-host-x",`${l.x}px`),c.style.setProperty("--md-tooltip-host-y",`${l.y}px`),c.style.setProperty("--md-tooltip-x",`${f.x}px`),c.style.setProperty("--md-tooltip-y",`${f.y}px`),c.classList.toggle("md-tooltip2--top",f.y<0),c.classList.toggle("md-tooltip2--bottom",f.y>=0)}),a.pipe(b(c=>c),re(s,(c,l)=>l),b(c=>c.role==="tooltip")).subscribe(c=>{let l=ce(R(":scope > *",c));c.style.setProperty("--md-tooltip-width",`${l.width}px`),c.style.setProperty("--md-tooltip-tail","0px")}),a.pipe(K(),ve(me),re(s)).subscribe(([c,l])=>{l.classList.toggle("md-tooltip2--active",c)}),z([a.pipe(b(c=>c)),s]).subscribe(([c,l])=>{l.role==="dialog"?(e.setAttribute("aria-controls",n),e.setAttribute("aria-haspopup","dialog")):e.setAttribute("aria-describedby",n)}),a.pipe(b(c=>!c)).subscribe(()=>{e.removeAttribute("aria-controls"),e.removeAttribute("aria-describedby"),e.removeAttribute("aria-haspopup")}),ja(e).pipe(w(c=>i.next(c)),_(()=>i.complete()),m(c=>$({ref:e},c)))})}function mt(e,{viewport$:t},r=document.body){return Fa(e,{content$:new j(o=>{let n=e.title,i=wn(n);return o.next(i),e.removeAttribute("title"),r.append(i),()=>{i.remove(),e.setAttribute("title",n)}}),viewport$:t})}function Ua(e,t){let r=C(()=>z([tn(e),Ne(t)])).pipe(m(([{x:o,y:n},i])=>{let{width:a,height:s}=ce(e);return{x:o-i.x+a/2,y:n-i.y+s/2}}));return et(e).pipe(v(o=>r.pipe(m(n=>({active:o,offset:n})),Te(+!o||1/0))))}function kn(e,t,{target$:r}){let[o,n]=Array.from(e.children);return C(()=>{let i=new g,a=i.pipe(Z(),ie(!0));return i.subscribe({next({offset:s}){e.style.setProperty("--md-tooltip-x",`${s.x}px`),e.style.setProperty("--md-tooltip-y",`${s.y}px`)},complete(){e.style.removeProperty("--md-tooltip-x"),e.style.removeProperty("--md-tooltip-y")}}),tt(e).pipe(W(a)).subscribe(s=>{e.toggleAttribute("data-md-visible",s)}),O(i.pipe(b(({active:s})=>s)),i.pipe(_e(250),b(({active:s})=>!s))).subscribe({next({active:s}){s?e.prepend(o):o.remove()},complete(){e.prepend(o)}}),i.pipe(Me(16,me)).subscribe(({active:s})=>{o.classList.toggle("md-tooltip--active",s)}),i.pipe(pt(125,me),b(()=>!!e.offsetParent),m(()=>e.offsetParent.getBoundingClientRect()),m(({x:s})=>s)).subscribe({next(s){s?e.style.setProperty("--md-tooltip-0",`${-s}px`):e.style.removeProperty("--md-tooltip-0")},complete(){e.style.removeProperty("--md-tooltip-0")}}),h(n,"click").pipe(W(a),b(s=>!(s.metaKey||s.ctrlKey))).subscribe(s=>{s.stopPropagation(),s.preventDefault()}),h(n,"mousedown").pipe(W(a),re(i)).subscribe(([s,{active:p}])=>{var c;if(s.button!==0||s.metaKey||s.ctrlKey)s.preventDefault();else if(p){s.preventDefault();let l=e.parentElement.closest(".md-annotation");l instanceof HTMLElement?l.focus():(c=Ie())==null||c.blur()}}),r.pipe(W(a),b(s=>s===o),Ge(125)).subscribe(()=>e.focus()),Ua(e,t).pipe(w(s=>i.next(s)),_(()=>i.complete()),m(s=>$({ref:e},s)))})}function Wa(e){return e.tagName==="CODE"?P(".c, .c1, .cm",e):[e]}function Da(e){let t=[];for(let r of Wa(e)){let o=[],n=document.createNodeIterator(r,NodeFilter.SHOW_TEXT);for(let i=n.nextNode();i;i=n.nextNode())o.push(i);for(let i of o){let a;for(;a=/(\(\d+\))(!)?/.exec(i.textContent);){let[,s,p]=a;if(typeof p=="undefined"){let c=i.splitText(a.index);i=c.splitText(s.length),t.push(c)}else{i.textContent=s,t.push(i);break}}}}return t}function Hn(e,t){t.append(...Array.from(e.childNodes))}function fr(e,t,{target$:r,print$:o}){let n=t.closest("[id]"),i=n==null?void 0:n.id,a=new Map;for(let s of Da(t)){let[,p]=s.textContent.match(/\((\d+)\)/);fe(`:scope > li:nth-child(${p})`,e)&&(a.set(p,Tn(p,i)),s.replaceWith(a.get(p)))}return a.size===0?S:C(()=>{let s=new g,p=s.pipe(Z(),ie(!0)),c=[];for(let[l,f]of a)c.push([R(".md-typeset",f),R(`:scope > li:nth-child(${l})`,e)]);return o.pipe(W(p)).subscribe(l=>{e.hidden=!l,e.classList.toggle("md-annotation-list",l);for(let[f,u]of c)l?Hn(f,u):Hn(u,f)}),O(...[...a].map(([,l])=>kn(l,t,{target$:r}))).pipe(_(()=>s.complete()),pe())})}function $n(e){if(e.nextElementSibling){let t=e.nextElementSibling;if(t.tagName==="OL")return t;if(t.tagName==="P"&&!t.children.length)return $n(t)}}function Pn(e,t){return C(()=>{let r=$n(e);return typeof r!="undefined"?fr(r,e,t):S})}var Rn=Mt(Br());var Va=0;function In(e){if(e.nextElementSibling){let t=e.nextElementSibling;if(t.tagName==="OL")return t;if(t.tagName==="P"&&!t.children.length)return In(t)}}function Na(e){return ge(e).pipe(m(({width:t})=>({scrollable:St(e).width>t})),ee("scrollable"))}function jn(e,t){let{matches:r}=matchMedia("(hover)"),o=C(()=>{let n=new g,i=n.pipe(jr(1));n.subscribe(({scrollable:c})=>{c&&r?e.setAttribute("tabindex","0"):e.removeAttribute("tabindex")});let a=[];if(Rn.default.isSupported()&&(e.closest(".copy")||B("content.code.copy")&&!e.closest(".no-copy"))){let c=e.closest("pre");c.id=`__code_${Va++}`;let l=Sn(c.id);c.insertBefore(l,e),B("content.tooltips")&&a.push(mt(l,{viewport$}))}let s=e.closest(".highlight");if(s instanceof HTMLElement){let c=In(s);if(typeof c!="undefined"&&(s.classList.contains("annotate")||B("content.code.annotate"))){let l=fr(c,e,t);a.push(ge(s).pipe(W(i),m(({width:f,height:u})=>f&&u),K(),v(f=>f?l:S)))}}return P(":scope > span[id]",e).length&&e.classList.add("md-code__content"),Na(e).pipe(w(c=>n.next(c)),_(()=>n.complete()),m(c=>$({ref:e},c)),Re(...a))});return B("content.lazy")?tt(e).pipe(b(n=>n),Te(1),v(()=>o)):o}function za(e,{target$:t,print$:r}){let o=!0;return O(t.pipe(m(n=>n.closest("details:not([open])")),b(n=>e===n),m(()=>({action:"open",reveal:!0}))),r.pipe(b(n=>n||!o),w(()=>o=e.open),m(n=>({action:n?"open":"close"}))))}function Fn(e,t){return C(()=>{let r=new g;return r.subscribe(({action:o,reveal:n})=>{e.toggleAttribute("open",o==="open"),n&&e.scrollIntoView()}),za(e,t).pipe(w(o=>r.next(o)),_(()=>r.complete()),m(o=>$({ref:e},o)))})}var Un=".node circle,.node ellipse,.node path,.node polygon,.node rect{fill:var(--md-mermaid-node-bg-color);stroke:var(--md-mermaid-node-fg-color)}marker{fill:var(--md-mermaid-edge-color)!important}.edgeLabel .label rect{fill:#0000}.label{color:var(--md-mermaid-label-fg-color);font-family:var(--md-mermaid-font-family)}.label foreignObject{line-height:normal;overflow:visible}.label div .edgeLabel{color:var(--md-mermaid-label-fg-color)}.edgeLabel,.edgeLabel p,.label div .edgeLabel{background-color:var(--md-mermaid-label-bg-color)}.edgeLabel,.edgeLabel p{fill:var(--md-mermaid-label-bg-color);color:var(--md-mermaid-edge-color)}.edgePath .path,.flowchart-link{stroke:var(--md-mermaid-edge-color);stroke-width:.05rem}.edgePath .arrowheadPath{fill:var(--md-mermaid-edge-color);stroke:none}.cluster rect{fill:var(--md-default-fg-color--lightest);stroke:var(--md-default-fg-color--lighter)}.cluster span{color:var(--md-mermaid-label-fg-color);font-family:var(--md-mermaid-font-family)}g #flowchart-circleEnd,g #flowchart-circleStart,g #flowchart-crossEnd,g #flowchart-crossStart,g #flowchart-pointEnd,g #flowchart-pointStart{stroke:none}g.classGroup line,g.classGroup rect{fill:var(--md-mermaid-node-bg-color);stroke:var(--md-mermaid-node-fg-color)}g.classGroup text{fill:var(--md-mermaid-label-fg-color);font-family:var(--md-mermaid-font-family)}.classLabel .box{fill:var(--md-mermaid-label-bg-color);background-color:var(--md-mermaid-label-bg-color);opacity:1}.classLabel .label{fill:var(--md-mermaid-label-fg-color);font-family:var(--md-mermaid-font-family)}.node .divider{stroke:var(--md-mermaid-node-fg-color)}.relation{stroke:var(--md-mermaid-edge-color)}.cardinality{fill:var(--md-mermaid-label-fg-color);font-family:var(--md-mermaid-font-family)}.cardinality text{fill:inherit!important}defs #classDiagram-compositionEnd,defs #classDiagram-compositionStart,defs #classDiagram-dependencyEnd,defs #classDiagram-dependencyStart,defs #classDiagram-extensionEnd,defs #classDiagram-extensionStart{fill:var(--md-mermaid-edge-color)!important;stroke:var(--md-mermaid-edge-color)!important}defs #classDiagram-aggregationEnd,defs #classDiagram-aggregationStart{fill:var(--md-mermaid-label-bg-color)!important;stroke:var(--md-mermaid-edge-color)!important}g.stateGroup rect{fill:var(--md-mermaid-node-bg-color);stroke:var(--md-mermaid-node-fg-color)}g.stateGroup .state-title{fill:var(--md-mermaid-label-fg-color)!important;font-family:var(--md-mermaid-font-family)}g.stateGroup .composit{fill:var(--md-mermaid-label-bg-color)}.nodeLabel,.nodeLabel p{color:var(--md-mermaid-label-fg-color);font-family:var(--md-mermaid-font-family)}a .nodeLabel{text-decoration:underline}.node circle.state-end,.node circle.state-start,.start-state{fill:var(--md-mermaid-edge-color);stroke:none}.end-state-inner,.end-state-outer{fill:var(--md-mermaid-edge-color)}.end-state-inner,.node circle.state-end{stroke:var(--md-mermaid-label-bg-color)}.transition{stroke:var(--md-mermaid-edge-color)}[id^=state-fork] rect,[id^=state-join] rect{fill:var(--md-mermaid-edge-color)!important;stroke:none!important}.statediagram-cluster.statediagram-cluster .inner{fill:var(--md-default-bg-color)}.statediagram-cluster rect{fill:var(--md-mermaid-node-bg-color);stroke:var(--md-mermaid-node-fg-color)}.statediagram-state rect.divider{fill:var(--md-default-fg-color--lightest);stroke:var(--md-default-fg-color--lighter)}defs #statediagram-barbEnd{stroke:var(--md-mermaid-edge-color)}.attributeBoxEven,.attributeBoxOdd{fill:var(--md-mermaid-node-bg-color);stroke:var(--md-mermaid-node-fg-color)}.entityBox{fill:var(--md-mermaid-label-bg-color);stroke:var(--md-mermaid-node-fg-color)}.entityLabel{fill:var(--md-mermaid-label-fg-color);font-family:var(--md-mermaid-font-family)}.relationshipLabelBox{fill:var(--md-mermaid-label-bg-color);fill-opacity:1;background-color:var(--md-mermaid-label-bg-color);opacity:1}.relationshipLabel{fill:var(--md-mermaid-label-fg-color)}.relationshipLine{stroke:var(--md-mermaid-edge-color)}defs #ONE_OR_MORE_END *,defs #ONE_OR_MORE_START *,defs #ONLY_ONE_END *,defs #ONLY_ONE_START *,defs #ZERO_OR_MORE_END *,defs #ZERO_OR_MORE_START *,defs #ZERO_OR_ONE_END *,defs #ZERO_OR_ONE_START *{stroke:var(--md-mermaid-edge-color)!important}defs #ZERO_OR_MORE_END circle,defs #ZERO_OR_MORE_START circle{fill:var(--md-mermaid-label-bg-color)}.actor{fill:var(--md-mermaid-sequence-actor-bg-color);stroke:var(--md-mermaid-sequence-actor-border-color)}text.actor>tspan{fill:var(--md-mermaid-sequence-actor-fg-color);font-family:var(--md-mermaid-font-family)}line{stroke:var(--md-mermaid-sequence-actor-line-color)}.actor-man circle,.actor-man line{fill:var(--md-mermaid-sequence-actorman-bg-color);stroke:var(--md-mermaid-sequence-actorman-line-color)}.messageLine0,.messageLine1{stroke:var(--md-mermaid-sequence-message-line-color)}.note{fill:var(--md-mermaid-sequence-note-bg-color);stroke:var(--md-mermaid-sequence-note-border-color)}.loopText,.loopText>tspan,.messageText,.noteText>tspan{stroke:none;font-family:var(--md-mermaid-font-family)!important}.messageText{fill:var(--md-mermaid-sequence-message-fg-color)}.loopText,.loopText>tspan{fill:var(--md-mermaid-sequence-loop-fg-color)}.noteText>tspan{fill:var(--md-mermaid-sequence-note-fg-color)}#arrowhead path{fill:var(--md-mermaid-sequence-message-line-color);stroke:none}.loopLine{fill:var(--md-mermaid-sequence-loop-bg-color);stroke:var(--md-mermaid-sequence-loop-border-color)}.labelBox{fill:var(--md-mermaid-sequence-label-bg-color);stroke:none}.labelText,.labelText>span{fill:var(--md-mermaid-sequence-label-fg-color);font-family:var(--md-mermaid-font-family)}.sequenceNumber{fill:var(--md-mermaid-sequence-number-fg-color)}rect.rect{fill:var(--md-mermaid-sequence-box-bg-color);stroke:none}rect.rect+text.text{fill:var(--md-mermaid-sequence-box-fg-color)}defs #sequencenumber{fill:var(--md-mermaid-sequence-number-bg-color)!important}";var Gr,Qa=0;function Ka(){return typeof mermaid=="undefined"||mermaid instanceof Element?Tt("https://unpkg.com/mermaid@11/dist/mermaid.min.js"):I(void 0)}function Wn(e){return e.classList.remove("mermaid"),Gr||(Gr=Ka().pipe(w(()=>mermaid.initialize({startOnLoad:!1,themeCSS:Un,sequence:{actorFontSize:"16px",messageFontSize:"16px",noteFontSize:"16px"}})),m(()=>{}),G(1))),Gr.subscribe(()=>co(this,null,function*(){e.classList.add("mermaid");let t=`__mermaid_${Qa++}`,r=x("div",{class:"mermaid"}),o=e.textContent,{svg:n,fn:i}=yield mermaid.render(t,o),a=r.attachShadow({mode:"closed"});a.innerHTML=n,e.replaceWith(r),i==null||i(a)})),Gr.pipe(m(()=>({ref:e})))}var Dn=x("table");function Vn(e){return e.replaceWith(Dn),Dn.replaceWith(An(e)),I({ref:e})}function Ya(e){let t=e.find(r=>r.checked)||e[0];return O(...e.map(r=>h(r,"change").pipe(m(()=>R(`label[for="${r.id}"]`))))).pipe(Q(R(`label[for="${t.id}"]`)),m(r=>({active:r})))}function Nn(e,{viewport$:t,target$:r}){let o=R(".tabbed-labels",e),n=P(":scope > input",e),i=Kr("prev");e.append(i);let a=Kr("next");return e.append(a),C(()=>{let s=new g,p=s.pipe(Z(),ie(!0));z([s,ge(e),tt(e)]).pipe(W(p),Me(1,me)).subscribe({next([{active:c},l]){let f=Ve(c),{width:u}=ce(c);e.style.setProperty("--md-indicator-x",`${f.x}px`),e.style.setProperty("--md-indicator-width",`${u}px`);let d=pr(o);(f.xd.x+l.width)&&o.scrollTo({left:Math.max(0,f.x-16),behavior:"smooth"})},complete(){e.style.removeProperty("--md-indicator-x"),e.style.removeProperty("--md-indicator-width")}}),z([Ne(o),ge(o)]).pipe(W(p)).subscribe(([c,l])=>{let f=St(o);i.hidden=c.x<16,a.hidden=c.x>f.width-l.width-16}),O(h(i,"click").pipe(m(()=>-1)),h(a,"click").pipe(m(()=>1))).pipe(W(p)).subscribe(c=>{let{width:l}=ce(o);o.scrollBy({left:l*c,behavior:"smooth"})}),r.pipe(W(p),b(c=>n.includes(c))).subscribe(c=>c.click()),o.classList.add("tabbed-labels--linked");for(let c of n){let l=R(`label[for="${c.id}"]`);l.replaceChildren(x("a",{href:`#${l.htmlFor}`,tabIndex:-1},...Array.from(l.childNodes))),h(l.firstElementChild,"click").pipe(W(p),b(f=>!(f.metaKey||f.ctrlKey)),w(f=>{f.preventDefault(),f.stopPropagation()})).subscribe(()=>{history.replaceState({},"",`#${l.htmlFor}`),l.click()})}return B("content.tabs.link")&&s.pipe(Ce(1),re(t)).subscribe(([{active:c},{offset:l}])=>{let f=c.innerText.trim();if(c.hasAttribute("data-md-switching"))c.removeAttribute("data-md-switching");else{let u=e.offsetTop-l.y;for(let y of P("[data-tabs]"))for(let L of P(":scope > input",y)){let X=R(`label[for="${L.id}"]`);if(X!==c&&X.innerText.trim()===f){X.setAttribute("data-md-switching",""),L.click();break}}window.scrollTo({top:e.offsetTop-u});let d=__md_get("__tabs")||[];__md_set("__tabs",[...new Set([f,...d])])}}),s.pipe(W(p)).subscribe(()=>{for(let c of P("audio, video",e))c.pause()}),Ya(n).pipe(w(c=>s.next(c)),_(()=>s.complete()),m(c=>$({ref:e},c)))}).pipe(Ke(se))}function zn(e,{viewport$:t,target$:r,print$:o}){return O(...P(".annotate:not(.highlight)",e).map(n=>Pn(n,{target$:r,print$:o})),...P("pre:not(.mermaid) > code",e).map(n=>jn(n,{target$:r,print$:o})),...P("pre.mermaid",e).map(n=>Wn(n)),...P("table:not([class])",e).map(n=>Vn(n)),...P("details",e).map(n=>Fn(n,{target$:r,print$:o})),...P("[data-tabs]",e).map(n=>Nn(n,{viewport$:t,target$:r})),...P("[title]",e).filter(()=>B("content.tooltips")).map(n=>mt(n,{viewport$:t})))}function Ba(e,{alert$:t}){return t.pipe(v(r=>O(I(!0),I(!1).pipe(Ge(2e3))).pipe(m(o=>({message:r,active:o})))))}function qn(e,t){let r=R(".md-typeset",e);return C(()=>{let o=new g;return o.subscribe(({message:n,active:i})=>{e.classList.toggle("md-dialog--active",i),r.textContent=n}),Ba(e,t).pipe(w(n=>o.next(n)),_(()=>o.complete()),m(n=>$({ref:e},n)))})}var Ga=0;function Ja(e,t){document.body.append(e);let{width:r}=ce(e);e.style.setProperty("--md-tooltip-width",`${r}px`),e.remove();let o=cr(t),n=typeof o!="undefined"?Ne(o):I({x:0,y:0}),i=O(et(t),$t(t)).pipe(K());return z([i,n]).pipe(m(([a,s])=>{let{x:p,y:c}=Ve(t),l=ce(t),f=t.closest("table");return f&&t.parentElement&&(p+=f.offsetLeft+t.parentElement.offsetLeft,c+=f.offsetTop+t.parentElement.offsetTop),{active:a,offset:{x:p-s.x+l.width/2-r/2,y:c-s.y+l.height+8}}}))}function Qn(e){let t=e.title;if(!t.length)return S;let r=`__tooltip_${Ga++}`,o=Rt(r,"inline"),n=R(".md-typeset",o);return n.innerHTML=t,C(()=>{let i=new g;return i.subscribe({next({offset:a}){o.style.setProperty("--md-tooltip-x",`${a.x}px`),o.style.setProperty("--md-tooltip-y",`${a.y}px`)},complete(){o.style.removeProperty("--md-tooltip-x"),o.style.removeProperty("--md-tooltip-y")}}),O(i.pipe(b(({active:a})=>a)),i.pipe(_e(250),b(({active:a})=>!a))).subscribe({next({active:a}){a?(e.insertAdjacentElement("afterend",o),e.setAttribute("aria-describedby",r),e.removeAttribute("title")):(o.remove(),e.removeAttribute("aria-describedby"),e.setAttribute("title",t))},complete(){o.remove(),e.removeAttribute("aria-describedby"),e.setAttribute("title",t)}}),i.pipe(Me(16,me)).subscribe(({active:a})=>{o.classList.toggle("md-tooltip--active",a)}),i.pipe(pt(125,me),b(()=>!!e.offsetParent),m(()=>e.offsetParent.getBoundingClientRect()),m(({x:a})=>a)).subscribe({next(a){a?o.style.setProperty("--md-tooltip-0",`${-a}px`):o.style.removeProperty("--md-tooltip-0")},complete(){o.style.removeProperty("--md-tooltip-0")}}),Ja(o,e).pipe(w(a=>i.next(a)),_(()=>i.complete()),m(a=>$({ref:e},a)))}).pipe(Ke(se))}function Xa({viewport$:e}){if(!B("header.autohide"))return I(!1);let t=e.pipe(m(({offset:{y:n}})=>n),Be(2,1),m(([n,i])=>[nMath.abs(i-n.y)>100),m(([,[n]])=>n),K()),o=ze("search");return z([e,o]).pipe(m(([{offset:n},i])=>n.y>400&&!i),K(),v(n=>n?r:I(!1)),Q(!1))}function Kn(e,t){return C(()=>z([ge(e),Xa(t)])).pipe(m(([{height:r},o])=>({height:r,hidden:o})),K((r,o)=>r.height===o.height&&r.hidden===o.hidden),G(1))}function Yn(e,{header$:t,main$:r}){return C(()=>{let o=new g,n=o.pipe(Z(),ie(!0));o.pipe(ee("active"),He(t)).subscribe(([{active:a},{hidden:s}])=>{e.classList.toggle("md-header--shadow",a&&!s),e.hidden=s});let i=ue(P("[title]",e)).pipe(b(()=>B("content.tooltips")),ne(a=>Qn(a)));return r.subscribe(o),t.pipe(W(n),m(a=>$({ref:e},a)),Re(i.pipe(W(n))))})}function Za(e,{viewport$:t,header$:r}){return mr(e,{viewport$:t,header$:r}).pipe(m(({offset:{y:o}})=>{let{height:n}=ce(e);return{active:o>=n}}),ee("active"))}function Bn(e,t){return C(()=>{let r=new g;r.subscribe({next({active:n}){e.classList.toggle("md-header__title--active",n)},complete(){e.classList.remove("md-header__title--active")}});let o=fe(".md-content h1");return typeof o=="undefined"?S:Za(o,t).pipe(w(n=>r.next(n)),_(()=>r.complete()),m(n=>$({ref:e},n)))})}function Gn(e,{viewport$:t,header$:r}){let o=r.pipe(m(({height:i})=>i),K()),n=o.pipe(v(()=>ge(e).pipe(m(({height:i})=>({top:e.offsetTop,bottom:e.offsetTop+i})),ee("bottom"))));return z([o,n,t]).pipe(m(([i,{top:a,bottom:s},{offset:{y:p},size:{height:c}}])=>(c=Math.max(0,c-Math.max(0,a-p,i)-Math.max(0,c+p-s)),{offset:a-i,height:c,active:a-i<=p})),K((i,a)=>i.offset===a.offset&&i.height===a.height&&i.active===a.active))}function es(e){let t=__md_get("__palette")||{index:e.findIndex(o=>matchMedia(o.getAttribute("data-md-color-media")).matches)},r=Math.max(0,Math.min(t.index,e.length-1));return I(...e).pipe(ne(o=>h(o,"change").pipe(m(()=>o))),Q(e[r]),m(o=>({index:e.indexOf(o),color:{media:o.getAttribute("data-md-color-media"),scheme:o.getAttribute("data-md-color-scheme"),primary:o.getAttribute("data-md-color-primary"),accent:o.getAttribute("data-md-color-accent")}})),G(1))}function Jn(e){let t=P("input",e),r=x("meta",{name:"theme-color"});document.head.appendChild(r);let o=x("meta",{name:"color-scheme"});document.head.appendChild(o);let n=Pt("(prefers-color-scheme: light)");return C(()=>{let i=new g;return i.subscribe(a=>{if(document.body.setAttribute("data-md-color-switching",""),a.color.media==="(prefers-color-scheme)"){let s=matchMedia("(prefers-color-scheme: light)"),p=document.querySelector(s.matches?"[data-md-color-media='(prefers-color-scheme: light)']":"[data-md-color-media='(prefers-color-scheme: dark)']");a.color.scheme=p.getAttribute("data-md-color-scheme"),a.color.primary=p.getAttribute("data-md-color-primary"),a.color.accent=p.getAttribute("data-md-color-accent")}for(let[s,p]of Object.entries(a.color))document.body.setAttribute(`data-md-color-${s}`,p);for(let s=0;sa.key==="Enter"),re(i,(a,s)=>s)).subscribe(({index:a})=>{a=(a+1)%t.length,t[a].click(),t[a].focus()}),i.pipe(m(()=>{let a=Se("header"),s=window.getComputedStyle(a);return o.content=s.colorScheme,s.backgroundColor.match(/\d+/g).map(p=>(+p).toString(16).padStart(2,"0")).join("")})).subscribe(a=>r.content=`#${a}`),i.pipe(ve(se)).subscribe(()=>{document.body.removeAttribute("data-md-color-switching")}),es(t).pipe(W(n.pipe(Ce(1))),ct(),w(a=>i.next(a)),_(()=>i.complete()),m(a=>$({ref:e},a)))})}function Xn(e,{progress$:t}){return C(()=>{let r=new g;return r.subscribe(({value:o})=>{e.style.setProperty("--md-progress-value",`${o}`)}),t.pipe(w(o=>r.next({value:o})),_(()=>r.complete()),m(o=>({ref:e,value:o})))})}var Jr=Mt(Br());function ts(e){e.setAttribute("data-md-copying","");let t=e.closest("[data-copy]"),r=t?t.getAttribute("data-copy"):e.innerText;return e.removeAttribute("data-md-copying"),r.trimEnd()}function Zn({alert$:e}){Jr.default.isSupported()&&new j(t=>{new Jr.default("[data-clipboard-target], [data-clipboard-text]",{text:r=>r.getAttribute("data-clipboard-text")||ts(R(r.getAttribute("data-clipboard-target")))}).on("success",r=>t.next(r))}).pipe(w(t=>{t.trigger.focus()}),m(()=>Ee("clipboard.copied"))).subscribe(e)}function ei(e,t){return e.protocol=t.protocol,e.hostname=t.hostname,e}function rs(e,t){let r=new Map;for(let o of P("url",e)){let n=R("loc",o),i=[ei(new URL(n.textContent),t)];r.set(`${i[0]}`,i);for(let a of P("[rel=alternate]",o)){let s=a.getAttribute("href");s!=null&&i.push(ei(new URL(s),t))}}return r}function ur(e){return un(new URL("sitemap.xml",e)).pipe(m(t=>rs(t,new URL(e))),de(()=>I(new Map)))}function os(e,t){if(!(e.target instanceof Element))return S;let r=e.target.closest("a");if(r===null)return S;if(r.target||e.metaKey||e.ctrlKey)return S;let o=new URL(r.href);return o.search=o.hash="",t.has(`${o}`)?(e.preventDefault(),I(new URL(r.href))):S}function ti(e){let t=new Map;for(let r of P(":scope > *",e.head))t.set(r.outerHTML,r);return t}function ri(e){for(let t of P("[href], [src]",e))for(let r of["href","src"]){let o=t.getAttribute(r);if(o&&!/^(?:[a-z]+:)?\/\//i.test(o)){t[r]=t[r];break}}return I(e)}function ns(e){for(let o of["[data-md-component=announce]","[data-md-component=container]","[data-md-component=header-topic]","[data-md-component=outdated]","[data-md-component=logo]","[data-md-component=skip]",...B("navigation.tabs.sticky")?["[data-md-component=tabs]"]:[]]){let n=fe(o),i=fe(o,e);typeof n!="undefined"&&typeof i!="undefined"&&n.replaceWith(i)}let t=ti(document);for(let[o,n]of ti(e))t.has(o)?t.delete(o):document.head.appendChild(n);for(let o of t.values()){let n=o.getAttribute("name");n!=="theme-color"&&n!=="color-scheme"&&o.remove()}let r=Se("container");return We(P("script",r)).pipe(v(o=>{let n=e.createElement("script");if(o.src){for(let i of o.getAttributeNames())n.setAttribute(i,o.getAttribute(i));return o.replaceWith(n),new j(i=>{n.onload=()=>i.complete()})}else return n.textContent=o.textContent,o.replaceWith(n),S}),Z(),ie(document))}function oi({location$:e,viewport$:t,progress$:r}){let o=xe();if(location.protocol==="file:")return S;let n=ur(o.base);I(document).subscribe(ri);let i=h(document.body,"click").pipe(He(n),v(([p,c])=>os(p,c)),pe()),a=h(window,"popstate").pipe(m(ye),pe());i.pipe(re(t)).subscribe(([p,{offset:c}])=>{history.replaceState(c,""),history.pushState(null,"",p)}),O(i,a).subscribe(e);let s=e.pipe(ee("pathname"),v(p=>fn(p,{progress$:r}).pipe(de(()=>(lt(p,!0),S)))),v(ri),v(ns),pe());return O(s.pipe(re(e,(p,c)=>c)),s.pipe(v(()=>e),ee("pathname"),v(()=>e),ee("hash")),e.pipe(K((p,c)=>p.pathname===c.pathname&&p.hash===c.hash),v(()=>i),w(()=>history.back()))).subscribe(p=>{var c,l;history.state!==null||!p.hash?window.scrollTo(0,(l=(c=history.state)==null?void 0:c.y)!=null?l:0):(history.scrollRestoration="auto",pn(p.hash),history.scrollRestoration="manual")}),e.subscribe(()=>{history.scrollRestoration="manual"}),h(window,"beforeunload").subscribe(()=>{history.scrollRestoration="auto"}),t.pipe(ee("offset"),_e(100)).subscribe(({offset:p})=>{history.replaceState(p,"")}),s}var ni=Mt(qr());function ii(e){let t=e.separator.split("|").map(n=>n.replace(/(\(\?[!=<][^)]+\))/g,"").length===0?"\uFFFD":n).join("|"),r=new RegExp(t,"img"),o=(n,i,a)=>`${i}${a}`;return n=>{n=n.replace(/[\s*+\-:~^]+/g," ").trim();let i=new RegExp(`(^|${e.separator}|)(${n.replace(/[|\\{}()[\]^$+*?.-]/g,"\\$&").replace(r,"|")})`,"img");return a=>(0,ni.default)(a).replace(i,o).replace(/<\/mark>(\s+)]*>/img,"$1")}}function jt(e){return e.type===1}function dr(e){return e.type===3}function ai(e,t){let r=yn(e);return O(I(location.protocol!=="file:"),ze("search")).pipe(Ae(o=>o),v(()=>t)).subscribe(({config:o,docs:n})=>r.next({type:0,data:{config:o,docs:n,options:{suggest:B("search.suggest")}}})),r}function si(e){var l;let{selectedVersionSitemap:t,selectedVersionBaseURL:r,currentLocation:o,currentBaseURL:n}=e,i=(l=Xr(n))==null?void 0:l.pathname;if(i===void 0)return;let a=ss(o.pathname,i);if(a===void 0)return;let s=ps(t.keys());if(!t.has(s))return;let p=Xr(a,s);if(!p||!t.has(p.href))return;let c=Xr(a,r);if(c)return c.hash=o.hash,c.search=o.search,c}function Xr(e,t){try{return new URL(e,t)}catch(r){return}}function ss(e,t){if(e.startsWith(t))return e.slice(t.length)}function cs(e,t){let r=Math.min(e.length,t.length),o;for(o=0;oS)),o=r.pipe(m(n=>{let[,i]=t.base.match(/([^/]+)\/?$/);return n.find(({version:a,aliases:s})=>a===i||s.includes(i))||n[0]}));r.pipe(m(n=>new Map(n.map(i=>[`${new URL(`../${i.version}/`,t.base)}`,i]))),v(n=>h(document.body,"click").pipe(b(i=>!i.metaKey&&!i.ctrlKey),re(o),v(([i,a])=>{if(i.target instanceof Element){let s=i.target.closest("a");if(s&&!s.target&&n.has(s.href)){let p=s.href;return!i.target.closest(".md-version")&&n.get(p)===a?S:(i.preventDefault(),I(new URL(p)))}}return S}),v(i=>ur(i).pipe(m(a=>{var s;return(s=si({selectedVersionSitemap:a,selectedVersionBaseURL:i,currentLocation:ye(),currentBaseURL:t.base}))!=null?s:i})))))).subscribe(n=>lt(n,!0)),z([r,o]).subscribe(([n,i])=>{R(".md-header__topic").appendChild(Cn(n,i))}),e.pipe(v(()=>o)).subscribe(n=>{var a;let i=__md_get("__outdated",sessionStorage);if(i===null){i=!0;let s=((a=t.version)==null?void 0:a.default)||"latest";Array.isArray(s)||(s=[s]);e:for(let p of s)for(let c of n.aliases.concat(n.version))if(new RegExp(p,"i").test(c)){i=!1;break e}__md_set("__outdated",i,sessionStorage)}if(i)for(let s of ae("outdated"))s.hidden=!1})}function ls(e,{worker$:t}){let{searchParams:r}=ye();r.has("q")&&(Je("search",!0),e.value=r.get("q"),e.focus(),ze("search").pipe(Ae(i=>!i)).subscribe(()=>{let i=ye();i.searchParams.delete("q"),history.replaceState({},"",`${i}`)}));let o=et(e),n=O(t.pipe(Ae(jt)),h(e,"keyup"),o).pipe(m(()=>e.value),K());return z([n,o]).pipe(m(([i,a])=>({value:i,focus:a})),G(1))}function pi(e,{worker$:t}){let r=new g,o=r.pipe(Z(),ie(!0));z([t.pipe(Ae(jt)),r],(i,a)=>a).pipe(ee("value")).subscribe(({value:i})=>t.next({type:2,data:i})),r.pipe(ee("focus")).subscribe(({focus:i})=>{i&&Je("search",i)}),h(e.form,"reset").pipe(W(o)).subscribe(()=>e.focus());let n=R("header [for=__search]");return h(n,"click").subscribe(()=>e.focus()),ls(e,{worker$:t}).pipe(w(i=>r.next(i)),_(()=>r.complete()),m(i=>$({ref:e},i)),G(1))}function li(e,{worker$:t,query$:r}){let o=new g,n=on(e.parentElement).pipe(b(Boolean)),i=e.parentElement,a=R(":scope > :first-child",e),s=R(":scope > :last-child",e);ze("search").subscribe(l=>s.setAttribute("role",l?"list":"presentation")),o.pipe(re(r),Wr(t.pipe(Ae(jt)))).subscribe(([{items:l},{value:f}])=>{switch(l.length){case 0:a.textContent=f.length?Ee("search.result.none"):Ee("search.result.placeholder");break;case 1:a.textContent=Ee("search.result.one");break;default:let u=sr(l.length);a.textContent=Ee("search.result.other",u)}});let p=o.pipe(w(()=>s.innerHTML=""),v(({items:l})=>O(I(...l.slice(0,10)),I(...l.slice(10)).pipe(Be(4),Vr(n),v(([f])=>f)))),m(Mn),pe());return p.subscribe(l=>s.appendChild(l)),p.pipe(ne(l=>{let f=fe("details",l);return typeof f=="undefined"?S:h(f,"toggle").pipe(W(o),m(()=>f))})).subscribe(l=>{l.open===!1&&l.offsetTop<=i.scrollTop&&i.scrollTo({top:l.offsetTop})}),t.pipe(b(dr),m(({data:l})=>l)).pipe(w(l=>o.next(l)),_(()=>o.complete()),m(l=>$({ref:e},l)))}function ms(e,{query$:t}){return t.pipe(m(({value:r})=>{let o=ye();return o.hash="",r=r.replace(/\s+/g,"+").replace(/&/g,"%26").replace(/=/g,"%3D"),o.search=`q=${r}`,{url:o}}))}function mi(e,t){let r=new g,o=r.pipe(Z(),ie(!0));return r.subscribe(({url:n})=>{e.setAttribute("data-clipboard-text",e.href),e.href=`${n}`}),h(e,"click").pipe(W(o)).subscribe(n=>n.preventDefault()),ms(e,t).pipe(w(n=>r.next(n)),_(()=>r.complete()),m(n=>$({ref:e},n)))}function fi(e,{worker$:t,keyboard$:r}){let o=new g,n=Se("search-query"),i=O(h(n,"keydown"),h(n,"focus")).pipe(ve(se),m(()=>n.value),K());return o.pipe(He(i),m(([{suggest:s},p])=>{let c=p.split(/([\s-]+)/);if(s!=null&&s.length&&c[c.length-1]){let l=s[s.length-1];l.startsWith(c[c.length-1])&&(c[c.length-1]=l)}else c.length=0;return c})).subscribe(s=>e.innerHTML=s.join("").replace(/\s/g," ")),r.pipe(b(({mode:s})=>s==="search")).subscribe(s=>{switch(s.type){case"ArrowRight":e.innerText.length&&n.selectionStart===n.value.length&&(n.value=e.innerText);break}}),t.pipe(b(dr),m(({data:s})=>s)).pipe(w(s=>o.next(s)),_(()=>o.complete()),m(()=>({ref:e})))}function ui(e,{index$:t,keyboard$:r}){let o=xe();try{let n=ai(o.search,t),i=Se("search-query",e),a=Se("search-result",e);h(e,"click").pipe(b(({target:p})=>p instanceof Element&&!!p.closest("a"))).subscribe(()=>Je("search",!1)),r.pipe(b(({mode:p})=>p==="search")).subscribe(p=>{let c=Ie();switch(p.type){case"Enter":if(c===i){let l=new Map;for(let f of P(":first-child [href]",a)){let u=f.firstElementChild;l.set(f,parseFloat(u.getAttribute("data-md-score")))}if(l.size){let[[f]]=[...l].sort(([,u],[,d])=>d-u);f.click()}p.claim()}break;case"Escape":case"Tab":Je("search",!1),i.blur();break;case"ArrowUp":case"ArrowDown":if(typeof c=="undefined")i.focus();else{let l=[i,...P(":not(details) > [href], summary, details[open] [href]",a)],f=Math.max(0,(Math.max(0,l.indexOf(c))+l.length+(p.type==="ArrowUp"?-1:1))%l.length);l[f].focus()}p.claim();break;default:i!==Ie()&&i.focus()}}),r.pipe(b(({mode:p})=>p==="global")).subscribe(p=>{switch(p.type){case"f":case"s":case"/":i.focus(),i.select(),p.claim();break}});let s=pi(i,{worker$:n});return O(s,li(a,{worker$:n,query$:s})).pipe(Re(...ae("search-share",e).map(p=>mi(p,{query$:s})),...ae("search-suggest",e).map(p=>fi(p,{worker$:n,keyboard$:r}))))}catch(n){return e.hidden=!0,Ye}}function di(e,{index$:t,location$:r}){return z([t,r.pipe(Q(ye()),b(o=>!!o.searchParams.get("h")))]).pipe(m(([o,n])=>ii(o.config)(n.searchParams.get("h"))),m(o=>{var a;let n=new Map,i=document.createNodeIterator(e,NodeFilter.SHOW_TEXT);for(let s=i.nextNode();s;s=i.nextNode())if((a=s.parentElement)!=null&&a.offsetHeight){let p=s.textContent,c=o(p);c.length>p.length&&n.set(s,c)}for(let[s,p]of n){let{childNodes:c}=x("span",null,p);s.replaceWith(...Array.from(c))}return{ref:e,nodes:n}}))}function fs(e,{viewport$:t,main$:r}){let o=e.closest(".md-grid"),n=o.offsetTop-o.parentElement.offsetTop;return z([r,t]).pipe(m(([{offset:i,height:a},{offset:{y:s}}])=>(a=a+Math.min(n,Math.max(0,s-i))-n,{height:a,locked:s>=i+n})),K((i,a)=>i.height===a.height&&i.locked===a.locked))}function Zr(e,o){var n=o,{header$:t}=n,r=so(n,["header$"]);let i=R(".md-sidebar__scrollwrap",e),{y:a}=Ve(i);return C(()=>{let s=new g,p=s.pipe(Z(),ie(!0)),c=s.pipe(Me(0,me));return c.pipe(re(t)).subscribe({next([{height:l},{height:f}]){i.style.height=`${l-2*a}px`,e.style.top=`${f}px`},complete(){i.style.height="",e.style.top=""}}),c.pipe(Ae()).subscribe(()=>{for(let l of P(".md-nav__link--active[href]",e)){if(!l.clientHeight)continue;let f=l.closest(".md-sidebar__scrollwrap");if(typeof f!="undefined"){let u=l.offsetTop-f.offsetTop,{height:d}=ce(f);f.scrollTo({top:u-d/2})}}}),ue(P("label[tabindex]",e)).pipe(ne(l=>h(l,"click").pipe(ve(se),m(()=>l),W(p)))).subscribe(l=>{let f=R(`[id="${l.htmlFor}"]`);R(`[aria-labelledby="${l.id}"]`).setAttribute("aria-expanded",`${f.checked}`)}),fs(e,r).pipe(w(l=>s.next(l)),_(()=>s.complete()),m(l=>$({ref:e},l)))})}function hi(e,t){if(typeof t!="undefined"){let r=`https://api.github.com/repos/${e}/${t}`;return st(je(`${r}/releases/latest`).pipe(de(()=>S),m(o=>({version:o.tag_name})),De({})),je(r).pipe(de(()=>S),m(o=>({stars:o.stargazers_count,forks:o.forks_count})),De({}))).pipe(m(([o,n])=>$($({},o),n)))}else{let r=`https://api.github.com/users/${e}`;return je(r).pipe(m(o=>({repositories:o.public_repos})),De({}))}}function bi(e,t){let r=`https://${e}/api/v4/projects/${encodeURIComponent(t)}`;return st(je(`${r}/releases/permalink/latest`).pipe(de(()=>S),m(({tag_name:o})=>({version:o})),De({})),je(r).pipe(de(()=>S),m(({star_count:o,forks_count:n})=>({stars:o,forks:n})),De({}))).pipe(m(([o,n])=>$($({},o),n)))}function vi(e){let t=e.match(/^.+github\.com\/([^/]+)\/?([^/]+)?/i);if(t){let[,r,o]=t;return hi(r,o)}if(t=e.match(/^.+?([^/]*gitlab[^/]+)\/(.+?)\/?$/i),t){let[,r,o]=t;return bi(r,o)}return S}var us;function ds(e){return us||(us=C(()=>{let t=__md_get("__source",sessionStorage);if(t)return I(t);if(ae("consent").length){let o=__md_get("__consent");if(!(o&&o.github))return S}return vi(e.href).pipe(w(o=>__md_set("__source",o,sessionStorage)))}).pipe(de(()=>S),b(t=>Object.keys(t).length>0),m(t=>({facts:t})),G(1)))}function gi(e){let t=R(":scope > :last-child",e);return C(()=>{let r=new g;return r.subscribe(({facts:o})=>{t.appendChild(_n(o)),t.classList.add("md-source__repository--active")}),ds(e).pipe(w(o=>r.next(o)),_(()=>r.complete()),m(o=>$({ref:e},o)))})}function hs(e,{viewport$:t,header$:r}){return ge(document.body).pipe(v(()=>mr(e,{header$:r,viewport$:t})),m(({offset:{y:o}})=>({hidden:o>=10})),ee("hidden"))}function yi(e,t){return C(()=>{let r=new g;return r.subscribe({next({hidden:o}){e.hidden=o},complete(){e.hidden=!1}}),(B("navigation.tabs.sticky")?I({hidden:!1}):hs(e,t)).pipe(w(o=>r.next(o)),_(()=>r.complete()),m(o=>$({ref:e},o)))})}function bs(e,{viewport$:t,header$:r}){let o=new Map,n=P(".md-nav__link",e);for(let s of n){let p=decodeURIComponent(s.hash.substring(1)),c=fe(`[id="${p}"]`);typeof c!="undefined"&&o.set(s,c)}let i=r.pipe(ee("height"),m(({height:s})=>{let p=Se("main"),c=R(":scope > :first-child",p);return s+.8*(c.offsetTop-p.offsetTop)}),pe());return ge(document.body).pipe(ee("height"),v(s=>C(()=>{let p=[];return I([...o].reduce((c,[l,f])=>{for(;p.length&&o.get(p[p.length-1]).tagName>=f.tagName;)p.pop();let u=f.offsetTop;for(;!u&&f.parentElement;)f=f.parentElement,u=f.offsetTop;let d=f.offsetParent;for(;d;d=d.offsetParent)u+=d.offsetTop;return c.set([...p=[...p,l]].reverse(),u)},new Map))}).pipe(m(p=>new Map([...p].sort(([,c],[,l])=>c-l))),He(i),v(([p,c])=>t.pipe(Fr(([l,f],{offset:{y:u},size:d})=>{let y=u+d.height>=Math.floor(s.height);for(;f.length;){let[,L]=f[0];if(L-c=u&&!y)f=[l.pop(),...f];else break}return[l,f]},[[],[...p]]),K((l,f)=>l[0]===f[0]&&l[1]===f[1])))))).pipe(m(([s,p])=>({prev:s.map(([c])=>c),next:p.map(([c])=>c)})),Q({prev:[],next:[]}),Be(2,1),m(([s,p])=>s.prev.length{let i=new g,a=i.pipe(Z(),ie(!0));if(i.subscribe(({prev:s,next:p})=>{for(let[c]of p)c.classList.remove("md-nav__link--passed"),c.classList.remove("md-nav__link--active");for(let[c,[l]]of s.entries())l.classList.add("md-nav__link--passed"),l.classList.toggle("md-nav__link--active",c===s.length-1)}),B("toc.follow")){let s=O(t.pipe(_e(1),m(()=>{})),t.pipe(_e(250),m(()=>"smooth")));i.pipe(b(({prev:p})=>p.length>0),He(o.pipe(ve(se))),re(s)).subscribe(([[{prev:p}],c])=>{let[l]=p[p.length-1];if(l.offsetHeight){let f=cr(l);if(typeof f!="undefined"){let u=l.offsetTop-f.offsetTop,{height:d}=ce(f);f.scrollTo({top:u-d/2,behavior:c})}}})}return B("navigation.tracking")&&t.pipe(W(a),ee("offset"),_e(250),Ce(1),W(n.pipe(Ce(1))),ct({delay:250}),re(i)).subscribe(([,{prev:s}])=>{let p=ye(),c=s[s.length-1];if(c&&c.length){let[l]=c,{hash:f}=new URL(l.href);p.hash!==f&&(p.hash=f,history.replaceState({},"",`${p}`))}else p.hash="",history.replaceState({},"",`${p}`)}),bs(e,{viewport$:t,header$:r}).pipe(w(s=>i.next(s)),_(()=>i.complete()),m(s=>$({ref:e},s)))})}function vs(e,{viewport$:t,main$:r,target$:o}){let n=t.pipe(m(({offset:{y:a}})=>a),Be(2,1),m(([a,s])=>a>s&&s>0),K()),i=r.pipe(m(({active:a})=>a));return z([i,n]).pipe(m(([a,s])=>!(a&&s)),K(),W(o.pipe(Ce(1))),ie(!0),ct({delay:250}),m(a=>({hidden:a})))}function Ei(e,{viewport$:t,header$:r,main$:o,target$:n}){let i=new g,a=i.pipe(Z(),ie(!0));return i.subscribe({next({hidden:s}){e.hidden=s,s?(e.setAttribute("tabindex","-1"),e.blur()):e.removeAttribute("tabindex")},complete(){e.style.top="",e.hidden=!0,e.removeAttribute("tabindex")}}),r.pipe(W(a),ee("height")).subscribe(({height:s})=>{e.style.top=`${s+16}px`}),h(e,"click").subscribe(s=>{s.preventDefault(),window.scrollTo({top:0})}),vs(e,{viewport$:t,main$:o,target$:n}).pipe(w(s=>i.next(s)),_(()=>i.complete()),m(s=>$({ref:e},s)))}function wi({document$:e,viewport$:t}){e.pipe(v(()=>P(".md-ellipsis")),ne(r=>tt(r).pipe(W(e.pipe(Ce(1))),b(o=>o),m(()=>r),Te(1))),b(r=>r.offsetWidth{let o=r.innerText,n=r.closest("a")||r;return n.title=o,B("content.tooltips")?mt(n,{viewport$:t}).pipe(W(e.pipe(Ce(1))),_(()=>n.removeAttribute("title"))):S})).subscribe(),B("content.tooltips")&&e.pipe(v(()=>P(".md-status")),ne(r=>mt(r,{viewport$:t}))).subscribe()}function Ti({document$:e,tablet$:t}){e.pipe(v(()=>P(".md-toggle--indeterminate")),w(r=>{r.indeterminate=!0,r.checked=!1}),ne(r=>h(r,"change").pipe(Dr(()=>r.classList.contains("md-toggle--indeterminate")),m(()=>r))),re(t)).subscribe(([r,o])=>{r.classList.remove("md-toggle--indeterminate"),o&&(r.checked=!1)})}function gs(){return/(iPad|iPhone|iPod)/.test(navigator.userAgent)}function Si({document$:e}){e.pipe(v(()=>P("[data-md-scrollfix]")),w(t=>t.removeAttribute("data-md-scrollfix")),b(gs),ne(t=>h(t,"touchstart").pipe(m(()=>t)))).subscribe(t=>{let r=t.scrollTop;r===0?t.scrollTop=1:r+t.offsetHeight===t.scrollHeight&&(t.scrollTop=r-1)})}function Oi({viewport$:e,tablet$:t}){z([ze("search"),t]).pipe(m(([r,o])=>r&&!o),v(r=>I(r).pipe(Ge(r?400:100))),re(e)).subscribe(([r,{offset:{y:o}}])=>{if(r)document.body.setAttribute("data-md-scrolllock",""),document.body.style.top=`-${o}px`;else{let n=-1*parseInt(document.body.style.top,10);document.body.removeAttribute("data-md-scrolllock"),document.body.style.top="",n&&window.scrollTo(0,n)}})}Object.entries||(Object.entries=function(e){let t=[];for(let r of Object.keys(e))t.push([r,e[r]]);return t});Object.values||(Object.values=function(e){let t=[];for(let r of Object.keys(e))t.push(e[r]);return t});typeof Element!="undefined"&&(Element.prototype.scrollTo||(Element.prototype.scrollTo=function(e,t){typeof e=="object"?(this.scrollLeft=e.left,this.scrollTop=e.top):(this.scrollLeft=e,this.scrollTop=t)}),Element.prototype.replaceWith||(Element.prototype.replaceWith=function(...e){let t=this.parentNode;if(t){e.length===0&&t.removeChild(this);for(let r=e.length-1;r>=0;r--){let o=e[r];typeof o=="string"?o=document.createTextNode(o):o.parentNode&&o.parentNode.removeChild(o),r?t.insertBefore(this.previousSibling,o):t.replaceChild(o,this)}}}));function ys(){return location.protocol==="file:"?Tt(`${new URL("search/search_index.js",eo.base)}`).pipe(m(()=>__index),G(1)):je(new URL("search/search_index.json",eo.base))}document.documentElement.classList.remove("no-js");document.documentElement.classList.add("js");var ot=Go(),Ut=sn(),Lt=ln(Ut),to=an(),Oe=gn(),hr=Pt("(min-width: 960px)"),Mi=Pt("(min-width: 1220px)"),_i=mn(),eo=xe(),Ai=document.forms.namedItem("search")?ys():Ye,ro=new g;Zn({alert$:ro});var oo=new g;B("navigation.instant")&&oi({location$:Ut,viewport$:Oe,progress$:oo}).subscribe(ot);var Li;((Li=eo.version)==null?void 0:Li.provider)==="mike"&&ci({document$:ot});O(Ut,Lt).pipe(Ge(125)).subscribe(()=>{Je("drawer",!1),Je("search",!1)});to.pipe(b(({mode:e})=>e==="global")).subscribe(e=>{switch(e.type){case"p":case",":let t=fe("link[rel=prev]");typeof t!="undefined"&<(t);break;case"n":case".":let r=fe("link[rel=next]");typeof r!="undefined"&<(r);break;case"Enter":let o=Ie();o instanceof HTMLLabelElement&&o.click()}});wi({viewport$:Oe,document$:ot});Ti({document$:ot,tablet$:hr});Si({document$:ot});Oi({viewport$:Oe,tablet$:hr});var rt=Kn(Se("header"),{viewport$:Oe}),Ft=ot.pipe(m(()=>Se("main")),v(e=>Gn(e,{viewport$:Oe,header$:rt})),G(1)),xs=O(...ae("consent").map(e=>En(e,{target$:Lt})),...ae("dialog").map(e=>qn(e,{alert$:ro})),...ae("palette").map(e=>Jn(e)),...ae("progress").map(e=>Xn(e,{progress$:oo})),...ae("search").map(e=>ui(e,{index$:Ai,keyboard$:to})),...ae("source").map(e=>gi(e))),Es=C(()=>O(...ae("announce").map(e=>xn(e)),...ae("content").map(e=>zn(e,{viewport$:Oe,target$:Lt,print$:_i})),...ae("content").map(e=>B("search.highlight")?di(e,{index$:Ai,location$:Ut}):S),...ae("header").map(e=>Yn(e,{viewport$:Oe,header$:rt,main$:Ft})),...ae("header-title").map(e=>Bn(e,{viewport$:Oe,header$:rt})),...ae("sidebar").map(e=>e.getAttribute("data-md-type")==="navigation"?Nr(Mi,()=>Zr(e,{viewport$:Oe,header$:rt,main$:Ft})):Nr(hr,()=>Zr(e,{viewport$:Oe,header$:rt,main$:Ft}))),...ae("tabs").map(e=>yi(e,{viewport$:Oe,header$:rt})),...ae("toc").map(e=>xi(e,{viewport$:Oe,header$:rt,main$:Ft,target$:Lt})),...ae("top").map(e=>Ei(e,{viewport$:Oe,header$:rt,main$:Ft,target$:Lt})))),Ci=ot.pipe(v(()=>Es),Re(xs),G(1));Ci.subscribe();window.document$=ot;window.location$=Ut;window.target$=Lt;window.keyboard$=to;window.viewport$=Oe;window.tablet$=hr;window.screen$=Mi;window.print$=_i;window.alert$=ro;window.progress$=oo;window.component$=Ci;})(); +//# sourceMappingURL=bundle.83f73b43.min.js.map + diff --git a/assets/javascripts/bundle.83f73b43.min.js.map b/assets/javascripts/bundle.83f73b43.min.js.map new file mode 100644 index 00000000..fe920b7d --- /dev/null +++ b/assets/javascripts/bundle.83f73b43.min.js.map @@ -0,0 +1,7 @@ +{ + "version": 3, + "sources": ["node_modules/focus-visible/dist/focus-visible.js", "node_modules/escape-html/index.js", "node_modules/clipboard/dist/clipboard.js", "src/templates/assets/javascripts/bundle.ts", "node_modules/tslib/tslib.es6.mjs", "node_modules/rxjs/src/internal/util/isFunction.ts", "node_modules/rxjs/src/internal/util/createErrorClass.ts", "node_modules/rxjs/src/internal/util/UnsubscriptionError.ts", "node_modules/rxjs/src/internal/util/arrRemove.ts", "node_modules/rxjs/src/internal/Subscription.ts", "node_modules/rxjs/src/internal/config.ts", "node_modules/rxjs/src/internal/scheduler/timeoutProvider.ts", "node_modules/rxjs/src/internal/util/reportUnhandledError.ts", "node_modules/rxjs/src/internal/util/noop.ts", "node_modules/rxjs/src/internal/NotificationFactories.ts", "node_modules/rxjs/src/internal/util/errorContext.ts", "node_modules/rxjs/src/internal/Subscriber.ts", "node_modules/rxjs/src/internal/symbol/observable.ts", "node_modules/rxjs/src/internal/util/identity.ts", "node_modules/rxjs/src/internal/util/pipe.ts", "node_modules/rxjs/src/internal/Observable.ts", "node_modules/rxjs/src/internal/util/lift.ts", "node_modules/rxjs/src/internal/operators/OperatorSubscriber.ts", "node_modules/rxjs/src/internal/scheduler/animationFrameProvider.ts", "node_modules/rxjs/src/internal/util/ObjectUnsubscribedError.ts", "node_modules/rxjs/src/internal/Subject.ts", "node_modules/rxjs/src/internal/BehaviorSubject.ts", "node_modules/rxjs/src/internal/scheduler/dateTimestampProvider.ts", "node_modules/rxjs/src/internal/ReplaySubject.ts", "node_modules/rxjs/src/internal/scheduler/Action.ts", "node_modules/rxjs/src/internal/scheduler/intervalProvider.ts", "node_modules/rxjs/src/internal/scheduler/AsyncAction.ts", "node_modules/rxjs/src/internal/Scheduler.ts", "node_modules/rxjs/src/internal/scheduler/AsyncScheduler.ts", "node_modules/rxjs/src/internal/scheduler/async.ts", "node_modules/rxjs/src/internal/scheduler/QueueAction.ts", "node_modules/rxjs/src/internal/scheduler/QueueScheduler.ts", "node_modules/rxjs/src/internal/scheduler/queue.ts", "node_modules/rxjs/src/internal/scheduler/AnimationFrameAction.ts", "node_modules/rxjs/src/internal/scheduler/AnimationFrameScheduler.ts", "node_modules/rxjs/src/internal/scheduler/animationFrame.ts", "node_modules/rxjs/src/internal/observable/empty.ts", "node_modules/rxjs/src/internal/util/isScheduler.ts", "node_modules/rxjs/src/internal/util/args.ts", "node_modules/rxjs/src/internal/util/isArrayLike.ts", "node_modules/rxjs/src/internal/util/isPromise.ts", "node_modules/rxjs/src/internal/util/isInteropObservable.ts", "node_modules/rxjs/src/internal/util/isAsyncIterable.ts", "node_modules/rxjs/src/internal/util/throwUnobservableError.ts", "node_modules/rxjs/src/internal/symbol/iterator.ts", "node_modules/rxjs/src/internal/util/isIterable.ts", "node_modules/rxjs/src/internal/util/isReadableStreamLike.ts", "node_modules/rxjs/src/internal/observable/innerFrom.ts", "node_modules/rxjs/src/internal/util/executeSchedule.ts", "node_modules/rxjs/src/internal/operators/observeOn.ts", "node_modules/rxjs/src/internal/operators/subscribeOn.ts", "node_modules/rxjs/src/internal/scheduled/scheduleObservable.ts", "node_modules/rxjs/src/internal/scheduled/schedulePromise.ts", "node_modules/rxjs/src/internal/scheduled/scheduleArray.ts", "node_modules/rxjs/src/internal/scheduled/scheduleIterable.ts", "node_modules/rxjs/src/internal/scheduled/scheduleAsyncIterable.ts", "node_modules/rxjs/src/internal/scheduled/scheduleReadableStreamLike.ts", "node_modules/rxjs/src/internal/scheduled/scheduled.ts", "node_modules/rxjs/src/internal/observable/from.ts", "node_modules/rxjs/src/internal/observable/of.ts", "node_modules/rxjs/src/internal/observable/throwError.ts", "node_modules/rxjs/src/internal/util/EmptyError.ts", "node_modules/rxjs/src/internal/util/isDate.ts", "node_modules/rxjs/src/internal/operators/map.ts", "node_modules/rxjs/src/internal/util/mapOneOrManyArgs.ts", "node_modules/rxjs/src/internal/util/argsArgArrayOrObject.ts", "node_modules/rxjs/src/internal/util/createObject.ts", "node_modules/rxjs/src/internal/observable/combineLatest.ts", "node_modules/rxjs/src/internal/operators/mergeInternals.ts", "node_modules/rxjs/src/internal/operators/mergeMap.ts", "node_modules/rxjs/src/internal/operators/mergeAll.ts", "node_modules/rxjs/src/internal/operators/concatAll.ts", "node_modules/rxjs/src/internal/observable/concat.ts", "node_modules/rxjs/src/internal/observable/defer.ts", "node_modules/rxjs/src/internal/observable/fromEvent.ts", "node_modules/rxjs/src/internal/observable/fromEventPattern.ts", "node_modules/rxjs/src/internal/observable/timer.ts", "node_modules/rxjs/src/internal/observable/merge.ts", "node_modules/rxjs/src/internal/observable/never.ts", "node_modules/rxjs/src/internal/util/argsOrArgArray.ts", "node_modules/rxjs/src/internal/operators/filter.ts", "node_modules/rxjs/src/internal/observable/zip.ts", "node_modules/rxjs/src/internal/operators/audit.ts", "node_modules/rxjs/src/internal/operators/auditTime.ts", "node_modules/rxjs/src/internal/operators/bufferCount.ts", "node_modules/rxjs/src/internal/operators/catchError.ts", "node_modules/rxjs/src/internal/operators/scanInternals.ts", "node_modules/rxjs/src/internal/operators/combineLatest.ts", "node_modules/rxjs/src/internal/operators/combineLatestWith.ts", "node_modules/rxjs/src/internal/operators/debounce.ts", "node_modules/rxjs/src/internal/operators/debounceTime.ts", "node_modules/rxjs/src/internal/operators/defaultIfEmpty.ts", "node_modules/rxjs/src/internal/operators/take.ts", "node_modules/rxjs/src/internal/operators/ignoreElements.ts", "node_modules/rxjs/src/internal/operators/mapTo.ts", "node_modules/rxjs/src/internal/operators/delayWhen.ts", "node_modules/rxjs/src/internal/operators/delay.ts", "node_modules/rxjs/src/internal/operators/distinctUntilChanged.ts", "node_modules/rxjs/src/internal/operators/distinctUntilKeyChanged.ts", "node_modules/rxjs/src/internal/operators/throwIfEmpty.ts", "node_modules/rxjs/src/internal/operators/endWith.ts", "node_modules/rxjs/src/internal/operators/finalize.ts", "node_modules/rxjs/src/internal/operators/first.ts", "node_modules/rxjs/src/internal/operators/takeLast.ts", "node_modules/rxjs/src/internal/operators/merge.ts", "node_modules/rxjs/src/internal/operators/mergeWith.ts", "node_modules/rxjs/src/internal/operators/repeat.ts", "node_modules/rxjs/src/internal/operators/scan.ts", "node_modules/rxjs/src/internal/operators/share.ts", "node_modules/rxjs/src/internal/operators/shareReplay.ts", "node_modules/rxjs/src/internal/operators/skip.ts", "node_modules/rxjs/src/internal/operators/skipUntil.ts", "node_modules/rxjs/src/internal/operators/startWith.ts", "node_modules/rxjs/src/internal/operators/switchMap.ts", "node_modules/rxjs/src/internal/operators/takeUntil.ts", "node_modules/rxjs/src/internal/operators/takeWhile.ts", "node_modules/rxjs/src/internal/operators/tap.ts", "node_modules/rxjs/src/internal/operators/throttle.ts", "node_modules/rxjs/src/internal/operators/throttleTime.ts", "node_modules/rxjs/src/internal/operators/withLatestFrom.ts", "node_modules/rxjs/src/internal/operators/zip.ts", "node_modules/rxjs/src/internal/operators/zipWith.ts", "src/templates/assets/javascripts/browser/document/index.ts", "src/templates/assets/javascripts/browser/element/_/index.ts", "src/templates/assets/javascripts/browser/element/focus/index.ts", "src/templates/assets/javascripts/browser/element/hover/index.ts", "src/templates/assets/javascripts/utilities/h/index.ts", "src/templates/assets/javascripts/utilities/round/index.ts", "src/templates/assets/javascripts/browser/script/index.ts", "src/templates/assets/javascripts/browser/element/size/_/index.ts", "src/templates/assets/javascripts/browser/element/size/content/index.ts", "src/templates/assets/javascripts/browser/element/offset/_/index.ts", "src/templates/assets/javascripts/browser/element/offset/content/index.ts", "src/templates/assets/javascripts/browser/element/visibility/index.ts", "src/templates/assets/javascripts/browser/toggle/index.ts", "src/templates/assets/javascripts/browser/keyboard/index.ts", "src/templates/assets/javascripts/browser/location/_/index.ts", "src/templates/assets/javascripts/browser/location/hash/index.ts", "src/templates/assets/javascripts/browser/media/index.ts", "src/templates/assets/javascripts/browser/request/index.ts", "src/templates/assets/javascripts/browser/viewport/offset/index.ts", "src/templates/assets/javascripts/browser/viewport/size/index.ts", "src/templates/assets/javascripts/browser/viewport/_/index.ts", "src/templates/assets/javascripts/browser/viewport/at/index.ts", "src/templates/assets/javascripts/browser/worker/index.ts", "src/templates/assets/javascripts/_/index.ts", "src/templates/assets/javascripts/components/_/index.ts", "src/templates/assets/javascripts/components/announce/index.ts", "src/templates/assets/javascripts/components/consent/index.ts", "src/templates/assets/javascripts/templates/tooltip/index.tsx", "src/templates/assets/javascripts/templates/annotation/index.tsx", "src/templates/assets/javascripts/templates/clipboard/index.tsx", "src/templates/assets/javascripts/templates/search/index.tsx", "src/templates/assets/javascripts/templates/source/index.tsx", "src/templates/assets/javascripts/templates/tabbed/index.tsx", "src/templates/assets/javascripts/templates/table/index.tsx", "src/templates/assets/javascripts/templates/version/index.tsx", "src/templates/assets/javascripts/components/tooltip2/index.ts", "src/templates/assets/javascripts/components/content/annotation/_/index.ts", "src/templates/assets/javascripts/components/content/annotation/list/index.ts", "src/templates/assets/javascripts/components/content/annotation/block/index.ts", "src/templates/assets/javascripts/components/content/code/_/index.ts", "src/templates/assets/javascripts/components/content/details/index.ts", "src/templates/assets/javascripts/components/content/mermaid/index.css", "src/templates/assets/javascripts/components/content/mermaid/index.ts", "src/templates/assets/javascripts/components/content/table/index.ts", "src/templates/assets/javascripts/components/content/tabs/index.ts", "src/templates/assets/javascripts/components/content/_/index.ts", "src/templates/assets/javascripts/components/dialog/index.ts", "src/templates/assets/javascripts/components/tooltip/index.ts", "src/templates/assets/javascripts/components/header/_/index.ts", "src/templates/assets/javascripts/components/header/title/index.ts", "src/templates/assets/javascripts/components/main/index.ts", "src/templates/assets/javascripts/components/palette/index.ts", "src/templates/assets/javascripts/components/progress/index.ts", "src/templates/assets/javascripts/integrations/clipboard/index.ts", "src/templates/assets/javascripts/integrations/sitemap/index.ts", "src/templates/assets/javascripts/integrations/instant/index.ts", "src/templates/assets/javascripts/integrations/search/highlighter/index.ts", "src/templates/assets/javascripts/integrations/search/worker/message/index.ts", "src/templates/assets/javascripts/integrations/search/worker/_/index.ts", "src/templates/assets/javascripts/integrations/version/findurl/index.ts", "src/templates/assets/javascripts/integrations/version/index.ts", "src/templates/assets/javascripts/components/search/query/index.ts", "src/templates/assets/javascripts/components/search/result/index.ts", "src/templates/assets/javascripts/components/search/share/index.ts", "src/templates/assets/javascripts/components/search/suggest/index.ts", "src/templates/assets/javascripts/components/search/_/index.ts", "src/templates/assets/javascripts/components/search/highlight/index.ts", "src/templates/assets/javascripts/components/sidebar/index.ts", "src/templates/assets/javascripts/components/source/facts/github/index.ts", "src/templates/assets/javascripts/components/source/facts/gitlab/index.ts", "src/templates/assets/javascripts/components/source/facts/_/index.ts", "src/templates/assets/javascripts/components/source/_/index.ts", "src/templates/assets/javascripts/components/tabs/index.ts", "src/templates/assets/javascripts/components/toc/index.ts", "src/templates/assets/javascripts/components/top/index.ts", "src/templates/assets/javascripts/patches/ellipsis/index.ts", "src/templates/assets/javascripts/patches/indeterminate/index.ts", "src/templates/assets/javascripts/patches/scrollfix/index.ts", "src/templates/assets/javascripts/patches/scrolllock/index.ts", "src/templates/assets/javascripts/polyfills/index.ts"], + "sourcesContent": ["(function (global, factory) {\n typeof exports === 'object' && typeof module !== 'undefined' ? factory() :\n typeof define === 'function' && define.amd ? define(factory) :\n (factory());\n}(this, (function () { 'use strict';\n\n /**\n * Applies the :focus-visible polyfill at the given scope.\n * A scope in this case is either the top-level Document or a Shadow Root.\n *\n * @param {(Document|ShadowRoot)} scope\n * @see https://github.com/WICG/focus-visible\n */\n function applyFocusVisiblePolyfill(scope) {\n var hadKeyboardEvent = true;\n var hadFocusVisibleRecently = false;\n var hadFocusVisibleRecentlyTimeout = null;\n\n var inputTypesAllowlist = {\n text: true,\n search: true,\n url: true,\n tel: true,\n email: true,\n password: true,\n number: true,\n date: true,\n month: true,\n week: true,\n time: true,\n datetime: true,\n 'datetime-local': true\n };\n\n /**\n * Helper function for legacy browsers and iframes which sometimes focus\n * elements like document, body, and non-interactive SVG.\n * @param {Element} el\n */\n function isValidFocusTarget(el) {\n if (\n el &&\n el !== document &&\n el.nodeName !== 'HTML' &&\n el.nodeName !== 'BODY' &&\n 'classList' in el &&\n 'contains' in el.classList\n ) {\n return true;\n }\n return false;\n }\n\n /**\n * Computes whether the given element should automatically trigger the\n * `focus-visible` class being added, i.e. whether it should always match\n * `:focus-visible` when focused.\n * @param {Element} el\n * @return {boolean}\n */\n function focusTriggersKeyboardModality(el) {\n var type = el.type;\n var tagName = el.tagName;\n\n if (tagName === 'INPUT' && inputTypesAllowlist[type] && !el.readOnly) {\n return true;\n }\n\n if (tagName === 'TEXTAREA' && !el.readOnly) {\n return true;\n }\n\n if (el.isContentEditable) {\n return true;\n }\n\n return false;\n }\n\n /**\n * Add the `focus-visible` class to the given element if it was not added by\n * the author.\n * @param {Element} el\n */\n function addFocusVisibleClass(el) {\n if (el.classList.contains('focus-visible')) {\n return;\n }\n el.classList.add('focus-visible');\n el.setAttribute('data-focus-visible-added', '');\n }\n\n /**\n * Remove the `focus-visible` class from the given element if it was not\n * originally added by the author.\n * @param {Element} el\n */\n function removeFocusVisibleClass(el) {\n if (!el.hasAttribute('data-focus-visible-added')) {\n return;\n }\n el.classList.remove('focus-visible');\n el.removeAttribute('data-focus-visible-added');\n }\n\n /**\n * If the most recent user interaction was via the keyboard;\n * and the key press did not include a meta, alt/option, or control key;\n * then the modality is keyboard. Otherwise, the modality is not keyboard.\n * Apply `focus-visible` to any current active element and keep track\n * of our keyboard modality state with `hadKeyboardEvent`.\n * @param {KeyboardEvent} e\n */\n function onKeyDown(e) {\n if (e.metaKey || e.altKey || e.ctrlKey) {\n return;\n }\n\n if (isValidFocusTarget(scope.activeElement)) {\n addFocusVisibleClass(scope.activeElement);\n }\n\n hadKeyboardEvent = true;\n }\n\n /**\n * If at any point a user clicks with a pointing device, ensure that we change\n * the modality away from keyboard.\n * This avoids the situation where a user presses a key on an already focused\n * element, and then clicks on a different element, focusing it with a\n * pointing device, while we still think we're in keyboard modality.\n * @param {Event} e\n */\n function onPointerDown(e) {\n hadKeyboardEvent = false;\n }\n\n /**\n * On `focus`, add the `focus-visible` class to the target if:\n * - the target received focus as a result of keyboard navigation, or\n * - the event target is an element that will likely require interaction\n * via the keyboard (e.g. a text box)\n * @param {Event} e\n */\n function onFocus(e) {\n // Prevent IE from focusing the document or HTML element.\n if (!isValidFocusTarget(e.target)) {\n return;\n }\n\n if (hadKeyboardEvent || focusTriggersKeyboardModality(e.target)) {\n addFocusVisibleClass(e.target);\n }\n }\n\n /**\n * On `blur`, remove the `focus-visible` class from the target.\n * @param {Event} e\n */\n function onBlur(e) {\n if (!isValidFocusTarget(e.target)) {\n return;\n }\n\n if (\n e.target.classList.contains('focus-visible') ||\n e.target.hasAttribute('data-focus-visible-added')\n ) {\n // To detect a tab/window switch, we look for a blur event followed\n // rapidly by a visibility change.\n // If we don't see a visibility change within 100ms, it's probably a\n // regular focus change.\n hadFocusVisibleRecently = true;\n window.clearTimeout(hadFocusVisibleRecentlyTimeout);\n hadFocusVisibleRecentlyTimeout = window.setTimeout(function() {\n hadFocusVisibleRecently = false;\n }, 100);\n removeFocusVisibleClass(e.target);\n }\n }\n\n /**\n * If the user changes tabs, keep track of whether or not the previously\n * focused element had .focus-visible.\n * @param {Event} e\n */\n function onVisibilityChange(e) {\n if (document.visibilityState === 'hidden') {\n // If the tab becomes active again, the browser will handle calling focus\n // on the element (Safari actually calls it twice).\n // If this tab change caused a blur on an element with focus-visible,\n // re-apply the class when the user switches back to the tab.\n if (hadFocusVisibleRecently) {\n hadKeyboardEvent = true;\n }\n addInitialPointerMoveListeners();\n }\n }\n\n /**\n * Add a group of listeners to detect usage of any pointing devices.\n * These listeners will be added when the polyfill first loads, and anytime\n * the window is blurred, so that they are active when the window regains\n * focus.\n */\n function addInitialPointerMoveListeners() {\n document.addEventListener('mousemove', onInitialPointerMove);\n document.addEventListener('mousedown', onInitialPointerMove);\n document.addEventListener('mouseup', onInitialPointerMove);\n document.addEventListener('pointermove', onInitialPointerMove);\n document.addEventListener('pointerdown', onInitialPointerMove);\n document.addEventListener('pointerup', onInitialPointerMove);\n document.addEventListener('touchmove', onInitialPointerMove);\n document.addEventListener('touchstart', onInitialPointerMove);\n document.addEventListener('touchend', onInitialPointerMove);\n }\n\n function removeInitialPointerMoveListeners() {\n document.removeEventListener('mousemove', onInitialPointerMove);\n document.removeEventListener('mousedown', onInitialPointerMove);\n document.removeEventListener('mouseup', onInitialPointerMove);\n document.removeEventListener('pointermove', onInitialPointerMove);\n document.removeEventListener('pointerdown', onInitialPointerMove);\n document.removeEventListener('pointerup', onInitialPointerMove);\n document.removeEventListener('touchmove', onInitialPointerMove);\n document.removeEventListener('touchstart', onInitialPointerMove);\n document.removeEventListener('touchend', onInitialPointerMove);\n }\n\n /**\n * When the polfyill first loads, assume the user is in keyboard modality.\n * If any event is received from a pointing device (e.g. mouse, pointer,\n * touch), turn off keyboard modality.\n * This accounts for situations where focus enters the page from the URL bar.\n * @param {Event} e\n */\n function onInitialPointerMove(e) {\n // Work around a Safari quirk that fires a mousemove on whenever the\n // window blurs, even if you're tabbing out of the page. \u00AF\\_(\u30C4)_/\u00AF\n if (e.target.nodeName && e.target.nodeName.toLowerCase() === 'html') {\n return;\n }\n\n hadKeyboardEvent = false;\n removeInitialPointerMoveListeners();\n }\n\n // For some kinds of state, we are interested in changes at the global scope\n // only. For example, global pointer input, global key presses and global\n // visibility change should affect the state at every scope:\n document.addEventListener('keydown', onKeyDown, true);\n document.addEventListener('mousedown', onPointerDown, true);\n document.addEventListener('pointerdown', onPointerDown, true);\n document.addEventListener('touchstart', onPointerDown, true);\n document.addEventListener('visibilitychange', onVisibilityChange, true);\n\n addInitialPointerMoveListeners();\n\n // For focus and blur, we specifically care about state changes in the local\n // scope. This is because focus / blur events that originate from within a\n // shadow root are not re-dispatched from the host element if it was already\n // the active element in its own scope:\n scope.addEventListener('focus', onFocus, true);\n scope.addEventListener('blur', onBlur, true);\n\n // We detect that a node is a ShadowRoot by ensuring that it is a\n // DocumentFragment and also has a host property. This check covers native\n // implementation and polyfill implementation transparently. If we only cared\n // about the native implementation, we could just check if the scope was\n // an instance of a ShadowRoot.\n if (scope.nodeType === Node.DOCUMENT_FRAGMENT_NODE && scope.host) {\n // Since a ShadowRoot is a special kind of DocumentFragment, it does not\n // have a root element to add a class to. So, we add this attribute to the\n // host element instead:\n scope.host.setAttribute('data-js-focus-visible', '');\n } else if (scope.nodeType === Node.DOCUMENT_NODE) {\n document.documentElement.classList.add('js-focus-visible');\n document.documentElement.setAttribute('data-js-focus-visible', '');\n }\n }\n\n // It is important to wrap all references to global window and document in\n // these checks to support server-side rendering use cases\n // @see https://github.com/WICG/focus-visible/issues/199\n if (typeof window !== 'undefined' && typeof document !== 'undefined') {\n // Make the polyfill helper globally available. This can be used as a signal\n // to interested libraries that wish to coordinate with the polyfill for e.g.,\n // applying the polyfill to a shadow root:\n window.applyFocusVisiblePolyfill = applyFocusVisiblePolyfill;\n\n // Notify interested libraries of the polyfill's presence, in case the\n // polyfill was loaded lazily:\n var event;\n\n try {\n event = new CustomEvent('focus-visible-polyfill-ready');\n } catch (error) {\n // IE11 does not support using CustomEvent as a constructor directly:\n event = document.createEvent('CustomEvent');\n event.initCustomEvent('focus-visible-polyfill-ready', false, false, {});\n }\n\n window.dispatchEvent(event);\n }\n\n if (typeof document !== 'undefined') {\n // Apply the polyfill to the global document, so that no JavaScript\n // coordination is required to use the polyfill in the top-level document:\n applyFocusVisiblePolyfill(document);\n }\n\n})));\n", "/*!\n * escape-html\n * Copyright(c) 2012-2013 TJ Holowaychuk\n * Copyright(c) 2015 Andreas Lubbe\n * Copyright(c) 2015 Tiancheng \"Timothy\" Gu\n * MIT Licensed\n */\n\n'use strict';\n\n/**\n * Module variables.\n * @private\n */\n\nvar matchHtmlRegExp = /[\"'&<>]/;\n\n/**\n * Module exports.\n * @public\n */\n\nmodule.exports = escapeHtml;\n\n/**\n * Escape special characters in the given string of html.\n *\n * @param {string} string The string to escape for inserting into HTML\n * @return {string}\n * @public\n */\n\nfunction escapeHtml(string) {\n var str = '' + string;\n var match = matchHtmlRegExp.exec(str);\n\n if (!match) {\n return str;\n }\n\n var escape;\n var html = '';\n var index = 0;\n var lastIndex = 0;\n\n for (index = match.index; index < str.length; index++) {\n switch (str.charCodeAt(index)) {\n case 34: // \"\n escape = '"';\n break;\n case 38: // &\n escape = '&';\n break;\n case 39: // '\n escape = ''';\n break;\n case 60: // <\n escape = '<';\n break;\n case 62: // >\n escape = '>';\n break;\n default:\n continue;\n }\n\n if (lastIndex !== index) {\n html += str.substring(lastIndex, index);\n }\n\n lastIndex = index + 1;\n html += escape;\n }\n\n return lastIndex !== index\n ? html + str.substring(lastIndex, index)\n : html;\n}\n", "/*!\n * clipboard.js v2.0.11\n * https://clipboardjs.com/\n *\n * Licensed MIT \u00A9 Zeno Rocha\n */\n(function webpackUniversalModuleDefinition(root, factory) {\n\tif(typeof exports === 'object' && typeof module === 'object')\n\t\tmodule.exports = factory();\n\telse if(typeof define === 'function' && define.amd)\n\t\tdefine([], factory);\n\telse if(typeof exports === 'object')\n\t\texports[\"ClipboardJS\"] = factory();\n\telse\n\t\troot[\"ClipboardJS\"] = factory();\n})(this, function() {\nreturn /******/ (function() { // webpackBootstrap\n/******/ \tvar __webpack_modules__ = ({\n\n/***/ 686:\n/***/ (function(__unused_webpack_module, __webpack_exports__, __webpack_require__) {\n\n\"use strict\";\n\n// EXPORTS\n__webpack_require__.d(__webpack_exports__, {\n \"default\": function() { return /* binding */ clipboard; }\n});\n\n// EXTERNAL MODULE: ./node_modules/tiny-emitter/index.js\nvar tiny_emitter = __webpack_require__(279);\nvar tiny_emitter_default = /*#__PURE__*/__webpack_require__.n(tiny_emitter);\n// EXTERNAL MODULE: ./node_modules/good-listener/src/listen.js\nvar listen = __webpack_require__(370);\nvar listen_default = /*#__PURE__*/__webpack_require__.n(listen);\n// EXTERNAL MODULE: ./node_modules/select/src/select.js\nvar src_select = __webpack_require__(817);\nvar select_default = /*#__PURE__*/__webpack_require__.n(src_select);\n;// CONCATENATED MODULE: ./src/common/command.js\n/**\n * Executes a given operation type.\n * @param {String} type\n * @return {Boolean}\n */\nfunction command(type) {\n try {\n return document.execCommand(type);\n } catch (err) {\n return false;\n }\n}\n;// CONCATENATED MODULE: ./src/actions/cut.js\n\n\n/**\n * Cut action wrapper.\n * @param {String|HTMLElement} target\n * @return {String}\n */\n\nvar ClipboardActionCut = function ClipboardActionCut(target) {\n var selectedText = select_default()(target);\n command('cut');\n return selectedText;\n};\n\n/* harmony default export */ var actions_cut = (ClipboardActionCut);\n;// CONCATENATED MODULE: ./src/common/create-fake-element.js\n/**\n * Creates a fake textarea element with a value.\n * @param {String} value\n * @return {HTMLElement}\n */\nfunction createFakeElement(value) {\n var isRTL = document.documentElement.getAttribute('dir') === 'rtl';\n var fakeElement = document.createElement('textarea'); // Prevent zooming on iOS\n\n fakeElement.style.fontSize = '12pt'; // Reset box model\n\n fakeElement.style.border = '0';\n fakeElement.style.padding = '0';\n fakeElement.style.margin = '0'; // Move element out of screen horizontally\n\n fakeElement.style.position = 'absolute';\n fakeElement.style[isRTL ? 'right' : 'left'] = '-9999px'; // Move element to the same position vertically\n\n var yPosition = window.pageYOffset || document.documentElement.scrollTop;\n fakeElement.style.top = \"\".concat(yPosition, \"px\");\n fakeElement.setAttribute('readonly', '');\n fakeElement.value = value;\n return fakeElement;\n}\n;// CONCATENATED MODULE: ./src/actions/copy.js\n\n\n\n/**\n * Create fake copy action wrapper using a fake element.\n * @param {String} target\n * @param {Object} options\n * @return {String}\n */\n\nvar fakeCopyAction = function fakeCopyAction(value, options) {\n var fakeElement = createFakeElement(value);\n options.container.appendChild(fakeElement);\n var selectedText = select_default()(fakeElement);\n command('copy');\n fakeElement.remove();\n return selectedText;\n};\n/**\n * Copy action wrapper.\n * @param {String|HTMLElement} target\n * @param {Object} options\n * @return {String}\n */\n\n\nvar ClipboardActionCopy = function ClipboardActionCopy(target) {\n var options = arguments.length > 1 && arguments[1] !== undefined ? arguments[1] : {\n container: document.body\n };\n var selectedText = '';\n\n if (typeof target === 'string') {\n selectedText = fakeCopyAction(target, options);\n } else if (target instanceof HTMLInputElement && !['text', 'search', 'url', 'tel', 'password'].includes(target === null || target === void 0 ? void 0 : target.type)) {\n // If input type doesn't support `setSelectionRange`. Simulate it. https://developer.mozilla.org/en-US/docs/Web/API/HTMLInputElement/setSelectionRange\n selectedText = fakeCopyAction(target.value, options);\n } else {\n selectedText = select_default()(target);\n command('copy');\n }\n\n return selectedText;\n};\n\n/* harmony default export */ var actions_copy = (ClipboardActionCopy);\n;// CONCATENATED MODULE: ./src/actions/default.js\nfunction _typeof(obj) { \"@babel/helpers - typeof\"; if (typeof Symbol === \"function\" && typeof Symbol.iterator === \"symbol\") { _typeof = function _typeof(obj) { return typeof obj; }; } else { _typeof = function _typeof(obj) { return obj && typeof Symbol === \"function\" && obj.constructor === Symbol && obj !== Symbol.prototype ? \"symbol\" : typeof obj; }; } return _typeof(obj); }\n\n\n\n/**\n * Inner function which performs selection from either `text` or `target`\n * properties and then executes copy or cut operations.\n * @param {Object} options\n */\n\nvar ClipboardActionDefault = function ClipboardActionDefault() {\n var options = arguments.length > 0 && arguments[0] !== undefined ? arguments[0] : {};\n // Defines base properties passed from constructor.\n var _options$action = options.action,\n action = _options$action === void 0 ? 'copy' : _options$action,\n container = options.container,\n target = options.target,\n text = options.text; // Sets the `action` to be performed which can be either 'copy' or 'cut'.\n\n if (action !== 'copy' && action !== 'cut') {\n throw new Error('Invalid \"action\" value, use either \"copy\" or \"cut\"');\n } // Sets the `target` property using an element that will be have its content copied.\n\n\n if (target !== undefined) {\n if (target && _typeof(target) === 'object' && target.nodeType === 1) {\n if (action === 'copy' && target.hasAttribute('disabled')) {\n throw new Error('Invalid \"target\" attribute. Please use \"readonly\" instead of \"disabled\" attribute');\n }\n\n if (action === 'cut' && (target.hasAttribute('readonly') || target.hasAttribute('disabled'))) {\n throw new Error('Invalid \"target\" attribute. You can\\'t cut text from elements with \"readonly\" or \"disabled\" attributes');\n }\n } else {\n throw new Error('Invalid \"target\" value, use a valid Element');\n }\n } // Define selection strategy based on `text` property.\n\n\n if (text) {\n return actions_copy(text, {\n container: container\n });\n } // Defines which selection strategy based on `target` property.\n\n\n if (target) {\n return action === 'cut' ? actions_cut(target) : actions_copy(target, {\n container: container\n });\n }\n};\n\n/* harmony default export */ var actions_default = (ClipboardActionDefault);\n;// CONCATENATED MODULE: ./src/clipboard.js\nfunction clipboard_typeof(obj) { \"@babel/helpers - typeof\"; if (typeof Symbol === \"function\" && typeof Symbol.iterator === \"symbol\") { clipboard_typeof = function _typeof(obj) { return typeof obj; }; } else { clipboard_typeof = function _typeof(obj) { return obj && typeof Symbol === \"function\" && obj.constructor === Symbol && obj !== Symbol.prototype ? \"symbol\" : typeof obj; }; } return clipboard_typeof(obj); }\n\nfunction _classCallCheck(instance, Constructor) { if (!(instance instanceof Constructor)) { throw new TypeError(\"Cannot call a class as a function\"); } }\n\nfunction _defineProperties(target, props) { for (var i = 0; i < props.length; i++) { var descriptor = props[i]; descriptor.enumerable = descriptor.enumerable || false; descriptor.configurable = true; if (\"value\" in descriptor) descriptor.writable = true; Object.defineProperty(target, descriptor.key, descriptor); } }\n\nfunction _createClass(Constructor, protoProps, staticProps) { if (protoProps) _defineProperties(Constructor.prototype, protoProps); if (staticProps) _defineProperties(Constructor, staticProps); return Constructor; }\n\nfunction _inherits(subClass, superClass) { if (typeof superClass !== \"function\" && superClass !== null) { throw new TypeError(\"Super expression must either be null or a function\"); } subClass.prototype = Object.create(superClass && superClass.prototype, { constructor: { value: subClass, writable: true, configurable: true } }); if (superClass) _setPrototypeOf(subClass, superClass); }\n\nfunction _setPrototypeOf(o, p) { _setPrototypeOf = Object.setPrototypeOf || function _setPrototypeOf(o, p) { o.__proto__ = p; return o; }; return _setPrototypeOf(o, p); }\n\nfunction _createSuper(Derived) { var hasNativeReflectConstruct = _isNativeReflectConstruct(); return function _createSuperInternal() { var Super = _getPrototypeOf(Derived), result; if (hasNativeReflectConstruct) { var NewTarget = _getPrototypeOf(this).constructor; result = Reflect.construct(Super, arguments, NewTarget); } else { result = Super.apply(this, arguments); } return _possibleConstructorReturn(this, result); }; }\n\nfunction _possibleConstructorReturn(self, call) { if (call && (clipboard_typeof(call) === \"object\" || typeof call === \"function\")) { return call; } return _assertThisInitialized(self); }\n\nfunction _assertThisInitialized(self) { if (self === void 0) { throw new ReferenceError(\"this hasn't been initialised - super() hasn't been called\"); } return self; }\n\nfunction _isNativeReflectConstruct() { if (typeof Reflect === \"undefined\" || !Reflect.construct) return false; if (Reflect.construct.sham) return false; if (typeof Proxy === \"function\") return true; try { Date.prototype.toString.call(Reflect.construct(Date, [], function () {})); return true; } catch (e) { return false; } }\n\nfunction _getPrototypeOf(o) { _getPrototypeOf = Object.setPrototypeOf ? Object.getPrototypeOf : function _getPrototypeOf(o) { return o.__proto__ || Object.getPrototypeOf(o); }; return _getPrototypeOf(o); }\n\n\n\n\n\n\n/**\n * Helper function to retrieve attribute value.\n * @param {String} suffix\n * @param {Element} element\n */\n\nfunction getAttributeValue(suffix, element) {\n var attribute = \"data-clipboard-\".concat(suffix);\n\n if (!element.hasAttribute(attribute)) {\n return;\n }\n\n return element.getAttribute(attribute);\n}\n/**\n * Base class which takes one or more elements, adds event listeners to them,\n * and instantiates a new `ClipboardAction` on each click.\n */\n\n\nvar Clipboard = /*#__PURE__*/function (_Emitter) {\n _inherits(Clipboard, _Emitter);\n\n var _super = _createSuper(Clipboard);\n\n /**\n * @param {String|HTMLElement|HTMLCollection|NodeList} trigger\n * @param {Object} options\n */\n function Clipboard(trigger, options) {\n var _this;\n\n _classCallCheck(this, Clipboard);\n\n _this = _super.call(this);\n\n _this.resolveOptions(options);\n\n _this.listenClick(trigger);\n\n return _this;\n }\n /**\n * Defines if attributes would be resolved using internal setter functions\n * or custom functions that were passed in the constructor.\n * @param {Object} options\n */\n\n\n _createClass(Clipboard, [{\n key: \"resolveOptions\",\n value: function resolveOptions() {\n var options = arguments.length > 0 && arguments[0] !== undefined ? arguments[0] : {};\n this.action = typeof options.action === 'function' ? options.action : this.defaultAction;\n this.target = typeof options.target === 'function' ? options.target : this.defaultTarget;\n this.text = typeof options.text === 'function' ? options.text : this.defaultText;\n this.container = clipboard_typeof(options.container) === 'object' ? options.container : document.body;\n }\n /**\n * Adds a click event listener to the passed trigger.\n * @param {String|HTMLElement|HTMLCollection|NodeList} trigger\n */\n\n }, {\n key: \"listenClick\",\n value: function listenClick(trigger) {\n var _this2 = this;\n\n this.listener = listen_default()(trigger, 'click', function (e) {\n return _this2.onClick(e);\n });\n }\n /**\n * Defines a new `ClipboardAction` on each click event.\n * @param {Event} e\n */\n\n }, {\n key: \"onClick\",\n value: function onClick(e) {\n var trigger = e.delegateTarget || e.currentTarget;\n var action = this.action(trigger) || 'copy';\n var text = actions_default({\n action: action,\n container: this.container,\n target: this.target(trigger),\n text: this.text(trigger)\n }); // Fires an event based on the copy operation result.\n\n this.emit(text ? 'success' : 'error', {\n action: action,\n text: text,\n trigger: trigger,\n clearSelection: function clearSelection() {\n if (trigger) {\n trigger.focus();\n }\n\n window.getSelection().removeAllRanges();\n }\n });\n }\n /**\n * Default `action` lookup function.\n * @param {Element} trigger\n */\n\n }, {\n key: \"defaultAction\",\n value: function defaultAction(trigger) {\n return getAttributeValue('action', trigger);\n }\n /**\n * Default `target` lookup function.\n * @param {Element} trigger\n */\n\n }, {\n key: \"defaultTarget\",\n value: function defaultTarget(trigger) {\n var selector = getAttributeValue('target', trigger);\n\n if (selector) {\n return document.querySelector(selector);\n }\n }\n /**\n * Allow fire programmatically a copy action\n * @param {String|HTMLElement} target\n * @param {Object} options\n * @returns Text copied.\n */\n\n }, {\n key: \"defaultText\",\n\n /**\n * Default `text` lookup function.\n * @param {Element} trigger\n */\n value: function defaultText(trigger) {\n return getAttributeValue('text', trigger);\n }\n /**\n * Destroy lifecycle.\n */\n\n }, {\n key: \"destroy\",\n value: function destroy() {\n this.listener.destroy();\n }\n }], [{\n key: \"copy\",\n value: function copy(target) {\n var options = arguments.length > 1 && arguments[1] !== undefined ? arguments[1] : {\n container: document.body\n };\n return actions_copy(target, options);\n }\n /**\n * Allow fire programmatically a cut action\n * @param {String|HTMLElement} target\n * @returns Text cutted.\n */\n\n }, {\n key: \"cut\",\n value: function cut(target) {\n return actions_cut(target);\n }\n /**\n * Returns the support of the given action, or all actions if no action is\n * given.\n * @param {String} [action]\n */\n\n }, {\n key: \"isSupported\",\n value: function isSupported() {\n var action = arguments.length > 0 && arguments[0] !== undefined ? arguments[0] : ['copy', 'cut'];\n var actions = typeof action === 'string' ? [action] : action;\n var support = !!document.queryCommandSupported;\n actions.forEach(function (action) {\n support = support && !!document.queryCommandSupported(action);\n });\n return support;\n }\n }]);\n\n return Clipboard;\n}((tiny_emitter_default()));\n\n/* harmony default export */ var clipboard = (Clipboard);\n\n/***/ }),\n\n/***/ 828:\n/***/ (function(module) {\n\nvar DOCUMENT_NODE_TYPE = 9;\n\n/**\n * A polyfill for Element.matches()\n */\nif (typeof Element !== 'undefined' && !Element.prototype.matches) {\n var proto = Element.prototype;\n\n proto.matches = proto.matchesSelector ||\n proto.mozMatchesSelector ||\n proto.msMatchesSelector ||\n proto.oMatchesSelector ||\n proto.webkitMatchesSelector;\n}\n\n/**\n * Finds the closest parent that matches a selector.\n *\n * @param {Element} element\n * @param {String} selector\n * @return {Function}\n */\nfunction closest (element, selector) {\n while (element && element.nodeType !== DOCUMENT_NODE_TYPE) {\n if (typeof element.matches === 'function' &&\n element.matches(selector)) {\n return element;\n }\n element = element.parentNode;\n }\n}\n\nmodule.exports = closest;\n\n\n/***/ }),\n\n/***/ 438:\n/***/ (function(module, __unused_webpack_exports, __webpack_require__) {\n\nvar closest = __webpack_require__(828);\n\n/**\n * Delegates event to a selector.\n *\n * @param {Element} element\n * @param {String} selector\n * @param {String} type\n * @param {Function} callback\n * @param {Boolean} useCapture\n * @return {Object}\n */\nfunction _delegate(element, selector, type, callback, useCapture) {\n var listenerFn = listener.apply(this, arguments);\n\n element.addEventListener(type, listenerFn, useCapture);\n\n return {\n destroy: function() {\n element.removeEventListener(type, listenerFn, useCapture);\n }\n }\n}\n\n/**\n * Delegates event to a selector.\n *\n * @param {Element|String|Array} [elements]\n * @param {String} selector\n * @param {String} type\n * @param {Function} callback\n * @param {Boolean} useCapture\n * @return {Object}\n */\nfunction delegate(elements, selector, type, callback, useCapture) {\n // Handle the regular Element usage\n if (typeof elements.addEventListener === 'function') {\n return _delegate.apply(null, arguments);\n }\n\n // Handle Element-less usage, it defaults to global delegation\n if (typeof type === 'function') {\n // Use `document` as the first parameter, then apply arguments\n // This is a short way to .unshift `arguments` without running into deoptimizations\n return _delegate.bind(null, document).apply(null, arguments);\n }\n\n // Handle Selector-based usage\n if (typeof elements === 'string') {\n elements = document.querySelectorAll(elements);\n }\n\n // Handle Array-like based usage\n return Array.prototype.map.call(elements, function (element) {\n return _delegate(element, selector, type, callback, useCapture);\n });\n}\n\n/**\n * Finds closest match and invokes callback.\n *\n * @param {Element} element\n * @param {String} selector\n * @param {String} type\n * @param {Function} callback\n * @return {Function}\n */\nfunction listener(element, selector, type, callback) {\n return function(e) {\n e.delegateTarget = closest(e.target, selector);\n\n if (e.delegateTarget) {\n callback.call(element, e);\n }\n }\n}\n\nmodule.exports = delegate;\n\n\n/***/ }),\n\n/***/ 879:\n/***/ (function(__unused_webpack_module, exports) {\n\n/**\n * Check if argument is a HTML element.\n *\n * @param {Object} value\n * @return {Boolean}\n */\nexports.node = function(value) {\n return value !== undefined\n && value instanceof HTMLElement\n && value.nodeType === 1;\n};\n\n/**\n * Check if argument is a list of HTML elements.\n *\n * @param {Object} value\n * @return {Boolean}\n */\nexports.nodeList = function(value) {\n var type = Object.prototype.toString.call(value);\n\n return value !== undefined\n && (type === '[object NodeList]' || type === '[object HTMLCollection]')\n && ('length' in value)\n && (value.length === 0 || exports.node(value[0]));\n};\n\n/**\n * Check if argument is a string.\n *\n * @param {Object} value\n * @return {Boolean}\n */\nexports.string = function(value) {\n return typeof value === 'string'\n || value instanceof String;\n};\n\n/**\n * Check if argument is a function.\n *\n * @param {Object} value\n * @return {Boolean}\n */\nexports.fn = function(value) {\n var type = Object.prototype.toString.call(value);\n\n return type === '[object Function]';\n};\n\n\n/***/ }),\n\n/***/ 370:\n/***/ (function(module, __unused_webpack_exports, __webpack_require__) {\n\nvar is = __webpack_require__(879);\nvar delegate = __webpack_require__(438);\n\n/**\n * Validates all params and calls the right\n * listener function based on its target type.\n *\n * @param {String|HTMLElement|HTMLCollection|NodeList} target\n * @param {String} type\n * @param {Function} callback\n * @return {Object}\n */\nfunction listen(target, type, callback) {\n if (!target && !type && !callback) {\n throw new Error('Missing required arguments');\n }\n\n if (!is.string(type)) {\n throw new TypeError('Second argument must be a String');\n }\n\n if (!is.fn(callback)) {\n throw new TypeError('Third argument must be a Function');\n }\n\n if (is.node(target)) {\n return listenNode(target, type, callback);\n }\n else if (is.nodeList(target)) {\n return listenNodeList(target, type, callback);\n }\n else if (is.string(target)) {\n return listenSelector(target, type, callback);\n }\n else {\n throw new TypeError('First argument must be a String, HTMLElement, HTMLCollection, or NodeList');\n }\n}\n\n/**\n * Adds an event listener to a HTML element\n * and returns a remove listener function.\n *\n * @param {HTMLElement} node\n * @param {String} type\n * @param {Function} callback\n * @return {Object}\n */\nfunction listenNode(node, type, callback) {\n node.addEventListener(type, callback);\n\n return {\n destroy: function() {\n node.removeEventListener(type, callback);\n }\n }\n}\n\n/**\n * Add an event listener to a list of HTML elements\n * and returns a remove listener function.\n *\n * @param {NodeList|HTMLCollection} nodeList\n * @param {String} type\n * @param {Function} callback\n * @return {Object}\n */\nfunction listenNodeList(nodeList, type, callback) {\n Array.prototype.forEach.call(nodeList, function(node) {\n node.addEventListener(type, callback);\n });\n\n return {\n destroy: function() {\n Array.prototype.forEach.call(nodeList, function(node) {\n node.removeEventListener(type, callback);\n });\n }\n }\n}\n\n/**\n * Add an event listener to a selector\n * and returns a remove listener function.\n *\n * @param {String} selector\n * @param {String} type\n * @param {Function} callback\n * @return {Object}\n */\nfunction listenSelector(selector, type, callback) {\n return delegate(document.body, selector, type, callback);\n}\n\nmodule.exports = listen;\n\n\n/***/ }),\n\n/***/ 817:\n/***/ (function(module) {\n\nfunction select(element) {\n var selectedText;\n\n if (element.nodeName === 'SELECT') {\n element.focus();\n\n selectedText = element.value;\n }\n else if (element.nodeName === 'INPUT' || element.nodeName === 'TEXTAREA') {\n var isReadOnly = element.hasAttribute('readonly');\n\n if (!isReadOnly) {\n element.setAttribute('readonly', '');\n }\n\n element.select();\n element.setSelectionRange(0, element.value.length);\n\n if (!isReadOnly) {\n element.removeAttribute('readonly');\n }\n\n selectedText = element.value;\n }\n else {\n if (element.hasAttribute('contenteditable')) {\n element.focus();\n }\n\n var selection = window.getSelection();\n var range = document.createRange();\n\n range.selectNodeContents(element);\n selection.removeAllRanges();\n selection.addRange(range);\n\n selectedText = selection.toString();\n }\n\n return selectedText;\n}\n\nmodule.exports = select;\n\n\n/***/ }),\n\n/***/ 279:\n/***/ (function(module) {\n\nfunction E () {\n // Keep this empty so it's easier to inherit from\n // (via https://github.com/lipsmack from https://github.com/scottcorgan/tiny-emitter/issues/3)\n}\n\nE.prototype = {\n on: function (name, callback, ctx) {\n var e = this.e || (this.e = {});\n\n (e[name] || (e[name] = [])).push({\n fn: callback,\n ctx: ctx\n });\n\n return this;\n },\n\n once: function (name, callback, ctx) {\n var self = this;\n function listener () {\n self.off(name, listener);\n callback.apply(ctx, arguments);\n };\n\n listener._ = callback\n return this.on(name, listener, ctx);\n },\n\n emit: function (name) {\n var data = [].slice.call(arguments, 1);\n var evtArr = ((this.e || (this.e = {}))[name] || []).slice();\n var i = 0;\n var len = evtArr.length;\n\n for (i; i < len; i++) {\n evtArr[i].fn.apply(evtArr[i].ctx, data);\n }\n\n return this;\n },\n\n off: function (name, callback) {\n var e = this.e || (this.e = {});\n var evts = e[name];\n var liveEvents = [];\n\n if (evts && callback) {\n for (var i = 0, len = evts.length; i < len; i++) {\n if (evts[i].fn !== callback && evts[i].fn._ !== callback)\n liveEvents.push(evts[i]);\n }\n }\n\n // Remove event from queue to prevent memory leak\n // Suggested by https://github.com/lazd\n // Ref: https://github.com/scottcorgan/tiny-emitter/commit/c6ebfaa9bc973b33d110a84a307742b7cf94c953#commitcomment-5024910\n\n (liveEvents.length)\n ? e[name] = liveEvents\n : delete e[name];\n\n return this;\n }\n};\n\nmodule.exports = E;\nmodule.exports.TinyEmitter = E;\n\n\n/***/ })\n\n/******/ \t});\n/************************************************************************/\n/******/ \t// The module cache\n/******/ \tvar __webpack_module_cache__ = {};\n/******/ \t\n/******/ \t// The require function\n/******/ \tfunction __webpack_require__(moduleId) {\n/******/ \t\t// Check if module is in cache\n/******/ \t\tif(__webpack_module_cache__[moduleId]) {\n/******/ \t\t\treturn __webpack_module_cache__[moduleId].exports;\n/******/ \t\t}\n/******/ \t\t// Create a new module (and put it into the cache)\n/******/ \t\tvar module = __webpack_module_cache__[moduleId] = {\n/******/ \t\t\t// no module.id needed\n/******/ \t\t\t// no module.loaded needed\n/******/ \t\t\texports: {}\n/******/ \t\t};\n/******/ \t\n/******/ \t\t// Execute the module function\n/******/ \t\t__webpack_modules__[moduleId](module, module.exports, __webpack_require__);\n/******/ \t\n/******/ \t\t// Return the exports of the module\n/******/ \t\treturn module.exports;\n/******/ \t}\n/******/ \t\n/************************************************************************/\n/******/ \t/* webpack/runtime/compat get default export */\n/******/ \t!function() {\n/******/ \t\t// getDefaultExport function for compatibility with non-harmony modules\n/******/ \t\t__webpack_require__.n = function(module) {\n/******/ \t\t\tvar getter = module && module.__esModule ?\n/******/ \t\t\t\tfunction() { return module['default']; } :\n/******/ \t\t\t\tfunction() { return module; };\n/******/ \t\t\t__webpack_require__.d(getter, { a: getter });\n/******/ \t\t\treturn getter;\n/******/ \t\t};\n/******/ \t}();\n/******/ \t\n/******/ \t/* webpack/runtime/define property getters */\n/******/ \t!function() {\n/******/ \t\t// define getter functions for harmony exports\n/******/ \t\t__webpack_require__.d = function(exports, definition) {\n/******/ \t\t\tfor(var key in definition) {\n/******/ \t\t\t\tif(__webpack_require__.o(definition, key) && !__webpack_require__.o(exports, key)) {\n/******/ \t\t\t\t\tObject.defineProperty(exports, key, { enumerable: true, get: definition[key] });\n/******/ \t\t\t\t}\n/******/ \t\t\t}\n/******/ \t\t};\n/******/ \t}();\n/******/ \t\n/******/ \t/* webpack/runtime/hasOwnProperty shorthand */\n/******/ \t!function() {\n/******/ \t\t__webpack_require__.o = function(obj, prop) { return Object.prototype.hasOwnProperty.call(obj, prop); }\n/******/ \t}();\n/******/ \t\n/************************************************************************/\n/******/ \t// module exports must be returned from runtime so entry inlining is disabled\n/******/ \t// startup\n/******/ \t// Load entry module and return exports\n/******/ \treturn __webpack_require__(686);\n/******/ })()\n.default;\n});", "/*\n * Copyright (c) 2016-2024 Martin Donath \n *\n * Permission is hereby granted, free of charge, to any person obtaining a copy\n * of this software and associated documentation files (the \"Software\"), to\n * deal in the Software without restriction, including without limitation the\n * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or\n * sell copies of the Software, and to permit persons to whom the Software is\n * furnished to do so, subject to the following conditions:\n *\n * The above copyright notice and this permission notice shall be included in\n * all copies or substantial portions of the Software.\n *\n * THE SOFTWARE IS PROVIDED \"AS IS\", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR\n * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,\n * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL THE\n * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER\n * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING\n * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS\n * IN THE SOFTWARE.\n */\n\nimport \"focus-visible\"\n\nimport {\n EMPTY,\n NEVER,\n Observable,\n Subject,\n defer,\n delay,\n filter,\n map,\n merge,\n mergeWith,\n shareReplay,\n switchMap\n} from \"rxjs\"\n\nimport { configuration, feature } from \"./_\"\nimport {\n at,\n getActiveElement,\n getOptionalElement,\n requestJSON,\n setLocation,\n setToggle,\n watchDocument,\n watchKeyboard,\n watchLocation,\n watchLocationTarget,\n watchMedia,\n watchPrint,\n watchScript,\n watchViewport\n} from \"./browser\"\nimport {\n getComponentElement,\n getComponentElements,\n mountAnnounce,\n mountBackToTop,\n mountConsent,\n mountContent,\n mountDialog,\n mountHeader,\n mountHeaderTitle,\n mountPalette,\n mountProgress,\n mountSearch,\n mountSearchHiglight,\n mountSidebar,\n mountSource,\n mountTableOfContents,\n mountTabs,\n watchHeader,\n watchMain\n} from \"./components\"\nimport {\n SearchIndex,\n setupClipboardJS,\n setupInstantNavigation,\n setupVersionSelector\n} from \"./integrations\"\nimport {\n patchEllipsis,\n patchIndeterminate,\n patchScrollfix,\n patchScrolllock\n} from \"./patches\"\nimport \"./polyfills\"\n\n/* ----------------------------------------------------------------------------\n * Functions - @todo refactor\n * ------------------------------------------------------------------------- */\n\n/**\n * Fetch search index\n *\n * @returns Search index observable\n */\nfunction fetchSearchIndex(): Observable {\n if (location.protocol === \"file:\") {\n return watchScript(\n `${new URL(\"search/search_index.js\", config.base)}`\n )\n .pipe(\n // @ts-ignore - @todo fix typings\n map(() => __index),\n shareReplay(1)\n )\n } else {\n return requestJSON(\n new URL(\"search/search_index.json\", config.base)\n )\n }\n}\n\n/* ----------------------------------------------------------------------------\n * Application\n * ------------------------------------------------------------------------- */\n\n/* Yay, JavaScript is available */\ndocument.documentElement.classList.remove(\"no-js\")\ndocument.documentElement.classList.add(\"js\")\n\n/* Set up navigation observables and subjects */\nconst document$ = watchDocument()\nconst location$ = watchLocation()\nconst target$ = watchLocationTarget(location$)\nconst keyboard$ = watchKeyboard()\n\n/* Set up media observables */\nconst viewport$ = watchViewport()\nconst tablet$ = watchMedia(\"(min-width: 960px)\")\nconst screen$ = watchMedia(\"(min-width: 1220px)\")\nconst print$ = watchPrint()\n\n/* Retrieve search index, if search is enabled */\nconst config = configuration()\nconst index$ = document.forms.namedItem(\"search\")\n ? fetchSearchIndex()\n : NEVER\n\n/* Set up Clipboard.js integration */\nconst alert$ = new Subject()\nsetupClipboardJS({ alert$ })\n\n/* Set up progress indicator */\nconst progress$ = new Subject()\n\n/* Set up instant navigation, if enabled */\nif (feature(\"navigation.instant\"))\n setupInstantNavigation({ location$, viewport$, progress$ })\n .subscribe(document$)\n\n/* Set up version selector */\nif (config.version?.provider === \"mike\")\n setupVersionSelector({ document$ })\n\n/* Always close drawer and search on navigation */\nmerge(location$, target$)\n .pipe(\n delay(125)\n )\n .subscribe(() => {\n setToggle(\"drawer\", false)\n setToggle(\"search\", false)\n })\n\n/* Set up global keyboard handlers */\nkeyboard$\n .pipe(\n filter(({ mode }) => mode === \"global\")\n )\n .subscribe(key => {\n switch (key.type) {\n\n /* Go to previous page */\n case \"p\":\n case \",\":\n const prev = getOptionalElement(\"link[rel=prev]\")\n if (typeof prev !== \"undefined\")\n setLocation(prev)\n break\n\n /* Go to next page */\n case \"n\":\n case \".\":\n const next = getOptionalElement(\"link[rel=next]\")\n if (typeof next !== \"undefined\")\n setLocation(next)\n break\n\n /* Expand navigation, see https://bit.ly/3ZjG5io */\n case \"Enter\":\n const active = getActiveElement()\n if (active instanceof HTMLLabelElement)\n active.click()\n }\n })\n\n/* Set up patches */\npatchEllipsis({ viewport$, document$ })\npatchIndeterminate({ document$, tablet$ })\npatchScrollfix({ document$ })\npatchScrolllock({ viewport$, tablet$ })\n\n/* Set up header and main area observable */\nconst header$ = watchHeader(getComponentElement(\"header\"), { viewport$ })\nconst main$ = document$\n .pipe(\n map(() => getComponentElement(\"main\")),\n switchMap(el => watchMain(el, { viewport$, header$ })),\n shareReplay(1)\n )\n\n/* Set up control component observables */\nconst control$ = merge(\n\n /* Consent */\n ...getComponentElements(\"consent\")\n .map(el => mountConsent(el, { target$ })),\n\n /* Dialog */\n ...getComponentElements(\"dialog\")\n .map(el => mountDialog(el, { alert$ })),\n\n /* Color palette */\n ...getComponentElements(\"palette\")\n .map(el => mountPalette(el)),\n\n /* Progress bar */\n ...getComponentElements(\"progress\")\n .map(el => mountProgress(el, { progress$ })),\n\n /* Search */\n ...getComponentElements(\"search\")\n .map(el => mountSearch(el, { index$, keyboard$ })),\n\n /* Repository information */\n ...getComponentElements(\"source\")\n .map(el => mountSource(el))\n)\n\n/* Set up content component observables */\nconst content$ = defer(() => merge(\n\n /* Announcement bar */\n ...getComponentElements(\"announce\")\n .map(el => mountAnnounce(el)),\n\n /* Content */\n ...getComponentElements(\"content\")\n .map(el => mountContent(el, { viewport$, target$, print$ })),\n\n /* Search highlighting */\n ...getComponentElements(\"content\")\n .map(el => feature(\"search.highlight\")\n ? mountSearchHiglight(el, { index$, location$ })\n : EMPTY\n ),\n\n /* Header */\n ...getComponentElements(\"header\")\n .map(el => mountHeader(el, { viewport$, header$, main$ })),\n\n /* Header title */\n ...getComponentElements(\"header-title\")\n .map(el => mountHeaderTitle(el, { viewport$, header$ })),\n\n /* Sidebar */\n ...getComponentElements(\"sidebar\")\n .map(el => el.getAttribute(\"data-md-type\") === \"navigation\"\n ? at(screen$, () => mountSidebar(el, { viewport$, header$, main$ }))\n : at(tablet$, () => mountSidebar(el, { viewport$, header$, main$ }))\n ),\n\n /* Navigation tabs */\n ...getComponentElements(\"tabs\")\n .map(el => mountTabs(el, { viewport$, header$ })),\n\n /* Table of contents */\n ...getComponentElements(\"toc\")\n .map(el => mountTableOfContents(el, {\n viewport$, header$, main$, target$\n })),\n\n /* Back-to-top button */\n ...getComponentElements(\"top\")\n .map(el => mountBackToTop(el, { viewport$, header$, main$, target$ }))\n))\n\n/* Set up component observables */\nconst component$ = document$\n .pipe(\n switchMap(() => content$),\n mergeWith(control$),\n shareReplay(1)\n )\n\n/* Subscribe to all components */\ncomponent$.subscribe()\n\n/* ----------------------------------------------------------------------------\n * Exports\n * ------------------------------------------------------------------------- */\n\nwindow.document$ = document$ /* Document observable */\nwindow.location$ = location$ /* Location subject */\nwindow.target$ = target$ /* Location target observable */\nwindow.keyboard$ = keyboard$ /* Keyboard observable */\nwindow.viewport$ = viewport$ /* Viewport observable */\nwindow.tablet$ = tablet$ /* Media tablet observable */\nwindow.screen$ = screen$ /* Media screen observable */\nwindow.print$ = print$ /* Media print observable */\nwindow.alert$ = alert$ /* Alert subject */\nwindow.progress$ = progress$ /* Progress indicator subject */\nwindow.component$ = component$ /* Component observable */\n", "/******************************************************************************\nCopyright (c) Microsoft Corporation.\n\nPermission to use, copy, modify, and/or distribute this software for any\npurpose with or without fee is hereby granted.\n\nTHE SOFTWARE IS PROVIDED \"AS IS\" AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH\nREGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY\nAND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT,\nINDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM\nLOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR\nOTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR\nPERFORMANCE OF THIS SOFTWARE.\n***************************************************************************** */\n/* global Reflect, Promise, SuppressedError, Symbol, Iterator */\n\nvar extendStatics = function(d, b) {\n extendStatics = Object.setPrototypeOf ||\n ({ __proto__: [] } instanceof Array && function (d, b) { d.__proto__ = b; }) ||\n function (d, b) { for (var p in b) if (Object.prototype.hasOwnProperty.call(b, p)) d[p] = b[p]; };\n return extendStatics(d, b);\n};\n\nexport function __extends(d, b) {\n if (typeof b !== \"function\" && b !== null)\n throw new TypeError(\"Class extends value \" + String(b) + \" is not a constructor or null\");\n extendStatics(d, b);\n function __() { this.constructor = d; }\n d.prototype = b === null ? Object.create(b) : (__.prototype = b.prototype, new __());\n}\n\nexport var __assign = function() {\n __assign = Object.assign || function __assign(t) {\n for (var s, i = 1, n = arguments.length; i < n; i++) {\n s = arguments[i];\n for (var p in s) if (Object.prototype.hasOwnProperty.call(s, p)) t[p] = s[p];\n }\n return t;\n }\n return __assign.apply(this, arguments);\n}\n\nexport function __rest(s, e) {\n var t = {};\n for (var p in s) if (Object.prototype.hasOwnProperty.call(s, p) && e.indexOf(p) < 0)\n t[p] = s[p];\n if (s != null && typeof Object.getOwnPropertySymbols === \"function\")\n for (var i = 0, p = Object.getOwnPropertySymbols(s); i < p.length; i++) {\n if (e.indexOf(p[i]) < 0 && Object.prototype.propertyIsEnumerable.call(s, p[i]))\n t[p[i]] = s[p[i]];\n }\n return t;\n}\n\nexport function __decorate(decorators, target, key, desc) {\n var c = arguments.length, r = c < 3 ? target : desc === null ? desc = Object.getOwnPropertyDescriptor(target, key) : desc, d;\n if (typeof Reflect === \"object\" && typeof Reflect.decorate === \"function\") r = Reflect.decorate(decorators, target, key, desc);\n else for (var i = decorators.length - 1; i >= 0; i--) if (d = decorators[i]) r = (c < 3 ? d(r) : c > 3 ? d(target, key, r) : d(target, key)) || r;\n return c > 3 && r && Object.defineProperty(target, key, r), r;\n}\n\nexport function __param(paramIndex, decorator) {\n return function (target, key) { decorator(target, key, paramIndex); }\n}\n\nexport function __esDecorate(ctor, descriptorIn, decorators, contextIn, initializers, extraInitializers) {\n function accept(f) { if (f !== void 0 && typeof f !== \"function\") throw new TypeError(\"Function expected\"); return f; }\n var kind = contextIn.kind, key = kind === \"getter\" ? \"get\" : kind === \"setter\" ? \"set\" : \"value\";\n var target = !descriptorIn && ctor ? contextIn[\"static\"] ? ctor : ctor.prototype : null;\n var descriptor = descriptorIn || (target ? Object.getOwnPropertyDescriptor(target, contextIn.name) : {});\n var _, done = false;\n for (var i = decorators.length - 1; i >= 0; i--) {\n var context = {};\n for (var p in contextIn) context[p] = p === \"access\" ? {} : contextIn[p];\n for (var p in contextIn.access) context.access[p] = contextIn.access[p];\n context.addInitializer = function (f) { if (done) throw new TypeError(\"Cannot add initializers after decoration has completed\"); extraInitializers.push(accept(f || null)); };\n var result = (0, decorators[i])(kind === \"accessor\" ? { get: descriptor.get, set: descriptor.set } : descriptor[key], context);\n if (kind === \"accessor\") {\n if (result === void 0) continue;\n if (result === null || typeof result !== \"object\") throw new TypeError(\"Object expected\");\n if (_ = accept(result.get)) descriptor.get = _;\n if (_ = accept(result.set)) descriptor.set = _;\n if (_ = accept(result.init)) initializers.unshift(_);\n }\n else if (_ = accept(result)) {\n if (kind === \"field\") initializers.unshift(_);\n else descriptor[key] = _;\n }\n }\n if (target) Object.defineProperty(target, contextIn.name, descriptor);\n done = true;\n};\n\nexport function __runInitializers(thisArg, initializers, value) {\n var useValue = arguments.length > 2;\n for (var i = 0; i < initializers.length; i++) {\n value = useValue ? initializers[i].call(thisArg, value) : initializers[i].call(thisArg);\n }\n return useValue ? value : void 0;\n};\n\nexport function __propKey(x) {\n return typeof x === \"symbol\" ? x : \"\".concat(x);\n};\n\nexport function __setFunctionName(f, name, prefix) {\n if (typeof name === \"symbol\") name = name.description ? \"[\".concat(name.description, \"]\") : \"\";\n return Object.defineProperty(f, \"name\", { configurable: true, value: prefix ? \"\".concat(prefix, \" \", name) : name });\n};\n\nexport function __metadata(metadataKey, metadataValue) {\n if (typeof Reflect === \"object\" && typeof Reflect.metadata === \"function\") return Reflect.metadata(metadataKey, metadataValue);\n}\n\nexport function __awaiter(thisArg, _arguments, P, generator) {\n function adopt(value) { return value instanceof P ? value : new P(function (resolve) { resolve(value); }); }\n return new (P || (P = Promise))(function (resolve, reject) {\n function fulfilled(value) { try { step(generator.next(value)); } catch (e) { reject(e); } }\n function rejected(value) { try { step(generator[\"throw\"](value)); } catch (e) { reject(e); } }\n function step(result) { result.done ? resolve(result.value) : adopt(result.value).then(fulfilled, rejected); }\n step((generator = generator.apply(thisArg, _arguments || [])).next());\n });\n}\n\nexport function __generator(thisArg, body) {\n var _ = { label: 0, sent: function() { if (t[0] & 1) throw t[1]; return t[1]; }, trys: [], ops: [] }, f, y, t, g = Object.create((typeof Iterator === \"function\" ? Iterator : Object).prototype);\n return g.next = verb(0), g[\"throw\"] = verb(1), g[\"return\"] = verb(2), typeof Symbol === \"function\" && (g[Symbol.iterator] = function() { return this; }), g;\n function verb(n) { return function (v) { return step([n, v]); }; }\n function step(op) {\n if (f) throw new TypeError(\"Generator is already executing.\");\n while (g && (g = 0, op[0] && (_ = 0)), _) try {\n if (f = 1, y && (t = op[0] & 2 ? y[\"return\"] : op[0] ? y[\"throw\"] || ((t = y[\"return\"]) && t.call(y), 0) : y.next) && !(t = t.call(y, op[1])).done) return t;\n if (y = 0, t) op = [op[0] & 2, t.value];\n switch (op[0]) {\n case 0: case 1: t = op; break;\n case 4: _.label++; return { value: op[1], done: false };\n case 5: _.label++; y = op[1]; op = [0]; continue;\n case 7: op = _.ops.pop(); _.trys.pop(); continue;\n default:\n if (!(t = _.trys, t = t.length > 0 && t[t.length - 1]) && (op[0] === 6 || op[0] === 2)) { _ = 0; continue; }\n if (op[0] === 3 && (!t || (op[1] > t[0] && op[1] < t[3]))) { _.label = op[1]; break; }\n if (op[0] === 6 && _.label < t[1]) { _.label = t[1]; t = op; break; }\n if (t && _.label < t[2]) { _.label = t[2]; _.ops.push(op); break; }\n if (t[2]) _.ops.pop();\n _.trys.pop(); continue;\n }\n op = body.call(thisArg, _);\n } catch (e) { op = [6, e]; y = 0; } finally { f = t = 0; }\n if (op[0] & 5) throw op[1]; return { value: op[0] ? op[1] : void 0, done: true };\n }\n}\n\nexport var __createBinding = Object.create ? (function(o, m, k, k2) {\n if (k2 === undefined) k2 = k;\n var desc = Object.getOwnPropertyDescriptor(m, k);\n if (!desc || (\"get\" in desc ? !m.__esModule : desc.writable || desc.configurable)) {\n desc = { enumerable: true, get: function() { return m[k]; } };\n }\n Object.defineProperty(o, k2, desc);\n}) : (function(o, m, k, k2) {\n if (k2 === undefined) k2 = k;\n o[k2] = m[k];\n});\n\nexport function __exportStar(m, o) {\n for (var p in m) if (p !== \"default\" && !Object.prototype.hasOwnProperty.call(o, p)) __createBinding(o, m, p);\n}\n\nexport function __values(o) {\n var s = typeof Symbol === \"function\" && Symbol.iterator, m = s && o[s], i = 0;\n if (m) return m.call(o);\n if (o && typeof o.length === \"number\") return {\n next: function () {\n if (o && i >= o.length) o = void 0;\n return { value: o && o[i++], done: !o };\n }\n };\n throw new TypeError(s ? \"Object is not iterable.\" : \"Symbol.iterator is not defined.\");\n}\n\nexport function __read(o, n) {\n var m = typeof Symbol === \"function\" && o[Symbol.iterator];\n if (!m) return o;\n var i = m.call(o), r, ar = [], e;\n try {\n while ((n === void 0 || n-- > 0) && !(r = i.next()).done) ar.push(r.value);\n }\n catch (error) { e = { error: error }; }\n finally {\n try {\n if (r && !r.done && (m = i[\"return\"])) m.call(i);\n }\n finally { if (e) throw e.error; }\n }\n return ar;\n}\n\n/** @deprecated */\nexport function __spread() {\n for (var ar = [], i = 0; i < arguments.length; i++)\n ar = ar.concat(__read(arguments[i]));\n return ar;\n}\n\n/** @deprecated */\nexport function __spreadArrays() {\n for (var s = 0, i = 0, il = arguments.length; i < il; i++) s += arguments[i].length;\n for (var r = Array(s), k = 0, i = 0; i < il; i++)\n for (var a = arguments[i], j = 0, jl = a.length; j < jl; j++, k++)\n r[k] = a[j];\n return r;\n}\n\nexport function __spreadArray(to, from, pack) {\n if (pack || arguments.length === 2) for (var i = 0, l = from.length, ar; i < l; i++) {\n if (ar || !(i in from)) {\n if (!ar) ar = Array.prototype.slice.call(from, 0, i);\n ar[i] = from[i];\n }\n }\n return to.concat(ar || Array.prototype.slice.call(from));\n}\n\nexport function __await(v) {\n return this instanceof __await ? (this.v = v, this) : new __await(v);\n}\n\nexport function __asyncGenerator(thisArg, _arguments, generator) {\n if (!Symbol.asyncIterator) throw new TypeError(\"Symbol.asyncIterator is not defined.\");\n var g = generator.apply(thisArg, _arguments || []), i, q = [];\n return i = Object.create((typeof AsyncIterator === \"function\" ? AsyncIterator : Object).prototype), verb(\"next\"), verb(\"throw\"), verb(\"return\", awaitReturn), i[Symbol.asyncIterator] = function () { return this; }, i;\n function awaitReturn(f) { return function (v) { return Promise.resolve(v).then(f, reject); }; }\n function verb(n, f) { if (g[n]) { i[n] = function (v) { return new Promise(function (a, b) { q.push([n, v, a, b]) > 1 || resume(n, v); }); }; if (f) i[n] = f(i[n]); } }\n function resume(n, v) { try { step(g[n](v)); } catch (e) { settle(q[0][3], e); } }\n function step(r) { r.value instanceof __await ? Promise.resolve(r.value.v).then(fulfill, reject) : settle(q[0][2], r); }\n function fulfill(value) { resume(\"next\", value); }\n function reject(value) { resume(\"throw\", value); }\n function settle(f, v) { if (f(v), q.shift(), q.length) resume(q[0][0], q[0][1]); }\n}\n\nexport function __asyncDelegator(o) {\n var i, p;\n return i = {}, verb(\"next\"), verb(\"throw\", function (e) { throw e; }), verb(\"return\"), i[Symbol.iterator] = function () { return this; }, i;\n function verb(n, f) { i[n] = o[n] ? function (v) { return (p = !p) ? { value: __await(o[n](v)), done: false } : f ? f(v) : v; } : f; }\n}\n\nexport function __asyncValues(o) {\n if (!Symbol.asyncIterator) throw new TypeError(\"Symbol.asyncIterator is not defined.\");\n var m = o[Symbol.asyncIterator], i;\n return m ? m.call(o) : (o = typeof __values === \"function\" ? __values(o) : o[Symbol.iterator](), i = {}, verb(\"next\"), verb(\"throw\"), verb(\"return\"), i[Symbol.asyncIterator] = function () { return this; }, i);\n function verb(n) { i[n] = o[n] && function (v) { return new Promise(function (resolve, reject) { v = o[n](v), settle(resolve, reject, v.done, v.value); }); }; }\n function settle(resolve, reject, d, v) { Promise.resolve(v).then(function(v) { resolve({ value: v, done: d }); }, reject); }\n}\n\nexport function __makeTemplateObject(cooked, raw) {\n if (Object.defineProperty) { Object.defineProperty(cooked, \"raw\", { value: raw }); } else { cooked.raw = raw; }\n return cooked;\n};\n\nvar __setModuleDefault = Object.create ? (function(o, v) {\n Object.defineProperty(o, \"default\", { enumerable: true, value: v });\n}) : function(o, v) {\n o[\"default\"] = v;\n};\n\nexport function __importStar(mod) {\n if (mod && mod.__esModule) return mod;\n var result = {};\n if (mod != null) for (var k in mod) if (k !== \"default\" && Object.prototype.hasOwnProperty.call(mod, k)) __createBinding(result, mod, k);\n __setModuleDefault(result, mod);\n return result;\n}\n\nexport function __importDefault(mod) {\n return (mod && mod.__esModule) ? mod : { default: mod };\n}\n\nexport function __classPrivateFieldGet(receiver, state, kind, f) {\n if (kind === \"a\" && !f) throw new TypeError(\"Private accessor was defined without a getter\");\n if (typeof state === \"function\" ? receiver !== state || !f : !state.has(receiver)) throw new TypeError(\"Cannot read private member from an object whose class did not declare it\");\n return kind === \"m\" ? f : kind === \"a\" ? f.call(receiver) : f ? f.value : state.get(receiver);\n}\n\nexport function __classPrivateFieldSet(receiver, state, value, kind, f) {\n if (kind === \"m\") throw new TypeError(\"Private method is not writable\");\n if (kind === \"a\" && !f) throw new TypeError(\"Private accessor was defined without a setter\");\n if (typeof state === \"function\" ? receiver !== state || !f : !state.has(receiver)) throw new TypeError(\"Cannot write private member to an object whose class did not declare it\");\n return (kind === \"a\" ? f.call(receiver, value) : f ? f.value = value : state.set(receiver, value)), value;\n}\n\nexport function __classPrivateFieldIn(state, receiver) {\n if (receiver === null || (typeof receiver !== \"object\" && typeof receiver !== \"function\")) throw new TypeError(\"Cannot use 'in' operator on non-object\");\n return typeof state === \"function\" ? receiver === state : state.has(receiver);\n}\n\nexport function __addDisposableResource(env, value, async) {\n if (value !== null && value !== void 0) {\n if (typeof value !== \"object\" && typeof value !== \"function\") throw new TypeError(\"Object expected.\");\n var dispose, inner;\n if (async) {\n if (!Symbol.asyncDispose) throw new TypeError(\"Symbol.asyncDispose is not defined.\");\n dispose = value[Symbol.asyncDispose];\n }\n if (dispose === void 0) {\n if (!Symbol.dispose) throw new TypeError(\"Symbol.dispose is not defined.\");\n dispose = value[Symbol.dispose];\n if (async) inner = dispose;\n }\n if (typeof dispose !== \"function\") throw new TypeError(\"Object not disposable.\");\n if (inner) dispose = function() { try { inner.call(this); } catch (e) { return Promise.reject(e); } };\n env.stack.push({ value: value, dispose: dispose, async: async });\n }\n else if (async) {\n env.stack.push({ async: true });\n }\n return value;\n}\n\nvar _SuppressedError = typeof SuppressedError === \"function\" ? SuppressedError : function (error, suppressed, message) {\n var e = new Error(message);\n return e.name = \"SuppressedError\", e.error = error, e.suppressed = suppressed, e;\n};\n\nexport function __disposeResources(env) {\n function fail(e) {\n env.error = env.hasError ? new _SuppressedError(e, env.error, \"An error was suppressed during disposal.\") : e;\n env.hasError = true;\n }\n var r, s = 0;\n function next() {\n while (r = env.stack.pop()) {\n try {\n if (!r.async && s === 1) return s = 0, env.stack.push(r), Promise.resolve().then(next);\n if (r.dispose) {\n var result = r.dispose.call(r.value);\n if (r.async) return s |= 2, Promise.resolve(result).then(next, function(e) { fail(e); return next(); });\n }\n else s |= 1;\n }\n catch (e) {\n fail(e);\n }\n }\n if (s === 1) return env.hasError ? Promise.reject(env.error) : Promise.resolve();\n if (env.hasError) throw env.error;\n }\n return next();\n}\n\nexport default {\n __extends,\n __assign,\n __rest,\n __decorate,\n __param,\n __metadata,\n __awaiter,\n __generator,\n __createBinding,\n __exportStar,\n __values,\n __read,\n __spread,\n __spreadArrays,\n __spreadArray,\n __await,\n __asyncGenerator,\n __asyncDelegator,\n __asyncValues,\n __makeTemplateObject,\n __importStar,\n __importDefault,\n __classPrivateFieldGet,\n __classPrivateFieldSet,\n __classPrivateFieldIn,\n __addDisposableResource,\n __disposeResources,\n};\n", "/**\n * Returns true if the object is a function.\n * @param value The value to check\n */\nexport function isFunction(value: any): value is (...args: any[]) => any {\n return typeof value === 'function';\n}\n", "/**\n * Used to create Error subclasses until the community moves away from ES5.\n *\n * This is because compiling from TypeScript down to ES5 has issues with subclassing Errors\n * as well as other built-in types: https://github.com/Microsoft/TypeScript/issues/12123\n *\n * @param createImpl A factory function to create the actual constructor implementation. The returned\n * function should be a named function that calls `_super` internally.\n */\nexport function createErrorClass(createImpl: (_super: any) => any): T {\n const _super = (instance: any) => {\n Error.call(instance);\n instance.stack = new Error().stack;\n };\n\n const ctorFunc = createImpl(_super);\n ctorFunc.prototype = Object.create(Error.prototype);\n ctorFunc.prototype.constructor = ctorFunc;\n return ctorFunc;\n}\n", "import { createErrorClass } from './createErrorClass';\n\nexport interface UnsubscriptionError extends Error {\n readonly errors: any[];\n}\n\nexport interface UnsubscriptionErrorCtor {\n /**\n * @deprecated Internal implementation detail. Do not construct error instances.\n * Cannot be tagged as internal: https://github.com/ReactiveX/rxjs/issues/6269\n */\n new (errors: any[]): UnsubscriptionError;\n}\n\n/**\n * An error thrown when one or more errors have occurred during the\n * `unsubscribe` of a {@link Subscription}.\n */\nexport const UnsubscriptionError: UnsubscriptionErrorCtor = createErrorClass(\n (_super) =>\n function UnsubscriptionErrorImpl(this: any, errors: (Error | string)[]) {\n _super(this);\n this.message = errors\n ? `${errors.length} errors occurred during unsubscription:\n${errors.map((err, i) => `${i + 1}) ${err.toString()}`).join('\\n ')}`\n : '';\n this.name = 'UnsubscriptionError';\n this.errors = errors;\n }\n);\n", "/**\n * Removes an item from an array, mutating it.\n * @param arr The array to remove the item from\n * @param item The item to remove\n */\nexport function arrRemove(arr: T[] | undefined | null, item: T) {\n if (arr) {\n const index = arr.indexOf(item);\n 0 <= index && arr.splice(index, 1);\n }\n}\n", "import { isFunction } from './util/isFunction';\nimport { UnsubscriptionError } from './util/UnsubscriptionError';\nimport { SubscriptionLike, TeardownLogic, Unsubscribable } from './types';\nimport { arrRemove } from './util/arrRemove';\n\n/**\n * Represents a disposable resource, such as the execution of an Observable. A\n * Subscription has one important method, `unsubscribe`, that takes no argument\n * and just disposes the resource held by the subscription.\n *\n * Additionally, subscriptions may be grouped together through the `add()`\n * method, which will attach a child Subscription to the current Subscription.\n * When a Subscription is unsubscribed, all its children (and its grandchildren)\n * will be unsubscribed as well.\n *\n * @class Subscription\n */\nexport class Subscription implements SubscriptionLike {\n /** @nocollapse */\n public static EMPTY = (() => {\n const empty = new Subscription();\n empty.closed = true;\n return empty;\n })();\n\n /**\n * A flag to indicate whether this Subscription has already been unsubscribed.\n */\n public closed = false;\n\n private _parentage: Subscription[] | Subscription | null = null;\n\n /**\n * The list of registered finalizers to execute upon unsubscription. Adding and removing from this\n * list occurs in the {@link #add} and {@link #remove} methods.\n */\n private _finalizers: Exclude[] | null = null;\n\n /**\n * @param initialTeardown A function executed first as part of the finalization\n * process that is kicked off when {@link #unsubscribe} is called.\n */\n constructor(private initialTeardown?: () => void) {}\n\n /**\n * Disposes the resources held by the subscription. May, for instance, cancel\n * an ongoing Observable execution or cancel any other type of work that\n * started when the Subscription was created.\n * @return {void}\n */\n unsubscribe(): void {\n let errors: any[] | undefined;\n\n if (!this.closed) {\n this.closed = true;\n\n // Remove this from it's parents.\n const { _parentage } = this;\n if (_parentage) {\n this._parentage = null;\n if (Array.isArray(_parentage)) {\n for (const parent of _parentage) {\n parent.remove(this);\n }\n } else {\n _parentage.remove(this);\n }\n }\n\n const { initialTeardown: initialFinalizer } = this;\n if (isFunction(initialFinalizer)) {\n try {\n initialFinalizer();\n } catch (e) {\n errors = e instanceof UnsubscriptionError ? e.errors : [e];\n }\n }\n\n const { _finalizers } = this;\n if (_finalizers) {\n this._finalizers = null;\n for (const finalizer of _finalizers) {\n try {\n execFinalizer(finalizer);\n } catch (err) {\n errors = errors ?? [];\n if (err instanceof UnsubscriptionError) {\n errors = [...errors, ...err.errors];\n } else {\n errors.push(err);\n }\n }\n }\n }\n\n if (errors) {\n throw new UnsubscriptionError(errors);\n }\n }\n }\n\n /**\n * Adds a finalizer to this subscription, so that finalization will be unsubscribed/called\n * when this subscription is unsubscribed. If this subscription is already {@link #closed},\n * because it has already been unsubscribed, then whatever finalizer is passed to it\n * will automatically be executed (unless the finalizer itself is also a closed subscription).\n *\n * Closed Subscriptions cannot be added as finalizers to any subscription. Adding a closed\n * subscription to a any subscription will result in no operation. (A noop).\n *\n * Adding a subscription to itself, or adding `null` or `undefined` will not perform any\n * operation at all. (A noop).\n *\n * `Subscription` instances that are added to this instance will automatically remove themselves\n * if they are unsubscribed. Functions and {@link Unsubscribable} objects that you wish to remove\n * will need to be removed manually with {@link #remove}\n *\n * @param teardown The finalization logic to add to this subscription.\n */\n add(teardown: TeardownLogic): void {\n // Only add the finalizer if it's not undefined\n // and don't add a subscription to itself.\n if (teardown && teardown !== this) {\n if (this.closed) {\n // If this subscription is already closed,\n // execute whatever finalizer is handed to it automatically.\n execFinalizer(teardown);\n } else {\n if (teardown instanceof Subscription) {\n // We don't add closed subscriptions, and we don't add the same subscription\n // twice. Subscription unsubscribe is idempotent.\n if (teardown.closed || teardown._hasParent(this)) {\n return;\n }\n teardown._addParent(this);\n }\n (this._finalizers = this._finalizers ?? []).push(teardown);\n }\n }\n }\n\n /**\n * Checks to see if a this subscription already has a particular parent.\n * This will signal that this subscription has already been added to the parent in question.\n * @param parent the parent to check for\n */\n private _hasParent(parent: Subscription) {\n const { _parentage } = this;\n return _parentage === parent || (Array.isArray(_parentage) && _parentage.includes(parent));\n }\n\n /**\n * Adds a parent to this subscription so it can be removed from the parent if it\n * unsubscribes on it's own.\n *\n * NOTE: THIS ASSUMES THAT {@link _hasParent} HAS ALREADY BEEN CHECKED.\n * @param parent The parent subscription to add\n */\n private _addParent(parent: Subscription) {\n const { _parentage } = this;\n this._parentage = Array.isArray(_parentage) ? (_parentage.push(parent), _parentage) : _parentage ? [_parentage, parent] : parent;\n }\n\n /**\n * Called on a child when it is removed via {@link #remove}.\n * @param parent The parent to remove\n */\n private _removeParent(parent: Subscription) {\n const { _parentage } = this;\n if (_parentage === parent) {\n this._parentage = null;\n } else if (Array.isArray(_parentage)) {\n arrRemove(_parentage, parent);\n }\n }\n\n /**\n * Removes a finalizer from this subscription that was previously added with the {@link #add} method.\n *\n * Note that `Subscription` instances, when unsubscribed, will automatically remove themselves\n * from every other `Subscription` they have been added to. This means that using the `remove` method\n * is not a common thing and should be used thoughtfully.\n *\n * If you add the same finalizer instance of a function or an unsubscribable object to a `Subscription` instance\n * more than once, you will need to call `remove` the same number of times to remove all instances.\n *\n * All finalizer instances are removed to free up memory upon unsubscription.\n *\n * @param teardown The finalizer to remove from this subscription\n */\n remove(teardown: Exclude): void {\n const { _finalizers } = this;\n _finalizers && arrRemove(_finalizers, teardown);\n\n if (teardown instanceof Subscription) {\n teardown._removeParent(this);\n }\n }\n}\n\nexport const EMPTY_SUBSCRIPTION = Subscription.EMPTY;\n\nexport function isSubscription(value: any): value is Subscription {\n return (\n value instanceof Subscription ||\n (value && 'closed' in value && isFunction(value.remove) && isFunction(value.add) && isFunction(value.unsubscribe))\n );\n}\n\nfunction execFinalizer(finalizer: Unsubscribable | (() => void)) {\n if (isFunction(finalizer)) {\n finalizer();\n } else {\n finalizer.unsubscribe();\n }\n}\n", "import { Subscriber } from './Subscriber';\nimport { ObservableNotification } from './types';\n\n/**\n * The {@link GlobalConfig} object for RxJS. It is used to configure things\n * like how to react on unhandled errors.\n */\nexport const config: GlobalConfig = {\n onUnhandledError: null,\n onStoppedNotification: null,\n Promise: undefined,\n useDeprecatedSynchronousErrorHandling: false,\n useDeprecatedNextContext: false,\n};\n\n/**\n * The global configuration object for RxJS, used to configure things\n * like how to react on unhandled errors. Accessible via {@link config}\n * object.\n */\nexport interface GlobalConfig {\n /**\n * A registration point for unhandled errors from RxJS. These are errors that\n * cannot were not handled by consuming code in the usual subscription path. For\n * example, if you have this configured, and you subscribe to an observable without\n * providing an error handler, errors from that subscription will end up here. This\n * will _always_ be called asynchronously on another job in the runtime. This is because\n * we do not want errors thrown in this user-configured handler to interfere with the\n * behavior of the library.\n */\n onUnhandledError: ((err: any) => void) | null;\n\n /**\n * A registration point for notifications that cannot be sent to subscribers because they\n * have completed, errored or have been explicitly unsubscribed. By default, next, complete\n * and error notifications sent to stopped subscribers are noops. However, sometimes callers\n * might want a different behavior. For example, with sources that attempt to report errors\n * to stopped subscribers, a caller can configure RxJS to throw an unhandled error instead.\n * This will _always_ be called asynchronously on another job in the runtime. This is because\n * we do not want errors thrown in this user-configured handler to interfere with the\n * behavior of the library.\n */\n onStoppedNotification: ((notification: ObservableNotification, subscriber: Subscriber) => void) | null;\n\n /**\n * The promise constructor used by default for {@link Observable#toPromise toPromise} and {@link Observable#forEach forEach}\n * methods.\n *\n * @deprecated As of version 8, RxJS will no longer support this sort of injection of a\n * Promise constructor. If you need a Promise implementation other than native promises,\n * please polyfill/patch Promise as you see appropriate. Will be removed in v8.\n */\n Promise?: PromiseConstructorLike;\n\n /**\n * If true, turns on synchronous error rethrowing, which is a deprecated behavior\n * in v6 and higher. This behavior enables bad patterns like wrapping a subscribe\n * call in a try/catch block. It also enables producer interference, a nasty bug\n * where a multicast can be broken for all observers by a downstream consumer with\n * an unhandled error. DO NOT USE THIS FLAG UNLESS IT'S NEEDED TO BUY TIME\n * FOR MIGRATION REASONS.\n *\n * @deprecated As of version 8, RxJS will no longer support synchronous throwing\n * of unhandled errors. All errors will be thrown on a separate call stack to prevent bad\n * behaviors described above. Will be removed in v8.\n */\n useDeprecatedSynchronousErrorHandling: boolean;\n\n /**\n * If true, enables an as-of-yet undocumented feature from v5: The ability to access\n * `unsubscribe()` via `this` context in `next` functions created in observers passed\n * to `subscribe`.\n *\n * This is being removed because the performance was severely problematic, and it could also cause\n * issues when types other than POJOs are passed to subscribe as subscribers, as they will likely have\n * their `this` context overwritten.\n *\n * @deprecated As of version 8, RxJS will no longer support altering the\n * context of next functions provided as part of an observer to Subscribe. Instead,\n * you will have access to a subscription or a signal or token that will allow you to do things like\n * unsubscribe and test closed status. Will be removed in v8.\n */\n useDeprecatedNextContext: boolean;\n}\n", "import type { TimerHandle } from './timerHandle';\ntype SetTimeoutFunction = (handler: () => void, timeout?: number, ...args: any[]) => TimerHandle;\ntype ClearTimeoutFunction = (handle: TimerHandle) => void;\n\ninterface TimeoutProvider {\n setTimeout: SetTimeoutFunction;\n clearTimeout: ClearTimeoutFunction;\n delegate:\n | {\n setTimeout: SetTimeoutFunction;\n clearTimeout: ClearTimeoutFunction;\n }\n | undefined;\n}\n\nexport const timeoutProvider: TimeoutProvider = {\n // When accessing the delegate, use the variable rather than `this` so that\n // the functions can be called without being bound to the provider.\n setTimeout(handler: () => void, timeout?: number, ...args) {\n const { delegate } = timeoutProvider;\n if (delegate?.setTimeout) {\n return delegate.setTimeout(handler, timeout, ...args);\n }\n return setTimeout(handler, timeout, ...args);\n },\n clearTimeout(handle) {\n const { delegate } = timeoutProvider;\n return (delegate?.clearTimeout || clearTimeout)(handle as any);\n },\n delegate: undefined,\n};\n", "import { config } from '../config';\nimport { timeoutProvider } from '../scheduler/timeoutProvider';\n\n/**\n * Handles an error on another job either with the user-configured {@link onUnhandledError},\n * or by throwing it on that new job so it can be picked up by `window.onerror`, `process.on('error')`, etc.\n *\n * This should be called whenever there is an error that is out-of-band with the subscription\n * or when an error hits a terminal boundary of the subscription and no error handler was provided.\n *\n * @param err the error to report\n */\nexport function reportUnhandledError(err: any) {\n timeoutProvider.setTimeout(() => {\n const { onUnhandledError } = config;\n if (onUnhandledError) {\n // Execute the user-configured error handler.\n onUnhandledError(err);\n } else {\n // Throw so it is picked up by the runtime's uncaught error mechanism.\n throw err;\n }\n });\n}\n", "/* tslint:disable:no-empty */\nexport function noop() { }\n", "import { CompleteNotification, NextNotification, ErrorNotification } from './types';\n\n/**\n * A completion object optimized for memory use and created to be the\n * same \"shape\" as other notifications in v8.\n * @internal\n */\nexport const COMPLETE_NOTIFICATION = (() => createNotification('C', undefined, undefined) as CompleteNotification)();\n\n/**\n * Internal use only. Creates an optimized error notification that is the same \"shape\"\n * as other notifications.\n * @internal\n */\nexport function errorNotification(error: any): ErrorNotification {\n return createNotification('E', undefined, error) as any;\n}\n\n/**\n * Internal use only. Creates an optimized next notification that is the same \"shape\"\n * as other notifications.\n * @internal\n */\nexport function nextNotification(value: T) {\n return createNotification('N', value, undefined) as NextNotification;\n}\n\n/**\n * Ensures that all notifications created internally have the same \"shape\" in v8.\n *\n * TODO: This is only exported to support a crazy legacy test in `groupBy`.\n * @internal\n */\nexport function createNotification(kind: 'N' | 'E' | 'C', value: any, error: any) {\n return {\n kind,\n value,\n error,\n };\n}\n", "import { config } from '../config';\n\nlet context: { errorThrown: boolean; error: any } | null = null;\n\n/**\n * Handles dealing with errors for super-gross mode. Creates a context, in which\n * any synchronously thrown errors will be passed to {@link captureError}. Which\n * will record the error such that it will be rethrown after the call back is complete.\n * TODO: Remove in v8\n * @param cb An immediately executed function.\n */\nexport function errorContext(cb: () => void) {\n if (config.useDeprecatedSynchronousErrorHandling) {\n const isRoot = !context;\n if (isRoot) {\n context = { errorThrown: false, error: null };\n }\n cb();\n if (isRoot) {\n const { errorThrown, error } = context!;\n context = null;\n if (errorThrown) {\n throw error;\n }\n }\n } else {\n // This is the general non-deprecated path for everyone that\n // isn't crazy enough to use super-gross mode (useDeprecatedSynchronousErrorHandling)\n cb();\n }\n}\n\n/**\n * Captures errors only in super-gross mode.\n * @param err the error to capture\n */\nexport function captureError(err: any) {\n if (config.useDeprecatedSynchronousErrorHandling && context) {\n context.errorThrown = true;\n context.error = err;\n }\n}\n", "import { isFunction } from './util/isFunction';\nimport { Observer, ObservableNotification } from './types';\nimport { isSubscription, Subscription } from './Subscription';\nimport { config } from './config';\nimport { reportUnhandledError } from './util/reportUnhandledError';\nimport { noop } from './util/noop';\nimport { nextNotification, errorNotification, COMPLETE_NOTIFICATION } from './NotificationFactories';\nimport { timeoutProvider } from './scheduler/timeoutProvider';\nimport { captureError } from './util/errorContext';\n\n/**\n * Implements the {@link Observer} interface and extends the\n * {@link Subscription} class. While the {@link Observer} is the public API for\n * consuming the values of an {@link Observable}, all Observers get converted to\n * a Subscriber, in order to provide Subscription-like capabilities such as\n * `unsubscribe`. Subscriber is a common type in RxJS, and crucial for\n * implementing operators, but it is rarely used as a public API.\n *\n * @class Subscriber\n */\nexport class Subscriber extends Subscription implements Observer {\n /**\n * A static factory for a Subscriber, given a (potentially partial) definition\n * of an Observer.\n * @param next The `next` callback of an Observer.\n * @param error The `error` callback of an\n * Observer.\n * @param complete The `complete` callback of an\n * Observer.\n * @return A Subscriber wrapping the (partially defined)\n * Observer represented by the given arguments.\n * @nocollapse\n * @deprecated Do not use. Will be removed in v8. There is no replacement for this\n * method, and there is no reason to be creating instances of `Subscriber` directly.\n * If you have a specific use case, please file an issue.\n */\n static create(next?: (x?: T) => void, error?: (e?: any) => void, complete?: () => void): Subscriber {\n return new SafeSubscriber(next, error, complete);\n }\n\n /** @deprecated Internal implementation detail, do not use directly. Will be made internal in v8. */\n protected isStopped: boolean = false;\n /** @deprecated Internal implementation detail, do not use directly. Will be made internal in v8. */\n protected destination: Subscriber | Observer; // this `any` is the escape hatch to erase extra type param (e.g. R)\n\n /**\n * @deprecated Internal implementation detail, do not use directly. Will be made internal in v8.\n * There is no reason to directly create an instance of Subscriber. This type is exported for typings reasons.\n */\n constructor(destination?: Subscriber | Observer) {\n super();\n if (destination) {\n this.destination = destination;\n // Automatically chain subscriptions together here.\n // if destination is a Subscription, then it is a Subscriber.\n if (isSubscription(destination)) {\n destination.add(this);\n }\n } else {\n this.destination = EMPTY_OBSERVER;\n }\n }\n\n /**\n * The {@link Observer} callback to receive notifications of type `next` from\n * the Observable, with a value. The Observable may call this method 0 or more\n * times.\n * @param {T} [value] The `next` value.\n * @return {void}\n */\n next(value?: T): void {\n if (this.isStopped) {\n handleStoppedNotification(nextNotification(value), this);\n } else {\n this._next(value!);\n }\n }\n\n /**\n * The {@link Observer} callback to receive notifications of type `error` from\n * the Observable, with an attached `Error`. Notifies the Observer that\n * the Observable has experienced an error condition.\n * @param {any} [err] The `error` exception.\n * @return {void}\n */\n error(err?: any): void {\n if (this.isStopped) {\n handleStoppedNotification(errorNotification(err), this);\n } else {\n this.isStopped = true;\n this._error(err);\n }\n }\n\n /**\n * The {@link Observer} callback to receive a valueless notification of type\n * `complete` from the Observable. Notifies the Observer that the Observable\n * has finished sending push-based notifications.\n * @return {void}\n */\n complete(): void {\n if (this.isStopped) {\n handleStoppedNotification(COMPLETE_NOTIFICATION, this);\n } else {\n this.isStopped = true;\n this._complete();\n }\n }\n\n unsubscribe(): void {\n if (!this.closed) {\n this.isStopped = true;\n super.unsubscribe();\n this.destination = null!;\n }\n }\n\n protected _next(value: T): void {\n this.destination.next(value);\n }\n\n protected _error(err: any): void {\n try {\n this.destination.error(err);\n } finally {\n this.unsubscribe();\n }\n }\n\n protected _complete(): void {\n try {\n this.destination.complete();\n } finally {\n this.unsubscribe();\n }\n }\n}\n\n/**\n * This bind is captured here because we want to be able to have\n * compatibility with monoid libraries that tend to use a method named\n * `bind`. In particular, a library called Monio requires this.\n */\nconst _bind = Function.prototype.bind;\n\nfunction bind any>(fn: Fn, thisArg: any): Fn {\n return _bind.call(fn, thisArg);\n}\n\n/**\n * Internal optimization only, DO NOT EXPOSE.\n * @internal\n */\nclass ConsumerObserver implements Observer {\n constructor(private partialObserver: Partial>) {}\n\n next(value: T): void {\n const { partialObserver } = this;\n if (partialObserver.next) {\n try {\n partialObserver.next(value);\n } catch (error) {\n handleUnhandledError(error);\n }\n }\n }\n\n error(err: any): void {\n const { partialObserver } = this;\n if (partialObserver.error) {\n try {\n partialObserver.error(err);\n } catch (error) {\n handleUnhandledError(error);\n }\n } else {\n handleUnhandledError(err);\n }\n }\n\n complete(): void {\n const { partialObserver } = this;\n if (partialObserver.complete) {\n try {\n partialObserver.complete();\n } catch (error) {\n handleUnhandledError(error);\n }\n }\n }\n}\n\nexport class SafeSubscriber extends Subscriber {\n constructor(\n observerOrNext?: Partial> | ((value: T) => void) | null,\n error?: ((e?: any) => void) | null,\n complete?: (() => void) | null\n ) {\n super();\n\n let partialObserver: Partial>;\n if (isFunction(observerOrNext) || !observerOrNext) {\n // The first argument is a function, not an observer. The next\n // two arguments *could* be observers, or they could be empty.\n partialObserver = {\n next: (observerOrNext ?? undefined) as (((value: T) => void) | undefined),\n error: error ?? undefined,\n complete: complete ?? undefined,\n };\n } else {\n // The first argument is a partial observer.\n let context: any;\n if (this && config.useDeprecatedNextContext) {\n // This is a deprecated path that made `this.unsubscribe()` available in\n // next handler functions passed to subscribe. This only exists behind a flag\n // now, as it is *very* slow.\n context = Object.create(observerOrNext);\n context.unsubscribe = () => this.unsubscribe();\n partialObserver = {\n next: observerOrNext.next && bind(observerOrNext.next, context),\n error: observerOrNext.error && bind(observerOrNext.error, context),\n complete: observerOrNext.complete && bind(observerOrNext.complete, context),\n };\n } else {\n // The \"normal\" path. Just use the partial observer directly.\n partialObserver = observerOrNext;\n }\n }\n\n // Wrap the partial observer to ensure it's a full observer, and\n // make sure proper error handling is accounted for.\n this.destination = new ConsumerObserver(partialObserver);\n }\n}\n\nfunction handleUnhandledError(error: any) {\n if (config.useDeprecatedSynchronousErrorHandling) {\n captureError(error);\n } else {\n // Ideal path, we report this as an unhandled error,\n // which is thrown on a new call stack.\n reportUnhandledError(error);\n }\n}\n\n/**\n * An error handler used when no error handler was supplied\n * to the SafeSubscriber -- meaning no error handler was supplied\n * do the `subscribe` call on our observable.\n * @param err The error to handle\n */\nfunction defaultErrorHandler(err: any) {\n throw err;\n}\n\n/**\n * A handler for notifications that cannot be sent to a stopped subscriber.\n * @param notification The notification being sent\n * @param subscriber The stopped subscriber\n */\nfunction handleStoppedNotification(notification: ObservableNotification, subscriber: Subscriber) {\n const { onStoppedNotification } = config;\n onStoppedNotification && timeoutProvider.setTimeout(() => onStoppedNotification(notification, subscriber));\n}\n\n/**\n * The observer used as a stub for subscriptions where the user did not\n * pass any arguments to `subscribe`. Comes with the default error handling\n * behavior.\n */\nexport const EMPTY_OBSERVER: Readonly> & { closed: true } = {\n closed: true,\n next: noop,\n error: defaultErrorHandler,\n complete: noop,\n};\n", "/**\n * Symbol.observable or a string \"@@observable\". Used for interop\n *\n * @deprecated We will no longer be exporting this symbol in upcoming versions of RxJS.\n * Instead polyfill and use Symbol.observable directly *or* use https://www.npmjs.com/package/symbol-observable\n */\nexport const observable: string | symbol = (() => (typeof Symbol === 'function' && Symbol.observable) || '@@observable')();\n", "/**\n * This function takes one parameter and just returns it. Simply put,\n * this is like `(x: T): T => x`.\n *\n * ## Examples\n *\n * This is useful in some cases when using things like `mergeMap`\n *\n * ```ts\n * import { interval, take, map, range, mergeMap, identity } from 'rxjs';\n *\n * const source$ = interval(1000).pipe(take(5));\n *\n * const result$ = source$.pipe(\n * map(i => range(i)),\n * mergeMap(identity) // same as mergeMap(x => x)\n * );\n *\n * result$.subscribe({\n * next: console.log\n * });\n * ```\n *\n * Or when you want to selectively apply an operator\n *\n * ```ts\n * import { interval, take, identity } from 'rxjs';\n *\n * const shouldLimit = () => Math.random() < 0.5;\n *\n * const source$ = interval(1000);\n *\n * const result$ = source$.pipe(shouldLimit() ? take(5) : identity);\n *\n * result$.subscribe({\n * next: console.log\n * });\n * ```\n *\n * @param x Any value that is returned by this function\n * @returns The value passed as the first parameter to this function\n */\nexport function identity(x: T): T {\n return x;\n}\n", "import { identity } from './identity';\nimport { UnaryFunction } from '../types';\n\nexport function pipe(): typeof identity;\nexport function pipe(fn1: UnaryFunction): UnaryFunction;\nexport function pipe(fn1: UnaryFunction, fn2: UnaryFunction): UnaryFunction;\nexport function pipe(fn1: UnaryFunction, fn2: UnaryFunction, fn3: UnaryFunction): UnaryFunction;\nexport function pipe(\n fn1: UnaryFunction,\n fn2: UnaryFunction,\n fn3: UnaryFunction,\n fn4: UnaryFunction\n): UnaryFunction;\nexport function pipe(\n fn1: UnaryFunction,\n fn2: UnaryFunction,\n fn3: UnaryFunction,\n fn4: UnaryFunction,\n fn5: UnaryFunction\n): UnaryFunction;\nexport function pipe(\n fn1: UnaryFunction,\n fn2: UnaryFunction,\n fn3: UnaryFunction,\n fn4: UnaryFunction,\n fn5: UnaryFunction,\n fn6: UnaryFunction\n): UnaryFunction;\nexport function pipe(\n fn1: UnaryFunction,\n fn2: UnaryFunction,\n fn3: UnaryFunction,\n fn4: UnaryFunction,\n fn5: UnaryFunction,\n fn6: UnaryFunction,\n fn7: UnaryFunction\n): UnaryFunction;\nexport function pipe(\n fn1: UnaryFunction,\n fn2: UnaryFunction,\n fn3: UnaryFunction,\n fn4: UnaryFunction,\n fn5: UnaryFunction,\n fn6: UnaryFunction,\n fn7: UnaryFunction,\n fn8: UnaryFunction\n): UnaryFunction;\nexport function pipe(\n fn1: UnaryFunction,\n fn2: UnaryFunction,\n fn3: UnaryFunction,\n fn4: UnaryFunction,\n fn5: UnaryFunction,\n fn6: UnaryFunction,\n fn7: UnaryFunction,\n fn8: UnaryFunction,\n fn9: UnaryFunction\n): UnaryFunction;\nexport function pipe(\n fn1: UnaryFunction,\n fn2: UnaryFunction,\n fn3: UnaryFunction,\n fn4: UnaryFunction,\n fn5: UnaryFunction,\n fn6: UnaryFunction,\n fn7: UnaryFunction,\n fn8: UnaryFunction,\n fn9: UnaryFunction,\n ...fns: UnaryFunction[]\n): UnaryFunction;\n\n/**\n * pipe() can be called on one or more functions, each of which can take one argument (\"UnaryFunction\")\n * and uses it to return a value.\n * It returns a function that takes one argument, passes it to the first UnaryFunction, and then\n * passes the result to the next one, passes that result to the next one, and so on. \n */\nexport function pipe(...fns: Array>): UnaryFunction {\n return pipeFromArray(fns);\n}\n\n/** @internal */\nexport function pipeFromArray(fns: Array>): UnaryFunction {\n if (fns.length === 0) {\n return identity as UnaryFunction;\n }\n\n if (fns.length === 1) {\n return fns[0];\n }\n\n return function piped(input: T): R {\n return fns.reduce((prev: any, fn: UnaryFunction) => fn(prev), input as any);\n };\n}\n", "import { Operator } from './Operator';\nimport { SafeSubscriber, Subscriber } from './Subscriber';\nimport { isSubscription, Subscription } from './Subscription';\nimport { TeardownLogic, OperatorFunction, Subscribable, Observer } from './types';\nimport { observable as Symbol_observable } from './symbol/observable';\nimport { pipeFromArray } from './util/pipe';\nimport { config } from './config';\nimport { isFunction } from './util/isFunction';\nimport { errorContext } from './util/errorContext';\n\n/**\n * A representation of any set of values over any amount of time. This is the most basic building block\n * of RxJS.\n *\n * @class Observable\n */\nexport class Observable implements Subscribable {\n /**\n * @deprecated Internal implementation detail, do not use directly. Will be made internal in v8.\n */\n source: Observable | undefined;\n\n /**\n * @deprecated Internal implementation detail, do not use directly. Will be made internal in v8.\n */\n operator: Operator | undefined;\n\n /**\n * @constructor\n * @param {Function} subscribe the function that is called when the Observable is\n * initially subscribed to. This function is given a Subscriber, to which new values\n * can be `next`ed, or an `error` method can be called to raise an error, or\n * `complete` can be called to notify of a successful completion.\n */\n constructor(subscribe?: (this: Observable, subscriber: Subscriber) => TeardownLogic) {\n if (subscribe) {\n this._subscribe = subscribe;\n }\n }\n\n // HACK: Since TypeScript inherits static properties too, we have to\n // fight against TypeScript here so Subject can have a different static create signature\n /**\n * Creates a new Observable by calling the Observable constructor\n * @owner Observable\n * @method create\n * @param {Function} subscribe? the subscriber function to be passed to the Observable constructor\n * @return {Observable} a new observable\n * @nocollapse\n * @deprecated Use `new Observable()` instead. Will be removed in v8.\n */\n static create: (...args: any[]) => any = (subscribe?: (subscriber: Subscriber) => TeardownLogic) => {\n return new Observable(subscribe);\n };\n\n /**\n * Creates a new Observable, with this Observable instance as the source, and the passed\n * operator defined as the new observable's operator.\n * @method lift\n * @param operator the operator defining the operation to take on the observable\n * @return a new observable with the Operator applied\n * @deprecated Internal implementation detail, do not use directly. Will be made internal in v8.\n * If you have implemented an operator using `lift`, it is recommended that you create an\n * operator by simply returning `new Observable()` directly. See \"Creating new operators from\n * scratch\" section here: https://rxjs.dev/guide/operators\n */\n lift(operator?: Operator): Observable {\n const observable = new Observable();\n observable.source = this;\n observable.operator = operator;\n return observable;\n }\n\n subscribe(observerOrNext?: Partial> | ((value: T) => void)): Subscription;\n /** @deprecated Instead of passing separate callback arguments, use an observer argument. Signatures taking separate callback arguments will be removed in v8. Details: https://rxjs.dev/deprecations/subscribe-arguments */\n subscribe(next?: ((value: T) => void) | null, error?: ((error: any) => void) | null, complete?: (() => void) | null): Subscription;\n /**\n * Invokes an execution of an Observable and registers Observer handlers for notifications it will emit.\n *\n * Use it when you have all these Observables, but still nothing is happening.\n *\n * `subscribe` is not a regular operator, but a method that calls Observable's internal `subscribe` function. It\n * might be for example a function that you passed to Observable's constructor, but most of the time it is\n * a library implementation, which defines what will be emitted by an Observable, and when it be will emitted. This means\n * that calling `subscribe` is actually the moment when Observable starts its work, not when it is created, as it is often\n * the thought.\n *\n * Apart from starting the execution of an Observable, this method allows you to listen for values\n * that an Observable emits, as well as for when it completes or errors. You can achieve this in two\n * of the following ways.\n *\n * The first way is creating an object that implements {@link Observer} interface. It should have methods\n * defined by that interface, but note that it should be just a regular JavaScript object, which you can create\n * yourself in any way you want (ES6 class, classic function constructor, object literal etc.). In particular, do\n * not attempt to use any RxJS implementation details to create Observers - you don't need them. Remember also\n * that your object does not have to implement all methods. If you find yourself creating a method that doesn't\n * do anything, you can simply omit it. Note however, if the `error` method is not provided and an error happens,\n * it will be thrown asynchronously. Errors thrown asynchronously cannot be caught using `try`/`catch`. Instead,\n * use the {@link onUnhandledError} configuration option or use a runtime handler (like `window.onerror` or\n * `process.on('error)`) to be notified of unhandled errors. Because of this, it's recommended that you provide\n * an `error` method to avoid missing thrown errors.\n *\n * The second way is to give up on Observer object altogether and simply provide callback functions in place of its methods.\n * This means you can provide three functions as arguments to `subscribe`, where the first function is equivalent\n * of a `next` method, the second of an `error` method and the third of a `complete` method. Just as in case of an Observer,\n * if you do not need to listen for something, you can omit a function by passing `undefined` or `null`,\n * since `subscribe` recognizes these functions by where they were placed in function call. When it comes\n * to the `error` function, as with an Observer, if not provided, errors emitted by an Observable will be thrown asynchronously.\n *\n * You can, however, subscribe with no parameters at all. This may be the case where you're not interested in terminal events\n * and you also handled emissions internally by using operators (e.g. using `tap`).\n *\n * Whichever style of calling `subscribe` you use, in both cases it returns a Subscription object.\n * This object allows you to call `unsubscribe` on it, which in turn will stop the work that an Observable does and will clean\n * up all resources that an Observable used. Note that cancelling a subscription will not call `complete` callback\n * provided to `subscribe` function, which is reserved for a regular completion signal that comes from an Observable.\n *\n * Remember that callbacks provided to `subscribe` are not guaranteed to be called asynchronously.\n * It is an Observable itself that decides when these functions will be called. For example {@link of}\n * by default emits all its values synchronously. Always check documentation for how given Observable\n * will behave when subscribed and if its default behavior can be modified with a `scheduler`.\n *\n * #### Examples\n *\n * Subscribe with an {@link guide/observer Observer}\n *\n * ```ts\n * import { of } from 'rxjs';\n *\n * const sumObserver = {\n * sum: 0,\n * next(value) {\n * console.log('Adding: ' + value);\n * this.sum = this.sum + value;\n * },\n * error() {\n * // We actually could just remove this method,\n * // since we do not really care about errors right now.\n * },\n * complete() {\n * console.log('Sum equals: ' + this.sum);\n * }\n * };\n *\n * of(1, 2, 3) // Synchronously emits 1, 2, 3 and then completes.\n * .subscribe(sumObserver);\n *\n * // Logs:\n * // 'Adding: 1'\n * // 'Adding: 2'\n * // 'Adding: 3'\n * // 'Sum equals: 6'\n * ```\n *\n * Subscribe with functions ({@link deprecations/subscribe-arguments deprecated})\n *\n * ```ts\n * import { of } from 'rxjs'\n *\n * let sum = 0;\n *\n * of(1, 2, 3).subscribe(\n * value => {\n * console.log('Adding: ' + value);\n * sum = sum + value;\n * },\n * undefined,\n * () => console.log('Sum equals: ' + sum)\n * );\n *\n * // Logs:\n * // 'Adding: 1'\n * // 'Adding: 2'\n * // 'Adding: 3'\n * // 'Sum equals: 6'\n * ```\n *\n * Cancel a subscription\n *\n * ```ts\n * import { interval } from 'rxjs';\n *\n * const subscription = interval(1000).subscribe({\n * next(num) {\n * console.log(num)\n * },\n * complete() {\n * // Will not be called, even when cancelling subscription.\n * console.log('completed!');\n * }\n * });\n *\n * setTimeout(() => {\n * subscription.unsubscribe();\n * console.log('unsubscribed!');\n * }, 2500);\n *\n * // Logs:\n * // 0 after 1s\n * // 1 after 2s\n * // 'unsubscribed!' after 2.5s\n * ```\n *\n * @param {Observer|Function} observerOrNext (optional) Either an observer with methods to be called,\n * or the first of three possible handlers, which is the handler for each value emitted from the subscribed\n * Observable.\n * @param {Function} error (optional) A handler for a terminal event resulting from an error. If no error handler is provided,\n * the error will be thrown asynchronously as unhandled.\n * @param {Function} complete (optional) A handler for a terminal event resulting from successful completion.\n * @return {Subscription} a subscription reference to the registered handlers\n * @method subscribe\n */\n subscribe(\n observerOrNext?: Partial> | ((value: T) => void) | null,\n error?: ((error: any) => void) | null,\n complete?: (() => void) | null\n ): Subscription {\n const subscriber = isSubscriber(observerOrNext) ? observerOrNext : new SafeSubscriber(observerOrNext, error, complete);\n\n errorContext(() => {\n const { operator, source } = this;\n subscriber.add(\n operator\n ? // We're dealing with a subscription in the\n // operator chain to one of our lifted operators.\n operator.call(subscriber, source)\n : source\n ? // If `source` has a value, but `operator` does not, something that\n // had intimate knowledge of our API, like our `Subject`, must have\n // set it. We're going to just call `_subscribe` directly.\n this._subscribe(subscriber)\n : // In all other cases, we're likely wrapping a user-provided initializer\n // function, so we need to catch errors and handle them appropriately.\n this._trySubscribe(subscriber)\n );\n });\n\n return subscriber;\n }\n\n /** @internal */\n protected _trySubscribe(sink: Subscriber): TeardownLogic {\n try {\n return this._subscribe(sink);\n } catch (err) {\n // We don't need to return anything in this case,\n // because it's just going to try to `add()` to a subscription\n // above.\n sink.error(err);\n }\n }\n\n /**\n * Used as a NON-CANCELLABLE means of subscribing to an observable, for use with\n * APIs that expect promises, like `async/await`. You cannot unsubscribe from this.\n *\n * **WARNING**: Only use this with observables you *know* will complete. If the source\n * observable does not complete, you will end up with a promise that is hung up, and\n * potentially all of the state of an async function hanging out in memory. To avoid\n * this situation, look into adding something like {@link timeout}, {@link take},\n * {@link takeWhile}, or {@link takeUntil} amongst others.\n *\n * #### Example\n *\n * ```ts\n * import { interval, take } from 'rxjs';\n *\n * const source$ = interval(1000).pipe(take(4));\n *\n * async function getTotal() {\n * let total = 0;\n *\n * await source$.forEach(value => {\n * total += value;\n * console.log('observable -> ' + value);\n * });\n *\n * return total;\n * }\n *\n * getTotal().then(\n * total => console.log('Total: ' + total)\n * );\n *\n * // Expected:\n * // 'observable -> 0'\n * // 'observable -> 1'\n * // 'observable -> 2'\n * // 'observable -> 3'\n * // 'Total: 6'\n * ```\n *\n * @param next a handler for each value emitted by the observable\n * @return a promise that either resolves on observable completion or\n * rejects with the handled error\n */\n forEach(next: (value: T) => void): Promise;\n\n /**\n * @param next a handler for each value emitted by the observable\n * @param promiseCtor a constructor function used to instantiate the Promise\n * @return a promise that either resolves on observable completion or\n * rejects with the handled error\n * @deprecated Passing a Promise constructor will no longer be available\n * in upcoming versions of RxJS. This is because it adds weight to the library, for very\n * little benefit. If you need this functionality, it is recommended that you either\n * polyfill Promise, or you create an adapter to convert the returned native promise\n * to whatever promise implementation you wanted. Will be removed in v8.\n */\n forEach(next: (value: T) => void, promiseCtor: PromiseConstructorLike): Promise;\n\n forEach(next: (value: T) => void, promiseCtor?: PromiseConstructorLike): Promise {\n promiseCtor = getPromiseCtor(promiseCtor);\n\n return new promiseCtor((resolve, reject) => {\n const subscriber = new SafeSubscriber({\n next: (value) => {\n try {\n next(value);\n } catch (err) {\n reject(err);\n subscriber.unsubscribe();\n }\n },\n error: reject,\n complete: resolve,\n });\n this.subscribe(subscriber);\n }) as Promise;\n }\n\n /** @internal */\n protected _subscribe(subscriber: Subscriber): TeardownLogic {\n return this.source?.subscribe(subscriber);\n }\n\n /**\n * An interop point defined by the es7-observable spec https://github.com/zenparsing/es-observable\n * @method Symbol.observable\n * @return {Observable} this instance of the observable\n */\n [Symbol_observable]() {\n return this;\n }\n\n /* tslint:disable:max-line-length */\n pipe(): Observable;\n pipe(op1: OperatorFunction): Observable;\n pipe(op1: OperatorFunction, op2: OperatorFunction): Observable;\n pipe(op1: OperatorFunction, op2: OperatorFunction, op3: OperatorFunction): Observable;\n pipe(\n op1: OperatorFunction,\n op2: OperatorFunction,\n op3: OperatorFunction,\n op4: OperatorFunction\n ): Observable;\n pipe(\n op1: OperatorFunction,\n op2: OperatorFunction,\n op3: OperatorFunction,\n op4: OperatorFunction,\n op5: OperatorFunction\n ): Observable;\n pipe(\n op1: OperatorFunction,\n op2: OperatorFunction,\n op3: OperatorFunction,\n op4: OperatorFunction,\n op5: OperatorFunction,\n op6: OperatorFunction\n ): Observable;\n pipe(\n op1: OperatorFunction,\n op2: OperatorFunction,\n op3: OperatorFunction,\n op4: OperatorFunction,\n op5: OperatorFunction,\n op6: OperatorFunction,\n op7: OperatorFunction\n ): Observable;\n pipe(\n op1: OperatorFunction,\n op2: OperatorFunction,\n op3: OperatorFunction,\n op4: OperatorFunction,\n op5: OperatorFunction,\n op6: OperatorFunction,\n op7: OperatorFunction,\n op8: OperatorFunction\n ): Observable;\n pipe(\n op1: OperatorFunction,\n op2: OperatorFunction,\n op3: OperatorFunction,\n op4: OperatorFunction,\n op5: OperatorFunction,\n op6: OperatorFunction,\n op7: OperatorFunction,\n op8: OperatorFunction,\n op9: OperatorFunction\n ): Observable;\n pipe(\n op1: OperatorFunction,\n op2: OperatorFunction,\n op3: OperatorFunction,\n op4: OperatorFunction,\n op5: OperatorFunction,\n op6: OperatorFunction,\n op7: OperatorFunction,\n op8: OperatorFunction,\n op9: OperatorFunction,\n ...operations: OperatorFunction[]\n ): Observable;\n /* tslint:enable:max-line-length */\n\n /**\n * Used to stitch together functional operators into a chain.\n * @method pipe\n * @return {Observable} the Observable result of all of the operators having\n * been called in the order they were passed in.\n *\n * ## Example\n *\n * ```ts\n * import { interval, filter, map, scan } from 'rxjs';\n *\n * interval(1000)\n * .pipe(\n * filter(x => x % 2 === 0),\n * map(x => x + x),\n * scan((acc, x) => acc + x)\n * )\n * .subscribe(x => console.log(x));\n * ```\n */\n pipe(...operations: OperatorFunction[]): Observable {\n return pipeFromArray(operations)(this);\n }\n\n /* tslint:disable:max-line-length */\n /** @deprecated Replaced with {@link firstValueFrom} and {@link lastValueFrom}. Will be removed in v8. Details: https://rxjs.dev/deprecations/to-promise */\n toPromise(): Promise;\n /** @deprecated Replaced with {@link firstValueFrom} and {@link lastValueFrom}. Will be removed in v8. Details: https://rxjs.dev/deprecations/to-promise */\n toPromise(PromiseCtor: typeof Promise): Promise;\n /** @deprecated Replaced with {@link firstValueFrom} and {@link lastValueFrom}. Will be removed in v8. Details: https://rxjs.dev/deprecations/to-promise */\n toPromise(PromiseCtor: PromiseConstructorLike): Promise;\n /* tslint:enable:max-line-length */\n\n /**\n * Subscribe to this Observable and get a Promise resolving on\n * `complete` with the last emission (if any).\n *\n * **WARNING**: Only use this with observables you *know* will complete. If the source\n * observable does not complete, you will end up with a promise that is hung up, and\n * potentially all of the state of an async function hanging out in memory. To avoid\n * this situation, look into adding something like {@link timeout}, {@link take},\n * {@link takeWhile}, or {@link takeUntil} amongst others.\n *\n * @method toPromise\n * @param [promiseCtor] a constructor function used to instantiate\n * the Promise\n * @return A Promise that resolves with the last value emit, or\n * rejects on an error. If there were no emissions, Promise\n * resolves with undefined.\n * @deprecated Replaced with {@link firstValueFrom} and {@link lastValueFrom}. Will be removed in v8. Details: https://rxjs.dev/deprecations/to-promise\n */\n toPromise(promiseCtor?: PromiseConstructorLike): Promise {\n promiseCtor = getPromiseCtor(promiseCtor);\n\n return new promiseCtor((resolve, reject) => {\n let value: T | undefined;\n this.subscribe(\n (x: T) => (value = x),\n (err: any) => reject(err),\n () => resolve(value)\n );\n }) as Promise;\n }\n}\n\n/**\n * Decides between a passed promise constructor from consuming code,\n * A default configured promise constructor, and the native promise\n * constructor and returns it. If nothing can be found, it will throw\n * an error.\n * @param promiseCtor The optional promise constructor to passed by consuming code\n */\nfunction getPromiseCtor(promiseCtor: PromiseConstructorLike | undefined) {\n return promiseCtor ?? config.Promise ?? Promise;\n}\n\nfunction isObserver(value: any): value is Observer {\n return value && isFunction(value.next) && isFunction(value.error) && isFunction(value.complete);\n}\n\nfunction isSubscriber(value: any): value is Subscriber {\n return (value && value instanceof Subscriber) || (isObserver(value) && isSubscription(value));\n}\n", "import { Observable } from '../Observable';\nimport { Subscriber } from '../Subscriber';\nimport { OperatorFunction } from '../types';\nimport { isFunction } from './isFunction';\n\n/**\n * Used to determine if an object is an Observable with a lift function.\n */\nexport function hasLift(source: any): source is { lift: InstanceType['lift'] } {\n return isFunction(source?.lift);\n}\n\n/**\n * Creates an `OperatorFunction`. Used to define operators throughout the library in a concise way.\n * @param init The logic to connect the liftedSource to the subscriber at the moment of subscription.\n */\nexport function operate(\n init: (liftedSource: Observable, subscriber: Subscriber) => (() => void) | void\n): OperatorFunction {\n return (source: Observable) => {\n if (hasLift(source)) {\n return source.lift(function (this: Subscriber, liftedSource: Observable) {\n try {\n return init(liftedSource, this);\n } catch (err) {\n this.error(err);\n }\n });\n }\n throw new TypeError('Unable to lift unknown Observable type');\n };\n}\n", "import { Subscriber } from '../Subscriber';\n\n/**\n * Creates an instance of an `OperatorSubscriber`.\n * @param destination The downstream subscriber.\n * @param onNext Handles next values, only called if this subscriber is not stopped or closed. Any\n * error that occurs in this function is caught and sent to the `error` method of this subscriber.\n * @param onError Handles errors from the subscription, any errors that occur in this handler are caught\n * and send to the `destination` error handler.\n * @param onComplete Handles completion notification from the subscription. Any errors that occur in\n * this handler are sent to the `destination` error handler.\n * @param onFinalize Additional teardown logic here. This will only be called on teardown if the\n * subscriber itself is not already closed. This is called after all other teardown logic is executed.\n */\nexport function createOperatorSubscriber(\n destination: Subscriber,\n onNext?: (value: T) => void,\n onComplete?: () => void,\n onError?: (err: any) => void,\n onFinalize?: () => void\n): Subscriber {\n return new OperatorSubscriber(destination, onNext, onComplete, onError, onFinalize);\n}\n\n/**\n * A generic helper for allowing operators to be created with a Subscriber and\n * use closures to capture necessary state from the operator function itself.\n */\nexport class OperatorSubscriber extends Subscriber {\n /**\n * Creates an instance of an `OperatorSubscriber`.\n * @param destination The downstream subscriber.\n * @param onNext Handles next values, only called if this subscriber is not stopped or closed. Any\n * error that occurs in this function is caught and sent to the `error` method of this subscriber.\n * @param onError Handles errors from the subscription, any errors that occur in this handler are caught\n * and send to the `destination` error handler.\n * @param onComplete Handles completion notification from the subscription. Any errors that occur in\n * this handler are sent to the `destination` error handler.\n * @param onFinalize Additional finalization logic here. This will only be called on finalization if the\n * subscriber itself is not already closed. This is called after all other finalization logic is executed.\n * @param shouldUnsubscribe An optional check to see if an unsubscribe call should truly unsubscribe.\n * NOTE: This currently **ONLY** exists to support the strange behavior of {@link groupBy}, where unsubscription\n * to the resulting observable does not actually disconnect from the source if there are active subscriptions\n * to any grouped observable. (DO NOT EXPOSE OR USE EXTERNALLY!!!)\n */\n constructor(\n destination: Subscriber,\n onNext?: (value: T) => void,\n onComplete?: () => void,\n onError?: (err: any) => void,\n private onFinalize?: () => void,\n private shouldUnsubscribe?: () => boolean\n ) {\n // It's important - for performance reasons - that all of this class's\n // members are initialized and that they are always initialized in the same\n // order. This will ensure that all OperatorSubscriber instances have the\n // same hidden class in V8. This, in turn, will help keep the number of\n // hidden classes involved in property accesses within the base class as\n // low as possible. If the number of hidden classes involved exceeds four,\n // the property accesses will become megamorphic and performance penalties\n // will be incurred - i.e. inline caches won't be used.\n //\n // The reasons for ensuring all instances have the same hidden class are\n // further discussed in this blog post from Benedikt Meurer:\n // https://benediktmeurer.de/2018/03/23/impact-of-polymorphism-on-component-based-frameworks-like-react/\n super(destination);\n this._next = onNext\n ? function (this: OperatorSubscriber, value: T) {\n try {\n onNext(value);\n } catch (err) {\n destination.error(err);\n }\n }\n : super._next;\n this._error = onError\n ? function (this: OperatorSubscriber, err: any) {\n try {\n onError(err);\n } catch (err) {\n // Send any errors that occur down stream.\n destination.error(err);\n } finally {\n // Ensure finalization.\n this.unsubscribe();\n }\n }\n : super._error;\n this._complete = onComplete\n ? function (this: OperatorSubscriber) {\n try {\n onComplete();\n } catch (err) {\n // Send any errors that occur down stream.\n destination.error(err);\n } finally {\n // Ensure finalization.\n this.unsubscribe();\n }\n }\n : super._complete;\n }\n\n unsubscribe() {\n if (!this.shouldUnsubscribe || this.shouldUnsubscribe()) {\n const { closed } = this;\n super.unsubscribe();\n // Execute additional teardown if we have any and we didn't already do so.\n !closed && this.onFinalize?.();\n }\n }\n}\n", "import { Subscription } from '../Subscription';\n\ninterface AnimationFrameProvider {\n schedule(callback: FrameRequestCallback): Subscription;\n requestAnimationFrame: typeof requestAnimationFrame;\n cancelAnimationFrame: typeof cancelAnimationFrame;\n delegate:\n | {\n requestAnimationFrame: typeof requestAnimationFrame;\n cancelAnimationFrame: typeof cancelAnimationFrame;\n }\n | undefined;\n}\n\nexport const animationFrameProvider: AnimationFrameProvider = {\n // When accessing the delegate, use the variable rather than `this` so that\n // the functions can be called without being bound to the provider.\n schedule(callback) {\n let request = requestAnimationFrame;\n let cancel: typeof cancelAnimationFrame | undefined = cancelAnimationFrame;\n const { delegate } = animationFrameProvider;\n if (delegate) {\n request = delegate.requestAnimationFrame;\n cancel = delegate.cancelAnimationFrame;\n }\n const handle = request((timestamp) => {\n // Clear the cancel function. The request has been fulfilled, so\n // attempting to cancel the request upon unsubscription would be\n // pointless.\n cancel = undefined;\n callback(timestamp);\n });\n return new Subscription(() => cancel?.(handle));\n },\n requestAnimationFrame(...args) {\n const { delegate } = animationFrameProvider;\n return (delegate?.requestAnimationFrame || requestAnimationFrame)(...args);\n },\n cancelAnimationFrame(...args) {\n const { delegate } = animationFrameProvider;\n return (delegate?.cancelAnimationFrame || cancelAnimationFrame)(...args);\n },\n delegate: undefined,\n};\n", "import { createErrorClass } from './createErrorClass';\n\nexport interface ObjectUnsubscribedError extends Error {}\n\nexport interface ObjectUnsubscribedErrorCtor {\n /**\n * @deprecated Internal implementation detail. Do not construct error instances.\n * Cannot be tagged as internal: https://github.com/ReactiveX/rxjs/issues/6269\n */\n new (): ObjectUnsubscribedError;\n}\n\n/**\n * An error thrown when an action is invalid because the object has been\n * unsubscribed.\n *\n * @see {@link Subject}\n * @see {@link BehaviorSubject}\n *\n * @class ObjectUnsubscribedError\n */\nexport const ObjectUnsubscribedError: ObjectUnsubscribedErrorCtor = createErrorClass(\n (_super) =>\n function ObjectUnsubscribedErrorImpl(this: any) {\n _super(this);\n this.name = 'ObjectUnsubscribedError';\n this.message = 'object unsubscribed';\n }\n);\n", "import { Operator } from './Operator';\nimport { Observable } from './Observable';\nimport { Subscriber } from './Subscriber';\nimport { Subscription, EMPTY_SUBSCRIPTION } from './Subscription';\nimport { Observer, SubscriptionLike, TeardownLogic } from './types';\nimport { ObjectUnsubscribedError } from './util/ObjectUnsubscribedError';\nimport { arrRemove } from './util/arrRemove';\nimport { errorContext } from './util/errorContext';\n\n/**\n * A Subject is a special type of Observable that allows values to be\n * multicasted to many Observers. Subjects are like EventEmitters.\n *\n * Every Subject is an Observable and an Observer. You can subscribe to a\n * Subject, and you can call next to feed values as well as error and complete.\n */\nexport class Subject extends Observable implements SubscriptionLike {\n closed = false;\n\n private currentObservers: Observer[] | null = null;\n\n /** @deprecated Internal implementation detail, do not use directly. Will be made internal in v8. */\n observers: Observer[] = [];\n /** @deprecated Internal implementation detail, do not use directly. Will be made internal in v8. */\n isStopped = false;\n /** @deprecated Internal implementation detail, do not use directly. Will be made internal in v8. */\n hasError = false;\n /** @deprecated Internal implementation detail, do not use directly. Will be made internal in v8. */\n thrownError: any = null;\n\n /**\n * Creates a \"subject\" by basically gluing an observer to an observable.\n *\n * @nocollapse\n * @deprecated Recommended you do not use. Will be removed at some point in the future. Plans for replacement still under discussion.\n */\n static create: (...args: any[]) => any = (destination: Observer, source: Observable): AnonymousSubject => {\n return new AnonymousSubject(destination, source);\n };\n\n constructor() {\n // NOTE: This must be here to obscure Observable's constructor.\n super();\n }\n\n /** @deprecated Internal implementation detail, do not use directly. Will be made internal in v8. */\n lift(operator: Operator): Observable {\n const subject = new AnonymousSubject(this, this);\n subject.operator = operator as any;\n return subject as any;\n }\n\n /** @internal */\n protected _throwIfClosed() {\n if (this.closed) {\n throw new ObjectUnsubscribedError();\n }\n }\n\n next(value: T) {\n errorContext(() => {\n this._throwIfClosed();\n if (!this.isStopped) {\n if (!this.currentObservers) {\n this.currentObservers = Array.from(this.observers);\n }\n for (const observer of this.currentObservers) {\n observer.next(value);\n }\n }\n });\n }\n\n error(err: any) {\n errorContext(() => {\n this._throwIfClosed();\n if (!this.isStopped) {\n this.hasError = this.isStopped = true;\n this.thrownError = err;\n const { observers } = this;\n while (observers.length) {\n observers.shift()!.error(err);\n }\n }\n });\n }\n\n complete() {\n errorContext(() => {\n this._throwIfClosed();\n if (!this.isStopped) {\n this.isStopped = true;\n const { observers } = this;\n while (observers.length) {\n observers.shift()!.complete();\n }\n }\n });\n }\n\n unsubscribe() {\n this.isStopped = this.closed = true;\n this.observers = this.currentObservers = null!;\n }\n\n get observed() {\n return this.observers?.length > 0;\n }\n\n /** @internal */\n protected _trySubscribe(subscriber: Subscriber): TeardownLogic {\n this._throwIfClosed();\n return super._trySubscribe(subscriber);\n }\n\n /** @internal */\n protected _subscribe(subscriber: Subscriber): Subscription {\n this._throwIfClosed();\n this._checkFinalizedStatuses(subscriber);\n return this._innerSubscribe(subscriber);\n }\n\n /** @internal */\n protected _innerSubscribe(subscriber: Subscriber) {\n const { hasError, isStopped, observers } = this;\n if (hasError || isStopped) {\n return EMPTY_SUBSCRIPTION;\n }\n this.currentObservers = null;\n observers.push(subscriber);\n return new Subscription(() => {\n this.currentObservers = null;\n arrRemove(observers, subscriber);\n });\n }\n\n /** @internal */\n protected _checkFinalizedStatuses(subscriber: Subscriber) {\n const { hasError, thrownError, isStopped } = this;\n if (hasError) {\n subscriber.error(thrownError);\n } else if (isStopped) {\n subscriber.complete();\n }\n }\n\n /**\n * Creates a new Observable with this Subject as the source. You can do this\n * to create custom Observer-side logic of the Subject and conceal it from\n * code that uses the Observable.\n * @return {Observable} Observable that the Subject casts to\n */\n asObservable(): Observable {\n const observable: any = new Observable();\n observable.source = this;\n return observable;\n }\n}\n\n/**\n * @class AnonymousSubject\n */\nexport class AnonymousSubject extends Subject {\n constructor(\n /** @deprecated Internal implementation detail, do not use directly. Will be made internal in v8. */\n public destination?: Observer,\n source?: Observable\n ) {\n super();\n this.source = source;\n }\n\n next(value: T) {\n this.destination?.next?.(value);\n }\n\n error(err: any) {\n this.destination?.error?.(err);\n }\n\n complete() {\n this.destination?.complete?.();\n }\n\n /** @internal */\n protected _subscribe(subscriber: Subscriber): Subscription {\n return this.source?.subscribe(subscriber) ?? EMPTY_SUBSCRIPTION;\n }\n}\n", "import { Subject } from './Subject';\nimport { Subscriber } from './Subscriber';\nimport { Subscription } from './Subscription';\n\n/**\n * A variant of Subject that requires an initial value and emits its current\n * value whenever it is subscribed to.\n *\n * @class BehaviorSubject\n */\nexport class BehaviorSubject extends Subject {\n constructor(private _value: T) {\n super();\n }\n\n get value(): T {\n return this.getValue();\n }\n\n /** @internal */\n protected _subscribe(subscriber: Subscriber): Subscription {\n const subscription = super._subscribe(subscriber);\n !subscription.closed && subscriber.next(this._value);\n return subscription;\n }\n\n getValue(): T {\n const { hasError, thrownError, _value } = this;\n if (hasError) {\n throw thrownError;\n }\n this._throwIfClosed();\n return _value;\n }\n\n next(value: T): void {\n super.next((this._value = value));\n }\n}\n", "import { TimestampProvider } from '../types';\n\ninterface DateTimestampProvider extends TimestampProvider {\n delegate: TimestampProvider | undefined;\n}\n\nexport const dateTimestampProvider: DateTimestampProvider = {\n now() {\n // Use the variable rather than `this` so that the function can be called\n // without being bound to the provider.\n return (dateTimestampProvider.delegate || Date).now();\n },\n delegate: undefined,\n};\n", "import { Subject } from './Subject';\nimport { TimestampProvider } from './types';\nimport { Subscriber } from './Subscriber';\nimport { Subscription } from './Subscription';\nimport { dateTimestampProvider } from './scheduler/dateTimestampProvider';\n\n/**\n * A variant of {@link Subject} that \"replays\" old values to new subscribers by emitting them when they first subscribe.\n *\n * `ReplaySubject` has an internal buffer that will store a specified number of values that it has observed. Like `Subject`,\n * `ReplaySubject` \"observes\" values by having them passed to its `next` method. When it observes a value, it will store that\n * value for a time determined by the configuration of the `ReplaySubject`, as passed to its constructor.\n *\n * When a new subscriber subscribes to the `ReplaySubject` instance, it will synchronously emit all values in its buffer in\n * a First-In-First-Out (FIFO) manner. The `ReplaySubject` will also complete, if it has observed completion; and it will\n * error if it has observed an error.\n *\n * There are two main configuration items to be concerned with:\n *\n * 1. `bufferSize` - This will determine how many items are stored in the buffer, defaults to infinite.\n * 2. `windowTime` - The amount of time to hold a value in the buffer before removing it from the buffer.\n *\n * Both configurations may exist simultaneously. So if you would like to buffer a maximum of 3 values, as long as the values\n * are less than 2 seconds old, you could do so with a `new ReplaySubject(3, 2000)`.\n *\n * ### Differences with BehaviorSubject\n *\n * `BehaviorSubject` is similar to `new ReplaySubject(1)`, with a couple of exceptions:\n *\n * 1. `BehaviorSubject` comes \"primed\" with a single value upon construction.\n * 2. `ReplaySubject` will replay values, even after observing an error, where `BehaviorSubject` will not.\n *\n * @see {@link Subject}\n * @see {@link BehaviorSubject}\n * @see {@link shareReplay}\n */\nexport class ReplaySubject extends Subject {\n private _buffer: (T | number)[] = [];\n private _infiniteTimeWindow = true;\n\n /**\n * @param bufferSize The size of the buffer to replay on subscription\n * @param windowTime The amount of time the buffered items will stay buffered\n * @param timestampProvider An object with a `now()` method that provides the current timestamp. This is used to\n * calculate the amount of time something has been buffered.\n */\n constructor(\n private _bufferSize = Infinity,\n private _windowTime = Infinity,\n private _timestampProvider: TimestampProvider = dateTimestampProvider\n ) {\n super();\n this._infiniteTimeWindow = _windowTime === Infinity;\n this._bufferSize = Math.max(1, _bufferSize);\n this._windowTime = Math.max(1, _windowTime);\n }\n\n next(value: T): void {\n const { isStopped, _buffer, _infiniteTimeWindow, _timestampProvider, _windowTime } = this;\n if (!isStopped) {\n _buffer.push(value);\n !_infiniteTimeWindow && _buffer.push(_timestampProvider.now() + _windowTime);\n }\n this._trimBuffer();\n super.next(value);\n }\n\n /** @internal */\n protected _subscribe(subscriber: Subscriber): Subscription {\n this._throwIfClosed();\n this._trimBuffer();\n\n const subscription = this._innerSubscribe(subscriber);\n\n const { _infiniteTimeWindow, _buffer } = this;\n // We use a copy here, so reentrant code does not mutate our array while we're\n // emitting it to a new subscriber.\n const copy = _buffer.slice();\n for (let i = 0; i < copy.length && !subscriber.closed; i += _infiniteTimeWindow ? 1 : 2) {\n subscriber.next(copy[i] as T);\n }\n\n this._checkFinalizedStatuses(subscriber);\n\n return subscription;\n }\n\n private _trimBuffer() {\n const { _bufferSize, _timestampProvider, _buffer, _infiniteTimeWindow } = this;\n // If we don't have an infinite buffer size, and we're over the length,\n // use splice to truncate the old buffer values off. Note that we have to\n // double the size for instances where we're not using an infinite time window\n // because we're storing the values and the timestamps in the same array.\n const adjustedBufferSize = (_infiniteTimeWindow ? 1 : 2) * _bufferSize;\n _bufferSize < Infinity && adjustedBufferSize < _buffer.length && _buffer.splice(0, _buffer.length - adjustedBufferSize);\n\n // Now, if we're not in an infinite time window, remove all values where the time is\n // older than what is allowed.\n if (!_infiniteTimeWindow) {\n const now = _timestampProvider.now();\n let last = 0;\n // Search the array for the first timestamp that isn't expired and\n // truncate the buffer up to that point.\n for (let i = 1; i < _buffer.length && (_buffer[i] as number) <= now; i += 2) {\n last = i;\n }\n last && _buffer.splice(0, last + 1);\n }\n }\n}\n", "import { Scheduler } from '../Scheduler';\nimport { Subscription } from '../Subscription';\nimport { SchedulerAction } from '../types';\n\n/**\n * A unit of work to be executed in a `scheduler`. An action is typically\n * created from within a {@link SchedulerLike} and an RxJS user does not need to concern\n * themselves about creating and manipulating an Action.\n *\n * ```ts\n * class Action extends Subscription {\n * new (scheduler: Scheduler, work: (state?: T) => void);\n * schedule(state?: T, delay: number = 0): Subscription;\n * }\n * ```\n *\n * @class Action\n */\nexport class Action extends Subscription {\n constructor(scheduler: Scheduler, work: (this: SchedulerAction, state?: T) => void) {\n super();\n }\n /**\n * Schedules this action on its parent {@link SchedulerLike} for execution. May be passed\n * some context object, `state`. May happen at some point in the future,\n * according to the `delay` parameter, if specified.\n * @param {T} [state] Some contextual data that the `work` function uses when\n * called by the Scheduler.\n * @param {number} [delay] Time to wait before executing the work, where the\n * time unit is implicit and defined by the Scheduler.\n * @return {void}\n */\n public schedule(state?: T, delay: number = 0): Subscription {\n return this;\n }\n}\n", "import type { TimerHandle } from './timerHandle';\ntype SetIntervalFunction = (handler: () => void, timeout?: number, ...args: any[]) => TimerHandle;\ntype ClearIntervalFunction = (handle: TimerHandle) => void;\n\ninterface IntervalProvider {\n setInterval: SetIntervalFunction;\n clearInterval: ClearIntervalFunction;\n delegate:\n | {\n setInterval: SetIntervalFunction;\n clearInterval: ClearIntervalFunction;\n }\n | undefined;\n}\n\nexport const intervalProvider: IntervalProvider = {\n // When accessing the delegate, use the variable rather than `this` so that\n // the functions can be called without being bound to the provider.\n setInterval(handler: () => void, timeout?: number, ...args) {\n const { delegate } = intervalProvider;\n if (delegate?.setInterval) {\n return delegate.setInterval(handler, timeout, ...args);\n }\n return setInterval(handler, timeout, ...args);\n },\n clearInterval(handle) {\n const { delegate } = intervalProvider;\n return (delegate?.clearInterval || clearInterval)(handle as any);\n },\n delegate: undefined,\n};\n", "import { Action } from './Action';\nimport { SchedulerAction } from '../types';\nimport { Subscription } from '../Subscription';\nimport { AsyncScheduler } from './AsyncScheduler';\nimport { intervalProvider } from './intervalProvider';\nimport { arrRemove } from '../util/arrRemove';\nimport { TimerHandle } from './timerHandle';\n\nexport class AsyncAction extends Action {\n public id: TimerHandle | undefined;\n public state?: T;\n // @ts-ignore: Property has no initializer and is not definitely assigned\n public delay: number;\n protected pending: boolean = false;\n\n constructor(protected scheduler: AsyncScheduler, protected work: (this: SchedulerAction, state?: T) => void) {\n super(scheduler, work);\n }\n\n public schedule(state?: T, delay: number = 0): Subscription {\n if (this.closed) {\n return this;\n }\n\n // Always replace the current state with the new state.\n this.state = state;\n\n const id = this.id;\n const scheduler = this.scheduler;\n\n //\n // Important implementation note:\n //\n // Actions only execute once by default, unless rescheduled from within the\n // scheduled callback. This allows us to implement single and repeat\n // actions via the same code path, without adding API surface area, as well\n // as mimic traditional recursion but across asynchronous boundaries.\n //\n // However, JS runtimes and timers distinguish between intervals achieved by\n // serial `setTimeout` calls vs. a single `setInterval` call. An interval of\n // serial `setTimeout` calls can be individually delayed, which delays\n // scheduling the next `setTimeout`, and so on. `setInterval` attempts to\n // guarantee the interval callback will be invoked more precisely to the\n // interval period, regardless of load.\n //\n // Therefore, we use `setInterval` to schedule single and repeat actions.\n // If the action reschedules itself with the same delay, the interval is not\n // canceled. If the action doesn't reschedule, or reschedules with a\n // different delay, the interval will be canceled after scheduled callback\n // execution.\n //\n if (id != null) {\n this.id = this.recycleAsyncId(scheduler, id, delay);\n }\n\n // Set the pending flag indicating that this action has been scheduled, or\n // has recursively rescheduled itself.\n this.pending = true;\n\n this.delay = delay;\n // If this action has already an async Id, don't request a new one.\n this.id = this.id ?? this.requestAsyncId(scheduler, this.id, delay);\n\n return this;\n }\n\n protected requestAsyncId(scheduler: AsyncScheduler, _id?: TimerHandle, delay: number = 0): TimerHandle {\n return intervalProvider.setInterval(scheduler.flush.bind(scheduler, this), delay);\n }\n\n protected recycleAsyncId(_scheduler: AsyncScheduler, id?: TimerHandle, delay: number | null = 0): TimerHandle | undefined {\n // If this action is rescheduled with the same delay time, don't clear the interval id.\n if (delay != null && this.delay === delay && this.pending === false) {\n return id;\n }\n // Otherwise, if the action's delay time is different from the current delay,\n // or the action has been rescheduled before it's executed, clear the interval id\n if (id != null) {\n intervalProvider.clearInterval(id);\n }\n\n return undefined;\n }\n\n /**\n * Immediately executes this action and the `work` it contains.\n * @return {any}\n */\n public execute(state: T, delay: number): any {\n if (this.closed) {\n return new Error('executing a cancelled action');\n }\n\n this.pending = false;\n const error = this._execute(state, delay);\n if (error) {\n return error;\n } else if (this.pending === false && this.id != null) {\n // Dequeue if the action didn't reschedule itself. Don't call\n // unsubscribe(), because the action could reschedule later.\n // For example:\n // ```\n // scheduler.schedule(function doWork(counter) {\n // /* ... I'm a busy worker bee ... */\n // var originalAction = this;\n // /* wait 100ms before rescheduling the action */\n // setTimeout(function () {\n // originalAction.schedule(counter + 1);\n // }, 100);\n // }, 1000);\n // ```\n this.id = this.recycleAsyncId(this.scheduler, this.id, null);\n }\n }\n\n protected _execute(state: T, _delay: number): any {\n let errored: boolean = false;\n let errorValue: any;\n try {\n this.work(state);\n } catch (e) {\n errored = true;\n // HACK: Since code elsewhere is relying on the \"truthiness\" of the\n // return here, we can't have it return \"\" or 0 or false.\n // TODO: Clean this up when we refactor schedulers mid-version-8 or so.\n errorValue = e ? e : new Error('Scheduled action threw falsy error');\n }\n if (errored) {\n this.unsubscribe();\n return errorValue;\n }\n }\n\n unsubscribe() {\n if (!this.closed) {\n const { id, scheduler } = this;\n const { actions } = scheduler;\n\n this.work = this.state = this.scheduler = null!;\n this.pending = false;\n\n arrRemove(actions, this);\n if (id != null) {\n this.id = this.recycleAsyncId(scheduler, id, null);\n }\n\n this.delay = null!;\n super.unsubscribe();\n }\n }\n}\n", "import { Action } from './scheduler/Action';\nimport { Subscription } from './Subscription';\nimport { SchedulerLike, SchedulerAction } from './types';\nimport { dateTimestampProvider } from './scheduler/dateTimestampProvider';\n\n/**\n * An execution context and a data structure to order tasks and schedule their\n * execution. Provides a notion of (potentially virtual) time, through the\n * `now()` getter method.\n *\n * Each unit of work in a Scheduler is called an `Action`.\n *\n * ```ts\n * class Scheduler {\n * now(): number;\n * schedule(work, delay?, state?): Subscription;\n * }\n * ```\n *\n * @class Scheduler\n * @deprecated Scheduler is an internal implementation detail of RxJS, and\n * should not be used directly. Rather, create your own class and implement\n * {@link SchedulerLike}. Will be made internal in v8.\n */\nexport class Scheduler implements SchedulerLike {\n public static now: () => number = dateTimestampProvider.now;\n\n constructor(private schedulerActionCtor: typeof Action, now: () => number = Scheduler.now) {\n this.now = now;\n }\n\n /**\n * A getter method that returns a number representing the current time\n * (at the time this function was called) according to the scheduler's own\n * internal clock.\n * @return {number} A number that represents the current time. May or may not\n * have a relation to wall-clock time. May or may not refer to a time unit\n * (e.g. milliseconds).\n */\n public now: () => number;\n\n /**\n * Schedules a function, `work`, for execution. May happen at some point in\n * the future, according to the `delay` parameter, if specified. May be passed\n * some context object, `state`, which will be passed to the `work` function.\n *\n * The given arguments will be processed an stored as an Action object in a\n * queue of actions.\n *\n * @param {function(state: ?T): ?Subscription} work A function representing a\n * task, or some unit of work to be executed by the Scheduler.\n * @param {number} [delay] Time to wait before executing the work, where the\n * time unit is implicit and defined by the Scheduler itself.\n * @param {T} [state] Some contextual data that the `work` function uses when\n * called by the Scheduler.\n * @return {Subscription} A subscription in order to be able to unsubscribe\n * the scheduled work.\n */\n public schedule(work: (this: SchedulerAction, state?: T) => void, delay: number = 0, state?: T): Subscription {\n return new this.schedulerActionCtor(this, work).schedule(state, delay);\n }\n}\n", "import { Scheduler } from '../Scheduler';\nimport { Action } from './Action';\nimport { AsyncAction } from './AsyncAction';\nimport { TimerHandle } from './timerHandle';\n\nexport class AsyncScheduler extends Scheduler {\n public actions: Array> = [];\n /**\n * A flag to indicate whether the Scheduler is currently executing a batch of\n * queued actions.\n * @type {boolean}\n * @internal\n */\n public _active: boolean = false;\n /**\n * An internal ID used to track the latest asynchronous task such as those\n * coming from `setTimeout`, `setInterval`, `requestAnimationFrame`, and\n * others.\n * @type {any}\n * @internal\n */\n public _scheduled: TimerHandle | undefined;\n\n constructor(SchedulerAction: typeof Action, now: () => number = Scheduler.now) {\n super(SchedulerAction, now);\n }\n\n public flush(action: AsyncAction): void {\n const { actions } = this;\n\n if (this._active) {\n actions.push(action);\n return;\n }\n\n let error: any;\n this._active = true;\n\n do {\n if ((error = action.execute(action.state, action.delay))) {\n break;\n }\n } while ((action = actions.shift()!)); // exhaust the scheduler queue\n\n this._active = false;\n\n if (error) {\n while ((action = actions.shift()!)) {\n action.unsubscribe();\n }\n throw error;\n }\n }\n}\n", "import { AsyncAction } from './AsyncAction';\nimport { AsyncScheduler } from './AsyncScheduler';\n\n/**\n *\n * Async Scheduler\n *\n * Schedule task as if you used setTimeout(task, duration)\n *\n * `async` scheduler schedules tasks asynchronously, by putting them on the JavaScript\n * event loop queue. It is best used to delay tasks in time or to schedule tasks repeating\n * in intervals.\n *\n * If you just want to \"defer\" task, that is to perform it right after currently\n * executing synchronous code ends (commonly achieved by `setTimeout(deferredTask, 0)`),\n * better choice will be the {@link asapScheduler} scheduler.\n *\n * ## Examples\n * Use async scheduler to delay task\n * ```ts\n * import { asyncScheduler } from 'rxjs';\n *\n * const task = () => console.log('it works!');\n *\n * asyncScheduler.schedule(task, 2000);\n *\n * // After 2 seconds logs:\n * // \"it works!\"\n * ```\n *\n * Use async scheduler to repeat task in intervals\n * ```ts\n * import { asyncScheduler } from 'rxjs';\n *\n * function task(state) {\n * console.log(state);\n * this.schedule(state + 1, 1000); // `this` references currently executing Action,\n * // which we reschedule with new state and delay\n * }\n *\n * asyncScheduler.schedule(task, 3000, 0);\n *\n * // Logs:\n * // 0 after 3s\n * // 1 after 4s\n * // 2 after 5s\n * // 3 after 6s\n * ```\n */\n\nexport const asyncScheduler = new AsyncScheduler(AsyncAction);\n\n/**\n * @deprecated Renamed to {@link asyncScheduler}. Will be removed in v8.\n */\nexport const async = asyncScheduler;\n", "import { AsyncAction } from './AsyncAction';\nimport { Subscription } from '../Subscription';\nimport { QueueScheduler } from './QueueScheduler';\nimport { SchedulerAction } from '../types';\nimport { TimerHandle } from './timerHandle';\n\nexport class QueueAction extends AsyncAction {\n constructor(protected scheduler: QueueScheduler, protected work: (this: SchedulerAction, state?: T) => void) {\n super(scheduler, work);\n }\n\n public schedule(state?: T, delay: number = 0): Subscription {\n if (delay > 0) {\n return super.schedule(state, delay);\n }\n this.delay = delay;\n this.state = state;\n this.scheduler.flush(this);\n return this;\n }\n\n public execute(state: T, delay: number): any {\n return delay > 0 || this.closed ? super.execute(state, delay) : this._execute(state, delay);\n }\n\n protected requestAsyncId(scheduler: QueueScheduler, id?: TimerHandle, delay: number = 0): TimerHandle {\n // If delay exists and is greater than 0, or if the delay is null (the\n // action wasn't rescheduled) but was originally scheduled as an async\n // action, then recycle as an async action.\n\n if ((delay != null && delay > 0) || (delay == null && this.delay > 0)) {\n return super.requestAsyncId(scheduler, id, delay);\n }\n\n // Otherwise flush the scheduler starting with this action.\n scheduler.flush(this);\n\n // HACK: In the past, this was returning `void`. However, `void` isn't a valid\n // `TimerHandle`, and generally the return value here isn't really used. So the\n // compromise is to return `0` which is both \"falsy\" and a valid `TimerHandle`,\n // as opposed to refactoring every other instanceo of `requestAsyncId`.\n return 0;\n }\n}\n", "import { AsyncScheduler } from './AsyncScheduler';\n\nexport class QueueScheduler extends AsyncScheduler {\n}\n", "import { QueueAction } from './QueueAction';\nimport { QueueScheduler } from './QueueScheduler';\n\n/**\n *\n * Queue Scheduler\n *\n * Put every next task on a queue, instead of executing it immediately\n *\n * `queue` scheduler, when used with delay, behaves the same as {@link asyncScheduler} scheduler.\n *\n * When used without delay, it schedules given task synchronously - executes it right when\n * it is scheduled. However when called recursively, that is when inside the scheduled task,\n * another task is scheduled with queue scheduler, instead of executing immediately as well,\n * that task will be put on a queue and wait for current one to finish.\n *\n * This means that when you execute task with `queue` scheduler, you are sure it will end\n * before any other task scheduled with that scheduler will start.\n *\n * ## Examples\n * Schedule recursively first, then do something\n * ```ts\n * import { queueScheduler } from 'rxjs';\n *\n * queueScheduler.schedule(() => {\n * queueScheduler.schedule(() => console.log('second')); // will not happen now, but will be put on a queue\n *\n * console.log('first');\n * });\n *\n * // Logs:\n * // \"first\"\n * // \"second\"\n * ```\n *\n * Reschedule itself recursively\n * ```ts\n * import { queueScheduler } from 'rxjs';\n *\n * queueScheduler.schedule(function(state) {\n * if (state !== 0) {\n * console.log('before', state);\n * this.schedule(state - 1); // `this` references currently executing Action,\n * // which we reschedule with new state\n * console.log('after', state);\n * }\n * }, 0, 3);\n *\n * // In scheduler that runs recursively, you would expect:\n * // \"before\", 3\n * // \"before\", 2\n * // \"before\", 1\n * // \"after\", 1\n * // \"after\", 2\n * // \"after\", 3\n *\n * // But with queue it logs:\n * // \"before\", 3\n * // \"after\", 3\n * // \"before\", 2\n * // \"after\", 2\n * // \"before\", 1\n * // \"after\", 1\n * ```\n */\n\nexport const queueScheduler = new QueueScheduler(QueueAction);\n\n/**\n * @deprecated Renamed to {@link queueScheduler}. Will be removed in v8.\n */\nexport const queue = queueScheduler;\n", "import { AsyncAction } from './AsyncAction';\nimport { AnimationFrameScheduler } from './AnimationFrameScheduler';\nimport { SchedulerAction } from '../types';\nimport { animationFrameProvider } from './animationFrameProvider';\nimport { TimerHandle } from './timerHandle';\n\nexport class AnimationFrameAction extends AsyncAction {\n constructor(protected scheduler: AnimationFrameScheduler, protected work: (this: SchedulerAction, state?: T) => void) {\n super(scheduler, work);\n }\n\n protected requestAsyncId(scheduler: AnimationFrameScheduler, id?: TimerHandle, delay: number = 0): TimerHandle {\n // If delay is greater than 0, request as an async action.\n if (delay !== null && delay > 0) {\n return super.requestAsyncId(scheduler, id, delay);\n }\n // Push the action to the end of the scheduler queue.\n scheduler.actions.push(this);\n // If an animation frame has already been requested, don't request another\n // one. If an animation frame hasn't been requested yet, request one. Return\n // the current animation frame request id.\n return scheduler._scheduled || (scheduler._scheduled = animationFrameProvider.requestAnimationFrame(() => scheduler.flush(undefined)));\n }\n\n protected recycleAsyncId(scheduler: AnimationFrameScheduler, id?: TimerHandle, delay: number = 0): TimerHandle | undefined {\n // If delay exists and is greater than 0, or if the delay is null (the\n // action wasn't rescheduled) but was originally scheduled as an async\n // action, then recycle as an async action.\n if (delay != null ? delay > 0 : this.delay > 0) {\n return super.recycleAsyncId(scheduler, id, delay);\n }\n // If the scheduler queue has no remaining actions with the same async id,\n // cancel the requested animation frame and set the scheduled flag to\n // undefined so the next AnimationFrameAction will request its own.\n const { actions } = scheduler;\n if (id != null && actions[actions.length - 1]?.id !== id) {\n animationFrameProvider.cancelAnimationFrame(id as number);\n scheduler._scheduled = undefined;\n }\n // Return undefined so the action knows to request a new async id if it's rescheduled.\n return undefined;\n }\n}\n", "import { AsyncAction } from './AsyncAction';\nimport { AsyncScheduler } from './AsyncScheduler';\n\nexport class AnimationFrameScheduler extends AsyncScheduler {\n public flush(action?: AsyncAction): void {\n this._active = true;\n // The async id that effects a call to flush is stored in _scheduled.\n // Before executing an action, it's necessary to check the action's async\n // id to determine whether it's supposed to be executed in the current\n // flush.\n // Previous implementations of this method used a count to determine this,\n // but that was unsound, as actions that are unsubscribed - i.e. cancelled -\n // are removed from the actions array and that can shift actions that are\n // scheduled to be executed in a subsequent flush into positions at which\n // they are executed within the current flush.\n const flushId = this._scheduled;\n this._scheduled = undefined;\n\n const { actions } = this;\n let error: any;\n action = action || actions.shift()!;\n\n do {\n if ((error = action.execute(action.state, action.delay))) {\n break;\n }\n } while ((action = actions[0]) && action.id === flushId && actions.shift());\n\n this._active = false;\n\n if (error) {\n while ((action = actions[0]) && action.id === flushId && actions.shift()) {\n action.unsubscribe();\n }\n throw error;\n }\n }\n}\n", "import { AnimationFrameAction } from './AnimationFrameAction';\nimport { AnimationFrameScheduler } from './AnimationFrameScheduler';\n\n/**\n *\n * Animation Frame Scheduler\n *\n * Perform task when `window.requestAnimationFrame` would fire\n *\n * When `animationFrame` scheduler is used with delay, it will fall back to {@link asyncScheduler} scheduler\n * behaviour.\n *\n * Without delay, `animationFrame` scheduler can be used to create smooth browser animations.\n * It makes sure scheduled task will happen just before next browser content repaint,\n * thus performing animations as efficiently as possible.\n *\n * ## Example\n * Schedule div height animation\n * ```ts\n * // html:
\n * import { animationFrameScheduler } from 'rxjs';\n *\n * const div = document.querySelector('div');\n *\n * animationFrameScheduler.schedule(function(height) {\n * div.style.height = height + \"px\";\n *\n * this.schedule(height + 1); // `this` references currently executing Action,\n * // which we reschedule with new state\n * }, 0, 0);\n *\n * // You will see a div element growing in height\n * ```\n */\n\nexport const animationFrameScheduler = new AnimationFrameScheduler(AnimationFrameAction);\n\n/**\n * @deprecated Renamed to {@link animationFrameScheduler}. Will be removed in v8.\n */\nexport const animationFrame = animationFrameScheduler;\n", "import { Observable } from '../Observable';\nimport { SchedulerLike } from '../types';\n\n/**\n * A simple Observable that emits no items to the Observer and immediately\n * emits a complete notification.\n *\n * Just emits 'complete', and nothing else.\n *\n * ![](empty.png)\n *\n * A simple Observable that only emits the complete notification. It can be used\n * for composing with other Observables, such as in a {@link mergeMap}.\n *\n * ## Examples\n *\n * Log complete notification\n *\n * ```ts\n * import { EMPTY } from 'rxjs';\n *\n * EMPTY.subscribe({\n * next: () => console.log('Next'),\n * complete: () => console.log('Complete!')\n * });\n *\n * // Outputs\n * // Complete!\n * ```\n *\n * Emit the number 7, then complete\n *\n * ```ts\n * import { EMPTY, startWith } from 'rxjs';\n *\n * const result = EMPTY.pipe(startWith(7));\n * result.subscribe(x => console.log(x));\n *\n * // Outputs\n * // 7\n * ```\n *\n * Map and flatten only odd numbers to the sequence `'a'`, `'b'`, `'c'`\n *\n * ```ts\n * import { interval, mergeMap, of, EMPTY } from 'rxjs';\n *\n * const interval$ = interval(1000);\n * const result = interval$.pipe(\n * mergeMap(x => x % 2 === 1 ? of('a', 'b', 'c') : EMPTY),\n * );\n * result.subscribe(x => console.log(x));\n *\n * // Results in the following to the console:\n * // x is equal to the count on the interval, e.g. (0, 1, 2, 3, ...)\n * // x will occur every 1000ms\n * // if x % 2 is equal to 1, print a, b, c (each on its own)\n * // if x % 2 is not equal to 1, nothing will be output\n * ```\n *\n * @see {@link Observable}\n * @see {@link NEVER}\n * @see {@link of}\n * @see {@link throwError}\n */\nexport const EMPTY = new Observable((subscriber) => subscriber.complete());\n\n/**\n * @param scheduler A {@link SchedulerLike} to use for scheduling\n * the emission of the complete notification.\n * @deprecated Replaced with the {@link EMPTY} constant or {@link scheduled} (e.g. `scheduled([], scheduler)`). Will be removed in v8.\n */\nexport function empty(scheduler?: SchedulerLike) {\n return scheduler ? emptyScheduled(scheduler) : EMPTY;\n}\n\nfunction emptyScheduled(scheduler: SchedulerLike) {\n return new Observable((subscriber) => scheduler.schedule(() => subscriber.complete()));\n}\n", "import { SchedulerLike } from '../types';\nimport { isFunction } from './isFunction';\n\nexport function isScheduler(value: any): value is SchedulerLike {\n return value && isFunction(value.schedule);\n}\n", "import { SchedulerLike } from '../types';\nimport { isFunction } from './isFunction';\nimport { isScheduler } from './isScheduler';\n\nfunction last(arr: T[]): T | undefined {\n return arr[arr.length - 1];\n}\n\nexport function popResultSelector(args: any[]): ((...args: unknown[]) => unknown) | undefined {\n return isFunction(last(args)) ? args.pop() : undefined;\n}\n\nexport function popScheduler(args: any[]): SchedulerLike | undefined {\n return isScheduler(last(args)) ? args.pop() : undefined;\n}\n\nexport function popNumber(args: any[], defaultValue: number): number {\n return typeof last(args) === 'number' ? args.pop()! : defaultValue;\n}\n", "export const isArrayLike = ((x: any): x is ArrayLike => x && typeof x.length === 'number' && typeof x !== 'function');", "import { isFunction } from \"./isFunction\";\n\n/**\n * Tests to see if the object is \"thennable\".\n * @param value the object to test\n */\nexport function isPromise(value: any): value is PromiseLike {\n return isFunction(value?.then);\n}\n", "import { InteropObservable } from '../types';\nimport { observable as Symbol_observable } from '../symbol/observable';\nimport { isFunction } from './isFunction';\n\n/** Identifies an input as being Observable (but not necessary an Rx Observable) */\nexport function isInteropObservable(input: any): input is InteropObservable {\n return isFunction(input[Symbol_observable]);\n}\n", "import { isFunction } from './isFunction';\n\nexport function isAsyncIterable(obj: any): obj is AsyncIterable {\n return Symbol.asyncIterator && isFunction(obj?.[Symbol.asyncIterator]);\n}\n", "/**\n * Creates the TypeError to throw if an invalid object is passed to `from` or `scheduled`.\n * @param input The object that was passed.\n */\nexport function createInvalidObservableTypeError(input: any) {\n // TODO: We should create error codes that can be looked up, so this can be less verbose.\n return new TypeError(\n `You provided ${\n input !== null && typeof input === 'object' ? 'an invalid object' : `'${input}'`\n } where a stream was expected. You can provide an Observable, Promise, ReadableStream, Array, AsyncIterable, or Iterable.`\n );\n}\n", "export function getSymbolIterator(): symbol {\n if (typeof Symbol !== 'function' || !Symbol.iterator) {\n return '@@iterator' as any;\n }\n\n return Symbol.iterator;\n}\n\nexport const iterator = getSymbolIterator();\n", "import { iterator as Symbol_iterator } from '../symbol/iterator';\nimport { isFunction } from './isFunction';\n\n/** Identifies an input as being an Iterable */\nexport function isIterable(input: any): input is Iterable {\n return isFunction(input?.[Symbol_iterator]);\n}\n", "import { ReadableStreamLike } from '../types';\nimport { isFunction } from './isFunction';\n\nexport async function* readableStreamLikeToAsyncGenerator(readableStream: ReadableStreamLike): AsyncGenerator {\n const reader = readableStream.getReader();\n try {\n while (true) {\n const { value, done } = await reader.read();\n if (done) {\n return;\n }\n yield value!;\n }\n } finally {\n reader.releaseLock();\n }\n}\n\nexport function isReadableStreamLike(obj: any): obj is ReadableStreamLike {\n // We don't want to use instanceof checks because they would return\n // false for instances from another Realm, like an ' ) + } + else if ( linkText.match( /vimeo/ ) ) { + let vimeoID = replace.split( '/' ).slice(-1)[0]; + aLink.push( '
' ) + } + else { + aLink.push( '
' + linkText + '' ); + } + text = text.split( linksFound[i] ).map(item => { return aLink[i].includes('iframe') ? item.trim() : item } ).join( aLink[i] ); + } + return text; + + } + else { + return input; + } + } \ No newline at end of file diff --git a/docs/js/katex.js b/docs/js/katex.js new file mode 100644 index 00000000..841e35ad --- /dev/null +++ b/docs/js/katex.js @@ -0,0 +1,10 @@ +document$.subscribe(({ body }) => { + renderMathInElement(body, { + delimiters: [ + { left: "$$", right: "$$", display: true }, + { left: "$", right: "$", display: false }, + { left: "\\(", right: "\\)", display: false }, + { left: "\\[", right: "\\]", display: true } + ], + }) +}) \ No newline at end of file diff --git a/docs/js/tsparticles.js b/docs/js/tsparticles.js new file mode 100644 index 00000000..bf96e09b --- /dev/null +++ b/docs/js/tsparticles.js @@ -0,0 +1,2 @@ +/*! For license information please see tsparticles.bundle.min.js.LICENSE.txt */ +!function(t,e){if("object"==typeof exports&&"object"==typeof module)module.exports=e();else if("function"==typeof define&&define.amd)define([],e);else{var i=e();for(var s in i)("object"==typeof exports?exports:t)[s]=i[s]}}(this,(()=>(()=>{"use strict";var t={d:(e,i)=>{for(var s in i)t.o(i,s)&&!t.o(e,s)&&Object.defineProperty(e,s,{enumerable:!0,get:i[s]})},o:(t,e)=>Object.prototype.hasOwnProperty.call(t,e),r:t=>{"undefined"!=typeof Symbol&&Symbol.toStringTag&&Object.defineProperty(t,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(t,"__esModule",{value:!0})}},e={};t.r(e),t.d(e,{AnimatableColor:()=>Se,AnimationOptions:()=>Me,AnimationValueWithRandom:()=>Ee,Background:()=>le,BackgroundMask:()=>de,BackgroundMaskCover:()=>he,Circle:()=>yi,ClickEvent:()=>pe,Collisions:()=>Fe,CollisionsAbsorb:()=>De,CollisionsOverlap:()=>Te,ColorAnimation:()=>Pe,DivEvent:()=>fe,Events:()=>ge,ExternalInteractorBase:()=>Si,FullScreen:()=>ue,HoverEvent:()=>ye,HslAnimation:()=>Oe,HslColorManager:()=>Pi,Interactivity:()=>we,ManualParticle:()=>xe,Modes:()=>be,Move:()=>Xe,MoveAngle:()=>qe,MoveAttract:()=>He,MoveCenter:()=>Ve,MoveGravity:()=>Ue,MovePath:()=>We,MoveTrail:()=>je,Opacity:()=>Ze,OpacityAnimation:()=>Ye,Options:()=>li,OptionsColor:()=>ce,OutModes:()=>Ge,Parallax:()=>ve,ParticlesBounce:()=>Ae,ParticlesBounceFactor:()=>Le,ParticlesDensity:()=>Qe,ParticlesInteractorBase:()=>Di,ParticlesNumber:()=>Ke,ParticlesNumberLimit:()=>Je,ParticlesOptions:()=>ai,Point:()=>pi,Range:()=>fi,RangedAnimationOptions:()=>Ce,RangedAnimationValueWithRandom:()=>Ie,Rectangle:()=>vi,ResizeEvent:()=>me,Responsive:()=>_e,RgbColorManager:()=>Oi,Shadow:()=>ti,Shape:()=>ei,Size:()=>si,SizeAnimation:()=>ii,Spin:()=>Ne,Stroke:()=>oi,Theme:()=>ze,ThemeDefault:()=>ke,ValueWithRandom:()=>Re,Vector:()=>y,Vector3d:()=>v,ZIndex:()=>ni,addColorManager:()=>Pt,addEasing:()=>b,alterHsl:()=>se,areBoundsInside:()=>et,arrayRandomIndex:()=>J,calcExactPositionOrRandomFromSize:()=>B,calcExactPositionOrRandomFromSizeRanged:()=>q,calcPositionFromSize:()=>L,calcPositionOrRandomFromSize:()=>A,calcPositionOrRandomFromSizeRanged:()=>F,calculateBounds:()=>it,circleBounce:()=>lt,circleBounceDataFromParticle:()=>ct,clamp:()=>k,clear:()=>Zt,collisionVelocity:()=>I,colorMix:()=>Vt,colorToHsl:()=>Tt,colorToRgb:()=>Dt,deepExtend:()=>st,divMode:()=>rt,divModeExecute:()=>nt,drawEffect:()=>Jt,drawLine:()=>Nt,drawParticle:()=>Qt,drawParticlePlugin:()=>ie,drawPlugin:()=>ee,drawShape:()=>Kt,drawShapeAfterDraw:()=>te,errorPrefix:()=>f,executeOnSingleOrMultiple:()=>dt,findItemFromSingleOrMultiple:()=>pt,generatedAttribute:()=>i,getDistance:()=>T,getDistances:()=>D,getEasing:()=>w,getHslAnimationFromHsl:()=>jt,getHslFromAnimation:()=>$t,getLinkColor:()=>Ut,getLinkRandomColor:()=>Wt,getLogger:()=>W,getParticleBaseVelocity:()=>E,getParticleDirectionAngle:()=>R,getPosition:()=>yt,getRandom:()=>_,getRandomRgbColor:()=>Bt,getRangeMax:()=>O,getRangeMin:()=>P,getRangeValue:()=>C,getSize:()=>mt,getStyleFromHsl:()=>Ht,getStyleFromRgb:()=>qt,hasMatchMedia:()=>G,hslToRgb:()=>At,hslaToRgba:()=>Ft,initParticleNumericAnimationValue:()=>ft,isArray:()=>kt,isBoolean:()=>gt,isDivModeEnabled:()=>ot,isFunction:()=>xt,isInArray:()=>Z,isNumber:()=>wt,isObject:()=>_t,isPointInside:()=>tt,isSsr:()=>j,isString:()=>bt,itemFromArray:()=>K,itemFromSingleOrMultiple:()=>ut,loadFont:()=>Q,loadFull:()=>gn,loadOptions:()=>ri,loadParticlesOptions:()=>ci,loadSlim:()=>an,mix:()=>z,mouseDownEvent:()=>s,mouseLeaveEvent:()=>n,mouseMoveEvent:()=>r,mouseOutEvent:()=>a,mouseUpEvent:()=>o,paintBase:()=>Xt,paintImage:()=>Yt,parseAlpha:()=>H,randomInRange:()=>M,rangeColorToHsl:()=>Rt,rangeColorToRgb:()=>St,rectBounce:()=>ht,resizeEvent:()=>u,rgbToHsl:()=>Et,safeIntersectionObserver:()=>X,safeMatchMedia:()=>N,safeMutationObserver:()=>Y,setLogger:()=>U,setRandom:()=>x,setRangeValue:()=>S,singleDivModeExecute:()=>at,stringToAlpha:()=>It,stringToRgb:()=>Lt,touchCancelEvent:()=>d,touchEndEvent:()=>l,touchMoveEvent:()=>h,touchStartEvent:()=>c,tsParticles:()=>Ti,visibilityChangeEvent:()=>p});const i="generated",s="pointerdown",o="pointerup",n="pointerleave",a="pointerout",r="pointermove",c="touchstart",l="touchend",h="touchmove",d="touchcancel",u="resize",p="visibilitychange",f="tsParticles - Error";class v{constructor(t,e,i){if(this._updateFromAngle=(t,e)=>{this.x=Math.cos(t)*e,this.y=Math.sin(t)*e},!wt(t)&&t){this.x=t.x,this.y=t.y;const e=t;this.z=e.z?e.z:0}else{if(void 0===t||void 0===e)throw new Error(`${f} Vector3d not initialized correctly`);this.x=t,this.y=e,this.z=i??0}}static get origin(){return v.create(0,0,0)}get angle(){return Math.atan2(this.y,this.x)}set angle(t){this._updateFromAngle(t,this.length)}get length(){return Math.sqrt(this.getLengthSq())}set length(t){this._updateFromAngle(this.angle,t)}static clone(t){return v.create(t.x,t.y,t.z)}static create(t,e,i){return new v(t,e,i)}add(t){return v.create(this.x+t.x,this.y+t.y,this.z+t.z)}addTo(t){this.x+=t.x,this.y+=t.y,this.z+=t.z}copy(){return v.clone(this)}distanceTo(t){return this.sub(t).length}distanceToSq(t){return this.sub(t).getLengthSq()}div(t){return v.create(this.x/t,this.y/t,this.z/t)}divTo(t){this.x/=t,this.y/=t,this.z/=t}getLengthSq(){return this.x**2+this.y**2}mult(t){return v.create(this.x*t,this.y*t,this.z*t)}multTo(t){this.x*=t,this.y*=t,this.z*=t}normalize(){const t=this.length;0!=t&&this.multTo(1/t)}rotate(t){return v.create(this.x*Math.cos(t)-this.y*Math.sin(t),this.x*Math.sin(t)+this.y*Math.cos(t),0)}setTo(t){this.x=t.x,this.y=t.y;const e=t;this.z=e.z?e.z:0}sub(t){return v.create(this.x-t.x,this.y-t.y,this.z-t.z)}subFrom(t){this.x-=t.x,this.y-=t.y,this.z-=t.z}}class y extends v{constructor(t,e){super(t,e,0)}static get origin(){return y.create(0,0)}static clone(t){return y.create(t.x,t.y)}static create(t,e){return new y(t,e)}}let m=Math.random;const g=new Map;function b(t,e){g.get(t)||g.set(t,e)}function w(t){return g.get(t)||(t=>t)}function x(t=Math.random){m=t}function _(){return k(m(),0,1-1e-16)}function k(t,e,i){return Math.min(Math.max(t,e),i)}function z(t,e,i,s){return Math.floor((t*i+e*s)/(i+s))}function M(t){const e=O(t);let i=P(t);return e===i&&(i=0),_()*(e-i)+i}function C(t){return wt(t)?t:M(t)}function P(t){return wt(t)?t:t.min}function O(t){return wt(t)?t:t.max}function S(t,e){if(t===e||void 0===e&&wt(t))return t;const i=P(t),s=O(t);return void 0!==e?{min:Math.min(i,e),max:Math.max(s,e)}:S(i,s)}function D(t,e){const i=t.x-e.x,s=t.y-e.y;return{dx:i,dy:s,distance:Math.sqrt(i**2+s**2)}}function T(t,e){return D(t,e).distance}function R(t,e,i){if(wt(t))return t*Math.PI/180;switch(t){case"top":return.5*-Math.PI;case"top-right":return.25*-Math.PI;case"right":return 0;case"bottom-right":return.25*Math.PI;case"bottom":return.5*Math.PI;case"bottom-left":return.75*Math.PI;case"left":return Math.PI;case"top-left":return.75*-Math.PI;case"inside":return Math.atan2(i.y-e.y,i.x-e.x);case"outside":return Math.atan2(e.y-i.y,e.x-i.x);default:return _()*Math.PI*2}}function E(t){const e=y.origin;return e.length=1,e.angle=t,e}function I(t,e,i,s){return y.create(t.x*(i-s)/(i+s)+2*e.x*s/(i+s),t.y)}function L(t){return t.position&&void 0!==t.position.x&&void 0!==t.position.y?{x:t.position.x*t.size.width/100,y:t.position.y*t.size.height/100}:void 0}function A(t){return{x:(t.position?.x??100*_())*t.size.width/100,y:(t.position?.y??100*_())*t.size.height/100}}function F(t){const e={x:void 0!==t.position?.x?C(t.position.x):void 0,y:void 0!==t.position?.y?C(t.position.y):void 0};return A({size:t.size,position:e})}function B(t){return{x:t.position?.x??_()*t.size.width,y:t.position?.y??_()*t.size.height}}function q(t){const e={x:void 0!==t.position?.x?C(t.position.x):void 0,y:void 0!==t.position?.y?C(t.position.y):void 0};return B({size:t.size,position:e})}function H(t){return t?t.endsWith("%")?parseFloat(t)/100:parseFloat(t):1}const V={debug:console.debug,error:console.error,info:console.info,log:console.log,verbose:console.log,warning:console.warn};function U(t){V.debug=t.debug||V.debug,V.error=t.error||V.error,V.info=t.info||V.info,V.log=t.log||V.log,V.verbose=t.verbose||V.verbose,V.warning=t.warning||V.warning}function W(){return V}function $(t){const e={bounced:!1},{pSide:i,pOtherSide:s,rectSide:o,rectOtherSide:n,velocity:a,factor:r}=t;return s.minn.max||s.maxn.max||(i.max>=o.min&&i.max<=.5*(o.max+o.min)&&a>0||i.min<=o.max&&i.min>.5*(o.max+o.min)&&a<0)&&(e.velocity=a*-r,e.bounced=!0),e}function j(){return"undefined"==typeof window||!window||void 0===window.document||!window.document}function G(){return!j()&&"undefined"!=typeof matchMedia}function N(t){if(G())return matchMedia(t)}function X(t){if(!j()&&"undefined"!=typeof IntersectionObserver)return new IntersectionObserver(t)}function Y(t){if(!j()&&"undefined"!=typeof MutationObserver)return new MutationObserver(t)}function Z(t,e){return t===e||kt(e)&&e.indexOf(t)>-1}async function Q(t,e){try{await document.fonts.load(`${e??"400"} 36px '${t??"Verdana"}'`)}catch{}}function J(t){return Math.floor(_()*t.length)}function K(t,e,i=!0){return t[void 0!==e&&i?e%t.length:J(t)]}function tt(t,e,i,s,o){return et(it(t,s??0),e,i,o)}function et(t,e,i,s){let o=!0;return s&&"bottom"!==s||(o=t.topi.x),!o||s&&"right"!==s||(o=t.lefti.y),o}function it(t,e){return{bottom:t.y+e,left:t.x-e,right:t.x+e,top:t.y-e}}function st(t,...e){for(const i of e){if(null==i)continue;if(!_t(i)){t=i;continue}const e=Array.isArray(i);!e||!_t(t)&&t&&Array.isArray(t)?e||!_t(t)&&t&&!Array.isArray(t)||(t={}):t=[];for(const e in i){if("__proto__"===e)continue;const s=i[e],o=t;o[e]=_t(s)&&Array.isArray(s)?s.map((t=>st(o[e],t))):st(o[e],s)}}return t}function ot(t,e){return!!pt(e,(e=>e.enable&&Z(t,e.mode)))}function nt(t,e,i){dt(e,(e=>{const s=e.mode;e.enable&&Z(t,s)&&at(e,i)}))}function at(t,e){dt(t.selectors,(i=>{e(i,t)}))}function rt(t,e){if(e&&t)return pt(t,(t=>function(t,e){const i=dt(e,(e=>t.matches(e)));return kt(i)?i.some((t=>t)):i}(e,t.selectors)))}function ct(t){return{position:t.getPosition(),radius:t.getRadius(),mass:t.getMass(),velocity:t.velocity,factor:y.create(C(t.options.bounce.horizontal.value),C(t.options.bounce.vertical.value))}}function lt(t,e){const{x:i,y:s}=t.velocity.sub(e.velocity),[o,n]=[t.position,e.position],{dx:a,dy:r}=D(n,o);if(i*a+s*r<0)return;const c=-Math.atan2(r,a),l=t.mass,h=e.mass,d=t.velocity.rotate(c),u=e.velocity.rotate(c),p=I(d,u,l,h),f=I(u,d,l,h),v=p.rotate(-c),y=f.rotate(-c);t.velocity.x=v.x*t.factor.x,t.velocity.y=v.y*t.factor.y,e.velocity.x=y.x*e.factor.x,e.velocity.y=y.y*e.factor.y}function ht(t,e){const i=it(t.getPosition(),t.getRadius()),s=t.options.bounce,o=$({pSide:{min:i.left,max:i.right},pOtherSide:{min:i.top,max:i.bottom},rectSide:{min:e.left,max:e.right},rectOtherSide:{min:e.top,max:e.bottom},velocity:t.velocity.x,factor:C(s.horizontal.value)});o.bounced&&(void 0!==o.velocity&&(t.velocity.x=o.velocity),void 0!==o.position&&(t.position.x=o.position));const n=$({pSide:{min:i.top,max:i.bottom},pOtherSide:{min:i.left,max:i.right},rectSide:{min:e.top,max:e.bottom},rectOtherSide:{min:e.left,max:e.right},velocity:t.velocity.y,factor:C(s.vertical.value)});n.bounced&&(void 0!==n.velocity&&(t.velocity.y=n.velocity),void 0!==n.position&&(t.position.y=n.position))}function dt(t,e){return kt(t)?t.map(((t,i)=>e(t,i))):e(t,0)}function ut(t,e,i){return kt(t)?K(t,e,i):t}function pt(t,e){return kt(t)?t.find(((t,i)=>e(t,i))):e(t,0)?t:void 0}function ft(t,e){const i=t.value,s=t.animation,o={delayTime:1e3*C(s.delay),enable:s.enable,value:C(t.value)*e,max:O(i)*e,min:P(i)*e,loops:0,maxLoops:C(s.count),time:0};if(s.enable){switch(o.decay=1-C(s.decay),s.mode){case"increase":o.status="increasing";break;case"decrease":o.status="decreasing";break;case"random":o.status=_()>=.5?"increasing":"decreasing"}const t="auto"===s.mode;switch(s.startValue){case"min":o.value=o.min,t&&(o.status="increasing");break;case"max":o.value=o.max,t&&(o.status="decreasing");break;default:o.value=M(o),t&&(o.status=_()>=.5?"increasing":"decreasing")}}return o.initialValue=o.value,o}function vt(t,e){if(!("percent"===t.mode)){const{mode:e,...i}=t;return i}return"x"in t?{x:t.x/100*e.width,y:t.y/100*e.height}:{width:t.width/100*e.width,height:t.height/100*e.height}}function yt(t,e){return vt(t,e)}function mt(t,e){return vt(t,e)}function gt(t){return"boolean"==typeof t}function bt(t){return"string"==typeof t}function wt(t){return"number"==typeof t}function xt(t){return"function"==typeof t}function _t(t){return"object"==typeof t&&null!==t}function kt(t){return Array.isArray(t)}const zt="random",Mt="mid",Ct=new Map;function Pt(t){Ct.set(t.key,t)}function Ot(t){for(const[,e]of Ct)if(t.startsWith(e.stringPrefix))return e.parseString(t);const e=t.replace(/^#?([a-f\d])([a-f\d])([a-f\d])([a-f\d])?$/i,((t,e,i,s,o)=>e+e+i+i+s+s+(void 0!==o?o+o:""))),i=/^#?([a-f\d]{2})([a-f\d]{2})([a-f\d]{2})([a-f\d]{2})?$/i.exec(e);return i?{a:void 0!==i[4]?parseInt(i[4],16)/255:1,b:parseInt(i[3],16),g:parseInt(i[2],16),r:parseInt(i[1],16)}:void 0}function St(t,e,i=!0){if(!t)return;const s=bt(t)?{value:t}:t;if(bt(s.value))return Dt(s.value,e,i);if(kt(s.value))return St({value:K(s.value,e,i)});for(const[,t]of Ct){const e=t.handleRangeColor(s);if(e)return e}}function Dt(t,e,i=!0){if(!t)return;const s=bt(t)?{value:t}:t;if(bt(s.value))return s.value===zt?Bt():Lt(s.value);if(kt(s.value))return Dt({value:K(s.value,e,i)});for(const[,t]of Ct){const e=t.handleColor(s);if(e)return e}}function Tt(t,e,i=!0){const s=Dt(t,e,i);return s?Et(s):void 0}function Rt(t,e,i=!0){const s=St(t,e,i);return s?Et(s):void 0}function Et(t){const e=t.r/255,i=t.g/255,s=t.b/255,o=Math.max(e,i,s),n=Math.min(e,i,s),a={h:0,l:.5*(o+n),s:0};return o!==n&&(a.s=a.l<.5?(o-n)/(o+n):(o-n)/(2-o-n),a.h=e===o?(i-s)/(o-n):a.h=i===o?2+(s-e)/(o-n):4+(e-i)/(o-n)),a.l*=100,a.s*=100,a.h*=60,a.h<0&&(a.h+=360),a.h>=360&&(a.h-=360),a}function It(t){return Ot(t)?.a}function Lt(t){return Ot(t)}function At(t){const e=(t.h%360+360)%360,i=Math.max(0,Math.min(100,t.s)),s=e/360,o=i/100,n=Math.max(0,Math.min(100,t.l))/100;if(0===i){const t=Math.round(255*n);return{r:t,g:t,b:t}}const a=(t,e,i)=>(i<0&&(i+=1),i>1&&(i-=1),6*i<1?t+6*(e-t)*i:2*i<1?e:3*i<2?t+(e-t)*(2/3-i)*6:t),r=n<.5?n*(1+o):n+o-n*o,c=2*n-r,l=Math.min(255,255*a(c,r,s+1/3)),h=Math.min(255,255*a(c,r,s)),d=Math.min(255,255*a(c,r,s-1/3));return{r:Math.round(l),g:Math.round(h),b:Math.round(d)}}function Ft(t){const e=At(t);return{a:t.a,b:e.b,g:e.g,r:e.r}}function Bt(t){const e=t??0;return{b:Math.floor(M(S(e,256))),g:Math.floor(M(S(e,256))),r:Math.floor(M(S(e,256)))}}function qt(t,e){return`rgba(${t.r}, ${t.g}, ${t.b}, ${e??1})`}function Ht(t,e){return`hsla(${t.h}, ${t.s}%, ${t.l}%, ${e??1})`}function Vt(t,e,i,s){let o=t,n=e;return void 0===o.r&&(o=At(t)),void 0===n.r&&(n=At(e)),{b:z(o.b,n.b,i,s),g:z(o.g,n.g,i,s),r:z(o.r,n.r,i,s)}}function Ut(t,e,i){if(i===zt)return Bt();if(i!==Mt)return i;{const i=t.getFillColor()??t.getStrokeColor(),s=e?.getFillColor()??e?.getStrokeColor();if(i&&s&&e)return Vt(i,s,t.getRadius(),e.getRadius());{const t=i??s;if(t)return At(t)}}}function Wt(t,e,i){const s=bt(t)?t:t.value;return s===zt?i?St({value:s}):e?zt:Mt:s===Mt?Mt:St({value:s})}function $t(t){return void 0!==t?{h:t.h.value,s:t.s.value,l:t.l.value}:void 0}function jt(t,e,i){const s={h:{enable:!1,value:t.h},s:{enable:!1,value:t.s},l:{enable:!1,value:t.l}};return e&&(Gt(s.h,e.h,i),Gt(s.s,e.s,i),Gt(s.l,e.l,i)),s}function Gt(t,e,i){t.enable=e.enable,t.enable?(t.velocity=C(e.speed)/100*i,t.decay=1-C(e.decay),t.status="increasing",t.loops=0,t.maxLoops=C(e.count),t.time=0,t.delayTime=1e3*C(e.delay),e.sync||(t.velocity*=_(),t.value*=_()),t.initialValue=t.value):t.velocity=0}function Nt(t,e,i){t.beginPath(),t.moveTo(e.x,e.y),t.lineTo(i.x,i.y),t.closePath()}function Xt(t,e,i){t.fillStyle=i??"rgba(0,0,0,0)",t.fillRect(0,0,e.width,e.height)}function Yt(t,e,i,s){i&&(t.globalAlpha=s,t.drawImage(i,0,0,e.width,e.height),t.globalAlpha=1)}function Zt(t,e){t.clearRect(0,0,e.width,e.height)}function Qt(t){const{container:e,context:i,particle:s,delta:o,colorStyles:n,backgroundMask:a,composite:r,radius:c,opacity:l,shadow:h,transform:d}=t,u=s.getPosition(),p=s.rotation+(s.pathRotation?s.velocity.angle:0),f=Math.sin(p),v=Math.cos(p),y={a:v*(d.a??1),b:f*(d.b??1),c:-f*(d.c??1),d:v*(d.d??1)};i.setTransform(y.a,y.b,y.c,y.d,u.x,u.y),a&&(i.globalCompositeOperation=r);const m=s.shadowColor;h.enable&&m&&(i.shadowBlur=h.blur,i.shadowColor=qt(m),i.shadowOffsetX=h.offset.x,i.shadowOffsetY=h.offset.y),n.fill&&(i.fillStyle=n.fill);const g=s.strokeWidth??0;i.lineWidth=g,n.stroke&&(i.strokeStyle=n.stroke);const b={container:e,context:i,particle:s,radius:c,opacity:l,delta:o,transformData:y};i.beginPath(),Kt(b),s.shapeClose&&i.closePath(),g>0&&i.stroke(),s.shapeFill&&i.fill(),te(b),Jt(b),i.globalCompositeOperation="source-over",i.setTransform(1,0,0,1,0,0)}function Jt(t){const{container:e,context:i,particle:s,radius:o,opacity:n,delta:a,transformData:r}=t;if(!s.effect)return;const c=e.effectDrawers.get(s.effect);c&&c.draw({context:i,particle:s,radius:o,opacity:n,delta:a,pixelRatio:e.retina.pixelRatio,transformData:{...r}})}function Kt(t){const{container:e,context:i,particle:s,radius:o,opacity:n,delta:a,transformData:r}=t;if(!s.shape)return;const c=e.shapeDrawers.get(s.shape);c&&c.draw({context:i,particle:s,radius:o,opacity:n,delta:a,pixelRatio:e.retina.pixelRatio,transformData:{...r}})}function te(t){const{container:e,context:i,particle:s,radius:o,opacity:n,delta:a,transformData:r}=t;if(!s.shape)return;const c=e.shapeDrawers.get(s.shape);c&&c.afterDraw&&c.afterDraw({context:i,particle:s,radius:o,opacity:n,delta:a,pixelRatio:e.retina.pixelRatio,transformData:{...r}})}function ee(t,e,i){e.draw&&e.draw(t,i)}function ie(t,e,i,s){e.drawParticle&&e.drawParticle(t,i,s)}function se(t,e,i){return{h:t.h,s:t.s,l:t.l+("darken"===e?-1:1)*i}}function oe(t,e,i){const s=e[i];void 0!==s&&(t[i]=(t[i]??1)*s)}class ne{constructor(t){this.container=t,this._applyPostDrawUpdaters=t=>{for(const e of this._postDrawUpdaters)e.afterDraw&&e.afterDraw(t)},this._applyPreDrawUpdaters=(t,e,i,s,o,n)=>{for(const a of this._preDrawUpdaters){if(a.getColorStyles){const{fill:n,stroke:r}=a.getColorStyles(e,t,i,s);n&&(o.fill=n),r&&(o.stroke=r)}if(a.getTransformValues){const t=a.getTransformValues(e);for(const e in t)oe(n,t,e)}a.beforeDraw&&a.beforeDraw(e)}},this._applyResizePlugins=()=>{for(const t of this._resizePlugins)t.resize&&t.resize()},this._getPluginParticleColors=t=>{let e,i;for(const s of this._colorPlugins)if(!e&&s.particleFillColor&&(e=Rt(s.particleFillColor(t))),!i&&s.particleStrokeColor&&(i=Rt(s.particleStrokeColor(t))),e&&i)break;return[e,i]},this._initCover=()=>{const t=this.container.actualOptions.backgroundMask.cover,e=St(t.color);if(e){const i={...e,a:t.opacity};this._coverColorStyle=qt(i,i.a)}},this._initStyle=()=>{const t=this.element,e=this.container.actualOptions;if(t){this._fullScreen?(this._originalStyle=st({},t.style),this._setFullScreenStyle()):this._resetOriginalStyle();for(const i in e.style){if(!i||!e.style)continue;const s=e.style[i];s&&t.style.setProperty(i,s,"important")}}},this._initTrail=async()=>{const t=this.container.actualOptions,e=t.particles.move.trail,i=e.fill;if(e.enable)if(i.color){const e=St(i.color);if(!e)return;const s=t.particles.move.trail;this._trailFill={color:{...e},opacity:1/s.length}}else await new Promise(((t,s)=>{if(!i.image)return;const o=document.createElement("img");o.addEventListener("load",(()=>{this._trailFill={image:o,opacity:1/e.length},t()})),o.addEventListener("error",(t=>{s(t.error)})),o.src=i.image}))},this._paintBase=t=>{this.draw((e=>Xt(e,this.size,t)))},this._paintImage=(t,e)=>{this.draw((i=>Yt(i,this.size,t,e)))},this._repairStyle=()=>{const t=this.element;t&&(this._safeMutationObserver((t=>t.disconnect())),this._initStyle(),this.initBackground(),this._safeMutationObserver((e=>e.observe(t,{attributes:!0}))))},this._resetOriginalStyle=()=>{const t=this.element,e=this._originalStyle;if(!t||!e)return;const i=t.style;i.position=e.position,i.zIndex=e.zIndex,i.top=e.top,i.left=e.left,i.width=e.width,i.height=e.height},this._safeMutationObserver=t=>{this._mutationObserver&&t(this._mutationObserver)},this._setFullScreenStyle=()=>{const t=this.element;if(!t)return;const e="important",i=t.style;i.setProperty("position","fixed",e),i.setProperty("z-index",this.container.actualOptions.fullScreen.zIndex.toString(10),e),i.setProperty("top","0",e),i.setProperty("left","0",e),i.setProperty("width","100%",e),i.setProperty("height","100%",e)},this.size={height:0,width:0},this._context=null,this._generated=!1,this._preDrawUpdaters=[],this._postDrawUpdaters=[],this._resizePlugins=[],this._colorPlugins=[]}get _fullScreen(){return this.container.actualOptions.fullScreen.enable}clear(){const t=this.container.actualOptions,e=t.particles.move.trail,i=this._trailFill;t.backgroundMask.enable?this.paint():e.enable&&e.length>0&&i?i.color?this._paintBase(qt(i.color,i.opacity)):i.image&&this._paintImage(i.image,i.opacity):t.clear&&this.draw((t=>{Zt(t,this.size)}))}destroy(){if(this.stop(),this._generated){const t=this.element;t&&t.remove()}else this._resetOriginalStyle();this._preDrawUpdaters=[],this._postDrawUpdaters=[],this._resizePlugins=[],this._colorPlugins=[]}draw(t){const e=this._context;if(e)return t(e)}drawParticle(t,e){if(t.spawning||t.destroyed)return;const i=t.getRadius();if(i<=0)return;const s=t.getFillColor(),o=t.getStrokeColor()??s;let[n,a]=this._getPluginParticleColors(t);n||(n=s),a||(a=o),(n||a)&&this.draw((s=>{const o=this.container,r=o.actualOptions,c=t.options.zIndex,l=(1-t.zIndexFactor)**c.opacityRate,h=t.bubble.opacity??t.opacity?.value??1,d=h*l,u=(t.strokeOpacity??h)*l,p={},f={fill:n?Ht(n,d):void 0};f.stroke=a?Ht(a,u):f.fill,this._applyPreDrawUpdaters(s,t,i,d,f,p),Qt({container:o,context:s,particle:t,delta:e,colorStyles:f,backgroundMask:r.backgroundMask.enable,composite:r.backgroundMask.composite,radius:i*(1-t.zIndexFactor)**c.sizeRate,opacity:d,shadow:t.options.shadow,transform:p}),this._applyPostDrawUpdaters(t)}))}drawParticlePlugin(t,e,i){this.draw((s=>ie(s,t,e,i)))}drawPlugin(t,e){this.draw((i=>ee(i,t,e)))}async init(){this._safeMutationObserver((t=>t.disconnect())),this._mutationObserver=Y((t=>{for(const e of t)"attributes"===e.type&&"style"===e.attributeName&&this._repairStyle()})),this.resize(),this._initStyle(),this._initCover();try{await this._initTrail()}catch(t){W().error(t)}this.initBackground(),this._safeMutationObserver((t=>{this.element&&t.observe(this.element,{attributes:!0})})),this.initUpdaters(),this.initPlugins(),this.paint()}initBackground(){const t=this.container.actualOptions.background,e=this.element;if(!e)return;const i=e.style;if(i){if(t.color){const e=St(t.color);i.backgroundColor=e?qt(e,t.opacity):""}else i.backgroundColor="";i.backgroundImage=t.image||"",i.backgroundPosition=t.position||"",i.backgroundRepeat=t.repeat||"",i.backgroundSize=t.size||""}}initPlugins(){this._resizePlugins=[];for(const[,t]of this.container.plugins)t.resize&&this._resizePlugins.push(t),(t.particleFillColor||t.particleStrokeColor)&&this._colorPlugins.push(t)}initUpdaters(){this._preDrawUpdaters=[],this._postDrawUpdaters=[];for(const t of this.container.particles.updaters)t.afterDraw&&this._postDrawUpdaters.push(t),(t.getColorStyles||t.getTransformValues||t.beforeDraw)&&this._preDrawUpdaters.push(t)}loadCanvas(t){this._generated&&this.element&&this.element.remove(),this._generated=t.dataset&&i in t.dataset?"true"===t.dataset[i]:this._generated,this.element=t,this.element.ariaHidden="true",this._originalStyle=st({},this.element.style),this.size.height=t.offsetHeight,this.size.width=t.offsetWidth,this._context=this.element.getContext("2d"),this._safeMutationObserver((t=>{this.element&&t.observe(this.element,{attributes:!0})})),this.container.retina.init(),this.initBackground()}paint(){const t=this.container.actualOptions;this.draw((e=>{t.backgroundMask.enable&&t.backgroundMask.cover?(Zt(e,this.size),this._paintBase(this._coverColorStyle)):this._paintBase()}))}resize(){if(!this.element)return!1;const t=this.container,e=t.retina.pixelRatio,i=t.canvas.size,s=this.element.offsetWidth*e,o=this.element.offsetHeight*e;if(o===i.height&&s===i.width&&o===this.element.height&&s===this.element.width)return!1;const n={...i};return this.element.width=i.width=this.element.offsetWidth*e,this.element.height=i.height=this.element.offsetHeight*e,this.container.started&&t.particles.setResizeFactor({width:i.width/n.width,height:i.height/n.height}),!0}stop(){this._safeMutationObserver((t=>t.disconnect())),this._mutationObserver=void 0,this.draw((t=>Zt(t,this.size)))}async windowResize(){if(!this.element||!this.resize())return;const t=this.container,e=t.updateActualOptions();t.particles.setDensity(),this._applyResizePlugins(),e&&await t.refresh()}}function ae(t,e,i,s,o){if(s){let s={passive:!0};gt(o)?s.capture=o:void 0!==o&&(s=o),t.addEventListener(e,i,s)}else{const s=o;t.removeEventListener(e,i,s)}}class re{constructor(t){this.container=t,this._doMouseTouchClick=t=>{const e=this.container,i=e.actualOptions;if(this._canPush){const t=e.interactivity.mouse,s=t.position;if(!s)return;t.clickPosition={...s},t.clickTime=(new Date).getTime();dt(i.interactivity.events.onClick.mode,(t=>this.container.handleClickMode(t)))}"touchend"===t.type&&setTimeout((()=>this._mouseTouchFinish()),500)},this._handleThemeChange=t=>{const e=t,i=this.container,s=i.options,o=s.defaultThemes,n=e.matches?o.dark:o.light,a=s.themes.find((t=>t.name===n));a&&a.default.auto&&i.loadTheme(n)},this._handleVisibilityChange=()=>{const t=this.container,e=t.actualOptions;this._mouseTouchFinish(),e.pauseOnBlur&&(document&&document.hidden?(t.pageHidden=!0,t.pause()):(t.pageHidden=!1,t.getAnimationStatus()?t.play(!0):t.draw(!0)))},this._handleWindowResize=async()=>{this._resizeTimeout&&(clearTimeout(this._resizeTimeout),delete this._resizeTimeout),this._resizeTimeout=setTimeout((async()=>{const t=this.container.canvas;t&&await t.windowResize()}),1e3*this.container.actualOptions.interactivity.events.resize.delay)},this._manageInteractivityListeners=(t,e)=>{const i=this._handlers,n=this.container,a=n.actualOptions,u=n.interactivity.element;if(!u)return;const p=u,f=n.canvas.element;f&&(f.style.pointerEvents=p===f?"initial":"none"),(a.interactivity.events.onHover.enable||a.interactivity.events.onClick.enable)&&(ae(u,r,i.mouseMove,e),ae(u,c,i.touchStart,e),ae(u,h,i.touchMove,e),a.interactivity.events.onClick.enable?(ae(u,l,i.touchEndClick,e),ae(u,o,i.mouseUp,e),ae(u,s,i.mouseDown,e)):ae(u,l,i.touchEnd,e),ae(u,t,i.mouseLeave,e),ae(u,d,i.touchCancel,e))},this._manageListeners=t=>{const e=this._handlers,i=this.container,s=i.actualOptions.interactivity.detectsOn,o=i.canvas.element;let r=n;"window"===s?(i.interactivity.element=window,r=a):i.interactivity.element="parent"===s&&o?o.parentElement??o.parentNode:o,this._manageMediaMatch(t),this._manageResize(t),this._manageInteractivityListeners(r,t),document&&ae(document,p,e.visibilityChange,t,!1)},this._manageMediaMatch=t=>{const e=this._handlers,i=N("(prefers-color-scheme: dark)");i&&(void 0===i.addEventListener?void 0!==i.addListener&&(t?i.addListener(e.oldThemeChange):i.removeListener(e.oldThemeChange)):ae(i,"change",e.themeChange,t))},this._manageResize=t=>{const e=this._handlers,i=this.container;if(!i.actualOptions.interactivity.events.resize)return;if("undefined"==typeof ResizeObserver)return void ae(window,u,e.resize,t);const s=i.canvas.element;this._resizeObserver&&!t?(s&&this._resizeObserver.unobserve(s),this._resizeObserver.disconnect(),delete this._resizeObserver):!this._resizeObserver&&t&&s&&(this._resizeObserver=new ResizeObserver((async t=>{t.find((t=>t.target===s))&&await this._handleWindowResize()})),this._resizeObserver.observe(s))},this._mouseDown=()=>{const{interactivity:t}=this.container;if(!t)return;const{mouse:e}=t;e.clicking=!0,e.downPosition=e.position},this._mouseTouchClick=t=>{const e=this.container,i=e.actualOptions,{mouse:s}=e.interactivity;s.inside=!0;let o=!1;const n=s.position;if(n&&i.interactivity.events.onClick.enable){for(const[,t]of e.plugins)if(t.clickPositionValid&&(o=t.clickPositionValid(n),o))break;o||this._doMouseTouchClick(t),s.clicking=!1}},this._mouseTouchFinish=()=>{const t=this.container.interactivity;if(!t)return;const e=t.mouse;delete e.position,delete e.clickPosition,delete e.downPosition,t.status=n,e.inside=!1,e.clicking=!1},this._mouseTouchMove=t=>{const e=this.container,i=e.actualOptions,s=e.interactivity,o=e.canvas.element;if(!s||!s.element)return;let n;if(s.mouse.inside=!0,t.type.startsWith("pointer")){this._canPush=!0;const e=t;if(s.element===window){if(o){const t=o.getBoundingClientRect();n={x:e.clientX-t.left,y:e.clientY-t.top}}}else if("parent"===i.interactivity.detectsOn){const t=e.target,i=e.currentTarget;if(t&&i&&o){const s=t.getBoundingClientRect(),a=i.getBoundingClientRect(),r=o.getBoundingClientRect();n={x:e.offsetX+2*s.left-(a.left+r.left),y:e.offsetY+2*s.top-(a.top+r.top)}}else n={x:e.offsetX??e.clientX,y:e.offsetY??e.clientY}}else e.target===o&&(n={x:e.offsetX??e.clientX,y:e.offsetY??e.clientY})}else if(this._canPush="touchmove"!==t.type,o){const e=t,i=e.touches[e.touches.length-1],s=o.getBoundingClientRect();n={x:i.clientX-(s.left??0),y:i.clientY-(s.top??0)}}const a=e.retina.pixelRatio;n&&(n.x*=a,n.y*=a),s.mouse.position=n,s.status=r},this._touchEnd=t=>{const e=t,i=Array.from(e.changedTouches);for(const t of i)this._touches.delete(t.identifier);this._mouseTouchFinish()},this._touchEndClick=t=>{const e=t,i=Array.from(e.changedTouches);for(const t of i)this._touches.delete(t.identifier);this._mouseTouchClick(t)},this._touchStart=t=>{const e=t,i=Array.from(e.changedTouches);for(const t of i)this._touches.set(t.identifier,performance.now());this._mouseTouchMove(t)},this._canPush=!0,this._touches=new Map,this._handlers={mouseDown:()=>this._mouseDown(),mouseLeave:()=>this._mouseTouchFinish(),mouseMove:t=>this._mouseTouchMove(t),mouseUp:t=>this._mouseTouchClick(t),touchStart:t=>this._touchStart(t),touchMove:t=>this._mouseTouchMove(t),touchEnd:t=>this._touchEnd(t),touchCancel:t=>this._touchEnd(t),touchEndClick:t=>this._touchEndClick(t),visibilityChange:()=>this._handleVisibilityChange(),themeChange:t=>this._handleThemeChange(t),oldThemeChange:t=>this._handleThemeChange(t),resize:()=>{this._handleWindowResize()}}}addListeners(){this._manageListeners(!0)}removeListeners(){this._manageListeners(!1)}}class ce{constructor(){this.value=""}static create(t,e){const i=new ce;return i.load(t),void 0!==e&&(bt(e)||kt(e)?i.load({value:e}):i.load(e)),i}load(t){void 0!==t?.value&&(this.value=t.value)}}class le{constructor(){this.color=new ce,this.color.value="",this.image="",this.position="",this.repeat="",this.size="",this.opacity=1}load(t){t&&(void 0!==t.color&&(this.color=ce.create(this.color,t.color)),void 0!==t.image&&(this.image=t.image),void 0!==t.position&&(this.position=t.position),void 0!==t.repeat&&(this.repeat=t.repeat),void 0!==t.size&&(this.size=t.size),void 0!==t.opacity&&(this.opacity=t.opacity))}}class he{constructor(){this.color=new ce,this.color.value="#fff",this.opacity=1}load(t){t&&(void 0!==t.color&&(this.color=ce.create(this.color,t.color)),void 0!==t.opacity&&(this.opacity=t.opacity))}}class de{constructor(){this.composite="destination-out",this.cover=new he,this.enable=!1}load(t){if(t){if(void 0!==t.composite&&(this.composite=t.composite),void 0!==t.cover){const e=t.cover,i=bt(t.cover)?{color:t.cover}:t.cover;this.cover.load(void 0!==e.color?e:{color:i})}void 0!==t.enable&&(this.enable=t.enable)}}}class ue{constructor(){this.enable=!0,this.zIndex=0}load(t){t&&(void 0!==t.enable&&(this.enable=t.enable),void 0!==t.zIndex&&(this.zIndex=t.zIndex))}}class pe{constructor(){this.enable=!1,this.mode=[]}load(t){t&&(void 0!==t.enable&&(this.enable=t.enable),void 0!==t.mode&&(this.mode=t.mode))}}class fe{constructor(){this.selectors=[],this.enable=!1,this.mode=[],this.type="circle"}load(t){t&&(void 0!==t.selectors&&(this.selectors=t.selectors),void 0!==t.enable&&(this.enable=t.enable),void 0!==t.mode&&(this.mode=t.mode),void 0!==t.type&&(this.type=t.type))}}class ve{constructor(){this.enable=!1,this.force=2,this.smooth=10}load(t){t&&(void 0!==t.enable&&(this.enable=t.enable),void 0!==t.force&&(this.force=t.force),void 0!==t.smooth&&(this.smooth=t.smooth))}}class ye{constructor(){this.enable=!1,this.mode=[],this.parallax=new ve}load(t){t&&(void 0!==t.enable&&(this.enable=t.enable),void 0!==t.mode&&(this.mode=t.mode),this.parallax.load(t.parallax))}}class me{constructor(){this.delay=.5,this.enable=!0}load(t){void 0!==t&&(void 0!==t.delay&&(this.delay=t.delay),void 0!==t.enable&&(this.enable=t.enable))}}class ge{constructor(){this.onClick=new pe,this.onDiv=new fe,this.onHover=new ye,this.resize=new me}load(t){if(!t)return;this.onClick.load(t.onClick);const e=t.onDiv;void 0!==e&&(this.onDiv=dt(e,(t=>{const e=new fe;return e.load(t),e}))),this.onHover.load(t.onHover),this.resize.load(t.resize)}}class be{constructor(t,e){this._engine=t,this._container=e}load(t){if(!t)return;if(!this._container)return;const e=this._engine.interactors.get(this._container);if(e)for(const i of e)i.loadModeOptions&&i.loadModeOptions(this,t)}}class we{constructor(t,e){this.detectsOn="window",this.events=new ge,this.modes=new be(t,e)}load(t){if(!t)return;const e=t.detectsOn;void 0!==e&&(this.detectsOn=e),this.events.load(t.events),this.modes.load(t.modes)}}class xe{load(t){t&&(t.position&&(this.position={x:t.position.x??50,y:t.position.y??50,mode:t.position.mode??"percent"}),t.options&&(this.options=st({},t.options)))}}class _e{constructor(){this.maxWidth=1/0,this.options={},this.mode="canvas"}load(t){t&&(void 0!==t.maxWidth&&(this.maxWidth=t.maxWidth),void 0!==t.mode&&("screen"===t.mode?this.mode="screen":this.mode="canvas"),void 0!==t.options&&(this.options=st({},t.options)))}}class ke{constructor(){this.auto=!1,this.mode="any",this.value=!1}load(t){t&&(void 0!==t.auto&&(this.auto=t.auto),void 0!==t.mode&&(this.mode=t.mode),void 0!==t.value&&(this.value=t.value))}}class ze{constructor(){this.name="",this.default=new ke}load(t){t&&(void 0!==t.name&&(this.name=t.name),this.default.load(t.default),void 0!==t.options&&(this.options=st({},t.options)))}}class Me{constructor(){this.count=0,this.enable=!1,this.speed=1,this.decay=0,this.delay=0,this.sync=!1}load(t){t&&(void 0!==t.count&&(this.count=S(t.count)),void 0!==t.enable&&(this.enable=t.enable),void 0!==t.speed&&(this.speed=S(t.speed)),void 0!==t.decay&&(this.decay=S(t.decay)),void 0!==t.delay&&(this.delay=S(t.delay)),void 0!==t.sync&&(this.sync=t.sync))}}class Ce extends Me{constructor(){super(),this.mode="auto",this.startValue="random"}load(t){super.load(t),t&&(void 0!==t.mode&&(this.mode=t.mode),void 0!==t.startValue&&(this.startValue=t.startValue))}}class Pe extends Me{constructor(){super(),this.offset=0,this.sync=!0}load(t){super.load(t),t&&void 0!==t.offset&&(this.offset=S(t.offset))}}class Oe{constructor(){this.h=new Pe,this.s=new Pe,this.l=new Pe}load(t){t&&(this.h.load(t.h),this.s.load(t.s),this.l.load(t.l))}}class Se extends ce{constructor(){super(),this.animation=new Oe}static create(t,e){const i=new Se;return i.load(t),void 0!==e&&(bt(e)||kt(e)?i.load({value:e}):i.load(e)),i}load(t){if(super.load(t),!t)return;const e=t.animation;void 0!==e&&(void 0!==e.enable?this.animation.h.load(e):this.animation.load(t.animation))}}class De{constructor(){this.speed=2}load(t){t&&void 0!==t.speed&&(this.speed=t.speed)}}class Te{constructor(){this.enable=!0,this.retries=0}load(t){t&&(void 0!==t.enable&&(this.enable=t.enable),void 0!==t.retries&&(this.retries=t.retries))}}class Re{constructor(){this.value=0}load(t){t&&void 0!==t.value&&(this.value=S(t.value))}}class Ee extends Re{constructor(){super(),this.animation=new Me}load(t){if(super.load(t),!t)return;const e=t.animation;void 0!==e&&this.animation.load(e)}}class Ie extends Ee{constructor(){super(),this.animation=new Ce}load(t){super.load(t)}}class Le extends Re{constructor(){super(),this.value=1}}class Ae{constructor(){this.horizontal=new Le,this.vertical=new Le}load(t){t&&(this.horizontal.load(t.horizontal),this.vertical.load(t.vertical))}}class Fe{constructor(){this.absorb=new De,this.bounce=new Ae,this.enable=!1,this.maxSpeed=50,this.mode="bounce",this.overlap=new Te}load(t){t&&(this.absorb.load(t.absorb),this.bounce.load(t.bounce),void 0!==t.enable&&(this.enable=t.enable),void 0!==t.maxSpeed&&(this.maxSpeed=S(t.maxSpeed)),void 0!==t.mode&&(this.mode=t.mode),this.overlap.load(t.overlap))}}class Be{constructor(){this.close=!0,this.fill=!0,this.options={},this.type=[]}load(t){if(!t)return;const e=t.options;if(void 0!==e)for(const t in e){const i=e[t];i&&(this.options[t]=st(this.options[t]??{},i))}void 0!==t.close&&(this.close=t.close),void 0!==t.fill&&(this.fill=t.fill),void 0!==t.type&&(this.type=t.type)}}class qe{constructor(){this.offset=0,this.value=90}load(t){t&&(void 0!==t.offset&&(this.offset=S(t.offset)),void 0!==t.value&&(this.value=S(t.value)))}}class He{constructor(){this.distance=200,this.enable=!1,this.rotate={x:3e3,y:3e3}}load(t){if(t&&(void 0!==t.distance&&(this.distance=S(t.distance)),void 0!==t.enable&&(this.enable=t.enable),t.rotate)){const e=t.rotate.x;void 0!==e&&(this.rotate.x=e);const i=t.rotate.y;void 0!==i&&(this.rotate.y=i)}}}class Ve{constructor(){this.x=50,this.y=50,this.mode="percent",this.radius=0}load(t){t&&(void 0!==t.x&&(this.x=t.x),void 0!==t.y&&(this.y=t.y),void 0!==t.mode&&(this.mode=t.mode),void 0!==t.radius&&(this.radius=t.radius))}}class Ue{constructor(){this.acceleration=9.81,this.enable=!1,this.inverse=!1,this.maxSpeed=50}load(t){t&&(void 0!==t.acceleration&&(this.acceleration=S(t.acceleration)),void 0!==t.enable&&(this.enable=t.enable),void 0!==t.inverse&&(this.inverse=t.inverse),void 0!==t.maxSpeed&&(this.maxSpeed=S(t.maxSpeed)))}}class We{constructor(){this.clamp=!0,this.delay=new Re,this.enable=!1,this.options={}}load(t){t&&(void 0!==t.clamp&&(this.clamp=t.clamp),this.delay.load(t.delay),void 0!==t.enable&&(this.enable=t.enable),this.generator=t.generator,t.options&&(this.options=st(this.options,t.options)))}}class $e{load(t){t&&(void 0!==t.color&&(this.color=ce.create(this.color,t.color)),void 0!==t.image&&(this.image=t.image))}}class je{constructor(){this.enable=!1,this.length=10,this.fill=new $e}load(t){t&&(void 0!==t.enable&&(this.enable=t.enable),void 0!==t.fill&&this.fill.load(t.fill),void 0!==t.length&&(this.length=t.length))}}class Ge{constructor(){this.default="out"}load(t){t&&(void 0!==t.default&&(this.default=t.default),this.bottom=t.bottom??t.default,this.left=t.left??t.default,this.right=t.right??t.default,this.top=t.top??t.default)}}class Ne{constructor(){this.acceleration=0,this.enable=!1}load(t){t&&(void 0!==t.acceleration&&(this.acceleration=S(t.acceleration)),void 0!==t.enable&&(this.enable=t.enable),t.position&&(this.position=st({},t.position)))}}class Xe{constructor(){this.angle=new qe,this.attract=new He,this.center=new Ve,this.decay=0,this.distance={},this.direction="none",this.drift=0,this.enable=!1,this.gravity=new Ue,this.path=new We,this.outModes=new Ge,this.random=!1,this.size=!1,this.speed=2,this.spin=new Ne,this.straight=!1,this.trail=new je,this.vibrate=!1,this.warp=!1}load(t){if(!t)return;this.angle.load(wt(t.angle)?{value:t.angle}:t.angle),this.attract.load(t.attract),this.center.load(t.center),void 0!==t.decay&&(this.decay=S(t.decay)),void 0!==t.direction&&(this.direction=t.direction),void 0!==t.distance&&(this.distance=wt(t.distance)?{horizontal:t.distance,vertical:t.distance}:{...t.distance}),void 0!==t.drift&&(this.drift=S(t.drift)),void 0!==t.enable&&(this.enable=t.enable),this.gravity.load(t.gravity);const e=t.outModes;void 0!==e&&(_t(e)?this.outModes.load(e):this.outModes.load({default:e})),this.path.load(t.path),void 0!==t.random&&(this.random=t.random),void 0!==t.size&&(this.size=t.size),void 0!==t.speed&&(this.speed=S(t.speed)),this.spin.load(t.spin),void 0!==t.straight&&(this.straight=t.straight),this.trail.load(t.trail),void 0!==t.vibrate&&(this.vibrate=t.vibrate),void 0!==t.warp&&(this.warp=t.warp)}}class Ye extends Ce{constructor(){super(),this.destroy="none",this.speed=2}load(t){super.load(t),t&&void 0!==t.destroy&&(this.destroy=t.destroy)}}class Ze extends Ie{constructor(){super(),this.animation=new Ye,this.value=1}load(t){if(!t)return;super.load(t);const e=t.animation;void 0!==e&&this.animation.load(e)}}class Qe{constructor(){this.enable=!1,this.width=1920,this.height=1080}load(t){if(!t)return;void 0!==t.enable&&(this.enable=t.enable);const e=t.width;void 0!==e&&(this.width=e);const i=t.height;void 0!==i&&(this.height=i)}}class Je{constructor(){this.mode="delete",this.value=0}load(t){t&&(void 0!==t.mode&&(this.mode=t.mode),void 0!==t.value&&(this.value=t.value))}}class Ke{constructor(){this.density=new Qe,this.limit=new Je,this.value=0}load(t){t&&(this.density.load(t.density),this.limit.load(t.limit),void 0!==t.value&&(this.value=t.value))}}class ti{constructor(){this.blur=0,this.color=new ce,this.enable=!1,this.offset={x:0,y:0},this.color.value="#000"}load(t){t&&(void 0!==t.blur&&(this.blur=t.blur),this.color=ce.create(this.color,t.color),void 0!==t.enable&&(this.enable=t.enable),void 0!==t.offset&&(void 0!==t.offset.x&&(this.offset.x=t.offset.x),void 0!==t.offset.y&&(this.offset.y=t.offset.y)))}}class ei{constructor(){this.close=!0,this.fill=!0,this.options={},this.type="circle"}load(t){if(!t)return;const e=t.options;if(void 0!==e)for(const t in e){const i=e[t];i&&(this.options[t]=st(this.options[t]??{},i))}void 0!==t.close&&(this.close=t.close),void 0!==t.fill&&(this.fill=t.fill),void 0!==t.type&&(this.type=t.type)}}class ii extends Ce{constructor(){super(),this.destroy="none",this.speed=5}load(t){super.load(t),t&&void 0!==t.destroy&&(this.destroy=t.destroy)}}class si extends Ie{constructor(){super(),this.animation=new ii,this.value=3}load(t){if(super.load(t),!t)return;const e=t.animation;void 0!==e&&this.animation.load(e)}}class oi{constructor(){this.width=0}load(t){t&&(void 0!==t.color&&(this.color=Se.create(this.color,t.color)),void 0!==t.width&&(this.width=S(t.width)),void 0!==t.opacity&&(this.opacity=S(t.opacity)))}}class ni extends Re{constructor(){super(),this.opacityRate=1,this.sizeRate=1,this.velocityRate=1}load(t){super.load(t),t&&(void 0!==t.opacityRate&&(this.opacityRate=t.opacityRate),void 0!==t.sizeRate&&(this.sizeRate=t.sizeRate),void 0!==t.velocityRate&&(this.velocityRate=t.velocityRate))}}class ai{constructor(t,e){this._engine=t,this._container=e,this.bounce=new Ae,this.collisions=new Fe,this.color=new Se,this.color.value="#fff",this.effect=new Be,this.groups={},this.move=new Xe,this.number=new Ke,this.opacity=new Ze,this.reduceDuplicates=!1,this.shadow=new ti,this.shape=new ei,this.size=new si,this.stroke=new oi,this.zIndex=new ni}load(t){if(!t)return;if(void 0!==t.groups)for(const e of Object.keys(t.groups)){if(!Object.hasOwn(t.groups,e))continue;const i=t.groups[e];void 0!==i&&(this.groups[e]=st(this.groups[e]??{},i))}void 0!==t.reduceDuplicates&&(this.reduceDuplicates=t.reduceDuplicates),this.bounce.load(t.bounce),this.color.load(Se.create(this.color,t.color)),this.effect.load(t.effect),this.move.load(t.move),this.number.load(t.number),this.opacity.load(t.opacity),this.shape.load(t.shape),this.size.load(t.size),this.shadow.load(t.shadow),this.zIndex.load(t.zIndex),this.collisions.load(t.collisions),void 0!==t.interactivity&&(this.interactivity=st({},t.interactivity));const e=t.stroke;if(e&&(this.stroke=dt(e,(t=>{const e=new oi;return e.load(t),e}))),this._container){const e=this._engine.updaters.get(this._container);if(e)for(const i of e)i.loadOptions&&i.loadOptions(this,t);const i=this._engine.interactors.get(this._container);if(i)for(const e of i)e.loadParticlesOptions&&e.loadParticlesOptions(this,t)}}}function ri(t,...e){for(const i of e)t.load(i)}function ci(t,e,...i){const s=new ai(t,e);return ri(s,...i),s}class li{constructor(t,e){this._findDefaultTheme=t=>this.themes.find((e=>e.default.value&&e.default.mode===t))??this.themes.find((t=>t.default.value&&"any"===t.default.mode)),this._importPreset=t=>{this.load(this._engine.getPreset(t))},this._engine=t,this._container=e,this.autoPlay=!0,this.background=new le,this.backgroundMask=new de,this.clear=!0,this.defaultThemes={},this.delay=0,this.fullScreen=new ue,this.detectRetina=!0,this.duration=0,this.fpsLimit=120,this.interactivity=new we(t,e),this.manualParticles=[],this.particles=ci(this._engine,this._container),this.pauseOnBlur=!0,this.pauseOnOutsideViewport=!0,this.responsive=[],this.smooth=!1,this.style={},this.themes=[],this.zLayers=100}load(t){if(!t)return;void 0!==t.preset&&dt(t.preset,(t=>this._importPreset(t))),void 0!==t.autoPlay&&(this.autoPlay=t.autoPlay),void 0!==t.clear&&(this.clear=t.clear),void 0!==t.name&&(this.name=t.name),void 0!==t.delay&&(this.delay=S(t.delay));const e=t.detectRetina;void 0!==e&&(this.detectRetina=e),void 0!==t.duration&&(this.duration=S(t.duration));const i=t.fpsLimit;void 0!==i&&(this.fpsLimit=i),void 0!==t.pauseOnBlur&&(this.pauseOnBlur=t.pauseOnBlur),void 0!==t.pauseOnOutsideViewport&&(this.pauseOnOutsideViewport=t.pauseOnOutsideViewport),void 0!==t.zLayers&&(this.zLayers=t.zLayers),this.background.load(t.background);const s=t.fullScreen;gt(s)?this.fullScreen.enable=s:this.fullScreen.load(s),this.backgroundMask.load(t.backgroundMask),this.interactivity.load(t.interactivity),t.manualParticles&&(this.manualParticles=t.manualParticles.map((t=>{const e=new xe;return e.load(t),e}))),this.particles.load(t.particles),this.style=st(this.style,t.style),this._engine.loadOptions(this,t),void 0!==t.smooth&&(this.smooth=t.smooth);const o=this._engine.interactors.get(this._container);if(o)for(const e of o)e.loadOptions&&e.loadOptions(this,t);if(void 0!==t.responsive)for(const e of t.responsive){const t=new _e;t.load(e),this.responsive.push(t)}if(this.responsive.sort(((t,e)=>t.maxWidth-e.maxWidth)),void 0!==t.themes)for(const e of t.themes){const t=this.themes.find((t=>t.name===e.name));if(t)t.load(e);else{const t=new ze;t.load(e),this.themes.push(t)}}this.defaultThemes.dark=this._findDefaultTheme("dark")?.name,this.defaultThemes.light=this._findDefaultTheme("light")?.name}setResponsive(t,e,i){this.load(i);const s=this.responsive.find((i=>"screen"===i.mode&&screen?i.maxWidth>screen.availWidth:i.maxWidth*e>t));return this.load(s?.options),s?.maxWidth}setTheme(t){if(t){const e=this.themes.find((e=>e.name===t));e&&this.load(e.options)}else{const t=N("(prefers-color-scheme: dark)"),e=t&&t.matches,i=this._findDefaultTheme(e?"dark":"light");i&&this.load(i.options)}}}class hi{constructor(t,e){this.container=e,this._engine=t,this._interactors=t.getInteractors(this.container,!0),this._externalInteractors=[],this._particleInteractors=[]}async externalInteract(t){for(const e of this._externalInteractors)e.isEnabled()&&await e.interact(t)}handleClickMode(t){for(const e of this._externalInteractors)e.handleClickMode&&e.handleClickMode(t)}init(){this._externalInteractors=[],this._particleInteractors=[];for(const t of this._interactors){switch(t.type){case"external":this._externalInteractors.push(t);break;case"particles":this._particleInteractors.push(t)}t.init()}}async particlesInteract(t,e){for(const i of this._externalInteractors)i.clear(t,e);for(const i of this._particleInteractors)i.isEnabled(t)&&await i.interact(t,e)}async reset(t){for(const e of this._externalInteractors)e.isEnabled()&&e.reset(t);for(const e of this._particleInteractors)e.isEnabled(t)&&e.reset(t)}}function di(t){if(!Z(t.outMode,t.checkModes))return;const e=2*t.radius;t.coord>t.maxCoord-e?t.setCb(-t.radius):t.coord{for(const[,s]of t.plugins){const t=void 0!==s.particlePosition?s.particlePosition(e,this):void 0;if(t)return v.create(t.x,t.y,i)}const o=B({size:t.canvas.size,position:e}),n=v.create(o.x,o.y,i),a=this.getRadius(),r=this.options.move.outModes,c=e=>{di({outMode:e,checkModes:["bounce","bounce-horizontal"],coord:n.x,maxCoord:t.canvas.size.width,setCb:t=>n.x+=t,radius:a})},l=e=>{di({outMode:e,checkModes:["bounce","bounce-vertical"],coord:n.y,maxCoord:t.canvas.size.height,setCb:t=>n.y+=t,radius:a})};return c(r.left??r.default),c(r.right??r.default),l(r.top??r.default),l(r.bottom??r.default),this._checkOverlap(n,s)?this._calcPosition(t,void 0,i,s+1):n},this._calculateVelocity=()=>{const t=E(this.direction).copy(),e=this.options.move;if("inside"===e.direction||"outside"===e.direction)return t;const i=Math.PI/180*C(e.angle.value),s=Math.PI/180*C(e.angle.offset),o={left:s-.5*i,right:s+.5*i};return e.straight||(t.angle+=M(S(o.left,o.right))),e.random&&"number"==typeof e.speed&&(t.length*=_()),t},this._checkOverlap=(t,e=0)=>{const i=this.options.collisions,s=this.getRadius();if(!i.enable)return!1;const o=i.overlap;if(o.enable)return!1;const n=o.retries;if(n>=0&&e>n)throw new Error(`${f} particle is overlapping and can't be placed`);return!!this.container.particles.find((e=>T(t,e.position){if(!t||!this.roll||!this.backColor&&!this.roll.alter)return t;const e=this.roll.horizontal&&this.roll.vertical?2:1,i=this.roll.horizontal?.5*Math.PI:0;return Math.floor(((this.roll.angle??0)+i)/(Math.PI/e))%2?this.backColor?this.backColor:this.roll.alter?se(t,this.roll.alter.type,this.roll.alter.value):t:t},this._initPosition=t=>{const e=this.container,i=C(this.options.zIndex.value);this.position=this._calcPosition(e,t,k(i,0,e.zLayers)),this.initialPosition=this.position.copy();const s=e.canvas.size;switch(this.moveCenter={...yt(this.options.move.center,s),radius:this.options.move.center.radius??0,mode:this.options.move.center.mode??"percent"},this.direction=R(this.options.move.direction,this.position,this.moveCenter),this.options.move.direction){case"inside":this.outType="inside";break;case"outside":this.outType="outside"}this.offset=y.origin},this._engine=t,this.init(e,s,o,n)}destroy(t){if(this.unbreakable||this.destroyed)return;this.destroyed=!0,this.bubble.inRange=!1,this.slow.inRange=!1;const e=this.container,i=this.pathGenerator,s=e.shapeDrawers.get(this.shape);s&&s.particleDestroy&&s.particleDestroy(this);for(const[,i]of e.plugins)i.particleDestroyed&&i.particleDestroyed(this,t);for(const i of e.particles.updaters)i.particleDestroyed&&i.particleDestroyed(this,t);i&&i.reset(this),this._engine.dispatchEvent("particleDestroyed",{container:this.container,data:{particle:this}})}draw(t){const e=this.container,i=e.canvas;for(const[,s]of e.plugins)i.drawParticlePlugin(s,this,t);i.drawParticle(this,t)}getFillColor(){return this._getRollColor(this.bubble.color??$t(this.color))}getMass(){return this.getRadius()**2*Math.PI*.5}getPosition(){return{x:this.position.x+this.offset.x,y:this.position.y+this.offset.y,z:this.position.z}}getRadius(){return this.bubble.radius??this.size.value}getStrokeColor(){return this._getRollColor(this.bubble.color??$t(this.strokeColor))}init(t,e,i,s){const o=this.container,n=this._engine;this.id=t,this.group=s,this.effectClose=!0,this.effectFill=!0,this.shapeClose=!0,this.shapeFill=!0,this.pathRotation=!1,this.lastPathTime=0,this.destroyed=!1,this.unbreakable=!1,this.rotation=0,this.misplaced=!1,this.retina={maxDistance:{}},this.outType="normal",this.ignoresResizeRatio=!0;const a=o.retina.pixelRatio,r=o.actualOptions,c=ci(this._engine,o,r.particles),l=c.effect.type,h=c.shape.type,{reduceDuplicates:d}=c;this.effect=ut(l,this.id,d),this.shape=ut(h,this.id,d);const u=c.effect,p=c.shape;if(i){if(i.effect&&i.effect.type){const t=ut(i.effect.type,this.id,d);t&&(this.effect=t,u.load(i.effect))}if(i.shape&&i.shape.type){const t=ut(i.shape.type,this.id,d);t&&(this.shape=t,p.load(i.shape))}}this.effectData=function(t,e,i,s){const o=e.options[t];if(o)return st({close:e.close,fill:e.fill},ut(o,i,s))}(this.effect,u,this.id,d),this.shapeData=function(t,e,i,s){const o=e.options[t];if(o)return st({close:e.close,fill:e.fill},ut(o,i,s))}(this.shape,p,this.id,d),c.load(i);const f=this.effectData;f&&c.load(f.particles);const v=this.shapeData;v&&c.load(v.particles);const y=new we(n,o);y.load(o.actualOptions.interactivity),y.load(c.interactivity),this.interactivity=y,this.effectFill=f?.fill??c.effect.fill,this.effectClose=f?.close??c.effect.close,this.shapeFill=v?.fill??c.shape.fill,this.shapeClose=v?.close??c.shape.close,this.options=c;const m=this.options.move.path;this.pathDelay=1e3*C(m.delay.value),m.generator&&(this.pathGenerator=this._engine.getPathGenerator(m.generator),this.pathGenerator&&o.addPath(m.generator,this.pathGenerator)&&this.pathGenerator.init(o)),o.retina.initParticle(this),this.size=ft(this.options.size,a),this.bubble={inRange:!1},this.slow={inRange:!1,factor:1},this._initPosition(e),this.initialVelocity=this._calculateVelocity(),this.velocity=this.initialVelocity.copy(),this.moveDecay=1-C(this.options.move.decay);const g=o.particles;g.setLastZIndex(this.position.z),this.zIndexFactor=this.position.z/o.zLayers,this.sides=24;let b=o.effectDrawers.get(this.effect);b||(b=this._engine.getEffectDrawer(this.effect),b&&o.effectDrawers.set(this.effect,b)),b&&b.loadEffect&&b.loadEffect(this);let w=o.shapeDrawers.get(this.shape);w||(w=this._engine.getShapeDrawer(this.shape),w&&o.shapeDrawers.set(this.shape,w)),w&&w.loadShape&&w.loadShape(this);const x=w?.getSidesCount;x&&(this.sides=x(this)),this.spawning=!1,this.shadowColor=St(this.options.shadow.color);for(const t of g.updaters)t.init(this);for(const t of g.movers)t.init&&t.init(this);b&&b.particleInit&&b.particleInit(o,this),w&&w.particleInit&&w.particleInit(o,this);for(const[,t]of o.plugins)t.particleCreated&&t.particleCreated(this)}isInsideCanvas(){const t=this.getRadius(),e=this.container.canvas.size,i=this.position;return i.x>=-t&&i.y>=-t&&i.y<=e.height+t&&i.x<=e.width+t}isVisible(){return!this.destroyed&&!this.spawning&&this.isInsideCanvas()}reset(){for(const t of this.container.particles.updaters)t.reset&&t.reset(this)}}class pi{constructor(t,e){this.position=t,this.particle=e}}class fi{constructor(t,e){this.position={x:t,y:e}}}class vi extends fi{constructor(t,e,i,s){super(t,e),this.size={height:s,width:i}}contains(t){const e=this.size.width,i=this.size.height,s=this.position;return t.x>=s.x&&t.x<=s.x+e&&t.y>=s.y&&t.y<=s.y+i}intersects(t){t instanceof yi&&t.intersects(this);const e=this.size.width,i=this.size.height,s=this.position,o=t.position,n=t instanceof vi?t.size:{width:0,height:0},a=n.width,r=n.height;return o.xs.x&&o.ys.y}}class yi extends fi{constructor(t,e,i){super(t,e),this.radius=i}contains(t){return T(t,this.position)<=this.radius}intersects(t){const e=this.position,i=t.position,s=Math.abs(i.x-e.x),o=Math.abs(i.y-e.y),n=this.radius;if(t instanceof yi){return n+t.radius>Math.sqrt(s**2+o**2)}if(t instanceof vi){const{width:e,height:i}=t.size;return Math.pow(s-e,2)+Math.pow(o-i,2)<=n**2||s<=n+e&&o<=n+i||s<=e||o<=i}return!1}}class mi{constructor(t,e){this.rectangle=t,this.capacity=e,this._subdivide=()=>{const{x:t,y:e}=this.rectangle.position,{width:i,height:s}=this.rectangle.size,{capacity:o}=this;for(let n=0;n<4;n++)this._subs.push(new mi(new vi(t+.5*i*(n%2),e+.5*s*(Math.round(.5*n)-n%2),.5*i,.5*s),o));this._divided=!0},this._points=[],this._divided=!1,this._subs=[]}insert(t){return!!this.rectangle.contains(t.position)&&(this._points.lengthe.insert(t)))))}query(t,e,i){const s=i||[];if(!t.intersects(this.rectangle))return[];for(const i of this._points)!t.contains(i.position)&&T(t.position,i.position)>i.particle.getRadius()&&(!e||e(i.particle))||s.push(i.particle);if(this._divided)for(const i of this._subs)i.query(t,e,s);return s}queryCircle(t,e,i){return this.query(new yi(t.x,t.y,e),i)}queryRectangle(t,e,i){return this.query(new vi(t.x,t.y,e.width,e.height),i)}}const gi=t=>{const{height:e,width:i}=t;return new vi(-.25*i,-.25*e,1.5*i,1.5*e)};class bi{constructor(t,e){this._addToPool=(...t)=>{for(const e of t)this._pool.push(e)},this._applyDensity=(t,e,i)=>{const s=t.number;if(!t.number.density?.enable)return void(void 0===i?this._limit=s.limit.value:s.limit&&this._groupLimits.set(i,s.limit.value));const o=this._initDensityFactor(s.density),n=s.value,a=s.limit.value>0?s.limit.value:n,r=Math.min(n,a)*o+e,c=Math.min(this.count,this.filter((t=>t.group===i)).length);void 0===i?this._limit=s.limit.value*o:this._groupLimits.set(i,s.limit.value*o),cr&&this.removeQuantity(c-r,i)},this._initDensityFactor=t=>{const e=this._container;if(!e.canvas.element||!t.enable)return 1;const i=e.canvas.element,s=e.retina.pixelRatio;return i.width*i.height/(t.height*t.width*s**2)},this._pushParticle=(t,e,i,s)=>{try{let o=this._pool.pop();o?o.init(this._nextId,t,e,i):o=new ui(this._engine,this._nextId,this._container,t,e,i);let n=!0;if(s&&(n=s(o)),!n)return;return this._array.push(o),this._zArray.push(o),this._nextId++,this._engine.dispatchEvent("particleAdded",{container:this._container,data:{particle:o}}),o}catch(t){return void W().warning(`${f} adding particle: ${t}`)}},this._removeParticle=(t,e,i)=>{const s=this._array[t];if(!s||s.group!==e)return!1;const o=this._zArray.indexOf(s);return this._array.splice(t,1),this._zArray.splice(o,1),s.destroy(i),this._engine.dispatchEvent("particleRemoved",{container:this._container,data:{particle:s}}),this._addToPool(s),!0},this._engine=t,this._container=e,this._nextId=0,this._array=[],this._zArray=[],this._pool=[],this._limit=0,this._groupLimits=new Map,this._needsSort=!1,this._lastZIndex=0,this._interactionManager=new hi(t,e);const i=e.canvas.size;this.quadTree=new mi(gi(i),4),this.movers=this._engine.getMovers(e,!0),this.updaters=this._engine.getUpdaters(e,!0)}get count(){return this._array.length}addManualParticles(){const t=this._container,e=t.actualOptions;for(const i of e.manualParticles)this.addParticle(i.position?yt(i.position,t.canvas.size):void 0,i.options)}addParticle(t,e,i,s){const o=this._container.actualOptions.particles.number.limit,n=void 0===i?this._limit:this._groupLimits.get(i)??this._limit,a=this.count;if(n>0)if("delete"===o.mode){const t=a+1-n;t>0&&this.removeQuantity(t)}else if("wait"===o.mode&&a>=n)return;return this._pushParticle(t,e,i,s)}clear(){this._array=[],this._zArray=[]}destroy(){this._array=[],this._zArray=[],this.movers=[],this.updaters=[]}async draw(t){const e=this._container,i=e.canvas;i.clear(),await this.update(t);for(const[,s]of e.plugins)i.drawPlugin(s,t);for(const e of this._zArray)e.draw(t)}filter(t){return this._array.filter(t)}find(t){return this._array.find(t)}get(t){return this._array[t]}handleClickMode(t){this._interactionManager.handleClickMode(t)}init(){const t=this._container,e=t.actualOptions;this._lastZIndex=0,this._needsSort=!1;let i=!1;this.updaters=this._engine.getUpdaters(t,!0),this._interactionManager.init();for(const[,e]of t.plugins)if(void 0!==e.particlesInitialization&&(i=e.particlesInitialization()),i)break;this._interactionManager.init();for(const[,e]of t.pathGenerators)e.init(t);if(this.addManualParticles(),!i){const t=e.particles,i=t.groups;for(const e in i){const s=i[e];for(let i=this.count,o=0;othis.count)return;let o=0;for(let n=t;o!i.has(t);this._array=this.filter(t),this._zArray=this._zArray.filter(t);for(const t of i)this._engine.dispatchEvent("particleRemoved",{container:this._container,data:{particle:t}});this._addToPool(...i)}await this._interactionManager.externalInteract(t);for(const e of this._array){for(const i of this.updaters)i.update(e,t);e.destroyed||e.spawning||await this._interactionManager.particlesInteract(e,t)}if(delete this._resizeFactor,this._needsSort){const t=this._zArray;t.sort(((t,e)=>e.position.z-t.position.z||t.id-e.id)),this._lastZIndex=t[t.length-1].position.z,this._needsSort=!1}}}class wi{constructor(t){this.container=t,this.pixelRatio=1,this.reduceFactor=1}init(){const t=this.container,e=t.actualOptions;this.pixelRatio=!e.detectRetina||j()?1:window.devicePixelRatio,this.reduceFactor=1;const i=this.pixelRatio,s=t.canvas;if(s.element){const t=s.element;s.size.width=t.offsetWidth*i,s.size.height=t.offsetHeight*i}const o=e.particles,n=o.move;this.maxSpeed=C(n.gravity.maxSpeed)*i,this.sizeAnimationSpeed=C(o.size.animation.speed)*i}initParticle(t){const e=t.options,i=this.pixelRatio,s=e.move,o=s.distance,n=t.retina;n.moveDrift=C(s.drift)*i,n.moveSpeed=C(s.speed)*i,n.sizeAnimationSpeed=C(e.size.animation.speed)*i;const a=n.maxDistance;a.horizontal=void 0!==o.horizontal?o.horizontal*i:void 0,a.vertical=void 0!==o.vertical?o.vertical*i:void 0,n.maxSpeed=C(s.gravity.maxSpeed)*i}}function xi(t){return t&&!t.destroyed}function _i(t,e,...i){const s=new li(t,e);return ri(s,...i),s}class ki{constructor(t,e,i){this._intersectionManager=t=>{if(xi(this)&&this.actualOptions.pauseOnOutsideViewport)for(const e of t)e.target===this.interactivity.element&&(e.isIntersecting?this.play:this.pause)()},this._nextFrame=async t=>{try{if(!this._smooth&&void 0!==this._lastFrameTime&&t1e3)return void this.draw(!1);if(await this.particles.draw(e),!this.alive())return void this.destroy();this.getAnimationStatus()&&this.draw(!1)}catch(t){W().error(`${f} in animation loop`,t)}},this._engine=t,this.id=Symbol(e),this.fpsLimit=120,this._smooth=!1,this._delay=0,this._duration=0,this._lifeTime=0,this._firstStart=!0,this.started=!1,this.destroyed=!1,this._paused=!0,this._lastFrameTime=0,this.zLayers=100,this.pageHidden=!1,this._sourceOptions=i,this._initialSourceOptions=i,this.retina=new wi(this),this.canvas=new ne(this),this.particles=new bi(this._engine,this),this.pathGenerators=new Map,this.interactivity={mouse:{clicking:!1,inside:!1}},this.plugins=new Map,this.effectDrawers=new Map,this.shapeDrawers=new Map,this._options=_i(this._engine,this),this.actualOptions=_i(this._engine,this),this._eventListeners=new re(this),this._intersectionObserver=X((t=>this._intersectionManager(t))),this._engine.dispatchEvent("containerBuilt",{container:this})}get options(){return this._options}get sourceOptions(){return this._sourceOptions}addClickHandler(t){if(!xi(this))return;const e=this.interactivity.element;if(!e)return;const i=(e,i,s)=>{if(!xi(this))return;const o=this.retina.pixelRatio,n={x:i.x*o,y:i.y*o},a=this.particles.quadTree.queryCircle(n,s*o);t(e,a)};let s=!1,o=!1;e.addEventListener("click",(t=>{if(!xi(this))return;const e=t,s={x:e.offsetX||e.clientX,y:e.offsetY||e.clientY};i(t,s,1)})),e.addEventListener("touchstart",(()=>{xi(this)&&(s=!0,o=!1)})),e.addEventListener("touchmove",(()=>{xi(this)&&(o=!0)})),e.addEventListener("touchend",(t=>{if(xi(this)){if(s&&!o){const e=t;let s=e.touches[e.touches.length-1];if(!s&&(s=e.changedTouches[e.changedTouches.length-1],!s))return;const o=this.canvas.element,n=o?o.getBoundingClientRect():void 0,a={x:s.clientX-(n?n.left:0),y:s.clientY-(n?n.top:0)};i(t,a,Math.max(s.radiusX,s.radiusY))}s=!1,o=!1}})),e.addEventListener("touchcancel",(()=>{xi(this)&&(s=!1,o=!1)}))}addLifeTime(t){this._lifeTime+=t}addPath(t,e,i=!1){return!(!xi(this)||!i&&this.pathGenerators.has(t))&&(this.pathGenerators.set(t,e),!0)}alive(){return!this._duration||this._lifeTime<=this._duration}destroy(){if(!xi(this))return;this.stop(),this.particles.destroy(),this.canvas.destroy();for(const[,t]of this.effectDrawers)t.destroy&&t.destroy(this);for(const[,t]of this.shapeDrawers)t.destroy&&t.destroy(this);for(const t of this.effectDrawers.keys())this.effectDrawers.delete(t);for(const t of this.shapeDrawers.keys())this.shapeDrawers.delete(t);this._engine.clearPlugins(this),this.destroyed=!0;const t=this._engine.dom(),e=t.findIndex((t=>t===this));e>=0&&t.splice(e,1),this._engine.dispatchEvent("containerDestroyed",{container:this})}draw(t){if(!xi(this))return;let e=t;this._drawAnimationFrame=requestAnimationFrame((async t=>{e&&(this._lastFrameTime=void 0,e=!1),await this._nextFrame(t)}))}async export(t,e={}){for(const[,i]of this.plugins){if(!i.export)continue;const s=await i.export(t,e);if(s.supported)return s.blob}W().error(`${f} - Export plugin with type ${t} not found`)}getAnimationStatus(){return!this._paused&&!this.pageHidden&&xi(this)}handleClickMode(t){if(xi(this)){this.particles.handleClickMode(t);for(const[,e]of this.plugins)e.handleClickMode&&e.handleClickMode(t)}}async init(){if(!xi(this))return;const t=this._engine.getSupportedEffects();for(const e of t){const t=this._engine.getEffectDrawer(e);t&&this.effectDrawers.set(e,t)}const e=this._engine.getSupportedShapes();for(const t of e){const e=this._engine.getShapeDrawer(t);e&&this.shapeDrawers.set(t,e)}this._options=_i(this._engine,this,this._initialSourceOptions,this.sourceOptions),this.actualOptions=_i(this._engine,this,this._options);const i=this._engine.getAvailablePlugins(this);for(const[t,e]of i)this.plugins.set(t,e);this.retina.init(),await this.canvas.init(),this.updateActualOptions(),this.canvas.initBackground(),this.canvas.resize(),this.zLayers=this.actualOptions.zLayers,this._duration=1e3*C(this.actualOptions.duration),this._delay=1e3*C(this.actualOptions.delay),this._lifeTime=0,this.fpsLimit=this.actualOptions.fpsLimit>0?this.actualOptions.fpsLimit:120,this._smooth=this.actualOptions.smooth;for(const[,t]of this.effectDrawers)t.init&&await t.init(this);for(const[,t]of this.shapeDrawers)t.init&&await t.init(this);for(const[,t]of this.plugins)t.init&&await t.init();this._engine.dispatchEvent("containerInit",{container:this}),this.particles.init(),this.particles.setDensity();for(const[,t]of this.plugins)t.particlesSetup&&t.particlesSetup();this._engine.dispatchEvent("particlesSetup",{container:this})}async loadTheme(t){xi(this)&&(this._currentTheme=t,await this.refresh())}pause(){if(xi(this)&&(void 0!==this._drawAnimationFrame&&(cancelAnimationFrame(this._drawAnimationFrame),delete this._drawAnimationFrame),!this._paused)){for(const[,t]of this.plugins)t.pause&&t.pause();this.pageHidden||(this._paused=!0),this._engine.dispatchEvent("containerPaused",{container:this})}}play(t){if(!xi(this))return;const e=this._paused||t;if(!this._firstStart||this.actualOptions.autoPlay){if(this._paused&&(this._paused=!1),e)for(const[,t]of this.plugins)t.play&&t.play();this._engine.dispatchEvent("containerPlay",{container:this}),this.draw(e||!1)}else this._firstStart=!1}async refresh(){if(xi(this))return this.stop(),this.start()}async reset(){if(xi(this))return this._initialSourceOptions=void 0,this._options=_i(this._engine,this),this.actualOptions=_i(this._engine,this,this._options),this.refresh()}async start(){xi(this)&&!this.started&&(await this.init(),this.started=!0,await new Promise((t=>{this._delayTimeout=setTimeout((async()=>{this._eventListeners.addListeners(),this.interactivity.element instanceof HTMLElement&&this._intersectionObserver&&this._intersectionObserver.observe(this.interactivity.element);for(const[,t]of this.plugins)t.start&&await t.start();this._engine.dispatchEvent("containerStarted",{container:this}),this.play(),t()}),this._delay)})))}stop(){if(xi(this)&&this.started){this._delayTimeout&&(clearTimeout(this._delayTimeout),delete this._delayTimeout),this._firstStart=!0,this.started=!1,this._eventListeners.removeListeners(),this.pause(),this.particles.clear(),this.canvas.stop(),this.interactivity.element instanceof HTMLElement&&this._intersectionObserver&&this._intersectionObserver.unobserve(this.interactivity.element);for(const[,t]of this.plugins)t.stop&&t.stop();for(const t of this.plugins.keys())this.plugins.delete(t);this._sourceOptions=this._options,this._engine.dispatchEvent("containerStopped",{container:this})}}updateActualOptions(){this.actualOptions.responsive=[];const t=this.actualOptions.setResponsive(this.canvas.size.width,this.retina.pixelRatio,this._options);return this.actualOptions.setTheme(this._currentTheme),this._responsiveMaxWidth!==t&&(this._responsiveMaxWidth=t,!0)}}class zi{constructor(){this._listeners=new Map}addEventListener(t,e){this.removeEventListener(t,e);let i=this._listeners.get(t);i||(i=[],this._listeners.set(t,i)),i.push(e)}dispatchEvent(t,e){const i=this._listeners.get(t);i&&i.forEach((t=>t(e)))}hasEventListener(t){return!!this._listeners.get(t)}removeAllEventListeners(t){t?this._listeners.delete(t):this._listeners=new Map}removeEventListener(t,e){const i=this._listeners.get(t);if(!i)return;const s=i.length,o=i.indexOf(e);o<0||(1===s?this._listeners.delete(t):i.splice(o,1))}}function Mi(t,e,i,s=!1){let o=e.get(t);return o&&!s||(o=[...i.values()].map((e=>e(t))),e.set(t,o)),o}class Ci{constructor(){this._configs=new Map,this._domArray=[],this._eventDispatcher=new zi,this._initialized=!1,this.plugins=[],this._initializers={interactors:new Map,movers:new Map,updaters:new Map},this.interactors=new Map,this.movers=new Map,this.updaters=new Map,this.presets=new Map,this.effectDrawers=new Map,this.shapeDrawers=new Map,this.pathGenerators=new Map}get configs(){const t={};for(const[e,i]of this._configs)t[e]=i;return t}get version(){return"3.0.2"}addConfig(t){const e=t.name??"default";this._configs.set(e,t),this._eventDispatcher.dispatchEvent("configAdded",{data:{name:e,config:t}})}async addEffect(t,e,i=!0){dt(t,(t=>{!this.getEffectDrawer(t)&&this.effectDrawers.set(t,e)})),await this.refresh(i)}addEventListener(t,e){this._eventDispatcher.addEventListener(t,e)}async addInteractor(t,e,i=!0){this._initializers.interactors.set(t,e),await this.refresh(i)}async addMover(t,e,i=!0){this._initializers.movers.set(t,e),await this.refresh(i)}async addParticleUpdater(t,e,i=!0){this._initializers.updaters.set(t,e),await this.refresh(i)}async addPathGenerator(t,e,i=!0){!this.getPathGenerator(t)&&this.pathGenerators.set(t,e),await this.refresh(i)}async addPlugin(t,e=!0){!this.getPlugin(t.id)&&this.plugins.push(t),await this.refresh(e)}async addPreset(t,e,i=!1,s=!0){(i||!this.getPreset(t))&&this.presets.set(t,e),await this.refresh(s)}async addShape(t,e,i=!0){dt(t,(t=>{!this.getShapeDrawer(t)&&this.shapeDrawers.set(t,e)})),await this.refresh(i)}clearPlugins(t){this.updaters.delete(t),this.movers.delete(t),this.interactors.delete(t)}dispatchEvent(t,e){this._eventDispatcher.dispatchEvent(t,e)}dom(){return this._domArray}domItem(t){const e=this.dom(),i=e[t];if(i&&!i.destroyed)return i;e.splice(t,1)}getAvailablePlugins(t){const e=new Map;for(const i of this.plugins)i.needsPlugin(t.actualOptions)&&e.set(i.id,i.getPlugin(t));return e}getEffectDrawer(t){return this.effectDrawers.get(t)}getInteractors(t,e=!1){return Mi(t,this.interactors,this._initializers.interactors,e)}getMovers(t,e=!1){return Mi(t,this.movers,this._initializers.movers,e)}getPathGenerator(t){return this.pathGenerators.get(t)}getPlugin(t){return this.plugins.find((e=>e.id===t))}getPreset(t){return this.presets.get(t)}getShapeDrawer(t){return this.shapeDrawers.get(t)}getSupportedEffects(){return this.effectDrawers.keys()}getSupportedShapes(){return this.shapeDrawers.keys()}getUpdaters(t,e=!1){return Mi(t,this.updaters,this._initializers.updaters,e)}init(){this._initialized||(this._initialized=!0)}async load(t){const e=t.id??`tsparticles${Math.floor(1e4*_())}`,{index:s,url:o}=t,n=o?await async function(t){const e=ut(t.url,t.index);if(!e)return t.fallback;const i=await fetch(e);return i.ok?i.json():(W().error(`${f} ${i.status} while retrieving config file`),t.fallback)}({fallback:t.options,url:o,index:s}):t.options;let a=t.element??document.getElementById(e);a||(a=document.createElement("div"),a.id=e,document.body.append(a));const r=ut(n,s),c=this.dom(),l=c.findIndex((t=>t.id.description===e));if(l>=0){const t=this.domItem(l);t&&!t.destroyed&&(t.destroy(),c.splice(l,1))}let h;if("canvas"===a.tagName.toLowerCase())h=a,h.dataset[i]="false";else{const t=a.getElementsByTagName("canvas");t.length?(h=t[0],h.dataset[i]="false"):(h=document.createElement("canvas"),h.dataset[i]="true",a.appendChild(h))}h.style.width||(h.style.width="100%"),h.style.height||(h.style.height="100%");const d=new ki(this,e,r);return l>=0?c.splice(l,0,d):c.push(d),d.canvas.loadCanvas(h),await d.start(),d}loadOptions(t,e){for(const i of this.plugins)i.loadOptions(t,e)}loadParticlesOptions(t,e,...i){const s=this.updaters.get(t);if(s)for(const t of s)t.loadOptions&&t.loadOptions(e,...i)}async refresh(t=!0){t&&this.dom().forEach((t=>t.refresh()))}removeEventListener(t,e){this._eventDispatcher.removeEventListener(t,e)}setOnClickHandler(t){const e=this.dom();if(!e.length)throw new Error(`${f} can only set click handlers after calling tsParticles.load()`);for(const i of e)i.addClickHandler(t)}}class Pi{constructor(){this.key="hsl",this.stringPrefix="hsl"}handleColor(t){const e=t.value.hsl??t.value;if(void 0!==e.h&&void 0!==e.s&&void 0!==e.l)return At(e)}handleRangeColor(t){const e=t.value.hsl??t.value;if(void 0!==e.h&&void 0!==e.l)return At({h:C(e.h),l:C(e.l),s:C(e.s)})}parseString(t){if(!t.startsWith("hsl"))return;const e=/hsla?\(\s*(\d+)\s*,\s*(\d+)%\s*,\s*(\d+)%\s*(,\s*([\d.%]+)\s*)?\)/i.exec(t);return e?Ft({a:e.length>4?H(e[5]):1,h:parseInt(e[1],10),l:parseInt(e[3],10),s:parseInt(e[2],10)}):void 0}}class Oi{constructor(){this.key="rgb",this.stringPrefix="rgb"}handleColor(t){const e=t.value.rgb??t.value;if(void 0!==e.r)return e}handleRangeColor(t){const e=t.value.rgb??t.value;if(void 0!==e.r)return{r:C(e.r),g:C(e.g),b:C(e.b)}}parseString(t){if(!t.startsWith(this.stringPrefix))return;const e=/rgba?\(\s*(\d+)\s*,\s*(\d+)\s*,\s*(\d+)\s*(,\s*([\d.%]+)\s*)?\)/i.exec(t);return e?{a:e.length>4?H(e[5]):1,b:parseInt(e[3],10),g:parseInt(e[2],10),r:parseInt(e[1],10)}:void 0}}class Si{constructor(t){this.container=t,this.type="external"}}class Di{constructor(t){this.container=t,this.type="particles"}}const Ti=function(){const t=new Oi,e=new Pi;Pt(t),Pt(e);const i=new Ci;return i.init(),i}();j()||(window.tsParticles=Ti);class Ri{constructor(){this.radius=0,this.mass=0}load(t){t&&(void 0!==t.mass&&(this.mass=t.mass),void 0!==t.radius&&(this.radius=t.radius))}}class Ei extends Re{constructor(){super(),this.density=5,this.value=50,this.limit=new Ri}load(t){t&&(super.load(t),void 0!==t.density&&(this.density=t.density),wt(t.limit)?this.limit.radius=t.limit:this.limit.load(t.limit))}}class Ii{constructor(){this.color=new ce,this.color.value="#000000",this.draggable=!1,this.opacity=1,this.destroy=!0,this.orbits=!1,this.size=new Ei}load(t){void 0!==t&&(void 0!==t.color&&(this.color=ce.create(this.color,t.color)),void 0!==t.draggable&&(this.draggable=t.draggable),this.name=t.name,void 0!==t.opacity&&(this.opacity=t.opacity),void 0!==t.position&&(this.position={},void 0!==t.position.x&&(this.position.x=S(t.position.x)),void 0!==t.position.y&&(this.position.y=S(t.position.y))),void 0!==t.size&&this.size.load(t.size),void 0!==t.destroy&&(this.destroy=t.destroy),void 0!==t.orbits&&(this.orbits=t.orbits))}}class Li{constructor(t,e,i,s){this.absorbers=t,this.container=e,this._calcPosition=()=>{const t=F({size:this.container.canvas.size,position:this.options.position});return y.create(t.x,t.y)},this._updateParticlePosition=(t,e)=>{if(t.destroyed)return;const i=this.container,s=i.canvas.size;if(t.needsNewPosition){const e=A({size:s});t.position.setTo(e),t.velocity.setTo(t.initialVelocity),t.absorberOrbit=void 0,t.needsNewPosition=!1}if(this.options.orbits){if(void 0===t.absorberOrbit&&(t.absorberOrbit=y.create(0,0),t.absorberOrbit.length=T(t.getPosition(),this.position),t.absorberOrbit.angle=_()*Math.PI*2),t.absorberOrbit.length<=this.size&&!this.options.destroy){const e=Math.min(s.width,s.height);t.absorberOrbit.length=e*(.2*_()-.1+1)}void 0===t.absorberOrbitDirection&&(t.absorberOrbitDirection=t.velocity.x>=0?"clockwise":"counter-clockwise");const o=t.absorberOrbit.length,n=t.absorberOrbit.angle,a=t.absorberOrbitDirection;t.velocity.setTo(y.origin);const r={x:"clockwise"===a?Math.cos:Math.sin,y:"clockwise"===a?Math.sin:Math.cos};t.position.x=this.position.x+o*r.x(n),t.position.y=this.position.y+o*r.y(n),t.absorberOrbit.length-=e.length,t.absorberOrbit.angle+=(t.retina.moveSpeed??0)*i.retina.pixelRatio/100*i.retina.reduceFactor}else{const i=y.origin;i.length=e.length,i.angle=e.angle,t.velocity.addTo(i)}},this.initialPosition=s?y.create(s.x,s.y):void 0,i instanceof Ii?this.options=i:(this.options=new Ii,this.options.load(i)),this.dragging=!1,this.name=this.options.name,this.opacity=this.options.opacity,this.size=C(this.options.size.value)*e.retina.pixelRatio,this.mass=this.size*this.options.size.density*e.retina.reduceFactor;const o=this.options.size.limit;this.limit={radius:o.radius*e.retina.pixelRatio*e.retina.reduceFactor,mass:o.mass},this.color=St(this.options.color)??{b:0,g:0,r:0},this.position=this.initialPosition?.copy()??this._calcPosition()}attract(t){const e=this.container,i=this.options;if(i.draggable){const t=e.interactivity.mouse;if(t.clicking&&t.downPosition){T(this.position,t.downPosition)<=this.size&&(this.dragging=!0)}else this.dragging=!1;this.dragging&&t.position&&(this.position.x=t.position.x,this.position.y=t.position.y)}const s=t.getPosition(),{dx:o,dy:n,distance:a}=D(this.position,s),r=y.create(o,n);if(r.length=this.mass/Math.pow(a,2)*e.retina.reduceFactor,at.getRadius()&&avoid 0===t||wt(t)?this.array[t||0]:this.array.find((e=>e.name===t)),t.addAbsorber=(t,e)=>this.addAbsorber(t,e)}addAbsorber(t,e){const i=new Li(this,this.container,t,e);return this.array.push(i),i}draw(t){for(const e of this.array)e.draw(t)}handleClickMode(t){const e=this.absorbers,i=this.interactivityAbsorbers;if("absorber"===t){const t=ut(i)??ut(e),s=this.container.interactivity.mouse.clickPosition;this.addAbsorber(t,s)}}async init(){this.absorbers=this.container.actualOptions.absorbers,this.interactivityAbsorbers=this.container.actualOptions.interactivity.modes.absorbers,dt(this.absorbers,(t=>{this.addAbsorber(t)}))}particleUpdate(t){for(const e of this.array)if(e.attract(t),t.destroyed)break}removeAbsorber(t){const e=this.array.indexOf(t);e>=0&&this.array.splice(e,1)}resize(){for(const t of this.array)t.resize()}stop(){this.array=[]}}class Fi{constructor(){this.id="absorbers"}getPlugin(t){return new Ai(t)}loadOptions(t,e){(this.needsPlugin(t)||this.needsPlugin(e))&&(e?.absorbers&&(t.absorbers=dt(e.absorbers,(t=>{const e=new Ii;return e.load(t),e}))),t.interactivity.modes.absorbers=dt(e?.interactivity?.modes?.absorbers,(t=>{const e=new Ii;return e.load(t),e})))}needsPlugin(t){if(!t)return!1;const e=t.absorbers;return kt(e)?!!e.length:!!e||!(!t.interactivity?.events?.onClick?.mode||!Z("absorber",t.interactivity.events.onClick.mode))}}class Bi{load(t){t&&(void 0!==t.bottom&&(this.bottom=S(t.bottom)),void 0!==t.left&&(this.left=S(t.left)),void 0!==t.right&&(this.right=S(t.right)),void 0!==t.top&&(this.top=S(t.top)))}}class qi extends Re{constructor(){super(),this.value=3}}class Hi extends Re{constructor(){super(),this.value={min:4,max:9}}}class Vi{constructor(){this.count=1,this.factor=new qi,this.rate=new Hi,this.sizeOffset=!0}load(t){t&&(void 0!==t.color&&(this.color=ce.create(this.color,t.color)),void 0!==t.count&&(this.count=t.count),this.factor.load(t.factor),this.rate.load(t.rate),this.particles=dt(t.particles,(t=>st({},t))),void 0!==t.sizeOffset&&(this.sizeOffset=t.sizeOffset),t.colorOffset&&(this.colorOffset=this.colorOffset??{},void 0!==t.colorOffset.h&&(this.colorOffset.h=t.colorOffset.h),void 0!==t.colorOffset.s&&(this.colorOffset.s=t.colorOffset.s),void 0!==t.colorOffset.l&&(this.colorOffset.l=t.colorOffset.l)))}}class Ui{constructor(){this.bounds=new Bi,this.mode="none",this.split=new Vi}load(t){t&&(t.mode&&(this.mode=t.mode),t.bounds&&this.bounds.load(t.bounds),this.split.load(t.split))}}function Wi(t,e,i,s){const o=i.options.destroy;if(!o)return;const n=o.split,a=ci(t,e,i.options),r=C(n.factor.value),c=i.getFillColor();n.color?a.color.load(n.color):n.colorOffset&&c?a.color.load({value:{hsl:{h:c.h+C(n.colorOffset.h??0),s:c.s+C(n.colorOffset.s??0),l:c.l+C(n.colorOffset.l??0)}}}):a.color.load({value:{hsl:i.getFillColor()}}),a.move.load({center:{x:i.position.x,y:i.position.y,mode:"precise"}}),wt(a.size.value)?a.size.value/=r:(a.size.value.min/=r,a.size.value.max/=r),a.load(s);const l=n.sizeOffset?S(-i.size.value,i.size.value):0,h={x:i.position.x+M(l),y:i.position.y+M(l)};return e.particles.addParticle(h,a,i.group,(t=>!(t.size.value<.5)&&(t.velocity.length=M(S(i.velocity.length,t.velocity.length)),t.splitCount=(i.splitCount??0)+1,t.unbreakable=!0,setTimeout((()=>{t.unbreakable=!1}),500),!0)))}class $i{constructor(t,e){this.engine=t,this.container=e}init(t){const e=this.container,i=t.options.destroy;if(!i)return;t.splitCount=0;const s=i.bounds;t.destroyBounds||(t.destroyBounds={});const{bottom:o,left:n,right:a,top:r}=s,{destroyBounds:c}=t,l=e.canvas.size;o&&(c.bottom=C(o)*l.height/100),n&&(c.left=C(n)*l.width/100),a&&(c.right=C(a)*l.width/100),r&&(c.top=C(r)*l.height/100)}isEnabled(t){return!t.destroyed}loadOptions(t,...e){t.destroy||(t.destroy=new Ui);for(const i of e)t.destroy.load(i?.destroy)}particleDestroyed(t,e){if(e)return;const i=t.options.destroy;i&&"split"===i.mode&&function(t,e,i){const s=i.options.destroy;if(!s)return;const o=s.split;if(o.count>=0&&(void 0===i.splitCount||i.splitCount++>o.count))return;const n=C(o.rate.value),a=ut(o.particles);for(let s=0;s=i.bottom||void 0!==i.left&&e.x<=i.left||void 0!==i.right&&e.x>=i.right||void 0!==i.top&&e.y<=i.top)&&t.destroy()}}class ji{constructor(){this.wait=!1}load(t){t&&(void 0!==t.count&&(this.count=t.count),void 0!==t.delay&&(this.delay=S(t.delay)),void 0!==t.duration&&(this.duration=S(t.duration)),void 0!==t.wait&&(this.wait=t.wait))}}class Gi{constructor(){this.quantity=1,this.delay=.1}load(t){void 0!==t&&(void 0!==t.quantity&&(this.quantity=S(t.quantity)),void 0!==t.delay&&(this.delay=S(t.delay)))}}class Ni{constructor(){this.color=!1,this.opacity=!1}load(t){t&&(void 0!==t.color&&(this.color=t.color),void 0!==t.opacity&&(this.opacity=t.opacity))}}class Xi{constructor(){this.options={},this.replace=new Ni,this.type="square"}load(t){t&&(void 0!==t.options&&(this.options=st({},t.options??{})),this.replace.load(t.replace),void 0!==t.type&&(this.type=t.type))}}class Yi{constructor(){this.mode="percent",this.height=0,this.width=0}load(t){void 0!==t&&(void 0!==t.mode&&(this.mode=t.mode),void 0!==t.height&&(this.height=t.height),void 0!==t.width&&(this.width=t.width))}}class Zi{constructor(){this.autoPlay=!0,this.fill=!0,this.life=new ji,this.rate=new Gi,this.shape=new Xi,this.startCount=0}load(t){t&&(void 0!==t.autoPlay&&(this.autoPlay=t.autoPlay),void 0!==t.size&&(this.size||(this.size=new Yi),this.size.load(t.size)),void 0!==t.direction&&(this.direction=t.direction),this.domId=t.domId,void 0!==t.fill&&(this.fill=t.fill),this.life.load(t.life),this.name=t.name,this.particles=dt(t.particles,(t=>st({},t))),this.rate.load(t.rate),this.shape.load(t.shape),void 0!==t.position&&(this.position={},void 0!==t.position.x&&(this.position.x=S(t.position.x)),void 0!==t.position.y&&(this.position.y=S(t.position.y))),void 0!==t.spawnColor&&(void 0===this.spawnColor&&(this.spawnColor=new Se),this.spawnColor.load(t.spawnColor)),void 0!==t.startCount&&(this.startCount=t.startCount))}}function Qi(t,e){t.color?t.color.value=e:t.color={value:e}}class Ji{constructor(t,e,i,s,o){this.emitters=e,this.container=i,this._destroy=()=>{this._mutationObserver?.disconnect(),this._mutationObserver=void 0,this._resizeObserver?.disconnect(),this._resizeObserver=void 0,this.emitters.removeEmitter(this),this._engine.dispatchEvent("emitterDestroyed",{container:this.container,data:{emitter:this}})},this._prepareToDie=()=>{if(this._paused)return;const t=void 0!==this.options.life?.duration?C(this.options.life.duration):void 0;this.container.retina.reduceFactor&&(this._lifeCount>0||this._immortal)&&void 0!==t&&t>0&&(this._duration=1e3*t)},this._setColorAnimation=(t,e,i)=>{const s=this.container;if(!t.enable)return e;const o=M(t.offset),n=1e3*C(this.options.rate.delay)/s.retina.reduceFactor;return(e+C(t.speed??0)*s.fpsLimit/n+3.6*o)%i},this._engine=t,this._currentDuration=0,this._currentEmitDelay=0,this._currentSpawnDelay=0,this._initialPosition=o,s instanceof Zi?this.options=s:(this.options=new Zi,this.options.load(s)),this._spawnDelay=1e3*C(this.options.life.delay??0)/this.container.retina.reduceFactor,this.position=this._initialPosition??this._calcPosition(),this.name=this.options.name,this.fill=this.options.fill,this._firstSpawn=!this.options.life.wait,this._startParticlesAdded=!1;let n=st({},this.options.particles);if(n??={},n.move??={},n.move.direction??=this.options.direction,this.options.spawnColor&&(this.spawnColor=Rt(this.options.spawnColor)),this._paused=!this.options.autoPlay,this._particlesOptions=n,this._size=this._calcSize(),this.size=mt(this._size,this.container.canvas.size),this._lifeCount=this.options.life.count??-1,this._immortal=this._lifeCount<=0,this.options.domId){const t=document.getElementById(this.options.domId);t&&(this._mutationObserver=new MutationObserver((()=>{this.resize()})),this._resizeObserver=new ResizeObserver((()=>{this.resize()})),this._mutationObserver.observe(t,{attributes:!0,attributeFilter:["style","width","height"]}),this._resizeObserver.observe(t))}const a=this.options.shape,r=this._engine.emitterShapeManager?.getShapeGenerator(a.type);r&&(this._shape=r.generate(this.position,this.size,this.fill,a.options)),this._engine.dispatchEvent("emitterCreated",{container:i,data:{emitter:this}}),this.play()}externalPause(){this._paused=!0,this.pause()}externalPlay(){this._paused=!1,this.play()}async init(){await(this._shape?.init())}pause(){this._paused||delete this._emitDelay}play(){if(!this._paused&&this.container.retina.reduceFactor&&(this._lifeCount>0||this._immortal||!this.options.life.count)&&(this._firstSpawn||this._currentSpawnDelay>=(this._spawnDelay??0))){if(void 0===this._emitDelay){const t=C(this.options.rate.delay);this._emitDelay=1e3*t/this.container.retina.reduceFactor}(this._lifeCount>0||this._immortal)&&this._prepareToDie()}}resize(){const t=this._initialPosition;this.position=t&&tt(t,this.container.canvas.size,y.origin)?t:this._calcPosition(),this._size=this._calcSize(),this.size=mt(this._size,this.container.canvas.size),this._shape?.resize(this.position,this.size)}async update(t){this._paused||(this._firstSpawn&&(this._firstSpawn=!1,this._currentSpawnDelay=this._spawnDelay??0,this._currentEmitDelay=this._emitDelay??0),this._startParticlesAdded||(this._startParticlesAdded=!0,await this._emitParticles(this.options.startCount)),void 0!==this._duration&&(this._currentDuration+=t.value,this._currentDuration>=this._duration&&(this.pause(),void 0!==this._spawnDelay&&delete this._spawnDelay,this._immortal||this._lifeCount--,this._lifeCount>0||this._immortal?(this.position=this._calcPosition(),this._shape?.resize(this.position,this.size),this._spawnDelay=1e3*C(this.options.life.delay??0)/this.container.retina.reduceFactor):this._destroy(),this._currentDuration-=this._duration,delete this._duration)),void 0!==this._spawnDelay&&(this._currentSpawnDelay+=t.value,this._currentSpawnDelay>=this._spawnDelay&&(this._engine.dispatchEvent("emitterPlay",{container:this.container}),this.play(),this._currentSpawnDelay-=this._currentSpawnDelay,delete this._spawnDelay)),void 0!==this._emitDelay&&(this._currentEmitDelay+=t.value,this._currentEmitDelay>=this._emitDelay&&(this._emit(),this._currentEmitDelay-=this._emitDelay)))}_calcPosition(){if(this.options.domId){const t=this.container,e=document.getElementById(this.options.domId);if(e){const i=e.getBoundingClientRect();return{x:(i.x+i.width/2)*t.retina.pixelRatio,y:(i.y+i.height/2)*t.retina.pixelRatio}}}return F({size:this.container.canvas.size,position:this.options.position})}_calcSize(){const t=this.container;if(this.options.domId){const e=document.getElementById(this.options.domId);if(e){const i=e.getBoundingClientRect();return{width:i.width*t.retina.pixelRatio,height:i.height*t.retina.pixelRatio,mode:"precise"}}}return this.options.size??(()=>{const t=new Yi;return t.load({height:0,mode:"percent",width:0}),t})()}async _emit(){if(this._paused)return;const t=C(this.options.rate.quantity);await this._emitParticles(t)}async _emitParticles(t){const e=ut(this._particlesOptions);for(let i=0;ivoid 0===t||wt(t)?this.array[t||0]:this.array.find((e=>e.name===t)),e.addEmitter=async(t,e)=>this.addEmitter(t,e),e.removeEmitter=t=>{const i=e.getEmitter(t);i&&this.removeEmitter(i)},e.playEmitter=t=>{const i=e.getEmitter(t);i&&i.externalPlay()},e.pauseEmitter=t=>{const i=e.getEmitter(t);i&&i.externalPause()}}async addEmitter(t,e){const i=new Zi;i.load(t);const s=new Ji(this._engine,this,this.container,i,e);return await s.init(),this.array.push(s),s}handleClickMode(t){const e=this.emitters,i=this.interactivityEmitters;if("emitter"!==t)return;let s;if(i&&kt(i.value))if(i.value.length>0&&i.random.enable){s=[];const t=[];for(let e=0;e{this.addEmitter(t,n)}))}async init(){if(this.emitters=this.container.actualOptions.emitters,this.interactivityEmitters=this.container.actualOptions.interactivity.modes.emitters,this.emitters)if(kt(this.emitters))for(const t of this.emitters)await this.addEmitter(t);else await this.addEmitter(this.emitters)}pause(){for(const t of this.array)t.pause()}play(){for(const t of this.array)t.play()}removeEmitter(t){const e=this.array.indexOf(t);e>=0&&this.array.splice(e,1)}resize(){for(const t of this.array)t.resize()}stop(){this.array=[]}async update(t){for(const e of this.array)await e.update(t)}}const ts=new Map;class es{constructor(t){this._engine=t}addShapeGenerator(t,e){this.getShapeGenerator(t)||ts.set(t,e)}getShapeGenerator(t){return ts.get(t)}getSupportedShapeGenerators(){return ts.keys()}}class is{constructor(t,e,i,s){this.position=t,this.size=e,this.fill=i,this.options=s}resize(t,e){this.position=t,this.size=e}}class ss{constructor(t){this._engine=t,this.id="emitters"}getPlugin(t){return new Ki(this._engine,t)}loadOptions(t,e){if(!this.needsPlugin(t)&&!this.needsPlugin(e))return;e?.emitters&&(t.emitters=dt(e.emitters,(t=>{const e=new Zi;return e.load(t),e})));const i=e?.interactivity?.modes?.emitters;if(i)if(kt(i))t.interactivity.modes.emitters={random:{count:1,enable:!0},value:i.map((t=>{const e=new Zi;return e.load(t),e}))};else{const e=i;if(void 0!==e.value)if(kt(e.value))t.interactivity.modes.emitters={random:{count:e.random.count??1,enable:e.random.enable??!1},value:e.value.map((t=>{const e=new Zi;return e.load(t),e}))};else{const i=new Zi;i.load(e.value),t.interactivity.modes.emitters={random:{count:e.random.count??1,enable:e.random.enable??!1},value:i}}else{(t.interactivity.modes.emitters={random:{count:1,enable:!1},value:new Zi}).value.load(i)}}}needsPlugin(t){if(!t)return!1;const e=t.emitters;return kt(e)&&!!e.length||void 0!==e||!!t.interactivity?.events?.onClick?.mode&&Z("emitter",t.interactivity.events.onClick.mode)}}class os extends is{constructor(t,e,i,s){super(t,e,i,s)}async init(){}async randomPosition(){const t=this.size,e=this.fill,i=this.position,[s,o]=[t.width/2,t.height/2],n=((t,e)=>{const i=_()/4,s=Math.atan(e/t*Math.tan(2*Math.PI*i)),o=_();return o<.25?s:o<.5?Math.PI-s:o<.75?Math.PI+s:-s})(s,o),a=(h=n,(c=s)*(l=o)/Math.sqrt((l*Math.cos(h))**2+(c*Math.sin(h))**2)),r=e?a*Math.sqrt(_()):a;var c,l,h;return{position:{x:i.x+r*Math.cos(n),y:i.y+r*Math.sin(n)}}}}class ns{generate(t,e,i,s){return new os(t,e,i,s)}}function as(t,e){return t+e*(_()-.5)}class rs extends is{constructor(t,e,i,s){super(t,e,i,s)}async init(){}async randomPosition(){const t=this.fill,e=this.position,i=this.size;if(t)return{position:{x:as(e.x,i.width),y:as(e.y,i.height)}};{const t=i.width/2,s=i.height/2,o=Math.floor(4*_()),n=2*(_()-.5);switch(o){case 0:return{position:{x:e.x+n*t,y:e.y-s}};case 1:return{position:{x:e.x-t,y:e.y+n*s}};case 2:return{position:{x:e.x+n*t,y:e.y+s}};default:return{position:{x:e.x+t,y:e.y+n*s}}}}}}class cs{generate(t,e,i,s){return new rs(t,e,i,s)}}class ls{constructor(){this.delay=1,this.pauseOnStop=!1,this.quantity=1}load(t){t&&(void 0!==t.delay&&(this.delay=t.delay),void 0!==t.quantity&&(this.quantity=t.quantity),void 0!==t.particles&&(this.particles=st({},t.particles)),void 0!==t.pauseOnStop&&(this.pauseOnStop=t.pauseOnStop))}}const hs="trail";class ds extends Si{constructor(t){super(t),this._delay=0}clear(){}init(){}async interact(t){const e=this.container,{interactivity:i}=e;if(!e.retina.reduceFactor)return;const s=e.actualOptions.interactivity.modes.trail;if(!s)return;const o=1e3*s.delay/this.container.retina.reduceFactor;if(this._delay=.5?"darken":"enlighten";t.roll.alter={type:i,value:C("darken"===i?e.darken.value:e.enlighten.value)}}else e.darken.enable?t.roll.alter={type:"darken",value:C(e.darken.value)}:e.enlighten.enable&&(t.roll.alter={type:"enlighten",value:C(e.enlighten.value)});else t.roll={enable:!1,horizontal:!1,vertical:!1,angle:0,speed:0}}(t)}isEnabled(t){const e=t.options.roll;return!t.destroyed&&!t.spawning&&!!e?.enable}loadOptions(t,...e){t.roll||(t.roll=new ps);for(const i of e)t.roll.load(i?.roll)}update(t,e){this.isEnabled(t)&&function(t,e){const i=t.options.roll,s=t.roll;if(!s||!i?.enable)return;const o=s.speed*e.factor,n=2*Math.PI;s.angle+=o,s.angle>n&&(s.angle-=n)}(t,e)}}function vs(t,e,i,s,o,n){!function(t,e){const i=t.options,s=i.move.path;if(!s.enable)return;if(t.lastPathTime<=t.pathDelay)return void(t.lastPathTime+=e.value);const o=t.pathGenerator?.generate(t,e);o&&t.velocity.addTo(o);s.clamp&&(t.velocity.x=k(t.velocity.x,-1,1),t.velocity.y=k(t.velocity.y,-1,1));t.lastPathTime-=t.pathDelay}(t,n);const a=t.gravity,r=a?.enable&&a.inverse?-1:1;o&&i&&(t.velocity.x+=o*n.factor/(60*i)),a?.enable&&i&&(t.velocity.y+=r*(a.acceleration*n.factor)/(60*i));const c=t.moveDecay;t.velocity.multTo(c);const l=t.velocity.mult(i);a?.enable&&s>0&&(!a.inverse&&l.y>=0&&l.y>=s||a.inverse&&l.y<=0&&l.y<=-s)&&(l.y=r*s,i&&(t.velocity.y=l.y/i));const h=t.options.zIndex,d=(1-t.zIndexFactor)**h.velocityRate;l.multTo(d);const{position:u}=t;u.addTo(l),e.vibrate&&(u.x+=Math.sin(u.x*Math.cos(u.y)),u.y+=Math.cos(u.y*Math.sin(u.x)))}class ys{constructor(){this._initSpin=t=>{const e=t.container,i=t.options.move.spin;if(!i.enable)return;const s=i.position??{x:50,y:50},o={x:.01*s.x*e.canvas.size.width,y:.01*s.y*e.canvas.size.height},n=T(t.getPosition(),o),a=C(i.acceleration);t.retina.spinAcceleration=a*e.retina.pixelRatio,t.spin={center:o,direction:t.velocity.x>=0?"clockwise":"counter-clockwise",angle:t.velocity.angle,radius:n,acceleration:t.retina.spinAcceleration}}}init(t){const e=t.options.move.gravity;t.gravity={enable:e.enable,acceleration:C(e.acceleration),inverse:e.inverse},this._initSpin(t)}isEnabled(t){return!t.destroyed&&t.options.move.enable}move(t,e){const i=t.options,s=i.move;if(!s.enable)return;const o=t.container,n=o.retina.pixelRatio,a=function(t){return t.slow.inRange?t.slow.factor:1}(t),r=(t.retina.moveSpeed??=C(s.speed)*n)*o.retina.reduceFactor,c=t.retina.moveDrift??=C(t.options.move.drift)*n,l=O(i.size.value)*n,h=r*(s.size?t.getRadius()/l:1)*a*(e.factor||1)/2,d=t.retina.maxSpeed??o.retina.maxSpeed;s.spin.enable?function(t,e){const i=t.container;if(!t.spin)return;const s={x:"clockwise"===t.spin.direction?Math.cos:Math.sin,y:"clockwise"===t.spin.direction?Math.sin:Math.cos};t.position.x=t.spin.center.x+t.spin.radius*s.x(t.spin.angle),t.position.y=t.spin.center.y+t.spin.radius*s.y(t.spin.angle),t.spin.radius+=t.spin.acceleration;const o=Math.max(i.canvas.size.width,i.canvas.size.height),n=.5*o;t.spin.radius>n?(t.spin.radius=n,t.spin.acceleration*=-1):t.spin.radius<0&&(t.spin.radius=0,t.spin.acceleration*=-1),t.spin.angle+=.01*e*(1-t.spin.radius/o)}(t,h):vs(t,s,h,d,c,e),function(t){const e=t.initialPosition,{dx:i,dy:s}=D(e,t.position),o=Math.abs(i),n=Math.abs(s),{maxDistance:a}=t.retina,r=a.horizontal,c=a.vertical;if(r||c)if((r&&o>=r||c&&n>=c)&&!t.misplaced)t.misplaced=!!r&&o>r||!!c&&n>c,r&&(t.velocity.x=.5*t.velocity.y-t.velocity.x),c&&(t.velocity.y=.5*t.velocity.x-t.velocity.y);else if((!r||oe.x&&s.x>0)&&(s.x*=-_()),c&&(i.ye.y&&s.y>0)&&(s.y*=-_())}}(t)}}class ms{draw(t){const{context:e,particle:i,radius:s}=t;i.circleRange||(i.circleRange={min:0,max:2*Math.PI});const o=i.circleRange;e.arc(0,0,s,o.min,o.max,!1)}getSidesCount(){return 12}particleInit(t,e){const i=e.shapeData,s=i?.angle??{max:360,min:0};e.circleRange=_t(s)?{min:s.min*Math.PI/180,max:s.max*Math.PI/180}:{min:0,max:s*Math.PI/180}}}function gs(t,e,i,s,o){if(!e||!i.enable||(e.maxLoops??0)>0&&(e.loops??0)>(e.maxLoops??0))return;if(e.time||(e.time=0),(e.delayTime??0)>0&&e.time<(e.delayTime??0)&&(e.time+=t.value),(e.delayTime??0)>0&&e.time<(e.delayTime??0))return;const n=M(i.offset),a=(e.velocity??0)*t.factor+3.6*n,r=e.decay??1;o&&"increasing"!==e.status?(e.value-=a,e.value<0&&(e.loops||(e.loops=0),e.loops++,e.status="increasing",e.value+=e.value)):(e.value+=a,e.value>s&&(e.loops||(e.loops=0),e.loops++,o&&(e.status="decreasing",e.value-=e.value%s))),e.velocity&&1!==r&&(e.velocity*=r),e.value>s&&(e.value%=s)}class bs{constructor(t){this.container=t}init(t){const e=Rt(t.options.color,t.id,t.options.reduceDuplicates);e&&(t.color=jt(e,t.options.color.animation,this.container.retina.reduceFactor))}isEnabled(t){const{h:e,s:i,l:s}=t.options.color.animation,{color:o}=t;return!t.destroyed&&!t.spawning&&(void 0!==o?.h.value&&e.enable||void 0!==o?.s.value&&i.enable||void 0!==o?.l.value&&s.enable)}update(t,e){!function(t,e){const{h:i,s,l:o}=t.options.color.animation,{color:n}=t;if(!n)return;const{h:a,s:r,l:c}=n;a&&gs(e,a,i,360,!1),r&&gs(e,r,s,100,!0),c&&gs(e,c,o,100,!0)}(t,e)}}class ws{constructor(t){this.container=t}init(t){const e=t.options.opacity;t.opacity=ft(e,1);const i=e.animation;i.enable&&(t.opacity.velocity=C(i.speed)/100*this.container.retina.reduceFactor,i.sync||(t.opacity.velocity*=_()))}isEnabled(t){return!t.destroyed&&!t.spawning&&!!t.opacity&&t.opacity.enable&&((t.opacity.maxLoops??0)<=0||(t.opacity.maxLoops??0)>0&&(t.opacity.loops??0)<(t.opacity.maxLoops??0))}reset(t){t.opacity&&(t.opacity.time=0,t.opacity.loops=0)}update(t,e){this.isEnabled(t)&&function(t,e){const i=t.opacity;if(t.destroyed||!i?.enable||(i.maxLoops??0)>0&&(i.loops??0)>(i.maxLoops??0))return;const s=i.min,o=i.max,n=i.decay??1;if(i.time||(i.time=0),(i.delayTime??0)>0&&i.time<(i.delayTime??0)&&(i.time+=e.value),!((i.delayTime??0)>0&&i.time<(i.delayTime??0))){switch(i.status){case"increasing":i.value>=o?(i.status="decreasing",i.loops||(i.loops=0),i.loops++):i.value+=(i.velocity??0)*e.factor;break;case"decreasing":i.value<=s?(i.status="increasing",i.loops||(i.loops=0),i.loops++):i.value-=(i.velocity??0)*e.factor}i.velocity&&1!==i.decay&&(i.velocity*=n),function(t,e,i,s){switch(t.options.opacity.animation.destroy){case"max":e>=s&&t.destroy();break;case"min":e<=i&&t.destroy()}}(t,i.value,s,o),t.destroyed||(i.value=k(i.value,s,o))}}(t,e)}}class xs{constructor(t){this.container=t,this.modes=["bounce","bounce-vertical","bounce-horizontal","bounceVertical","bounceHorizontal","split"]}update(t,e,i,s){if(!this.modes.includes(s))return;const o=this.container;let n=!1;for(const[,s]of o.plugins)if(void 0!==s.particleBounce&&(n=s.particleBounce(t,i,e)),n)break;if(n)return;const a=t.getPosition(),r=t.offset,c=t.getRadius(),l=it(a,c),h=o.canvas.size;!function(t){if("bounce"!==t.outMode&&"bounce-horizontal"!==t.outMode&&"bounceHorizontal"!==t.outMode&&"split"!==t.outMode||"left"!==t.direction&&"right"!==t.direction)return;t.bounds.right<0&&"left"===t.direction?t.particle.position.x=t.size+t.offset.x:t.bounds.left>t.canvasSize.width&&"right"===t.direction&&(t.particle.position.x=t.canvasSize.width-t.size-t.offset.x);const e=t.particle.velocity.x;let i=!1;if("right"===t.direction&&t.bounds.right>=t.canvasSize.width&&e>0||"left"===t.direction&&t.bounds.left<=0&&e<0){const e=C(t.particle.options.bounce.horizontal.value);t.particle.velocity.x*=-e,i=!0}if(!i)return;const s=t.offset.x+t.size;t.bounds.right>=t.canvasSize.width&&"right"===t.direction?t.particle.position.x=t.canvasSize.width-s:t.bounds.left<=0&&"left"===t.direction&&(t.particle.position.x=s),"split"===t.outMode&&t.particle.destroy()}({particle:t,outMode:s,direction:e,bounds:l,canvasSize:h,offset:r,size:c}),function(t){if("bounce"!==t.outMode&&"bounce-vertical"!==t.outMode&&"bounceVertical"!==t.outMode&&"split"!==t.outMode||"bottom"!==t.direction&&"top"!==t.direction)return;t.bounds.bottom<0&&"top"===t.direction?t.particle.position.y=t.size+t.offset.y:t.bounds.top>t.canvasSize.height&&"bottom"===t.direction&&(t.particle.position.y=t.canvasSize.height-t.size-t.offset.y);const e=t.particle.velocity.y;let i=!1;if("bottom"===t.direction&&t.bounds.bottom>=t.canvasSize.height&&e>0||"top"===t.direction&&t.bounds.top<=0&&e<0){const e=C(t.particle.options.bounce.vertical.value);t.particle.velocity.y*=-e,i=!0}if(!i)return;const s=t.offset.y+t.size;t.bounds.bottom>=t.canvasSize.height&&"bottom"===t.direction?t.particle.position.y=t.canvasSize.height-s:t.bounds.top<=0&&"top"===t.direction&&(t.particle.position.y=s),"split"===t.outMode&&t.particle.destroy()}({particle:t,outMode:s,direction:e,bounds:l,canvasSize:h,offset:r,size:c})}}class _s{constructor(t){this.container=t,this.modes=["destroy"]}update(t,e,i,s){if(!this.modes.includes(s))return;const o=this.container;switch(t.outType){case"normal":case"outside":if(tt(t.position,o.canvas.size,y.origin,t.getRadius(),e))return;break;case"inside":{const{dx:e,dy:i}=D(t.position,t.moveCenter),{x:s,y:o}=t.velocity;if(s<0&&e>t.moveCenter.radius||o<0&&i>t.moveCenter.radius||s>=0&&e<-t.moveCenter.radius||o>=0&&i<-t.moveCenter.radius)return;break}}o.particles.remove(t,void 0,!0)}}class ks{constructor(t){this.container=t,this.modes=["none"]}update(t,e,i,s){if(!this.modes.includes(s))return;if(t.options.move.distance.horizontal&&("left"===e||"right"===e)||t.options.move.distance.vertical&&("top"===e||"bottom"===e))return;const o=t.options.move.gravity,n=this.container,a=n.canvas.size,r=t.getRadius();if(o.enable){const i=t.position;(!o.inverse&&i.y>a.height+r&&"bottom"===e||o.inverse&&i.y<-r&&"top"===e)&&n.particles.remove(t)}else{if(t.velocity.y>0&&t.position.y<=a.height+r||t.velocity.y<0&&t.position.y>=-r||t.velocity.x>0&&t.position.x<=a.width+r||t.velocity.x<0&&t.position.x>=-r)return;tt(t.position,n.canvas.size,y.origin,r,e)||n.particles.remove(t)}}}class zs{constructor(t){this.container=t,this.modes=["out"]}update(t,e,i,s){if(!this.modes.includes(s))return;const o=this.container;switch(t.outType){case"inside":{const{x:e,y:i}=t.velocity,s=y.origin;s.length=t.moveCenter.radius,s.angle=t.velocity.angle+Math.PI,s.addTo(y.create(t.moveCenter));const{dx:n,dy:a}=D(t.position,s);if(e<=0&&n>=0||i<=0&&a>=0||e>=0&&n<=0||i>=0&&a<=0)return;t.position.x=Math.floor(M({min:0,max:o.canvas.size.width})),t.position.y=Math.floor(M({min:0,max:o.canvas.size.height}));const{dx:r,dy:c}=D(t.position,t.moveCenter);t.direction=Math.atan2(-c,-r),t.velocity.angle=t.direction;break}default:if(tt(t.position,o.canvas.size,y.origin,t.getRadius(),e))return;switch(t.outType){case"outside":{t.position.x=Math.floor(M({min:-t.moveCenter.radius,max:t.moveCenter.radius}))+t.moveCenter.x,t.position.y=Math.floor(M({min:-t.moveCenter.radius,max:t.moveCenter.radius}))+t.moveCenter.y;const{dx:e,dy:i}=D(t.position,t.moveCenter);t.moveCenter.radius&&(t.direction=Math.atan2(i,e),t.velocity.angle=t.direction);break}case"normal":{const i=t.options.move.warp,s=o.canvas.size,n={bottom:s.height+t.getRadius()+t.offset.y,left:-t.getRadius()-t.offset.x,right:s.width+t.getRadius()+t.offset.x,top:-t.getRadius()-t.offset.y},a=t.getRadius(),r=it(t.position,a);"right"===e&&r.left>s.width+t.offset.x?(t.position.x=n.left,t.initialPosition.x=t.position.x,i||(t.position.y=_()*s.height,t.initialPosition.y=t.position.y)):"left"===e&&r.right<-t.offset.x&&(t.position.x=n.right,t.initialPosition.x=t.position.x,i||(t.position.y=_()*s.height,t.initialPosition.y=t.position.y)),"bottom"===e&&r.top>s.height+t.offset.y?(i||(t.position.x=_()*s.width,t.initialPosition.x=t.position.x),t.position.y=n.top,t.initialPosition.y=t.position.y):"top"===e&&r.bottom<-t.offset.y&&(i||(t.position.x=_()*s.width,t.initialPosition.x=t.position.x),t.position.y=n.bottom,t.initialPosition.y=t.position.y);break}}}}}class Ms{constructor(t){this.container=t,this._updateOutMode=(t,e,i,s)=>{for(const o of this.updaters)o.update(t,s,e,i)},this.updaters=[new xs(t),new _s(t),new zs(t),new ks(t)]}init(){}isEnabled(t){return!t.destroyed&&!t.spawning}update(t,e){const i=t.options.move.outModes;this._updateOutMode(t,e,i.bottom??i.default,"bottom"),this._updateOutMode(t,e,i.left??i.default,"left"),this._updateOutMode(t,e,i.right??i.default,"right"),this._updateOutMode(t,e,i.top??i.default,"top")}}class Cs{init(t){const e=t.container,i=t.options.size.animation;i.enable&&(t.size.velocity=(t.retina.sizeAnimationSpeed??e.retina.sizeAnimationSpeed)/100*e.retina.reduceFactor,i.sync||(t.size.velocity*=_()))}isEnabled(t){return!t.destroyed&&!t.spawning&&t.size.enable&&((t.size.maxLoops??0)<=0||(t.size.maxLoops??0)>0&&(t.size.loops??0)<(t.size.maxLoops??0))}reset(t){t.size.loops=0}update(t,e){this.isEnabled(t)&&function(t,e){const i=t.size;if(t.destroyed||!i||!i.enable||(i.maxLoops??0)>0&&(i.loops??0)>(i.maxLoops??0))return;const s=(i.velocity??0)*e.factor,o=i.min,n=i.max,a=i.decay??1;if(i.time||(i.time=0),(i.delayTime??0)>0&&i.time<(i.delayTime??0)&&(i.time+=e.value),!((i.delayTime??0)>0&&i.time<(i.delayTime??0))){switch(i.status){case"increasing":i.value>=n?(i.status="decreasing",i.loops||(i.loops=0),i.loops++):i.value+=s;break;case"decreasing":i.value<=o?(i.status="increasing",i.loops||(i.loops=0),i.loops++):i.value-=s}i.velocity&&1!==a&&(i.velocity*=a),function(t,e,i,s){switch(t.options.size.animation.destroy){case"max":e>=s&&t.destroy();break;case"min":e<=i&&t.destroy()}}(t,i.value,o,n),t.destroyed||(i.value=k(i.value,o,n))}}(t,e)}}async function Ps(t,e=!0){await async function(t,e=!0){await t.addMover("base",(()=>new ys),e)}(t,!1),await async function(t,e=!0){await t.addShape("circle",new ms,e)}(t,!1),await async function(t,e=!0){await t.addParticleUpdater("color",(t=>new bs(t)),e)}(t,!1),await async function(t,e=!0){await t.addParticleUpdater("opacity",(t=>new ws(t)),e)}(t,!1),await async function(t,e=!0){await t.addParticleUpdater("outModes",(t=>new Ms(t)),e)}(t,!1),await async function(t,e=!0){await t.addParticleUpdater("size",(()=>new Cs),e)}(t,!1),await t.refresh(e)}const Os=["emoji"],Ss='"Twemoji Mozilla", Apple Color Emoji, "Segoe UI Emoji", "Noto Color Emoji", "EmojiOne Color"';class Ds{constructor(){this._emojiShapeDict=new Map}destroy(){for(const[,t]of this._emojiShapeDict)t instanceof ImageBitmap&&t?.close()}draw(t){const{context:e,particle:i,radius:s,opacity:o}=t,n=i.emojiData;n&&(e.globalAlpha=o,e.drawImage(n,-s,-s,2*s,2*s),e.globalAlpha=1)}async init(t){const e=t.actualOptions;if(Os.find((t=>Z(t,e.particles.shape.type)))){const t=[Q(Ss)],i=Os.map((t=>e.particles.shape.options[t])).find((t=>!!t));i&&dt(i,(e=>{e.font&&t.push(Q(e.font))})),await Promise.all(t)}}particleDestroy(t){delete t.emojiData}particleInit(t,e){if(!e.emojiData){const t=e.shapeData;if(!t?.value)return;const i=ut(t.value,e.randomIndexData),s=t.font??Ss;if(!i)return;const o=`${i}_${s}`,n=this._emojiShapeDict.get(o);if(n)return void(e.emojiData=n);const a=2*O(e.size.value);let r;if("undefined"!=typeof OffscreenCanvas){const t=new OffscreenCanvas(a,a),o=t.getContext("2d");if(!o)return;o.font=`400 ${2*O(e.size.value)}px ${s}`,o.textBaseline="middle",o.textAlign="center",o.fillText(i,O(e.size.value),O(e.size.value)),r=t.transferToImageBitmap()}else{const t=document.createElement("canvas");t.width=a,t.height=a;const o=t.getContext("2d");if(!o)return;o.font=`400 ${2*O(e.size.value)}px ${s}`,o.textBaseline="middle",o.textAlign="center",o.fillText(i,O(e.size.value),O(e.size.value)),r=t}this._emojiShapeDict.set(o,r),e.emojiData=r}}}class Ts{constructor(){this.distance=200,this.duration=.4,this.easing="ease-out-quad",this.factor=1,this.maxSpeed=50,this.speed=1}load(t){t&&(void 0!==t.distance&&(this.distance=t.distance),void 0!==t.duration&&(this.duration=t.duration),void 0!==t.easing&&(this.easing=t.easing),void 0!==t.factor&&(this.factor=t.factor),void 0!==t.maxSpeed&&(this.maxSpeed=t.maxSpeed),void 0!==t.speed&&(this.speed=t.speed))}}const Rs="attract";class Es extends Si{constructor(t,e){super(e),this._clickAttract=()=>{const t=this.container;t.attract||(t.attract={particles:[]});const{attract:e}=t;if(e.finish||(e.count||(e.count=0),e.count++,e.count===t.particles.count&&(e.finish=!0)),e.clicking){const e=t.interactivity.mouse.clickPosition,i=t.retina.attractModeDistance;if(!i||i<0||!e)return;this._processAttract(e,i,new yi(e.x,e.y,i))}else!1===e.clicking&&(e.particles=[])},this._hoverAttract=()=>{const t=this.container,e=t.interactivity.mouse.position,i=t.retina.attractModeDistance;!i||i<0||!e||this._processAttract(e,i,new yi(e.x,e.y,i))},this._processAttract=(t,e,i)=>{const s=this.container,o=s.actualOptions.interactivity.modes.attract;if(!o)return;const n=s.particles.quadTree.query(i,(t=>this.isEnabled(t)));for(const i of n){const{dx:s,dy:n,distance:a}=D(i.position,t),r=o.speed*o.factor,c=k(w(o.easing)(1-a/e)*r,0,o.maxSpeed),l=y.create(0===a?r:s/a*c,0===a?r:n/a*c);i.position.subFrom(l)}},this._engine=t,e.attract||(e.attract={particles:[]}),this.handleClickMode=t=>{const i=this.container.actualOptions.interactivity.modes.attract;if(i&&t===Rs){e.attract||(e.attract={particles:[]}),e.attract.clicking=!0,e.attract.count=0;for(const t of e.attract.particles)this.isEnabled(t)&&t.velocity.setTo(t.initialVelocity);e.attract.particles=[],e.attract.finish=!1,setTimeout((()=>{e.destroyed||(e.attract||(e.attract={particles:[]}),e.attract.clicking=!1)}),1e3*i.duration)}}}clear(){}init(){const t=this.container,e=t.actualOptions.interactivity.modes.attract;e&&(t.retina.attractModeDistance=e.distance*t.retina.pixelRatio)}async interact(){const t=this.container,e=t.actualOptions,i=t.interactivity.status===r,s=e.interactivity.events,o=s.onHover.enable,n=s.onHover.mode,a=s.onClick.enable,c=s.onClick.mode;i&&o&&Z(Rs,n)?this._hoverAttract():a&&Z(Rs,c)&&this._clickAttract()}isEnabled(t){const e=this.container,i=e.actualOptions,s=e.interactivity.mouse,o=(t?.interactivity??i.interactivity).events;if(!(s.position&&o.onHover.enable||s.clickPosition&&o.onClick.enable))return!1;const n=o.onHover.mode,a=o.onClick.mode;return Z(Rs,n)||Z(Rs,a)}loadModeOptions(t,...e){t.attract||(t.attract=new Ts);for(const i of e)t.attract.load(i?.attract)}reset(){}}class Is{constructor(){this.distance=200}load(t){t&&void 0!==t.distance&&(this.distance=t.distance)}}const Ls="bounce";class As extends Si{constructor(t){super(t),this._processBounce=(t,e,i)=>{const s=this.container.particles.quadTree.query(i,(t=>this.isEnabled(t)));for(const o of s)i instanceof yi?lt(ct(o),{position:t,radius:e,mass:e**2*Math.PI/2,velocity:y.origin,factor:y.origin}):i instanceof vi&&ht(o,it(t,e))},this._processMouseBounce=()=>{const t=this.container,e=10*t.retina.pixelRatio,i=t.interactivity.mouse.position,s=t.retina.bounceModeDistance;!s||s<0||!i||this._processBounce(i,s,new yi(i.x,i.y,s+e))},this._singleSelectorBounce=(t,e)=>{const i=this.container,s=document.querySelectorAll(t);s.length&&s.forEach((t=>{const s=t,o=i.retina.pixelRatio,n={x:(s.offsetLeft+s.offsetWidth/2)*o,y:(s.offsetTop+s.offsetHeight/2)*o},a=s.offsetWidth/2*o,r=10*o,c="circle"===e.type?new yi(n.x,n.y,a+r):new vi(s.offsetLeft*o-r,s.offsetTop*o-r,s.offsetWidth*o+2*r,s.offsetHeight*o+2*r);this._processBounce(n,a,c)}))}}clear(){}init(){const t=this.container,e=t.actualOptions.interactivity.modes.bounce;e&&(t.retina.bounceModeDistance=e.distance*t.retina.pixelRatio)}async interact(){const t=this.container,e=t.actualOptions.interactivity.events,i=t.interactivity.status===r,s=e.onHover.enable,o=e.onHover.mode,n=e.onDiv;i&&s&&Z(Ls,o)?this._processMouseBounce():nt(Ls,n,((t,e)=>this._singleSelectorBounce(t,e)))}isEnabled(t){const e=this.container,i=e.actualOptions,s=e.interactivity.mouse,o=(t?.interactivity??i.interactivity).events,n=o.onDiv;return s.position&&o.onHover.enable&&Z(Ls,o.onHover.mode)||ot(Ls,n)}loadModeOptions(t,...e){t.bounce||(t.bounce=new Is);for(const i of e)t.bounce.load(i?.bounce)}reset(){}}class Fs{constructor(){this.distance=200,this.duration=.4,this.mix=!1}load(t){if(t){if(void 0!==t.distance&&(this.distance=t.distance),void 0!==t.duration&&(this.duration=t.duration),void 0!==t.mix&&(this.mix=t.mix),void 0!==t.opacity&&(this.opacity=t.opacity),void 0!==t.color){const e=kt(this.color)?void 0:this.color;this.color=dt(t.color,(t=>ce.create(e,t)))}void 0!==t.size&&(this.size=t.size)}}}class Bs extends Fs{constructor(){super(),this.selectors=[]}load(t){super.load(t),t&&void 0!==t.selectors&&(this.selectors=t.selectors)}}class qs extends Fs{load(t){super.load(t),t&&(this.divs=dt(t.divs,(t=>{const e=new Bs;return e.load(t),e})))}}function Hs(t,e,i,s){if(e>=i){return k(t+(e-i)*s,t,e)}if(e{const t=this.container,e=t.actualOptions,i=t.interactivity.mouse.clickPosition,s=e.interactivity.modes.bubble;if(!s||!i)return;t.bubble||(t.bubble={});const o=t.retina.bubbleModeDistance;if(!o||o<0)return;const n=t.particles.quadTree.queryCircle(i,o,(t=>this.isEnabled(t))),{bubble:a}=t;for(const e of n){if(!a.clicking)continue;e.bubble.inRange=!a.durationEnd;const n=T(e.getPosition(),i),r=((new Date).getTime()-(t.interactivity.mouse.clickTime||0))/1e3;r>s.duration&&(a.durationEnd=!0),r>2*s.duration&&(a.clicking=!1,a.durationEnd=!1);const c={bubbleObj:{optValue:t.retina.bubbleModeSize,value:e.bubble.radius},particlesObj:{optValue:O(e.options.size.value)*t.retina.pixelRatio,value:e.size.value},type:"size"};this._process(e,n,r,c);const l={bubbleObj:{optValue:s.opacity,value:e.bubble.opacity},particlesObj:{optValue:O(e.options.opacity.value),value:e.opacity?.value??1},type:"opacity"};this._process(e,n,r,l),!a.durationEnd&&n<=o?this._hoverBubbleColor(e,n):delete e.bubble.color}},this._hoverBubble=()=>{const t=this.container,e=t.interactivity.mouse.position,i=t.retina.bubbleModeDistance;if(!i||i<0||void 0===e)return;const s=t.particles.quadTree.queryCircle(e,i,(t=>this.isEnabled(t)));for(const o of s){o.bubble.inRange=!0;const s=T(o.getPosition(),e),a=1-s/i;s<=i?a>=0&&t.interactivity.status===r&&(this._hoverBubbleSize(o,a),this._hoverBubbleOpacity(o,a),this._hoverBubbleColor(o,a)):this.reset(o),t.interactivity.status===n&&this.reset(o)}},this._hoverBubbleColor=(t,e,i)=>{const s=this.container.actualOptions,o=i??s.interactivity.modes.bubble;if(o){if(!t.bubble.finalColor){const e=o.color;if(!e)return;const i=ut(e);t.bubble.finalColor=Rt(i)}if(t.bubble.finalColor)if(o.mix){t.bubble.color=void 0;const i=t.getFillColor();t.bubble.color=i?Et(Vt(i,t.bubble.finalColor,1-e,e)):t.bubble.finalColor}else t.bubble.color=t.bubble.finalColor}},this._hoverBubbleOpacity=(t,e,i)=>{const s=this.container.actualOptions,o=i?.opacity??s.interactivity.modes.bubble?.opacity;if(!o)return;const n=t.options.opacity.value,a=Hs(t.opacity?.value??1,o,O(n),e);void 0!==a&&(t.bubble.opacity=a)},this._hoverBubbleSize=(t,e,i)=>{const s=this.container,o=i?.size?i.size*s.retina.pixelRatio:s.retina.bubbleModeSize;if(void 0===o)return;const n=O(t.options.size.value)*s.retina.pixelRatio,a=Hs(t.size.value,o,n,e);void 0!==a&&(t.bubble.radius=a)},this._process=(t,e,i,s)=>{const o=this.container,n=s.bubbleObj.optValue,a=o.actualOptions.interactivity.modes.bubble;if(!a||void 0===n)return;const r=a.duration,c=o.retina.bubbleModeDistance,l=s.particlesObj.optValue,h=s.bubbleObj.value,d=s.particlesObj.value||0,u=s.type;if(c&&!(c<0)&&n!==l)if(o.bubble||(o.bubble={}),o.bubble.durationEnd)h&&("size"===u&&delete t.bubble.radius,"opacity"===u&&delete t.bubble.opacity);else if(e<=c){if((h??d)!==n){const e=d-i*(d-n)/r;"size"===u&&(t.bubble.radius=e),"opacity"===u&&(t.bubble.opacity=e)}}else"size"===u&&delete t.bubble.radius,"opacity"===u&&delete t.bubble.opacity},this._singleSelectorHover=(t,e,i)=>{const s=this.container,o=document.querySelectorAll(e),n=s.actualOptions.interactivity.modes.bubble;n&&o.length&&o.forEach((e=>{const o=e,a=s.retina.pixelRatio,r={x:(o.offsetLeft+o.offsetWidth/2)*a,y:(o.offsetTop+o.offsetHeight/2)*a},c=o.offsetWidth/2*a,l="circle"===i.type?new yi(r.x,r.y,c):new vi(o.offsetLeft*a,o.offsetTop*a,o.offsetWidth*a,o.offsetHeight*a),h=s.particles.quadTree.query(l,(t=>this.isEnabled(t)));for(const e of h){if(!l.contains(e.getPosition()))continue;e.bubble.inRange=!0;const i=rt(n.divs,o);e.bubble.div&&e.bubble.div===o||(this.clear(e,t,!0),e.bubble.div=o),this._hoverBubbleSize(e,1,i),this._hoverBubbleOpacity(e,1,i),this._hoverBubbleColor(e,1,i)}}))},t.bubble||(t.bubble={}),this.handleClickMode=e=>{e===Vs&&(t.bubble||(t.bubble={}),t.bubble.clicking=!0)}}clear(t,e,i){t.bubble.inRange&&!i||(delete t.bubble.div,delete t.bubble.opacity,delete t.bubble.radius,delete t.bubble.color)}init(){const t=this.container,e=t.actualOptions.interactivity.modes.bubble;e&&(t.retina.bubbleModeDistance=e.distance*t.retina.pixelRatio,void 0!==e.size&&(t.retina.bubbleModeSize=e.size*t.retina.pixelRatio))}async interact(t){const e=this.container.actualOptions.interactivity.events,i=e.onHover,s=e.onClick,o=i.enable,n=i.mode,a=s.enable,r=s.mode,c=e.onDiv;o&&Z(Vs,n)?this._hoverBubble():a&&Z(Vs,r)?this._clickBubble():nt(Vs,c,((e,i)=>this._singleSelectorHover(t,e,i)))}isEnabled(t){const e=this.container,i=e.actualOptions,s=e.interactivity.mouse,o=(t?.interactivity??i.interactivity).events,{onClick:n,onDiv:a,onHover:r}=o,c=ot(Vs,a);return!!(c||r.enable&&s.position||n.enable&&s.clickPosition)&&(Z(Vs,r.mode)||Z(Vs,n.mode)||c)}loadModeOptions(t,...e){t.bubble||(t.bubble=new qs);for(const i of e)t.bubble.load(i?.bubble)}reset(t){t.bubble.inRange=!1}}class Ws{constructor(){this.opacity=.5}load(t){t&&void 0!==t.opacity&&(this.opacity=t.opacity)}}class $s{constructor(){this.distance=80,this.links=new Ws,this.radius=60}load(t){t&&(void 0!==t.distance&&(this.distance=t.distance),this.links.load(t.links),void 0!==t.radius&&(this.radius=t.radius))}}function js(t,e,i,s){const o=t.actualOptions.interactivity.modes.connect;if(o)return function(t,e,i,s){const o=Math.floor(i.getRadius()/e.getRadius()),n=e.getFillColor(),a=i.getFillColor();if(!n||!a)return;const r=e.getPosition(),c=i.getPosition(),l=Vt(n,a,e.getRadius(),i.getRadius()),h=t.createLinearGradient(r.x,r.y,c.x,c.y);return h.addColorStop(0,Ht(n,s)),h.addColorStop(o>1?1:o,qt(l,s)),h.addColorStop(1,Ht(a,s)),h}(e,i,s,o.links.opacity)}function Gs(t,e,i){t.canvas.draw((s=>{const o=js(t,s,e,i);if(!o)return;const n=e.getPosition(),a=i.getPosition();!function(t,e,i,s,o){Nt(t,s,o),t.lineWidth=e,t.strokeStyle=i,t.stroke()}(s,e.retina.linksWidth??0,o,n,a)}))}class Ns extends Si{constructor(t){super(t)}clear(){}init(){const t=this.container,e=t.actualOptions.interactivity.modes.connect;e&&(t.retina.connectModeDistance=e.distance*t.retina.pixelRatio,t.retina.connectModeRadius=e.radius*t.retina.pixelRatio)}async interact(){const t=this.container;if(t.actualOptions.interactivity.events.onHover.enable&&"pointermove"===t.interactivity.status){const e=t.interactivity.mouse.position;if(!t.retina.connectModeDistance||t.retina.connectModeDistance<0||!t.retina.connectModeRadius||t.retina.connectModeRadius<0||!e)return;const i=Math.abs(t.retina.connectModeRadius),s=t.particles.quadTree.queryCircle(e,i,(t=>this.isEnabled(t)));let o=0;for(const e of s){const i=e.getPosition();for(const n of s.slice(o+1)){const s=n.getPosition(),o=Math.abs(t.retina.connectModeDistance),a=Math.abs(i.x-s.x),r=Math.abs(i.y-s.y);a{const n=e.getPosition();!function(t,e,i,s,o,n){Nt(t,i,s),t.strokeStyle=qt(o,n),t.lineWidth=e,t.stroke()}(t,e.retina.linksWidth??0,n,o,i,s)}))}class Qs extends Si{constructor(t){super(t)}clear(){}init(){const t=this.container,e=t.actualOptions.interactivity.modes.grab;e&&(t.retina.grabModeDistance=e.distance*t.retina.pixelRatio)}async interact(){const t=this.container,e=t.actualOptions.interactivity;if(!e.modes.grab||!e.events.onHover.enable||t.interactivity.status!==r)return;const i=t.interactivity.mouse.position;if(!i)return;const s=t.retina.grabModeDistance;if(!s||s<0)return;const o=t.particles.quadTree.queryCircle(i,s,(t=>this.isEnabled(t)));for(const n of o){const o=T(n.getPosition(),i);if(o>s)continue;const a=e.modes.grab.links,r=a.opacity,c=r-o*r/s;if(c<=0)continue;const l=a.color??n.options.links?.color;if(!t.particles.grabLineColor&&l){const i=e.modes.grab.links;t.particles.grabLineColor=Wt(l,i.blink,i.consent)}const h=Ut(n,void 0,t.particles.grabLineColor);h&&Zs(t,n,h,c,i)}}isEnabled(t){const e=this.container,i=e.interactivity.mouse,s=(t?.interactivity??e.actualOptions.interactivity).events;return s.onHover.enable&&!!i.position&&Z("grab",s.onHover.mode)}loadModeOptions(t,...e){t.grab||(t.grab=new Ys);for(const i of e)t.grab.load(i?.grab)}reset(){}}class Js extends Si{constructor(t){super(t),this.handleClickMode=t=>{if("pause"!==t)return;const e=this.container;e.getAnimationStatus()?e.pause():e.play()}}clear(){}init(){}async interact(){}isEnabled(){return!0}reset(){}}class Ks{constructor(){this.default=!0,this.groups=[],this.quantity=4}load(t){if(!t)return;void 0!==t.default&&(this.default=t.default),void 0!==t.groups&&(this.groups=t.groups.map((t=>t))),this.groups.length||(this.default=!0);const e=t.quantity;void 0!==e&&(this.quantity=S(e))}}class to extends Si{constructor(t){super(t),this.handleClickMode=t=>{if("push"!==t)return;const e=this.container,i=e.actualOptions.interactivity.modes.push;if(!i)return;const s=C(i.quantity);if(s<=0)return;const o=K([void 0,...i.groups]),n=void 0!==o?e.actualOptions.particles.groups[o]:void 0;e.particles.push(s,e.interactivity.mouse,n,o)}}clear(){}init(){}async interact(){}isEnabled(){return!0}loadModeOptions(t,...e){t.push||(t.push=new Ks);for(const i of e)t.push.load(i?.push)}reset(){}}class eo{constructor(){this.quantity=2}load(t){if(!t)return;const e=t.quantity;void 0!==e&&(this.quantity=S(e))}}class io extends Si{constructor(t){super(t),this.handleClickMode=t=>{const e=this.container,i=e.actualOptions;if(!i.interactivity.modes.remove||"remove"!==t)return;const s=C(i.interactivity.modes.remove.quantity);e.particles.removeQuantity(s)}}clear(){}init(){}async interact(){}isEnabled(){return!0}loadModeOptions(t,...e){t.remove||(t.remove=new eo);for(const i of e)t.remove.load(i?.remove)}reset(){}}class so{constructor(){this.distance=200,this.duration=.4,this.factor=100,this.speed=1,this.maxSpeed=50,this.easing="ease-out-quad"}load(t){t&&(void 0!==t.distance&&(this.distance=t.distance),void 0!==t.duration&&(this.duration=t.duration),void 0!==t.easing&&(this.easing=t.easing),void 0!==t.factor&&(this.factor=t.factor),void 0!==t.speed&&(this.speed=t.speed),void 0!==t.maxSpeed&&(this.maxSpeed=t.maxSpeed))}}class oo extends so{constructor(){super(),this.selectors=[]}load(t){super.load(t),t&&void 0!==t.selectors&&(this.selectors=t.selectors)}}class no extends so{load(t){super.load(t),t&&(this.divs=dt(t.divs,(t=>{const e=new oo;return e.load(t),e})))}}const ao="repulse";class ro extends Si{constructor(t,e){super(e),this._clickRepulse=()=>{const t=this.container,e=t.actualOptions.interactivity.modes.repulse;if(!e)return;const i=t.repulse||{particles:[]};if(i.finish||(i.count||(i.count=0),i.count++,i.count===t.particles.count&&(i.finish=!0)),i.clicking){const s=t.retina.repulseModeDistance;if(!s||s<0)return;const o=Math.pow(s/6,3),n=t.interactivity.mouse.clickPosition;if(void 0===n)return;const a=new yi(n.x,n.y,o),r=t.particles.quadTree.query(a,(t=>this.isEnabled(t)));for(const t of r){const{dx:s,dy:a,distance:r}=D(n,t.position),c=r**2,l=-o*e.speed/c;if(c<=o){i.particles.push(t);const e=y.create(s,a);e.length=l,t.velocity.setTo(e)}}}else if(!1===i.clicking){for(const t of i.particles)t.velocity.setTo(t.initialVelocity);i.particles=[]}},this._hoverRepulse=()=>{const t=this.container,e=t.interactivity.mouse.position,i=t.retina.repulseModeDistance;!i||i<0||!e||this._processRepulse(e,i,new yi(e.x,e.y,i))},this._processRepulse=(t,e,i,s)=>{const o=this.container,n=o.particles.quadTree.query(i,(t=>this.isEnabled(t))),a=o.actualOptions.interactivity.modes.repulse;if(!a)return;const{easing:r,speed:c,factor:l,maxSpeed:h}=a,d=w(r),u=(s?.speed??c)*l;for(const i of n){const{dx:s,dy:o,distance:n}=D(i.position,t),a=k(d(1-n/e)*u,0,h),r=y.create(0===n?u:s/n*a,0===n?u:o/n*a);i.position.addTo(r)}},this._singleSelectorRepulse=(t,e)=>{const i=this.container,s=i.actualOptions.interactivity.modes.repulse;if(!s)return;const o=document.querySelectorAll(t);o.length&&o.forEach((t=>{const o=t,n=i.retina.pixelRatio,a={x:(o.offsetLeft+o.offsetWidth/2)*n,y:(o.offsetTop+o.offsetHeight/2)*n},r=o.offsetWidth/2*n,c="circle"===e.type?new yi(a.x,a.y,r):new vi(o.offsetLeft*n,o.offsetTop*n,o.offsetWidth*n,o.offsetHeight*n),l=rt(s.divs,o);this._processRepulse(a,r,c,l)}))},this._engine=t,e.repulse||(e.repulse={particles:[]}),this.handleClickMode=t=>{const i=this.container.actualOptions.interactivity.modes.repulse;if(!i||t!==ao)return;e.repulse||(e.repulse={particles:[]});const s=e.repulse;s.clicking=!0,s.count=0;for(const t of e.repulse.particles)this.isEnabled(t)&&t.velocity.setTo(t.initialVelocity);s.particles=[],s.finish=!1,setTimeout((()=>{e.destroyed||(s.clicking=!1)}),1e3*i.duration)}}clear(){}init(){const t=this.container,e=t.actualOptions.interactivity.modes.repulse;e&&(t.retina.repulseModeDistance=e.distance*t.retina.pixelRatio)}async interact(){const t=this.container,e=t.actualOptions,i=t.interactivity.status===r,s=e.interactivity.events,o=s.onHover,n=o.enable,a=o.mode,c=s.onClick,l=c.enable,h=c.mode,d=s.onDiv;i&&n&&Z(ao,a)?this._hoverRepulse():l&&Z(ao,h)?this._clickRepulse():nt(ao,d,((t,e)=>this._singleSelectorRepulse(t,e)))}isEnabled(t){const e=this.container,i=e.actualOptions,s=e.interactivity.mouse,o=(t?.interactivity??i.interactivity).events,n=o.onDiv,a=o.onHover,r=o.onClick,c=ot(ao,n);if(!(c||a.enable&&s.position||r.enable&&s.clickPosition))return!1;const l=a.mode,h=r.mode;return Z(ao,l)||Z(ao,h)||c}loadModeOptions(t,...e){t.repulse||(t.repulse=new no);for(const i of e)t.repulse.load(i?.repulse)}reset(){}}class co{constructor(){this.factor=3,this.radius=200}load(t){t&&(void 0!==t.factor&&(this.factor=t.factor),void 0!==t.radius&&(this.radius=t.radius))}}class lo extends Si{constructor(t){super(t)}clear(t,e,i){t.slow.inRange&&!i||(t.slow.factor=1)}init(){const t=this.container,e=t.actualOptions.interactivity.modes.slow;e&&(t.retina.slowModeRadius=e.radius*t.retina.pixelRatio)}async interact(){}isEnabled(t){const e=this.container,i=e.interactivity.mouse,s=(t?.interactivity??e.actualOptions.interactivity).events;return s.onHover.enable&&!!i.position&&Z("slow",s.onHover.mode)}loadModeOptions(t,...e){t.slow||(t.slow=new co);for(const i of e)t.slow.load(i?.slow)}reset(t){t.slow.inRange=!1;const e=this.container,i=e.actualOptions,s=e.interactivity.mouse.position,o=e.retina.slowModeRadius,n=i.interactivity.modes.slow;if(!n||!o||o<0||!s)return;const a=T(s,t.getPosition()),r=a/o,c=n.factor,{slow:l}=t;a>o||(l.inRange=!0,l.factor=r/c)}}const ho=[0,4,2,1],uo=[8,8,4,2];class po{constructor(t){this.pos=0,this.data=new Uint8ClampedArray(t)}getString(t){const e=this.data.slice(this.pos,this.pos+t);return this.pos+=e.length,e.reduce(((t,e)=>t+String.fromCharCode(e)),"")}nextByte(){return this.data[this.pos++]}nextTwoBytes(){return this.pos+=2,this.data[this.pos-2]+(this.data[this.pos-1]<<8)}readSubBlocks(){let t="",e=0;do{e=this.data[this.pos++];for(let i=e;--i>=0;t+=String.fromCharCode(this.data[this.pos++]));}while(0!==e);return t}readSubBlocksBin(){let t=0,e=0;for(let i=0;0!==(t=this.data[this.pos+i]);i+=t+1)e+=t;const i=new Uint8Array(e);for(let e=0;0!==(t=this.data[this.pos++]);)for(let s=t;--s>=0;i[e++]=this.data[this.pos++]);return i}skipSubBlocks(){for(;0!==this.data[this.pos];this.pos+=this.data[this.pos]+1);this.pos++}}function fo(t,e){const i=[];for(let s=0;s>>3;const h=1<<1+(7&r);c&&(a.localColorTable=fo(t,h));const d=t=>{const{r:s,g:n,b:r}=(c?a.localColorTable:e.globalColorTable)[t];return{r:s,g:n,b:r,a:t===o(null)?i?~~((s+n+r)/3):0:255}},u=(()=>{try{return new ImageData(a.width,a.height,{colorSpace:"srgb"})}catch(t){if(t instanceof DOMException&&"IndexSizeError"===t.name)return null;throw t}})();if(null==u)throw new EvalError("GIF frame size is to large");const p=t.nextByte(),f=t.readSubBlocksBin(),v=1<{const i=t>>>3,s=7&t;return(f[i]+(f[i+1]<<8)+(f[i+2]<<16)&(1<>>s};if(l){for(let i=0,o=p+1,r=0,c=[[0]],l=0;l<4;l++){if(ho[l]=c.length?c.push(c[s].concat(c[s][0])):s!==v&&c.push(c[s].concat(c[i][0]));for(let s=0;s=a.height))break}n?.(t.pos/(t.data.length-1),s(!1)+1,u,{x:a.left,y:a.top},{width:e.width,height:e.height})}a.image=u,a.bitmap=await createImageBitmap(u)}else{for(let t=0,e=p+1,i=0,s=[[0]],o=-4;;){const n=t;if(t=y(i,e),i+=e,t===v){e=p+1,s.length=v+2;for(let t=0;t=s.length?s.push(s[n].concat(s[n][0])):n!==v&&s.push(s[n].concat(s[t][0]));for(let e=0;e=1<>>5,o.disposalMethod=(28&n)>>>2,o.userInputDelayFlag=2==(2&n);const a=1==(1&n);o.delayTime=10*t.nextTwoBytes();const r=t.nextByte();a&&s(r),t.pos++;break}case 255:{t.pos++;const i={identifier:t.getString(8),authenticationCode:t.getString(3),data:t.readSubBlocksBin()};e.applicationExtensions.push(i);break}case 254:e.comments.push([i(!1),t.readSubBlocks()]);break;case 1:if(0===e.globalColorTable.length)throw new EvalError("plain text extension without global color table");t.pos++,e.frames[i(!1)].plainTextData={left:t.nextTwoBytes(),top:t.nextTwoBytes(),width:t.nextTwoBytes(),height:t.nextTwoBytes(),charSize:{width:t.nextTwoBytes(),height:t.nextTwoBytes()},foregroundColor:t.nextByte(),backgroundColor:t.nextByte(),text:t.readSubBlocks()};break;default:t.skipSubBlocks()}}(t,e,s,o);break;default:throw new EvalError("undefined block found")}return!1}const yo=/(#(?:[0-9a-f]{2}){2,4}|(#[0-9a-f]{3})|(rgb|hsl)a?\((-?\d+%?[,\s]+){2,3}\s*[\d.]+%?\))|currentcolor/gi;async function mo(t){return new Promise((e=>{t.loading=!0;const i=new Image;t.element=i,i.addEventListener("load",(()=>{t.loading=!1,e()})),i.addEventListener("error",(()=>{t.element=void 0,t.error=!0,t.loading=!1,W().error(`${f} loading image: ${t.source}`),e()})),i.src=t.source}))}async function go(t){if("gif"===t.type){t.loading=!0;try{t.gifData=await async function(t,e,i){i||(i=!1);const s=await fetch(t);if(!s.ok&&404===s.status)throw new EvalError("file not found");const o=await s.arrayBuffer(),n={width:0,height:0,totalTime:0,colorRes:0,pixelAspectRatio:0,frames:[],sortFlag:!1,globalColorTable:[],backgroundImage:new ImageData(1,1,{colorSpace:"srgb"}),comments:[],applicationExtensions:[]},a=new po(new Uint8ClampedArray(o));if("GIF89a"!==a.getString(6))throw new Error("not a supported GIF file");n.width=a.nextTwoBytes(),n.height=a.nextTwoBytes();const r=a.nextByte(),c=128==(128&r);n.colorRes=(112&r)>>>4,n.sortFlag=8==(8&r);const l=1<<1+(7&r),h=a.nextByte();n.pixelAspectRatio=a.nextByte(),0!==n.pixelAspectRatio&&(n.pixelAspectRatio=(n.pixelAspectRatio+15)/64),c&&(n.globalColorTable=fo(a,l));const d=(()=>{try{return new ImageData(n.width,n.height,{colorSpace:"srgb"})}catch(t){if(t instanceof DOMException&&"IndexSizeError"===t.name)return null;throw t}})();if(null==d)throw new Error("GIF frame size is to large");const{r:u,g:p,b:f}=n.globalColorTable[h];d.data.set(c?[u,p,f,255]:[0,0,0,0]);for(let t=4;t(t&&(y=!0),v),b=t=>(null!=t&&(m=t),m);try{do{y&&(n.frames.push({left:0,top:0,width:0,height:0,disposalMethod:0,image:new ImageData(1,1,{colorSpace:"srgb"}),plainTextData:null,userInputDelayFlag:!1,delayTime:0,sortFlag:!1,localColorTable:[],reserved:0,GCreserved:0}),v++,m=-1,y=!1)}while(!await vo(a,n,i,g,b,e));n.frames.length--;for(const t of n.frames){if(t.userInputDelayFlag&&0===t.delayTime){n.totalTime=1/0;break}n.totalTime+=t.delayTime}return n}catch(t){if(t instanceof EvalError)throw new Error(`error while parsing frame ${v} "${t.message}"`);throw t}}(t.source),t.gifLoopCount=function(t){for(const e of t.applicationExtensions)if(e.identifier+e.authenticationCode==="NETSCAPE2.0")return e.data[1]+(e.data[2]<<8);return NaN}(t.gifData)??0,0===t.gifLoopCount&&(t.gifLoopCount=1/0)}catch{t.error=!0}t.loading=!1}else await mo(t)}async function bo(t){if("svg"!==t.type)return void await mo(t);t.loading=!0;const e=await fetch(t.source);e.ok?t.svgData=await e.text():(W().error(`${f} Image not found`),t.error=!0),t.loading=!1}function wo(t,e,i,s){const o=function(t,e,i){const{svgData:s}=t;if(!s)return"";const o=Ht(e,i);if(s.includes("fill"))return s.replace(yo,(()=>o));const n=s.indexOf(">");return`${s.substring(0,n)} fill="${o}"${s.substring(n)}`}(t,i,s.opacity?.value??1),n={color:i,gif:e.gif,data:{...t,svgData:o},loaded:!1,ratio:e.width/e.height,replaceColor:e.replaceColor,source:e.src};return new Promise((e=>{const i=new Blob([o],{type:"image/svg+xml"}),s=URL||window.URL||window.webkitURL||window,a=s.createObjectURL(i),r=new Image;r.addEventListener("load",(()=>{n.loaded=!0,n.element=r,e(n),s.revokeObjectURL(a)})),r.addEventListener("error",(async()=>{s.revokeObjectURL(a);const i={...t,error:!1,loading:!0};await mo(i),n.loaded=!0,n.element=i.element,e(n)})),r.src=a}))}class xo{constructor(t){this.loadImageShape=async t=>{if(!this._engine.loadImage)throw new Error(`${f} image shape not initialized`);await this._engine.loadImage({gif:t.gif,name:t.name,replaceColor:t.replaceColor??!1,src:t.src})},this._engine=t}addImage(t){this._engine.images||(this._engine.images=[]),this._engine.images.push(t)}draw(t){const{context:e,radius:i,particle:s,opacity:o,delta:n}=t,a=s.image,r=a?.element;if(a){if(e.globalAlpha=o,a.gif&&a.gifData){const t=new OffscreenCanvas(a.gifData.width,a.gifData.height),o=t.getContext("2d");if(!o)throw new Error("could not create offscreen canvas context");o.imageSmoothingQuality="low",o.imageSmoothingEnabled=!1,o.clearRect(0,0,t.width,t.height),void 0===s.gifLoopCount&&(s.gifLoopCount=a.gifLoopCount??0);let r=s.gifFrame??0;const c={x:.5*-a.gifData.width,y:.5*-a.gifData.height},l=a.gifData.frames[r];if(void 0===s.gifTime&&(s.gifTime=0),!l.bitmap)return;switch(e.scale(i/a.gifData.width,i/a.gifData.height),l.disposalMethod){case 4:case 5:case 6:case 7:case 0:o.drawImage(l.bitmap,l.left,l.top),e.drawImage(t,c.x,c.y),o.clearRect(0,0,t.width,t.height);break;case 1:o.drawImage(l.bitmap,l.left,l.top),e.drawImage(t,c.x,c.y);break;case 2:o.drawImage(l.bitmap,l.left,l.top),e.drawImage(t,c.x,c.y),o.clearRect(0,0,t.width,t.height),0===a.gifData.globalColorTable.length?o.putImageData(a.gifData.frames[0].image,c.x+l.left,c.y+l.top):o.putImageData(a.gifData.backgroundImage,c.x,c.y);break;case 3:{const i=o.getImageData(0,0,t.width,t.height);o.drawImage(l.bitmap,l.left,l.top),e.drawImage(t,c.x,c.y),o.clearRect(0,0,t.width,t.height),o.putImageData(i,0,0)}}if(s.gifTime+=n.value,s.gifTime>l.delayTime){if(s.gifTime-=l.delayTime,++r>=a.gifData.frames.length){if(--s.gifLoopCount<=0)return;r=0,o.clearRect(0,0,t.width,t.height)}s.gifFrame=r}e.scale(a.gifData.width/i,a.gifData.height/i)}else if(r){const t=a.ratio,s={x:-i,y:-i},o=2*i;e.drawImage(r,s.x,s.y,o,o/t)}e.globalAlpha=1}}getSidesCount(){return 12}async init(t){const e=t.actualOptions;if(e.preload&&this._engine.loadImage)for(const t of e.preload)await this._engine.loadImage(t)}loadShape(t){if("image"!==t.shape&&"images"!==t.shape)return;this._engine.images||(this._engine.images=[]);const e=t.shapeData;if(!e)return;this._engine.images.find((t=>t.name===e.name||t.source===e.src))||this.loadImageShape(e).then((()=>{this.loadShape(t)}))}particleInit(t,e){if("image"!==e.shape&&"images"!==e.shape)return;this._engine.images||(this._engine.images=[]);const i=this._engine.images,s=e.shapeData;if(!s)return;const o=e.getFillColor(),n=i.find((t=>t.name===s.name||t.source===s.src));if(!n)return;const a=s.replaceColor??n.replaceColor;n.loading?setTimeout((()=>{this.particleInit(t,e)})):(async()=>{let t;t=n.svgData&&o?await wo(n,s,o,e):{color:o,data:n,element:n.element,gif:n.gif,gifData:n.gifData,gifLoopCount:n.gifLoopCount,loaded:!0,ratio:s.width&&s.height?s.width/s.height:n.ratio??1,replaceColor:a,source:s.src},t.ratio||(t.ratio=1);const i={image:t,fill:s.fill??e.shapeFill,close:s.close??e.shapeClose};e.image=i.image,e.shapeFill=i.fill,e.shapeClose=i.close})()}}class _o{constructor(){this.src="",this.gif=!1}load(t){t&&(void 0!==t.gif&&(this.gif=t.gif),void 0!==t.height&&(this.height=t.height),void 0!==t.name&&(this.name=t.name),void 0!==t.replaceColor&&(this.replaceColor=t.replaceColor),void 0!==t.src&&(this.src=t.src),void 0!==t.width&&(this.width=t.width))}}class ko{constructor(t){this.id="imagePreloader",this._engine=t}getPlugin(){return{}}loadOptions(t,e){if(!e||!e.preload)return;t.preload||(t.preload=[]);const i=t.preload;for(const t of e.preload){const e=i.find((e=>e.name===t.name||e.src===t.src));if(e)e.load(t);else{const e=new _o;e.load(t),i.push(e)}}}needsPlugin(){return!0}}async function zo(t,e=!0){!function(t){t.loadImage||(t.loadImage=async e=>{if(!e.name&&!e.src)throw new Error(`${f} no image source provided`);if(t.images||(t.images=[]),!t.images.find((t=>t.name===e.name||t.source===e.src)))try{const i={gif:e.gif??!1,name:e.name??e.src,source:e.src,type:e.src.substring(e.src.length-3),error:!1,loading:!0,replaceColor:e.replaceColor,ratio:e.width&&e.height?e.width/e.height:void 0};t.images.push(i);const s=e.gif?go:e.replaceColor?bo:mo;await s(i)}catch{throw new Error(`${f} ${e.name??e.src} not found`)}})}(t);const i=new ko(t);await t.addPlugin(i,e),await t.addShape(["image","images"],new xo(t),e)}class Mo extends Re{constructor(){super(),this.sync=!1}load(t){t&&(super.load(t),void 0!==t.sync&&(this.sync=t.sync))}}class Co extends Re{constructor(){super(),this.sync=!1}load(t){t&&(super.load(t),void 0!==t.sync&&(this.sync=t.sync))}}class Po{constructor(){this.count=0,this.delay=new Mo,this.duration=new Co}load(t){t&&(void 0!==t.count&&(this.count=t.count),this.delay.load(t.delay),this.duration.load(t.duration))}}class Oo{constructor(t){this.container=t}init(t){const e=this.container,i=t.options.life;i&&(t.life={delay:e.retina.reduceFactor?C(i.delay.value)*(i.delay.sync?1:_())/e.retina.reduceFactor*1e3:0,delayTime:0,duration:e.retina.reduceFactor?C(i.duration.value)*(i.duration.sync?1:_())/e.retina.reduceFactor*1e3:0,time:0,count:i.count},t.life.duration<=0&&(t.life.duration=-1),t.life.count<=0&&(t.life.count=-1),t.life&&(t.spawning=t.life.delay>0))}isEnabled(t){return!t.destroyed}loadOptions(t,...e){t.life||(t.life=new Po);for(const i of e)t.life.load(i?.life)}update(t,e){if(!this.isEnabled(t)||!t.life)return;const i=t.life;let s=!1;if(t.spawning){if(i.delayTime+=e.value,!(i.delayTime>=t.life.delay))return;s=!0,t.spawning=!1,i.delayTime=0,i.time=0}if(-1===i.duration)return;if(t.spawning)return;if(s?i.time=0:i.time+=e.value,i.time0&&t.life.count--,0===t.life.count)return void t.destroy();const o=this.container.canvas.size,n=S(0,o.width),a=S(0,o.width);t.position.x=M(n),t.position.y=M(a),t.spawning=!0,i.delayTime=0,i.time=0,t.reset();const r=t.options.life;r&&(i.delay=1e3*C(r.delay.value),i.duration=1e3*C(r.duration.value))}}class So{draw(t){const{context:e,particle:i,radius:s}=t,o=i.shapeData;e.moveTo(-s/2,0),e.lineTo(s/2,0),e.lineCap=o?.cap??"butt"}getSidesCount(){return 1}}class Do{init(){}isEnabled(t){return!j()&&!t.destroyed&&t.container.actualOptions.interactivity.events.onHover.parallax.enable}move(t){const e=t.container,i=e.actualOptions.interactivity.events.onHover.parallax;if(j()||!i.enable)return;const s=i.force,o=e.interactivity.mouse.position;if(!o)return;const n=e.canvas.size,a=.5*n.width,r=.5*n.height,c=i.smooth,l=t.getRadius()/s,h=(o.x-a)*l,d=(o.y-r)*l,{offset:u}=t;u.x+=(h-u.x)/c,u.y+=(d-u.y)/c}}class To extends Di{constructor(t){super(t)}clear(){}init(){}async interact(t){const e=this.container;void 0===t.attractDistance&&(t.attractDistance=C(t.options.move.attract.distance)*e.retina.pixelRatio);const i=t.attractDistance,s=t.getPosition(),o=e.particles.quadTree.queryCircle(s,i);for(const e of o){if(t===e||!e.options.move.attract.enable||e.destroyed||e.spawning)continue;const i=e.getPosition(),{dx:o,dy:n}=D(s,i),a=t.options.move.attract.rotate,r=o/(1e3*a.x),c=n/(1e3*a.y),l=e.size.value/t.size.value,h=1/l;t.velocity.x-=r*l,t.velocity.y-=c*l,e.velocity.x+=r*h,e.velocity.y+=c*h}}isEnabled(t){return t.options.move.attract.enable}reset(){}}function Ro(t,e,i,s,o,n){const a=k(t.options.collisions.absorb.speed*o.factor/10,0,s);t.size.value+=a/2,i.size.value-=a,s<=n&&(i.size.value=0,i.destroy())}const Eo=t=>{void 0===t.collisionMaxSpeed&&(t.collisionMaxSpeed=C(t.options.collisions.maxSpeed)),t.velocity.length>t.collisionMaxSpeed&&(t.velocity.length=t.collisionMaxSpeed)};function Io(t,e){lt(ct(t),ct(e)),Eo(t),Eo(e)}function Lo(t,e,i,s){switch(t.options.collisions.mode){case"absorb":!function(t,e,i,s){const o=t.getRadius(),n=e.getRadius();void 0===o&&void 0!==n?t.destroy():void 0!==o&&void 0===n?e.destroy():void 0!==o&&void 0!==n&&(o>=n?Ro(t,0,e,n,i,s):Ro(e,0,t,o,i,s))}(t,e,i,s);break;case"bounce":Io(t,e);break;case"destroy":!function(t,e){t.unbreakable||e.unbreakable||Io(t,e),void 0===t.getRadius()&&void 0!==e.getRadius()?t.destroy():void 0!==t.getRadius()&&void 0===e.getRadius()?e.destroy():void 0!==t.getRadius()&&void 0!==e.getRadius()&&(t.getRadius()>=e.getRadius()?e:t).destroy()}(t,e)}}class Ao extends Di{constructor(t){super(t)}clear(){}init(){}async interact(t,e){if(t.destroyed||t.spawning)return;const i=this.container,s=t.getPosition(),o=t.getRadius(),n=i.particles.quadTree.queryCircle(s,2*o);for(const a of n){if(t===a||!a.options.collisions.enable||t.options.collisions.mode!==a.options.collisions.mode||a.destroyed||a.spawning)continue;const n=a.getPosition(),r=a.getRadius();if(Math.abs(Math.round(s.z)-Math.round(n.z))>o+r)continue;T(s,n)>o+r||Lo(t,a,e,i.retina.pixelRatio)}}isEnabled(t){return t.options.collisions.enable}reset(){}}class Fo extends yi{constructor(t,e,i,s){super(t,e,i),this.canvasSize=s,this.canvasSize={...s}}contains(t){const{width:e,height:i}=this.canvasSize,{x:s,y:o}=t;return super.contains(t)||super.contains({x:s-e,y:o})||super.contains({x:s-e,y:o-i})||super.contains({x:s,y:o-i})}intersects(t){if(super.intersects(t))return!0;const e=t,i=t,s={x:t.position.x-this.canvasSize.width,y:t.position.y-this.canvasSize.height};if(void 0!==i.radius){const t=new yi(s.x,s.y,2*i.radius);return super.intersects(t)}if(void 0!==e.size){const t=new vi(s.x,s.y,2*e.size.width,2*e.size.height);return super.intersects(t)}return!1}}class Bo{constructor(){this.blur=5,this.color=new ce,this.color.value="#000",this.enable=!1}load(t){t&&(void 0!==t.blur&&(this.blur=t.blur),this.color=ce.create(this.color,t.color),void 0!==t.enable&&(this.enable=t.enable))}}class qo{constructor(){this.enable=!1,this.frequency=1}load(t){t&&(void 0!==t.color&&(this.color=ce.create(this.color,t.color)),void 0!==t.enable&&(this.enable=t.enable),void 0!==t.frequency&&(this.frequency=t.frequency),void 0!==t.opacity&&(this.opacity=t.opacity))}}class Ho{constructor(){this.blink=!1,this.color=new ce,this.color.value="#fff",this.consent=!1,this.distance=100,this.enable=!1,this.frequency=1,this.opacity=1,this.shadow=new Bo,this.triangles=new qo,this.width=1,this.warp=!1}load(t){t&&(void 0!==t.id&&(this.id=t.id),void 0!==t.blink&&(this.blink=t.blink),this.color=ce.create(this.color,t.color),void 0!==t.consent&&(this.consent=t.consent),void 0!==t.distance&&(this.distance=t.distance),void 0!==t.enable&&(this.enable=t.enable),void 0!==t.frequency&&(this.frequency=t.frequency),void 0!==t.opacity&&(this.opacity=t.opacity),this.shadow.load(t.shadow),this.triangles.load(t.triangles),void 0!==t.width&&(this.width=t.width),void 0!==t.warp&&(this.warp=t.warp))}}function Vo(t,e,i,s,o){const{dx:n,dy:a,distance:r}=D(t,e);if(!o||r<=i)return r;const c={x:Math.abs(n),y:Math.abs(a)},l=Math.min(c.x,s.width-c.x),h=Math.min(c.y,s.height-c.y);return Math.sqrt(l**2+h**2)}class Uo extends Di{constructor(t){super(t),this._setColor=t=>{if(!t.options.links)return;const e=this.linkContainer,i=t.options.links;let s=void 0===i.id?e.particles.linksColor:e.particles.linksColors.get(i.id);if(s)return;s=Wt(i.color,i.blink,i.consent),void 0===i.id?e.particles.linksColor=s:e.particles.linksColors.set(i.id,s)},this.linkContainer=t}clear(){}init(){this.linkContainer.particles.linksColor=void 0,this.linkContainer.particles.linksColors=new Map}async interact(t){if(!t.options.links)return;t.links=[];const e=t.getPosition(),i=this.container,s=i.canvas.size;if(e.x<0||e.y<0||e.x>s.width||e.y>s.height)return;const o=t.options.links,n=o.opacity,a=t.retina.linksDistance??0,r=o.warp,c=r?new Fo(e.x,e.y,a,s):new yi(e.x,e.y,a),l=i.particles.quadTree.query(c);for(const i of l){const c=i.options.links;if(t===i||!c?.enable||o.id!==c.id||i.spawning||i.destroyed||!i.links||t.links.some((t=>t.destination===i))||i.links.some((e=>e.destination===t)))continue;const l=i.getPosition();if(l.x<0||l.y<0||l.x>s.width||l.y>s.height)continue;const h=Vo(e,l,a,s,r&&c.warp);if(h>a)continue;const d=(1-h/a)*n;this._setColor(t),t.links.push({destination:i,opacity:d})}}isEnabled(t){return!!t.options.links?.enable}loadParticlesOptions(t,...e){t.links||(t.links=new Ho);for(const i of e)t.links.load(i?.links)}reset(){}}function Wo(t,e){const i=((s=t.map((t=>t.id))).sort(((t,e)=>t-e)),s.join("_"));var s;let o=e.get(i);return void 0===o&&(o=_(),e.set(i,o)),o}class $o{constructor(t){this.container=t,this._drawLinkLine=(t,e)=>{const i=t.options.links;if(!i?.enable)return;const s=this.container,o=s.actualOptions,n=e.destination,a=t.getPosition(),r=n.getPosition();let c=e.opacity;s.canvas.draw((e=>{let l;const h=t.options.twinkle?.lines;if(h?.enable){const t=h.frequency,e=St(h.color);_(){const s=t.options.links;if(!s?.enable)return;const o=s.triangles;if(!o.enable)return;const n=this.container,a=n.actualOptions,r=e.destination,c=i.destination,l=o.opacity??(e.opacity+i.opacity)/2;l<=0||n.canvas.draw((e=>{const i=t.getPosition(),h=r.getPosition(),d=c.getPosition(),u=t.retina.linksDistance??0;if(T(i,h)>u||T(d,h)>u||T(d,i)>u)return;let p=St(o.color);if(!p){const e=void 0!==s.id?n.particles.linksColors.get(s.id):n.particles.linksColor;p=Ut(t,r,e)}p&&function(t){const{context:e,pos1:i,pos2:s,pos3:o,backgroundMask:n,colorTriangle:a,opacityTriangle:r}=t;!function(t,e,i,s){t.beginPath(),t.moveTo(e.x,e.y),t.lineTo(i.x,i.y),t.lineTo(s.x,s.y),t.closePath()}(e,i,s,o),n.enable&&(e.globalCompositeOperation=n.composite),e.fillStyle=qt(a,r),e.fill()}({context:e,pos1:i,pos2:h,pos3:d,backgroundMask:a.backgroundMask,colorTriangle:p,opacityTriangle:l})}))},this._drawTriangles=(t,e,i,s)=>{const o=i.destination;if(!t.links?.triangles.enable||!o.options.links?.triangles.enable)return;const n=o.links?.filter((t=>{const e=this._getLinkFrequency(o,t.destination);return o.options.links&&e<=o.options.links.frequency&&s.findIndex((e=>e.destination===t.destination))>=0}));if(n?.length)for(const s of n){const n=s.destination;this._getTriangleFrequency(e,o,n)>t.links.triangles.frequency||this._drawLinkTriangle(e,i,s)}},this._getLinkFrequency=(t,e)=>Wo([t,e],this._freqs.links),this._getTriangleFrequency=(t,e,i)=>Wo([t,e,i],this._freqs.triangles),this._freqs={links:new Map,triangles:new Map}}drawParticle(t,e){const{links:i,options:s}=e;if(!i||i.length<=0)return;const o=i.filter((t=>s.links&&this._getLinkFrequency(e,t.destination)<=s.links.frequency));for(const t of o)this._drawTriangles(s,e,t,o),t.opacity>0&&(e.retina.linksWidth??0)>0&&this._drawLinkLine(e,t)}async init(){this._freqs.links=new Map,this._freqs.triangles=new Map}particleCreated(t){if(t.links=[],!t.options.links)return;const e=this.container.retina.pixelRatio,{retina:i}=t,{distance:s,width:o}=t.options.links;i.linksDistance=s*e,i.linksWidth=o*e}particleDestroyed(t){t.links=[]}}class jo{constructor(){this.id="links"}getPlugin(t){return new $o(t)}loadOptions(){}needsPlugin(){return!0}}async function Go(t,e=!0){await async function(t,e=!0){await t.addInteractor("particlesLinks",(t=>new Uo(t)),e)}(t,e),await async function(t,e=!0){const i=new jo;await t.addPlugin(i,e)}(t,e)}class No{draw(t){const{context:e,particle:i,radius:s}=t,o=this.getCenter(i,s),n=this.getSidesData(i,s),a=n.count.numerator*n.count.denominator,r=n.count.numerator/n.count.denominator,c=180*(r-2)/r,l=Math.PI-Math.PI*c/180;if(e){e.beginPath(),e.translate(o.x,o.y),e.moveTo(0,0);for(let t=0;t0?"counter-clockwise":"clockwise"}switch(i){case"counter-clockwise":case"counterClockwise":t.rotate.status="decreasing";break;case"clockwise":t.rotate.status="increasing"}const s=e.animation;s.enable&&(t.rotate.decay=1-C(s.decay),t.rotate.velocity=C(s.speed)/360*this.container.retina.reduceFactor,s.sync||(t.rotate.velocity*=_())),t.rotation=t.rotate.value}isEnabled(t){const e=t.options.rotate;return!!e&&(!t.destroyed&&!t.spawning&&e.animation.enable&&!e.path)}loadOptions(t,...e){t.rotate||(t.rotate=new Jo);for(const i of e)t.rotate.load(i?.rotate)}update(t,e){this.isEnabled(t)&&(!function(t,e){const i=t.rotate,s=t.options.rotate;if(!i||!s)return;const o=s.animation,n=(i.velocity??0)*e.factor,a=2*Math.PI,r=i.decay??1;o.enable&&("increasing"===i.status?(i.value+=n,i.value>a&&(i.value-=a)):(i.value-=n,i.value<0&&(i.value+=a)),i.velocity&&1!==r&&(i.velocity*=r))}(t,e),t.rotation=t.rotate?.value??0)}}const tn=Math.sqrt(2);class en{draw(t){const{context:e,radius:i}=t,s=i/tn,o=2*s;e.rect(-s,-s,o,o)}getSidesCount(){return 4}}class sn{draw(t){const{context:e,particle:i,radius:s}=t,o=i.sides,n=i.starInset??2;e.moveTo(0,0-s);for(let t=0;t0&&(e.loops??0)>(e.maxLoops??0))return;if(e.time||(e.time=0),(e.delayTime??0)>0&&e.time<(e.delayTime??0)&&(e.time+=t.value),(e.delayTime??0)>0&&e.time<(e.delayTime??0))return;const n=M(i.offset),a=(e.velocity??0)*t.factor+3.6*n,r=e.decay??1;o&&"increasing"!==e.status?(e.value-=a,e.value<0&&(e.loops||(e.loops=0),e.loops++,e.status="increasing",e.value+=e.value)):(e.value+=a,e.value>s&&(e.loops||(e.loops=0),e.loops++,o&&(e.status="decreasing",e.value-=e.value%s))),e.velocity&&1!==r&&(e.velocity*=r),e.value>s&&(e.value%=s)}class nn{constructor(t){this.container=t}init(t){const e=this.container,i=t.options,s=ut(i.stroke,t.id,i.reduceDuplicates);t.strokeWidth=C(s.width)*e.retina.pixelRatio,t.strokeOpacity=C(s.opacity??1),t.strokeAnimation=s.color?.animation;const o=Rt(s.color)??t.getFillColor();o&&(t.strokeColor=jt(o,t.strokeAnimation,e.retina.reduceFactor))}isEnabled(t){const e=t.strokeAnimation,{strokeColor:i}=t;return!t.destroyed&&!t.spawning&&!!e&&(void 0!==i?.h.value&&i.h.enable||void 0!==i?.s.value&&i.s.enable||void 0!==i?.l.value&&i.l.enable)}update(t,e){this.isEnabled(t)&&function(t,e){if(!t.strokeColor||!t.strokeAnimation)return;const{h:i,s,l:o}=t.strokeColor,{h:n,s:a,l:r}=t.strokeAnimation;i&&on(e,i,n,360,!1),s&&on(e,s,a,100,!0),o&&on(e,o,r,100,!0)}(t,e)}}async function an(t,e=!0){await async function(t,e=!0){await t.addMover("parallax",(()=>new Do),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("externalAttract",(e=>new Es(t,e)),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("externalBounce",(t=>new As(t)),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("externalBubble",(t=>new Us(t)),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("externalConnect",(t=>new Ns(t)),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("externalGrab",(t=>new Qs(t)),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("externalPause",(t=>new Js(t)),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("externalPush",(t=>new to(t)),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("externalRemove",(t=>new io(t)),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("externalRepulse",(e=>new ro(t,e)),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("externalSlow",(t=>new lo(t)),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("particlesAttract",(t=>new To(t)),e)}(t,!1),await async function(t,e=!0){await t.addInteractor("particlesCollisions",(t=>new Ao(t)),e)}(t,!1),await Go(t,!1),await async function(){b("ease-in-quad",(t=>t**2)),b("ease-out-quad",(t=>1-(1-t)**2)),b("ease-in-out-quad",(t=>t<.5?2*t**2:1-(-2*t+2)**2/2))}(),await async function(t,e=!0){await t.addShape(Os,new Ds,e)}(t,!1),await zo(t,!1),await async function(t,e=!0){await t.addShape("line",new So,e)}(t,!1),await Zo(t,!1),await async function(t,e=!0){await t.addShape(["edge","square"],new en,e)}(t,!1),await async function(t,e=!0){await t.addShape("star",new sn,e)}(t,!1),await async function(t,e=!0){await t.addParticleUpdater("life",(t=>new Oo(t)),e)}(t,!1),await async function(t,e=!0){await t.addParticleUpdater("rotate",(t=>new Ko(t)),e)}(t,!1),await async function(t,e=!0){await t.addParticleUpdater("strokeColor",(t=>new nn(t)),e)}(t,!1),await Ps(t,e)}const rn=["text","character","char","multiline-text"];class cn{constructor(){this._drawLine=(t,e,i,s,o,n)=>{const a={x:-(e.length*i/2),y:i/2},r=2*i;n?t.fillText(e,a.x,a.y+r*o):t.strokeText(e,a.x,a.y+r*o)}}draw(t){const{context:e,particle:i,radius:s,opacity:o}=t,n=i.shapeData;if(!n)return;const a=n.value;if(void 0===a)return;void 0===i.text&&(i.text=ut(a,i.randomIndexData));const r=i.text,c=n.style??"",l=n.weight??"400",h=2*Math.round(s),d=n.font??"Verdana",u=i.shapeFill,p=r?.split("\n");if(p){e.font=`${c} ${l} ${h}px "${d}"`,e.globalAlpha=o;for(let t=0;tZ(t,e.particles.shape.type)))){const t=rn.map((t=>e.particles.shape.options[t])).find((t=>!!t)),i=[];dt(t,(t=>{i.push(Q(t.font,t.weight))})),await Promise.all(i)}}particleInit(t,e){if(!e.shape||!rn.includes(e.shape))return;const i=e.shapeData;if(void 0===i)return;const s=i.value;void 0!==s&&(e.text=ut(s,e.randomIndexData))}}class ln{constructor(){this.enable=!1,this.speed=0,this.decay=0,this.sync=!1}load(t){t&&(void 0!==t.enable&&(this.enable=t.enable),void 0!==t.speed&&(this.speed=S(t.speed)),void 0!==t.decay&&(this.decay=S(t.decay)),void 0!==t.sync&&(this.sync=t.sync))}}class hn extends Re{constructor(){super(),this.animation=new ln,this.direction="clockwise",this.enable=!1,this.value=0}load(t){super.load(t),t&&(this.animation.load(t.animation),void 0!==t.direction&&(this.direction=t.direction),void 0!==t.enable&&(this.enable=t.enable))}}class dn{constructor(t){this.container=t}getTransformValues(t){const e=t.tilt?.enable&&t.tilt;return{b:e?Math.cos(e.value)*e.cosDirection:void 0,c:e?Math.sin(e.value)*e.sinDirection:void 0}}init(t){const e=t.options.tilt;if(!e)return;t.tilt={enable:e.enable,value:C(e.value)*Math.PI/180,sinDirection:_()>=.5?1:-1,cosDirection:_()>=.5?1:-1};let i=e.direction;if("random"===i){i=Math.floor(2*_())>0?"counter-clockwise":"clockwise"}switch(i){case"counter-clockwise":case"counterClockwise":t.tilt.status="decreasing";break;case"clockwise":t.tilt.status="increasing"}const s=t.options.tilt?.animation;s?.enable&&(t.tilt.decay=1-C(s.decay),t.tilt.velocity=C(s.speed)/360*this.container.retina.reduceFactor,s.sync||(t.tilt.velocity*=_()))}isEnabled(t){const e=t.options.tilt?.animation;return!t.destroyed&&!t.spawning&&!!e?.enable}loadOptions(t,...e){t.tilt||(t.tilt=new hn);for(const i of e)t.tilt.load(i?.tilt)}update(t,e){this.isEnabled(t)&&function(t,e){if(!t.tilt||!t.options.tilt)return;const i=t.options.tilt.animation,s=(t.tilt.velocity??0)*e.factor,o=2*Math.PI,n=t.tilt.decay??1;i.enable&&("increasing"===t.tilt.status?(t.tilt.value+=s,t.tilt.value>o&&(t.tilt.value-=o)):(t.tilt.value-=s,t.tilt.value<0&&(t.tilt.value+=o)),t.tilt.velocity&&1!==n&&(t.tilt.velocity*=n))}(t,e)}}class un{constructor(){this.enable=!1,this.frequency=.05,this.opacity=1}load(t){t&&(void 0!==t.color&&(this.color=ce.create(this.color,t.color)),void 0!==t.enable&&(this.enable=t.enable),void 0!==t.frequency&&(this.frequency=t.frequency),void 0!==t.opacity&&(this.opacity=S(t.opacity)))}}class pn{constructor(){this.lines=new un,this.particles=new un}load(t){t&&(this.lines.load(t.lines),this.particles.load(t.particles))}}class fn{getColorStyles(t,e,i,s){const o=t.options.twinkle;if(!o)return{};const n=o.particles,a=n.enable&&_()a&&(s.angle-=a),r.x+=n*Math.cos(s.angle),r.y+=n*Math.abs(Math.sin(s.angle))}(t,e)}}async function gn(t,e=!0){await async function(t,e=!0){await t.addParticleUpdater("destroy",(e=>new $i(t,e)),e)}(t,!1),await async function(t,e=!0){await t.addParticleUpdater("roll",(()=>new fs),e)}(t,!1),await async function(t,e=!0){await t.addParticleUpdater("tilt",(t=>new dn(t)),e)}(t,!1),await async function(t,e=!0){await t.addParticleUpdater("twinkle",(()=>new fn),e)}(t,!1),await async function(t,e=!0){await t.addParticleUpdater("wobble",(t=>new mn(t)),e)}(t,!1),await async function(t,e=!0){await t.addShape(rn,new cn,e)}(t,!1),await async function(t,e=!0){await t.addInteractor("externalTrail",(t=>new ds(t)),e)}(t,!1),await async function(t,e=!0){await t.addPlugin(new Fi,e)}(t,!1),await async function(t,e=!0){t.emitterShapeManager||(t.emitterShapeManager=new es(t)),t.addEmitterShapeGenerator||(t.addEmitterShapeGenerator=(e,i)=>{t.emitterShapeManager?.addShapeGenerator(e,i)});const i=new ss(t);await t.addPlugin(i,e)}(t,!1),await async function(t,e=!0){const i=t;i.addEmitterShapeGenerator&&i.addEmitterShapeGenerator("circle",new ns),await i.refresh(e)}(t,!1),await async function(t,e=!0){const i=t;i.addEmitterShapeGenerator&&i.addEmitterShapeGenerator("square",new cs),await i.refresh(e)}(t,!1),await an(t,e)}return gn(Ti),e})())); \ No newline at end of file diff --git a/docs/overrides/fancylogo.txt b/docs/overrides/fancylogo.txt new file mode 100644 index 00000000..230d5476 --- /dev/null +++ b/docs/overrides/fancylogo.txt @@ -0,0 +1,257 @@ +--- +hide: +- navigation +- toc +--- + +
+ +
+ + +
+
+
+ + +
+
Loading...
+
+
+ AI4CO Logo +
+
+ + +
+
+
\ No newline at end of file diff --git a/docs/overrides/main.html b/docs/overrides/main.html new file mode 100644 index 00000000..01fd277c --- /dev/null +++ b/docs/overrides/main.html @@ -0,0 +1,12 @@ +{% extends "base.html" %} +{% block content %} +{% if page.nb_url %} + {% set path_parts = page.url.strip('/').split('/') %} + {% set last_part = path_parts[-1] %} + {% set notebook_url = page.url ~ last_part ~ '.ipynb' %} + + {% include ".icons/material/download.svg" %} + +{% endif %} +{{ super() }} +{% endblock content %} \ No newline at end of file diff --git a/docs/stylesheets/extra.css b/docs/stylesheets/extra.css new file mode 100644 index 00000000..58d3e427 --- /dev/null +++ b/docs/stylesheets/extra.css @@ -0,0 +1,30 @@ +/* Custom colors */ +:root { + --md-primary-fg-color: #B92B0F; + --md-primary-fg-color--light: #F05F42; + --md-primary-fg-color--dark: #B92B0F; + + --md-accent-fg-color: #B92B0F; + --md-accent-fg-color--transparent: var(--md-accent-fg-color); /* Default to current color */ + --md-accent-bg-color: #ffffff; + --md-accent-bg-color--light: #B92B0F; + } + +[data-md-color-scheme="default"] { + --md-accent-fg-color--transparent: #f8d2cb; /* Transparent color for 'default' scheme */ +} + +[data-md-color-scheme="slate"] { + --md-accent-fg-color--transparent: #492821; /* Transparent color for 'default' scheme */ +} + +/* Ensure code blocks wrap text */ +.codehilite pre { + white-space: pre-wrap; /* Allow text to wrap within the pre element */ + word-break: break-word; /* Break the word at the edge of the container if necessary */ +} + +/* Improve overall readability of code by adding some padding */ +.codehilite { + padding: 8px; /* Adjust padding to fit your design */ +} diff --git a/docs/stylesheets/mkdocstrings.css b/docs/stylesheets/mkdocstrings.css new file mode 100644 index 00000000..abea38a6 --- /dev/null +++ b/docs/stylesheets/mkdocstrings.css @@ -0,0 +1,54 @@ +/* Indentation. */ +div.doc-contents:not(.first) { + padding-left: 15px; + border-left: .05rem solid var(--md-typeset-table-color); +} + + +/* Fancier color for operators such as * and |. */ +.doc-signature .o { + color: var(--md-code-hl-special-color); +} + +/* Fancier color for constants such as None, True, and False. */ +.doc-signature .kc { + color: var(--md-code-hl-constant-color); +} + +/* Fancier color for built-in types (only useful when cross-references are used). */ +.doc-signature .n > a[href^="https://docs.python.org/"][href*="/functions.html#"], +.doc-signature .n > a[href^="https://docs.python.org/"][href*="/stdtypes.html#"] { + color: var(--md-code-hl-constant-color); +} + + +/* Nice names only in TOC */ +.doc-symbol-toc.doc-symbol-method::after { + content: "m"; +} + +.doc-symbol-toc.doc-symbol-function::after { + content: "f"; +} + +.doc-symbol-toc.doc-symbol-class::after { + content: "C"; +} + +.doc-symbol-toc.doc-symbol-module::after { + content: "M"; +} + +.doc-symbol-toc.doc-symbol-attribute::after { + content: "A"; +} + +.doc-symbol-toc.doc-symbol-parameter::after { + content: "P"; +} + +/* Line under link as solid */ +.doc-signature .autorefs { + color: inherit; + border-bottom: 1px solid currentcolor; +} \ No newline at end of file diff --git a/examples/1-quickstart/1-quickstart.ipynb b/examples/1-quickstart/1-quickstart.ipynb new file mode 100644 index 00000000..a14bf040 --- /dev/null +++ b/examples/1-quickstart/1-quickstart.ipynb @@ -0,0 +1,455 @@ +{ + "cells": [ + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# RL4CO Quickstart Notebook\n", + "\n", + "\"Open\n", + "\n", + "[**Documentation**](https://rl4co.readthedocs.io/) | [**Getting Started**](https://github.com/ai4co/rl4co/tree/main#getting-started) | [**Usage**](https://github.com/ai4co/rl4co/tree/main#usage) | [**Contributing**](#contributing) | [**Paper**](https://arxiv.org/abs/2306.17100) | [**Citation**](#cite-us)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "In this notebook we will train the AttentionModel (AM) on the TSP environment for 20 nodes. On a GPU, this should less than 2 minutes! 🚀" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "![Alt text](https://user-images.githubusercontent.com/48984123/245925317-0db4efdd-1c93-4991-8f09-f3c6c1f35d60.png)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Installation" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "## Uncomment the following line to install the package from PyPI\n", + "## You may need to restart the runtime in Colab after this\n", + "## Remember to choose a GPU runtime for faster training!\n", + "\n", + "# !pip install rl4co" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Imports" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The autoreload extension is already loaded. To reload it, use:\n", + " %reload_ext autoreload\n" + ] + } + ], + "source": [ + "%load_ext autoreload\n", + "%autoreload 2\n", + "\n", + "import torch\n", + "\n", + "from rl4co.envs import TSPEnv\n", + "from rl4co.models import AttentionModelPolicy, REINFORCE\n", + "from rl4co.utils.trainer import RL4COTrainer" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Environment, Policy and Model\n", + "\n", + "Full documentation of:https://rl4.co/docs/content/api/envs/base/\n", + "\n", + "- Base environment class [here](https://rl4.co/docs/content/api/envs/base/)\n", + "- Base policy class [here](https://rl4.co/docs/content/api/networks/base_policies/)\n", + "- Base model class [here](https://rl4.co/docs/content/api/rl/base/)" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [], + "source": [ + "# RL4CO env based on TorchRL\n", + "env = TSPEnv(generator_params={'num_loc': 50})\n", + "\n", + "# Policy: neural network, in this case with encoder-decoder architecture\n", + "policy = AttentionModelPolicy(env_name=env.name, \n", + " embed_dim=128,\n", + " num_encoder_layers=3,\n", + " num_heads=8,\n", + " )\n", + "\n", + "# RL Model: REINFORCE and greedy rollout baseline\n", + "model = REINFORCE(env, \n", + " policy,\n", + " baseline=\"rollout\",\n", + " batch_size=512,\n", + " train_data_size=100_000,\n", + " val_data_size=10_000,\n", + " optimizer_kwargs={\"lr\": 1e-4},\n", + " ) " + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Test greedy rollout with untrained model and plot" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Problem 1 | Cost: 10.648\n", + "Problem 2 | Cost: 9.375\n", + "Problem 3 | Cost: 11.713\n" + ] + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAiMAAAGdCAYAAADAAnMpAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjguMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/H5lhTAAAACXBIWXMAAA9hAAAPYQGoP6dpAADKlUlEQVR4nOyddVgU2xvHv7tLpyBSipQBYiAqit1dqNfuxtZ7jXsNrl67ro157Q6wuxUVURFRDBBEEFS6a/f8/uDHyLC7sAvLBpzP88yjc2LmnWF3553zFocQQkChUCgUCoWiILiKFoBCoVAoFErFhiojFAqFQqFQFApVRigUCoVCoSgUqoxQKBQKhUJRKFQZoVAoFAqFolCoMkKhUCgUCkWhUGWEQqFQKBSKQqHKCIVCoVAoFIWipmgBJEEgEODbt2/Q19cHh8NRtDgUCoVCoVAkgBCClJQUWFpagssVv/6hEsrIt2/fYGVlpWgxKBQKhUKhlICvX7+iWrVqYvtVQhnR19cHkHcxBgYGCpaGQqFQKBSKJCQnJ8PKyop5jotDJZSRfNOMgYEBVUYoFAqFQlExinOxoA6sFAqFQqFQFApVRigUCoVCoSgUqoxQKBQKhUJRKFQZoVAoFAqFolCoMkKhUCgUCkWhUGWEQqFQKBSKQqHKCIVCoVAoFIVClREKhUKhUCgKhSojFAqFQqFQFIrUysiDBw/Qq1cvWFpagsPhwMfHp9g59+7dg4uLCzQ1NVGjRg0cOHCgBKJSKBQKhUIpj0itjKSlpaFBgwbYvn27ROPDwsLQo0cPtGvXDgEBAZg1axbGjx+P69evSy0shUKhUCiU8ofUtWm6deuGbt26STx+586dsLW1xYYNGwAAjo6OePToEf7991906dJF2tNTKBQKhUIpZ5S5z8iTJ0/QsWNHVluXLl3w5MkTsXOysrKQnJzM2igUCoVCoZRPylwZiYmJgZmZGavNzMwMycnJyMjIEDln1apVMDQ0ZDYrK6uyFpNCoVAoUsAXEDwJjcP5gCg8CY0DX0AULRJFhZHaTCMP/vzzT8yZM4fZT05OpgoJhUKhKAnXgqKx9OI7RCdlMm0Whlrw7FUHXetaKFAyiqpS5isj5ubm+P79O6vt+/fvMDAwgLa2tsg5mpqaMDAwYG0UCoVCUTzXgqLhceQlSxEBgJikTHgceYlrQdEKkoyiypS5MuLm5obbt2+z2m7evAk3N7eyPjWFQqFQZAhfQLD04juIMsjkty29+I6abChSI7UykpqaioCAAAQEBADIC90NCAhAREQEgDwTy8iRI5nxkydPxufPnzFv3jy8f/8eO3bswKlTpzB79mzZXAGFQqFQ5IJfWDyikzKRmxKL1MAbSHlzC+kffZGTkLcaQgBEJ2XCLyxesYJSVA6pfUb8/f3Rrl07Zj/ft2PUqFE4cOAAoqOjGcUEAGxtbXH58mXMnj0bmzdvRrVq1bB3714a1kuhUCgqxo+UPNNMzs8viLu6hWk3ajcO6q7uQuMoFEmRWhlp27YtCBG/BCcqu2rbtm3x6tUraU9FoVAoFCXCVF8LAEBys1jtHHVNkeMoFEmhtWkoFAqFIhGutsawMNQCyc1mtXPUNPL+RV5UjautsQKko6gyVBmhUCgUikTwuBx49qojpIwIstLB+f//PXvVAY/LEZ5MoRQBVUYoFAqFIjFd61pgUEN2IsvMr0EwN9SC13AXmmeEUiKUMukZhUKhUJQXWyMN1r5azFvcndMKWpoaYmZQKEVDV0YoDDS9M4VCkYTCpTxSkpNw9cplBUlDKQ/QlREKAJremUKhSE5SUpJQ2549e+Du7i5iNIVSPHRlhELTO1MoFKkomEsqn2vXruHLly8KkIZSHqDKSAUnP72zgJ+LzIhAVh9N70yhUETx9etXoTZCCP777z8FSEMpD1BlpIKTn9454c5efD/+FxIeHEZOYgzTT9M7UyiUwsTExIhs/++//8Dn8+UsDaU8QH1GKjg/UjKR8vo6Ul5eAgAkPzmJ9OAHICDQtnGGlrUztKzr0/TOFAqF4efPnyLbIyMjce3aNfTo0UPOElFUHaqMVHCiPwQg/oYXq03LugEEmalIDbiG1IBrADiYf7sefHt0RYcOHdCyZUvo6OgoRmAKhaJQfv78ibS0NLH9u3fvpsoIRWo4pKhCM0pCcnIyDA0NkZSUBAMDA0WLU26IiIhAkyZN8OPHD6ZNs5oTzAYvBwjB91NLkPU1SGiehoYGmjdvjo4dO6JDhw5o3Lgx1NSoXkuhVASuXLlSpLLB4/EQEREBS0tLOUpFUVYkfX5Tn5EKSnp6Ovr27ctSRHgGVVCl75/g8NTBUdOAab9FUDexFpqbnZ2Ne/fuYdGiRXBzc0PlypXRt29fbN26FcHBwUUWUqRQKKrN8+fPi+zn8/nYv3+/nKShlBeoMlIBIYRg3LhxrErKmlpaqDPyH/B0KzFtVc1MsO/4WVSrVq3I4yUnJ+P8+fOYMWMG6tSpg2rVqmHUqFGIjqYhwRRKecPPz6/YMXv37oVAIJCDNJTyAl1br4CsWbMGJ06cYLUdOngQ/Qf8Br+wePxIyYSpfl7lTR6XA5dr19CyZUskJiZKdPxKlSphwoQJsLCgydIolPIEIUTsyoihoSGWL1+OXbt2ISgoCLdu3ULnzp3lLCFFVaE+IxWMS5cuoXfv3ixTysKFC7F8+fIi5z169AgdO3ZEVlZWkeOWLVuG+fPnQ0OD1qigUMob4eHhqFWrFnR1dYVeTrhcLrKzs8HlcvHs2TNERkZiwIABihGUojRQnxGKEMHBwRg6dChLEenVqxeWLVtW7NyWLVvi2LFj4HCKLg1+9uxZvHjxotSyUigU5SMjIwOvX7+GlpaWUJ9AIEB8fDw4HA6aNWtGFRGKVFBlpIKQkJCA3r17IyUlhWmrU6cOjhw5Ai5Xso9Bv379sG3btiLHvH79Gs2bN8eECRMQFxdXKpkpFIpy4ejoCEdHR6FCefkUdIinUKSBKiMVgNzcXAwePBghISFMm5GREc6fPy+12WvKlCn466+/ih23d+9eODg4YP/+/dSRjUIRgSpXyabKCEXWUGWkArBgwQLcuHGD2edyuTh58iRq1KhRouMtX74co0ePZvZ1dXXh4+MDKysr1rjY2FiMHTsWbdq0QVCQcL4SCqWici0oGi3X3MGQPU8x80QAhux5ipZr7qhEUUo+n4/s7GyRfVQZoZQUqoyUcw4dOoQNGzaw2jZs2IBOnTqV+JgcDge7d+9Gt27dAABmZmbo06cPgoODMW/ePKEEaI8ePULDhg0xb948pKamlvi8FEp5QNWrZGdmii8NIS5NPIVSHFQZKcf4+flh4sSJrLZRo0Zh5syZpT62uro6Tp06hcaNG8PU1BRA3grJmjVr8OrVK7Rq1Yo1Pjc3F+vWrUOdOnXg7e1NE6NRKiT5VbJFffpVpUp2UcoIXRmhlBSqjJRTvn37hr59+7JCcZs2bYqdO3cWGxEjKXp6erh8+TJatGjBaq9bty7u37+PAwcOwMTEhNX39etX9OvXD7169UJYWJhM5KBQVIX8Ktn5CAQC5CZ9R8aX1wBUo0q2OH8RgCojlJJDlZFySGZmJvr168fKgGppaQlvb2+RIXmlwdTUFGvWrBFq53A4GDVqFD58+CC0OgMAly9fhpOTE1auXCnW/kyhlDcKVr+Ou+GFqG3DEbVzHH6eXQYi4Iscp2xQZUR5UWWnaKqMlDMIIZg8eTKePXvGtGlqasLb27vMMqLyeDyxfcbGxti1axeePHmCBg0asPoyMjKwcOFCNGjQAHfv3i0T2SgUZcJU/9fLAMnJhCAj+f//z0JO3FeR45SNwspIwe8/VUYUhyo7RQNUGSl3bNq0CQcPHmS17dmzB66urgqSKI9mzZrB398f//77L/T09Fh979+/R/v27TFixAh8//5dQRJSKGWPq60xLAy1wAGgYc6OZsuK/ggOAAvDvFIMykphZURHR4f5P1VGFIOqO0UDVBkpV9y4cQN//PEHq+3333/HiBEjFCQRGzU1NcyaNQvv37/Hb7/9JtR/5MgR1K5dGzt27ACfzxdxBApFteFxOfDsVQcAoGVRi9WXFngTAODZqw54XNn4dZUFhZURfX195v80mkb+lAenaIAqI+WGT58+YdCgQawEY126dBHpz6FoqlatilOnTuHatWuwt7dn9SUlJWHq1Klwc3OjaeUp5ZKudS3gNdwFVjUcAe4vE0dW1HvMc9VG17rKXWCysDJSMHFiYmIi9QGTMwWdouNv7ULSs3PgZ/36G6mCUzRAlZFyQXJyMvr06cMqXFWzZk0cP368SH8ORdOlSxcEBQXB09NTqLDe8+fP4erqiunTpyMpKUlBElIoZUPXuhbwXdQVtRzqFGgl2L5kRpGhs8pAYfkMDQ1Z+3R1RL7kOzvnxH5FyotLSLz3H77tHIvkFxdFjlNWqDKiYty6dYtlwhAIBBg+fDiCg4OZNgMDA1y4cAFGRkaKEFEqtLS08PfffyMoKEgoEZtAIMC2bdvg4OCA48eP09wklHIFj8tBmxbNWG1v377FwoULFSSRZBReGSn8O0P9RuRLvrNz4pMTyDfMCDJTwE9LFDlOWaHKiApBCMG8efNw/vx5pm3x4sW4ePGXBszhcHDs2DE4ODgoQsQSU7NmTVy/fh0nTpwQivqJiYnB0KFD0alTJ3z48EFBElIosqdJkyZCbRs3bsTt27cVII1kFFZGjI3ZzrZUGZEvrrbGqJT9E+nvHjBtHA1tGDTpk/d/KL9TNECVEZXCz88Pr169YtK7nzx5EitXrmSNWblyJXr06KEI8UoNh8PBoEGD8P79e8ycOVOomvDt27dRv359LF68uMhcBxSKqtC4cWOR7aNGjUJ8vHLa+At/9wonNqRmGvnC43JAHu0GCriw6rv0BE/bAPlu0MruFA1QZUSl2LFjBwDA19cXXl5eGDNmDKt/yJAhmD9/viJEkykGBgbYtGkT/P390bRpU1ZfdnY2li9fjrp16+Lq1asKkpBCkQ1169YVmRE5KioKkydPVkrTZGFlJL8cRD50ZUS+7N27F4HPn/xq4KnDoElfAIC5oRa8hrsovVM0QJURlSE2NhYnT55k9qdMmcL6UXBxccHevXtllupdGWjYsCF8fX2xc+dOVKpUidX3+fNndO/eHQMGDEBkZKRiBKRQSom6ujorGqUgp0+fxuHDh+UsUfEUVkbMzMxY+1QZkR+3b9/GpEmTWG29BwzGtrFtcHxCMzya314lFBGAKiMqw/79+1l1ZgpiamoKHx8fVvKh8gKXy8WkSZPw4cMHjBw5Uqj/7NmzcHR0xMaNG5Gbm6sACSmU0lHY56Ig06ZNU7oaToWVkcI+XlQZkQ/3799Hjx49WOkcAGD35nXo41wVbvaVld40UxCqjKgAAoEAXl5eYvtr1qyJGzdu4N27d0IfzPKCqakpDh48iHv37sHR0ZHVl5qait9//x2NGjWCr6+vgiSkUEpGYTNHQVJSUjBixAilUrQLh/aam5uz9qkyUvb4+vqiR48eQi+olpaWQitVqgJVRlSA69evF/l29PjxY4wfPx5OTk5o06YNEhIS5CidfGnTpg0CAgKwevVqaGtrs/oCAwPRokULjB8/HnFxcQqSkEKRjsIP88I8fvxYqZIXigrtLVjigSojZYufnx+6deuGtLQ0ob6uXbsqQCLZQJURFSDfcbUouFwu5s2bh5s3b6pEfpHSoKGhgfnz5yM4OBi9e/cW6t+3bx9q166N//77r9yuFCkKVa4KqqxI8ib7999/4/nz53KQpngKKyPa2tqs1R0aTVN2vHz5El26dEFycrLI/hYtWshZItmhpmgBKEUTHh6Oy5cvFzmmZs2aOHjwINzc3OQklXJgbW2N8+fP48KFC5g+fToiIiKYvri4OIwbNw7//fcfvLy8UK9ePQVKWj64FhSNpRffsYpxWRhqwbNXHZVxklNGivL1WrduHTIyMhASEoIdO3Zgz549UFNT7M+2OGXk8+fPAOjKSFkRGBiITp06sTJtF6Zhw4byE0jG0JURJWfXrl1FhvfNmDEDAQEBFU4RKUjv3r3x7t07zJ8/X+iH+vHjx2jYsCHmzp2L1NRUBUmo+pSHqqDKipaW+MyYampqWLx4MQ4ePIj9+/crXBEBil8ZSU9PF2lCoJScd+/eoWPHjkXmnlFXV4eTk5McpZItVBlRYrKysrB3716RfTY2Nrh79y42b95cLqNopEVXVxerV69GQEAAWrduzerj8/lYv349HB0dce7cOaXM3aDMlJeqoMqKpqam2L5Tp07JRQZpzG8FlREOhwMNDQ2aa6QM+fjxIzp06FCs+cvJyUmoxpcqQZURJebMmTOIjY0Vap84cSICAwPRtm1b+Qul5Dg5OeHevXs4ePAgqlSpwuqLjIxE//790bNnT2ZJmVI8BauCAgA/OxPpIc+Q5JuX90ZVqoIqK1paWpg7d67IvidPnuDr169lev5rQdFoueYOhux5ipknAjBkz1O0XHNH7GpXwWgaLS0tcDgcqoyUEUlJSZgxYwYMDAxgZ2dXpH+Ri4uLHCWTPVQZKSO+fPmCc+fOSTWn8NvJ9kKOq1WrVsXVq1exa9cu6Ovry1LccgWHw8HIkSPx/v17TJo0SSgR3JUrV+Dk5IQVK1aIzd1C+UXBap8J9w8gausw/Dz7DxIfHkZucqzIcRTJGTduHNasWSOU2C+fM2fOlNm5S2J+K7gykh/RVljxp06sssHQ0BDXrl3Dhw8fEBoaiiFDhogdq8r+IgBVRmRKSkoKDhw4gHbt2sHGxkbkqoY4Cr+d9F9+DE8K5MwYOXIkgoKCVDp0S94YGxtj586d8PX1hbOzM6svMzMTixYtQoMGDXDnzh3FCKgiFKz2ydXQAcn9pcDFXd8GkpsjNI4iOVWqVAGHwxFbp+b06dNlct6Smt9EKSN0ZaTsiYuLw/bt21ltBdMbUGWknCFt6CKfz8eNGzcwfPhwmJmZYcyYMbh37x4qVaqEYcOGSXROUW8nKa/yImi4OpWwZPN/OHjwoNg3J0rRNGvWDM+fP8emTZuEVpQ+fPiADh06YPjw4YiJiVGQhLJHliG4rrbGsDDUAgeAtj37gZn52R/RB2ZAL+mz0lcFVXbEKSNlZaopbH4rjDjzG1VGFMPChQuRk5PD7HO5XBw+fBgcDgccDgcNGjRQoHSlR/Gu2UqENKGLb9++xaFDh3DkyBF8+/ZN6Fhjx46Frq4uAIAQgpSUFCQmJiIpKQmJiYnMFp+QgPUXXyE5KQmCrDQIMlNh0GwA0t7dg45DK1TuNBk30sywREBUKrWvsqGmpoaZM2fit99+w5w5c1h1fgDg6NGjuHTpElasWIHJkyeDx+MpSNLSI+sQXB6XA89edeBx5CU0qtiCp28CfsqvVb+cuK94t2sm5miEYMWKFawEWBTJadKkidi+M2fOYPbs2TI9X0GzWubXIGSE+CEn4RtIThaM2o+HRhVroXEAVUYUwbdv34SCGQYPHoz+/ftj4cKFOHXqlMp/7zhEBUILkpOTYWhoiKSkJLFFpUpL/upE4ZuR//j3Gu6CRmZqOH78OA4dOoQXL14UeTwbGxtwOBxGAZEm+ZZ+0wHQNLODruOvqJDjE5rBzb6yxMegFM2NGzcwdepUhISECPU1btwYXl5eYt9UlRlJPsclzQmSr+QEnVqP1IBrIsdYW1tj9+7d6Ny5c4nOUZGJiIiAtbW1yD43NzeZlzp4EhqHIXueAgCSn/sg4c6vh12VAZ7Qsc9Tjgr/9hgaGjJJt1xdXfHs2TPExMSwatQMGzYMR44ckam8FZlRo0bh0KFDzD6Xy8WXL19QrVo15ObmwsvLC9OnT1eghOKR9PlNzTQQbTtNfXMbOQnfIMjNQdqHxxg6sD8sLS0xc+bMYhURIC9ZWVhYGBISEqTOAqppZs9SRADqHChrOnfujDdv3uDvv/8WCq309/eHq6srpk2bVmSCIWWjrENwu9a1wKP57bHEY7jYMV++fEGXLl0wevToInMiUISxsrJirTCoq6sz/y8LU01B8xtPtxKrLyvyHTjIW1ErbH4TtTJSuTL7RYk6sMqOsLAwoerNQ4cORbVq1QDkrfoqqyIiDVQZgbDtNCc5FnFXN+Pb7omI+HcAfvqsQkLwE7kVqxJkZwi1UedA2aOlpQVPT0+8efNG6E2eEILt27fDwcEBx44dU4ncJKJ8AAghyPwaBMLPlUkILo/LwdTh7kUm6gKAgwcPwtHREadPn1aJe6cMFHZiLegfAMg+qibf/AYAPF12CYkU/wvISfgGz151cN7Hm1GE+Hw+S678z4G6ujqrDAU108iO+fPns75DXC4XK1asUKBEZQP1GYHwqkOK/3mA/H81Q8Av0TF1dXVhbm6OSpUqMZuhoaHQvoGBIRZe+YzEXDVwNPXA1dIFR+OXhzQHgLmItxOK7KhZsyauXbuG06dPY9asWYiO/hXO+P37dwwbNgz79u1jlBNlpeDnWJCZitSgO0h+7g1+8k+Y9P0TurVbCI0rCTo6OmjXrh2uXr1atDw/fmDgwIHo27cvtm/fDktLy1KdtyLQpEkTXLlyRWTfqVOnZO430rWuBbyGu2D+3u/4XqCd5GaBXFuFxivccc43FrVq1cLMmTOF3sC1tbWRkJCAnTt3suqlUGVENrx7904ommrYsGGoXr26giQqO6jPCNi2UyLgI8prDPipot8eNTU1weVyhVIiF6Zhw4Z4/vy5RI6Q+XZ+AKwldlnY+SnSkZycDE9PT2zZskXIvKauro558+Zh4cKFQhWDlYGCn+OM0Of4cWYp08fTN4H5yI1Q0zOWif/Rjh07MHXqVInHGxoaYv369Rg3bpxQ3hfKLy5duoRevXox+6ampqwHe0REBKysrGR+3h8/Y2FmWkWo3c3NDXv37mXSjBsYGLCUDgsLC6SkpCA1NRW6urpMGng1NTVkZ2fTv3Up6dGjB0s55XK5+Pz5s1jfImWE+oxIQUHbKYfLg8XozTBsMQRcHUOhsVlZWcjIyICmpiZatmyJ3r17w87OTmjcq1evsH//fonOn/92Ym7IXvo2N9SiioicMTAwwL///osXL16gadOmrL6cnBysWLECTk5OYt9eFUnBz7GWrQt4Br/8D/gpsYjaOQ7Zjw/AWidH/EEkpEePHqz94jz5k5KSMGHCBHTo0EGk0zAlj8JO04XD+csqAZpJZWOWj0o+T548waJFi5iHX+FqsdHR0UzNJ1tbW6Y9NzdXpfytlJEXL14I/c4MHz5cpRQRaaArI/9H1OoEyc1G2rv7SPY/j5yf4WLndurUCSNHjoS6ujp8fX3x6NEjBAQEoHLlyvj06RMMDYWVGlHwBQR+YfH4kZIJU/080wwN51UcAoEAe/fuxYIFC5CQkCDU369fP2zatKlM3lRLSsHPceKTU0h8cEhojI6ODqZNm4a5c+fCxMSkxOeqV68egoKCAOT5O0jyU1KjRg1069YNq1evpjWVxGBlZYXIyEgAeYn7CjoCN2vWDE+ePCmT81arVg1RUVEi+5ycnPD27dsi5w8bNgxHjx5l9t+/f4/atWvLVMaKRPv27XH37l1mn8vlIjQ0FDY2NooTqgTQlREpEbU6wVHTQM1WvXD+9mPcunVL6G0wn5s3b2LEiBH4+++/UadOHTx8+BCJiYk4evQoq6x9cfC4HLjZV0Yf56pws69MFREFw+VyMXHiRLx//x6jRo0S6j937hwcHR2xYcMGIWdDRVHwc6xXvxPAFXYLS09Px9q1a2Fra4uFCxeWOOql4PeBEFJkUr7hw4cjKioKnz59wpYtW6giUgQFV0fi4+NZfkpPnz6V6jdFGszNzcX2FaeING7cGDVq1GC10YiakvPw4UOWIgLkfYdUTRGRCqICJCUlEQAkKSmpzM+VyxcQ35BY4vMqkviGxJJcvoDV/+HDBzJlyhSio6NDkLeIIrQZGxuTP//8k0RGRpa5vBT5cf/+fVKnTh2Rf/N69eqRR48eKVpEhvzPccvOvcV+TvM3fX19smTJEpKQkCDVOR48eMA6ToMGDcSeQ0tLizx9+rRsLracsWLFCta9Gzx4MGt/w4YNZXLeHj16FPtZEbetW7eObN++ndV29uzZMpGzvCMQCIirqyvrXnK5XBIaGqpo0UqEpM9vqoyUkLi4OLJ69WpStWpVsV9QNTU1MmzYMOLv769ocSkyIjs7m6xZs0asMjp27Fjy8+dPRYvJcPfuXYkfKIaGhmTZsmUSf89ycnKIkZERM9/IyIhoaWmxPv8Fj29qakrCwsLK9oLLAdevX2fdtwkTJrD2mzVrVibnHTt2bImVkfDwcHL69GlWm5eXV5nIWd65evWq0P0dOXKkosUqMVQZkRPZ2dnk+PHjQpps4a1Vq1bk7NmzJDc3V9EiU2RAeHg46dOnj9iVsb179xI+n69oMYlAICAODg5SPViMjIzIypUrSXJycrHHHzJkCGtu7955KzEcDofcu3ePWFhYsPqdnJxIYmKiHK5cdYmLi2Pdsw4dOpD69euz2r58+SLz8/71118lUkTylaP79++z2pcuXSpzGcs7AoGA1KtXT2hVJCQkRNGilRhJn98l8hnZvn07bGxsoKWlhaZNm8LPz6/I8Zs2bULt2rWhra0NKysrzJ49G5mZ5SOjqLq6OgYPHoynT5/i8ePH+O2338DlCt/Whw8fon///qhZsyY2bdok5JVOUS2sra3h4+ODCxcuCHm3x8fHY/z48WjVqhUCAwMVJGEeHA4HkydPZrWJ+nwWJCEhAX/99Rfs7Oywbt06JlxTFD179mTt52cQ7d69O9q0aYOLFy+y/EPevn2LQYMGyS2BoCpibGzMitDz9/fHb7/9xhpTFlE1RfmMFMXAgQMB0Po0suDcuXN48+YNq23YsGGwt7dXkERyRFot58SJE0RDQ4P8999/5O3bt2TChAmkUqVK5Pv37yLHHz16lGhqapKjR4+SsLAwcv36dWJhYUFmz54t8TmVeWVEFOHh4eT3338nBgYGYt8m9PX1yaxZs8jnz58VLS6llKSmppIFCxYImSUAEB6PR+bMmSPRKkNZER8fT7S1tRmZNDQ0JHrjbdiwIdm4caPY7zYheW/xXC6XmVO3bl3StWtXcvXqVWaMt7c34XA4rGN7eHgQgUAg9rgVnUGDBrHuV2HTTVmYak6ePFmilZGvX78SQgiJjY1ltQ8cOFDmMpZncnNzSc2aNVn3kMPhkI8fPypatFJRZmYaV1dXMnXqVGafz+cTS0tLsmrVKpHjp06dStq3b89qmzNnDmnRooXE51Q1ZSSf5ORksnnzZmJnZyf2i8zlckm/fv3Iw4cP6Y+zivP27VvSpk0bkX/nqlWrkjNnzijsbzxmzBghZVjcZ9LU1JS8fv1a4mO3bNmSNf/atWtCJqr169cLnWfTpk2yvsxyw7p161j36tixY0IOwrI21RQ2s0iymZiYMKZnPp9PeDwe09e2bVuZylfeOXjwoND9HT58uKLFKjVlooxkZWURHo9HvL29We0jR44kvXv3Fjnn6NGjxNDQkDx79owQQkhoaChxcHAgK1asEHuezMxMkpSUxGxfv35VSWUkn9zcXOLj4yP2QZW/NW7cmBw5coRkZWUpWmRKCREIBOTQoUOkSpUqIv/G3bp1U4hXvJ+fH0sOKyurIj+L/fv3l/hzuGrVKtbc7du3C40RCARCjpgcDodcuHBB1pdaLrh37x7rXs2ZM4csX76c1SbrqJoPHz5IrYxs2bKFdQxzc3Omr06dOjKVrzyTlZUl9J3kcrnkw4cPihat1JSJMhIVFUUAEF9fX1b73Llziaurq9h5mzdvJurq6swy9uTJk4s8j6enp8gPvqoqIwV58eIFGTFiBFFXVxf7Bbe0tCQrV64ksbGxihaXUkLi4+PJ5MmThcwTQF6Y67Jly0hmZqbc5BEIBMTFxYUlR61atYp80HTr1o2kp6cXe+w3b96w5nXv3p3VHx0dTQjJc/bu0KEDa6yuri559epVWVyySpOcnMz67LRq1UpIWWjatKlMz5mYmCjyc9CiRQuR7RwOh0RFRbGOUdDR1sTERKbylWcKh0UDIMOGDVO0WDJBaZSRu3fvEjMzM7Jnzx4SGBhIzp07R6ysrMiyZcvEnqe8rYyI4tu3b2TRokWkcuXKYh8G2traZNKkSSQ4OFjR4lJKyNOnT0nDhg1F/n1r1apFbt26JTdZ9uzZwzp/ly5dmP8bGhoKrVwAeUvtxfm7CAQCUr16dZaylZaWRgghZO/evWTixInM2ISEBKHonqpVqwo91CiEODo6spS23NxcIVNNeHi4zM4nEAhYodkASN++fUlmZqbIFAYNXZsL5WHq2LEjS1nJycmRmXzllbS0NGJmZiak6JWX332lMdO0bNmS/PHHH6y2w4cPE21tbYlDH1XVZ0QS0tPTye7du8Um0yr4lnrjxg3qV6KC5OTkkM2bN4v10xgyZAizelCWpKamspyqNTU1Sc+ePQmQl1hLIBCQ33//XUi+pk2bkvj4+CKP7eHhwZpz8eJFxu9h/PjxrLGhoaHExMSENd7FxYWkpqaW5eWrHCNGjGDdo6CgICFTzfr162V6ThsbG+bY6urqjCJa2IcFADHuPIU0W3mLXH3zjZlfONQ7JiZGpvKVR9auXSvyN6G8UCahvRoaGmjUqBFu377NtAkEAty+fRtubm4i56SnpwuFEuZXsiXKXxanzNHW1saECRMQFBSE69evo2vXriLHXb16FZ07d0a9evWwd+/eYqsGU5QHNTU1zJgxAx8+fMDgwYOF+o8fP47atWtj27Zt4PP5ZSaHrq4uRo4cyexnZWWhfv360NDQQJ8+fcDhcLBu3Tp4enqy5j179gzt2rVjhWoKBAJ8+PCBCdEtHOI7ZcoUzJ07F4BwKLGdnR3Onz8PTU1Npu3ly5cYNmxYmV6/qtGkSRPWvqgQ38Ll5UuLmZkZ8381NTXo6+sDAGxb9gZHg53CX8OiJmKSMuFx5CWuBUUDEA7vpSnhiyYpKQkrV65ktXE4HCxevFhBEikQabWcEydOEE1NTXLgwAHy7t07MnHiRFKpUiVGAx4xYgRZsGABM97T05Po6+uT48ePk8+fP5MbN24Qe3t7qcK+yvPKiCjevn1LJk2axArHLLyZmJiQxYsXy+WNmiJbbty4IRTCl781atSI+Pn5ldm5g4KCWOerWbMmWbhwoVAqeFFvwg4ODqwSBxMmTCBaWlqkUaNGQinLC26TJk0SKcuxY8eExhZeRa3I+Pr6su5NfhRjWZpqCifyS0lJIbl8AWm28hYxcO3H6tNv3IdYz79EbOZfIs1W3iK5fIFQKvvbt2/LTLbyiCj/yEGDBilaLJlSphlYt27dSqpXr040NDSIq6srq+ZEmzZtyKhRo5j9nJwc8vfffxN7e3uipaVFrKysyJQpU6Sqg1HRlJF8YmNjyYoVK4SyWBbc1NXVyciRI6kToIqRkZFBli5dSjQ1NYX+phwOR+rviDS0atWKdb7r16+LHLdjxw4h2WxtbZncOImJiUWWQ8jfinJYX7p0qdD4Xbt2lcl1qxppaWmsUNl8h9XCD3xZmmomTZrEOvanT5+Ib0gssZ5/iVSdcoCAmxeEwNXSJ8adJhPr+ZeYzTckVsgv6fjx4zKTrbzx8+dPoqurK/TdDwoKUrRoMoWmgy9HZGVlkcOHDwtFQxTe2rZtS86fP09TzqsQnz59YjmSFtxMTU3J4cOHZe4ndPToUdZ5+vfvL3bswYMHWUnNgDyH03znuosXLxarjHh4eIg9vkAgIMOHD2eN5/F45ObNmzK9ZlWl4CqIpqYmycrKIh8/fmTdL1lG1SxZsoR17IcPHxKfV5GMwmHYchip3H02sfr9HEsRsZ5/ifi8iiTnz59nzd+8ebPMZCtv/PHHH0Lfld9++03RYsmcMk0HT5EvGhoaGD58OPz9/fHgwQO4u7uDw+EIjbt37x769OmD2rVrY+vWrUhNTVWAtBRpqFGjBq5evYrTp0/D0tKS1ffjxw+MGDECHTp0wPv372V2zv79+8PExITZ9/Hxwbdv30SOHTlyJE6ePAl1dXWmLSoqCq1bt0ZgYCB69uyJoUOHFnm+otLPczgc7N27Fy1btmTa+Hw+BgwYgHfv3kl6SeWWxo0bM//PysrC27dvUbNmTTg7OzPtz549w5cvX2RyvsIp4b9//w5TfS1mv1KLIdCr1wFcNQ2huab6WjQlvIRERUVh69atQu0V0lfk/1BlRIXgcDho1aoVzp07h5CQEMycORN6enpC40JDQzFjxgxUq1YNc+fORUREhAKkpUgKh8PBgAED8P79e8yePZtx8M7n7t27qF+/PhYuXIj09PRSn09TUxNjx45l9vl8Pvbt2yd2/IABA+Dj4wMtrV8PpZ8/f6Jt27bw8/PD5s2bUaVKFbHzRSnOheXx9vZm1WNJSkpCz549K/zDrLAT6/PnzwGgzGrVFFZGYmJi4GprDAtDLYj7K3IAWBhqwdXWWOhzQB1YRbN8+XJkZWWx2vr374969eopSCLFQ5URFcXOzg6bNm1CZGQkNm7cCBsbG6ExSUlJWL9+Pezs7DBw4EA8efJE/oJSJEZfXx8bN27Eixcv0KxZM1ZfTk4OVq5cCScnJ1y6dKnU55o0aRJrf/fu3azidT4+Pqz+7t2748qVK9DV1WXaEhIS0KFDB7x9+1bkW14+xSkjAGBiYoLLly+jUqVKTFtYWBj69u1bbopqloSCKyNAXkQNIKyMnDp1SibnKxhNA+QpIzwuB5696gCAkEKSv+/Zqw54XA5dGSkCvoDgSWgcdl3yxe49e4T6lyxZogCplAg5mY1KRUX3GZGEnJwccubMGbHZElHAvnzixAmajEjJ4fP5ZPfu3cTIyEjk37Fv376lrk1S2Ffl/PnzhJC8PECmpqYi5zx58oQYGhqy5mlpaZErV64IRWLkbzNmzJBYptu3bwsVHMzPgVIRycrKYhU2dHZ2ZvqcnZ1Z90kWUTWhoaGsY06YMIHpu/rmG2m28hbLT6RwnpHCidOaN29eapnKAwXvna5TO6HviLu7u6JFLDOoA2sFxs/PjwwdOlRkFdn8zcrKiqxZs6bYZFYUxfLjxw8yevRokX9DXV1dsnbtWpKdnV2iY/v4+LCO161bN3Lnzh2mVIG44758+VIoaZm6ujrZu3cvqVSpkpCcs2bNkkquvXv3Ch1jyZIlJbrG8kCTJk2Y+6Cmpsak6C+LqJrU1FTWMXv16sXqz+ULiG9ILPF5FUl8Q2KFMrASQljZeGvUqFFqmVSdq2++EZv/K28WY4XTvgMo19GQVBmhkMjISPLnn38SY2NjsUqJrq4umTp1qsqXqS7vPHjwgDg5OYn8G9atW5c8fPhQ6mPm5OSQatWqMcfhcDisDK0Fc4oU5t27d8TS0lIoCkZUSvnZs2dLLdv8+fOFjnP48GGpj1MemDJlCus+5KdSKBxVU1R9MGnQ09NjjtmkSROp5zdu3JiZb2BgIBOZVJX8HC35K0k6tZoLfa6NHIXT6pcnaDQNBVWrVsXKlSvx9etXeHl5oXbt2kJj0tLSsH37dtSuXRu9e/fGnTt3aGZcJaRVq1Z49eoV1q5dCx0ddibMoKAgtGrVCmPHji3WYTAoKAienp7YsmULTp06xfJJIIQgOTmZ2Y+OjhZ7HEdHRzx8+JDlq8Tn87F3717UqVOHNVYSn5HCrFy5Ev369WO1jRs3Dg8fPpT6WKpOYb+RfCfWwlE1fn5+CA8PL/X5Cjqxfv/+Xer5BZ1Yk5OThRw1KxJ+YfGITsrzeeJnpiIzKlhojKbrQPiFxctbNKWDKiMVAB0dHUyePBnv3r3DlStX0KlTJ6ExhBBcvHgRHTp0QMOGDXHgwIEK/SOijKirq2Pu3LkIDg5G3759hfr3798PBwcH7NmzBwKBQOQxnJyc8O7dO8ycORPDhg0TclQtSFHKCJDnRP3gwQPUqlWLaSOE4N27d9DQ+BX6WRJlhMvl4vDhw6wHcXZ2Ntzd3RESEiL18VQZUWnh8xk4cCCrTxZRNQWdWGNiYqR+OaEp4X/xI+WX8zVPSw/6DXuw+rVruELTvAZrXEWFKiMVCC6Xi27duuHGjRt48+YNxo0bx6oPks/r168xZswYVK9eHUuXLqUe8UpG9erV4e3tjYsXLwpFUcXHx2PixIlo2bIlXr9+LTSXw+Fg//79EoUQxsTEFDvGysoKDx48QP369Vnt2dnZv46TnIXzAVF4EhoHvkDyB5uOjg4uXLgAKysrpi0uLg49evRAQkKCxMdRdRwcHFirYfkrI4BwVI0satUUXBnJzs5GYmKiVPNpRM0vCuZoEWRnIvnZWVa/YYuhQuMqKlQZqaDUrVsXe/fuRUREBJYtWyYU0gfk/Yj8/fffqF69OsaNG4c3b94oQFKKOHr27Im3b9/ir7/+YiUlA4AnT56gUaNGmDNnDlJSUlh9enp68PHxgbGxcZHHL25lJB8zMzPcvXtX6A0+nwuvv2HmiQAM2fMULdfcYYqqSYKFhQUuXbrEyqfz8eNH9O/fn6XwlGfU1NTg4uLC7AcHBzMJDWvUqIGGDRsyfbIw1YhKfCYNVBn5RcEcLYkPDoHk/Cpwqm3fBFrmNZgcLRUdqoxUcExNTbF48WJ8+fIFBw4cQIMGDYTGZGVl4b///kP9+vXRsWNHXL58WawZgCJfdHR0sGLFCrx+/Rpt27Zl9fH5fPz7779wdHTEmTNnWMvtdnZ2OHnyZJHZUSVVRgDA2NgYt27dQuvWrYX6MsNfg5C8z0vhKq+SUL9+fSFZ7969Cw8Pjwrj31TYt+fly5fMvqwToInKNSINVBn5RX6OlpyUOKS8ZOcHqtRiCIBfOVoqOlQZoQDIy4I5atQovHr1Cnfv3kXv3r1F2vpv376Nnj17ok6dOvDy8kJaWpoCpKUUxtHREXfu3MHhw4eFHgZRUVH47bff0L17d4SGhjLtHTt2xLp168QeU9qHkIGBAa5evYrOnbuw2nN+hCLx4REAeeEDALD04jupTDbdu3fH5s2bWW3//fcf1q5dK5WMqkpRfiOyNtXQlRHZ0sXJHGo3VgLk1wucll0jWDvUh9dwF3Sta6FA6ZQHqoxQWHA4HLRt2xbnz5/Hhw8fMG3aNFbWzXw+fPiAKVOmwMrKCgsWLEBkZKQCpKUUhMPhYPjw4Xj//j08PDyElMlr167ByckJy5YtY5yTZ8+ejeHDh4s8njQrI/no6Ojgr3//g3bNXxlkudoG0HfuyuwTANFJmVJHEEybNg3Tp09ntS1YsEBmqdCVGXERNYDsTTWiUsJLA00Jz2b16tX4EvKB1bZ17Uo8mt+eKiIFoMoIRSw1a9bE1q1bERkZiXXr1qF69epCYxISErBmzRrY2tpi6NChrB9JimIwMjLCjh078PTpU5avAZBncvP09ES9evVw69YtcDgc7N69G40aNRI6TkmUEQBIzCao0mcBdOq0AU/XCGbD10HNwFRoXEkiCDZu3Iju3buz2kaMGAE/P78Syaoq1KhRAwYGBsx+wZURQLamGmqmkR2PHz/GwoULWW2dO3fG+P6dqWmmEFQZoRRLpUqV8McffyA0NBQnT54UqpsCALm5uTh+/DhcXV3RokULnDlzhlXrhCJ/XF1d4efnh61bt7IeZADw6dMndOrUCUOGDEFiYiK8vb2FHiIlCesE8iIDODw1mPSYA/ORG6FhXFXsOGlRU1PDiRMnWNFAmZmZ6N27d7kuCMnlclmrIyEhIayIIlnWqimtmabwykhFVUZ+/vyJgQMHCn2H/v77b8UIpORQZYQiMWpqakzBvSdPnmDQoEFCFWYBwNfXF7/99htq1KiBjRs3IikpSQHSUgCAx+Nh2rRpeP/+PYYMGSLUf+LECTg4OMDHxwcnT56Empoa05ednV2iENr8CAIulwc1A+FqvgWrvJYEfX19XLp0SSg5V8+ePVlJ28obhU01L168YP5f2FTz/PnzEptqSrsyoqWlxVJ+K6IywufzMWzYMHz79o3VrqWlBTc3NwVJpdxQZYRSIpo1a4YTJ07g8+fPmDt3LgwNDYXGfPnyBb///juqVauGmTNnspwnKfLFwsICx44dw82bN1lJyoC8LJkzZszAnDlzMGfOHFZfSUw10lR5LSnVq1fHhQsXoK2tzbS9efMGgwcPLrcrcoWdWAubRAsnQCupI6umpiarerK0ygjANtVURGVk+fLluHnzplB7wZw5FDZUGaGUiurVq2Pt2rWIjIzEtm3bUKNGDaExqamp2LJlC2rWrAl3d3fcv3+/woRkKhsdO3ZEYGAgli1bJpTw7tWrV1i3bh0cHR2ZtjsvP5YoYVnXuhbwGu4Cc0O2KcbcUEtmEQRNmjTBkSNHWG1Xr17F7NmzS31sZaTwykhxfiOliaqRZUr4nz9/Vqjv+61bt7B06VKRfVQZKYIyrI8jM2ihPNWBz+eTCxcukHbthMtkF9waNmxIDh06RLKyshQtcoUlJCSEdO3aVeTfh/f/is/GPeaILRcvCZJUeS0tq1evFpJ/y5YtMj+PohEIBKxqyVZWVkJjXFxcWPchLCysROdq27YtqwAin8+Xan6fPn1YcqSkpJRIDlUjMjKSVKlSRezvXv/+/RUtotyhhfIoCoHL5aJXr164c+cOAgICMHr0aFadknxevXqFkSNHwsbGBitWrEBsbKwCpK3Y2Nvb48qVKzhz5gyqVmU7mfL/b+pIfnwMOXFfAZQsYRmPy4GbfWX0ca4KN/vKZRJBMG/ePIwdO5bVNmvWLFy5ckXm51IkHA6HtTry9etXoVULWa2OFPQb4fP5iIuLk2p+RYyoycnJweDBg4sMZS4u63FFhiojlDKjQYMG2L9/P758+YIlS5YIedkDeT4JixYtgpWVFSZOnIh3794pQNKKC4fDQf/+/REcHIw5c+YIOSTnJsYgNzHvgVfShGVlDYfDgZeXF9q1a8e0CQQCDBo0CIGBgQqUTPYU9hsp6MQKyE4ZoYnPpGfhwoV49OhRkWOMjIzkJI3qQZURSpljbm6OpUuXIiIiAvv27UPdunWFxmRmZmLPnj1wcnJC165dcf369QplZ1Y0+vr62LBhA/afvwNNSwemXcuuMbTtC6QiR8kSlpU1GhoaOHv2LGrXrs20paamomfPniXOl6KMFJX8DMhb7SqYW+b58+cICwuT+jw014h0XLhwochsxvlQZUQ8VBmhyA0tLS2MHTsWgYGBuHnzplDyqnyuX7+Orl27wsnJCbt370ZGRobIcRTZY1DVHmbD18K463TwDExRucs0keOUseS5kZERLl26hMqVKzNtX79+Re/evZGenq5AyWRHcU6sgGwSoJU2C2tFUkbi4+Ph5eUFd3d3eHh4sCosF4aaacRDlRGK3OFwOEzBvfzU5QVDNPMJDg7GpEmTYGVlhUWLFpWrN1xlxVRfCxwOF/oNuqDqpD1QMzARO04ZqVGjBry9vVl+Sv7+/hg+fAQef/pZosggZcLS0hKWlpbM/vPnz4VWEGWRAE3Wic/Kc0p4Y2NjXL16FefOnYOzs7OQ4qul9eu7QldGxEOVEYpCqV27Nnbs2IHIyEisWrVKyJESAOLi4rBixQpYW1tjxIgRrIqlFNlSsOQ5hyuc0K60CcvkQatWrbBv3z5Wm7f3OXQfMQUzTwRgyJ6naLnmjlSOuMpEQb+R79+/IyoqitVf2FTj7+8vtamGmmmkJzs7GytWrGC1aWlp4fnz54wCSZUR8VBlhKIUGBsbY8GCBQgLC8OxY8eEHPWAPG/1I0eOoFGjRmjTpg18fHzA5/MVIG35RR4Jy+TB8OHDsWTJElZb8rMzSHl9A0DJIoOUheL8RgDhBGjSmmqomUZ6Dh06JFSSYNCgQahbty5u3LgBY2NjaqYpAqqMUJQKdXV1DBkyBM+ePcOjR48wYMAAcLnCH9MHDx7A3d0dtWrVwubNm5GSkqIAacsn8khYJg8WL/FE5frtWG3xN7YjIzxAaSODJKEkfiPSmmqqVKnCqvosrZmmcuXKrPnlXRnJyckRWhUBgDFjxgAAnJyccOXKFSElj/ILqoxQlBIOh4MWLVrg9OnTCA0NxZw5c4SKvQHA58+fMWvWLFSrVg2///57qUqnU37Rta4FHs1vj+MTmmHzYGccn9BM5UqePw9PgG6n6azoIJ6uEXg6eZ8jZY0MKg5JVkbs7OxYlZilNdWoq6uzHIGlXRlRU1NjzS/vysjhw4eFfntsbGzQqlUrZr9p06Ysfx8KG6qMUJQeGxsbbNiwAZGRkdi8eTPs7OyExiQnJ2Pjxo2wt7fHgAED8PjxYxoaXErkkbCsLPmRkgmOmgaq9F8MNUMzaJjXQKV246BuYi00TpUwMTGBjY0Ns+/v7y/ys17anCMF3+JLUp+mcEr48oq4VZHRo0eLXNWliIbeKYrKoK+vjxkzZuDjx4/w9vZG69athcYIBAKcPXsWLVu2RNOmTXH8+HHk5OQoQFqKosmP+OHpGMJ08AqYDVkNkpmC2AtrQXKzhcapEgV9qhISEvD582ehMbJURmJjY6UuQFjQb+Tnz58QCARSzVcVjh49KvL+jxw5UgHSqC5UGaGoHDweD3379sX9+/fx4sULjBgxAurq6kLjnj9/jqFDh8LW1harV69GfLxqLcdTSkfByCD1SubgamhBy7oB0j88xveTiyHITFX6yCBxSOI3IspUI+qhKY6CETWEEKlXNwoqI7m5uUhMTJRqviqQm5uL5cuXC7W3bdsWtra2CpBIdaHKCEWlcXFxwaFDhxAeHo6FCxey7NT5REVF4c8//4SVlRWmTJmCDx8+KEBSirwRFRmkZmQJnn4VZEW+RcyReZjSxFDlzE+AcFp4UX4jQOkSoNGU8MVz7NgxhIaGCrWPHj1a/sKoOFQZoZQLLC0tsXz5ckRERGDXrl1wdHQUGpOeng4vLy84ODigR48euHXrFvUrKecUjgzicDjQsmkAAMiJi8Cfo/vizZs3ihSxRBTMIwKIXhkBSmeqoeG9RSNuVURPTw8DBgxQgESqDVVGKOUKHR0dTJw4EW/fvsW1a9fQpUsXkeOuXLmCTp06oUGDBvjvv/+QmalaTowUySkcGTR3zK8HRVRUFFq1aoV79+4pTsASYGhoyKrD8+LFC5E+GaUx1dDEZ0Vz4sQJfPr0Saj9t99+g66urgIkUm2oMkIpl3A4HHTp0gXXrl3D27dvMXHiRFZa5nzevHmDcePGoXr16vD09JR6KZqiGhSMDJo8tC+rLykpCV26dClR2nRFUtBvJDU1Vaz5saQJ0GhKePHw+XyRqyIANdGUFKqMUMo9derUwa5du/D161csX74cFhbCuTJ+/vyJZcuWoXr16hgzZgxev36tAEkp8sDMzAz16tVjtWVnZ2Pw4MHYvHmzgqSSnsJ+I5KaaiRVuqiZRjwnT54UqfzZ2dmhZcuWCpBI9aHKCKXCYGJigoULFyI8PByHDx8WsrsDeQ+lAwcOwNnZGe3bt8fFixfLbUhiRaZjx45CbYQQzJo1C3PnzlWJv7kkyc8AwNbWlmWqefHihUSmGmqmEQ2fz8c///wjsm/UqFE0t0gJoXeNUuHQ0NDA8OHD4e/vj/v376Nv376s1NX53L17F71790bt2rWxbds2pKamKkBaSlkgShnJZ/369RgxYgSys7PFjlEGGjZsyHrwiVsZAYRNNZI4slauXBk83q9iiTSaJo/Tp0/j/fv3IvtobpGSQ5URSoWFw+GgdevW8Pb2xqdPnzBz5kzo6ekJjQsJCcH06dNhZWWFefPm4evXrwqQliJLWrduDTU1NbH9x44dQ/fu3ZGcnCxHqaRDR0cHTk5OzP6rV6/EJvgrSVQNj8djKRTSroxUqlSJdY/LgzIiEAjEroq0a9eOlRmXIh1UGaFQkFd2fdOmTYiMjMSGDRtgbW0tNCYxMRHr1q2Dra0tBg8ejKdPnypAUoos0NPTg5ubW5Fjbt++jdatW+Pbt29ykkp6CvqNZGZm4t27dyLH2drassw6JTHVSKuMcDiccpcS/syZM2LvMXVcLR1UGaFQCmBoaIg5c+YgJCQEZ86cQYsWLYTG8Pl8nDx5Em5ubnBzc8OpU6ekTpVNUTxFmWryef36NZo3by52WV7RSOo3ApRsdaSgE2tCQgKysrKkkq/gyoqqr4wIBAIsW7ZMZJ+enh769+8vZ4nKF1QZoVBEoKamhv79++PRo0fw8/PDkCFDRC7rP336FIMGDYK9vT3Wr19fLlNel1eKUkZsbW2xY8cOnDlzBkeOHBFpvlMGJEkLn09JlJHCTqzSKhQFlZG4uDiVVtrPnTuHt2/fiuyjuUVKD1VGKJRiaNKkCY4dO4awsDAsWLAARkZGQmMiIiIwd+5cVKtWDdOnT0dISIgCJKVIQ5MmTaCvry+yLywsDM7Ozujfvz9atmyJatWqyVk6yahfvz6rLlNRKyMlMdXIOrw3NjZWqvnKQlGrIgA10cgCqoxQKBJSrVo1rFq1Cl+/fsWOHTtQq1YtoTFpaWnYtm0batWqhT59+uDevXs05bySoq6ujrZt2zL7zs7OrH4PDw+lf5PX1NRE/fr1mf03b94UmU1Y2qgaWp8mDx8fH7FlA2huEdlAlREKRUp0dXXh4eGB4OBgXL58WWzOigsXLqBdu3ZwcXHBwYMHpba3U8qeDh06AABatWqFBw8esFZAXr9+ja1btypKNIkp6MSak5ODwMBAsWML10wpLgFaaXONFM7CqorKSHGrIjS3iGygd5AiMXwBwZPQOJwPiMKT0DjwBRX7jZ/L5aJ79+64efMmAgMDMXbsWGhqagqNCwgIwOjRo2FtbY1ly5aVi6iC8kLHjh2hrq6OnTt3Ql9fH1u2bGH1L1myBJGRkQqSTjKk8RspbKp5+fJlkaYaWZtpVPGzf+HCBVZG5oJmMSBPGaGUHqqMUCTiWlA0Wq65gyF7nmLmiQAM2fMULdfcwbWgaEWLphTUq1cP+/btQ0REBJYuXSr0IwzkLXF7enrCysoK48ePR1BQkAIkpRSkTp06+Pfff1GnTh0AQN++fdGjRw+mPzU1FbNnz1aUeBJROC18UX4jgHSmmopupiGECK2KFMzl0r59e5FpACjSQ5URSrFcC4qGx5GXiE7KhCA7g2mPScqEx5GXVCEpgKmpKZYsWYKIiAjs37+fZc/PJysrC/v27UO9evXQuXNnXLlypdj04xkZGSqRolzV4HA4mDp1Kmt/69at0NbWZtrOnDmDq1evKkI8iahTpw5L3qJWRgDpTDUVPSX8xYsX8erVK2bf0NCQ1U8dV2UHVUYoYklPT8ejx77w+HMFfl7agG97PfD134HITYkDAOQbaZZefFfhTTaF0dTUxOjRoxEQEIA7d+6gV69eIlPO37x5Ez169ICTkxN27tyJ9PR0kccLCwvD0KFDi3ROpMgGW1tbLF68mNU2bdo0ZGRkiJmhWNTU1NCwYUNm/927d0hLSxM73tbWlrWa8vLlS4SGhooca2RkxDJLVKSVEUIIli5dymor+P3T09NDv3795C1WuYUqIxQAeW/r/v7+2LlzJ8aNG4cGDRrAwMAArVq2QPil7Uh7exc5cV8BEGSEPkdWVDBy4qPAz0zFt8QM+IXFK/oSlBIOh4N27drhwoUL+PDhA6ZOnQodHR2hce/fv4eHhwesrKzw119/ISoqitWvp6eHkydPon379ir1g66q/P7773B0dGT2P3/+jJUrVypQoqIp6AciEAhYb/OikDTnCIfDYZlqKtLKyOXLl/Hy5Utm39zcnOWEPnDgQJpbRIZwiArEHSYnJ8PQ0BBJSUkwMDBQtDgKhRCCixcvomvXrtDQ0CjRMXJycvDu3Tv4+/vj+fPn8Pf3R2BgoNi6FoUxaPYbBJmpSA34/9I1l4dKRsaoZmEGExMTmJiYoEqVKkX+X0tLq0SylwcSEhKwd+9ebN26VWydGzU1NQwcOBCzZ89G48aNkZCQAGNjYwB5b7aXLl1i/BwoZcO9e/fQrl07Zl9dXR2BgYFwcHBQoFSiOXLkCEaMGMHs//vvv5g1a5bY8eHh4bC1tWX2XVxc8OLFC5FjmzRpwph+9PX1pa7Xo6Ojw6wqubm5wdfXV6r5ioAQAldXV5bJy9HREcHBwcz+gwcP0KpVK0WIp1JI/PwmKkBSUhIBQJKSkhQtikJ58OABad68OWnQoIHEc3Jzc8nbt2/JgQMHyLRp00izZs2IlpYWQZ6VRaqNo65FNKs5EeMu04j1/EukcvfZhKOmUaJj6enpETs7O3Lv3r2yu2FKTnZ2Njlx4gRp2rRpkfeqZcuW5Pjx46w2Q0NDcvPmTUVfQrlnxIgRrPverl07IhAIFC2WEMHBwSw5hw4dWuycJk2asOaEhISIHNezZ0/WuLS0NKlks7a2Zuba29tLNVdRXL58mXXNNjY2rH07Ozul/BwoI5I+v6kyogK8efOG9YPwxx9/iBzH5/PJx48fydGjR8ns2bNJq1atiK6ubomUBS0tLdKsWTMydepUYj9gHrEct4NUn3ueWM+/xNosRm8hmkbmUh9fQ0ODnD59Ws53Unl58uQJGThwIOHxeBLfQx6PR3bv3q1o0cs1379/J5UqVWLd9yNHjihaLCH4fD7R19dnZKxVq1axc9atW8e6rlWrVokcN378eNa4z58/SyVbQaVHX19fqrmKQCAQEFdXV9Y1u7u7s/aXLVumaDFVBqqMlAPCw8PJqFGjCIfDYX0Rrl+/TgQCAQkLCyOnTp0i8+bNI+3btyeGhoYlUjzU1dVJo0aNyKRJk8iePXtIQEAAyc7OZuS4+uYbsZl/idgUUkTy2049ekd69Ogh8fkMDAzInTt3FHhnlZcvX76QP/74Q6q/5dy5cwmfz1e06OWWnTt3su63qakpiY+PV7RYQrRt25YlZ0JCQpHjw8LCWONdXFxEjlu4cCFrnK+vr1RyFf5tSE9Pl2q+vLl69SpLXnt7e2Jra8tqCw8PV7SYKgNVRlSY2NhYMmfOHKKhIdoE0qZNG1K5cuUSKR48Ho/Ur1+fjB07luzYsYM8f/6cZGZmFivT1TffSLOVt1jKSLOVt8jVN98IIXlvZv/884+Q4iRq09TUJMOGDSN37tyhD1ExpKSkkK1bt5IaNWpI9Hd1d3eXevmcIhl8Pl/IlObh4aFosYSYO3cuS8bbt28XO0cSU83WrVtZY7y9vaWSa8yYMaz5X758kWq+PBEIBKRZs2YseRcsWMDab9++vaLFVCmoMqKE5PIFxDcklvi8iiS+IbEkl8+2OaamppLly5cTAwODEikahTcOh0McHR3JiBEjyObNm4mvr2+pHljFyU8IIdeuXSPGxsYSy2hvb09WrFhBoqKiSixXeSYxMZE4ODhIdC8bN25Mvn37xpovyd+MUjyvXr0iXC6X9d169uyZosVicfLkSdbnYfXq1cXOkcRUc/r0adYYLy8vqeSaN28ea76/v79U8+XJ9evXWbLa2tqS0aNHs9oOHTqkaDFVijJVRrZt20asra2JpqYmcXV1LfZLmZCQQKZMmULMzc2JhoYGqVmzJrl8+bLE5ysPykhRKwvZ2dnEy8uLmJtL73tRcKtRowYZPHgwWb9+Pbl//z5JTk5WyLWGhYWRRo0aSSU7l8slvXr1Ij4+PiwTUUUmLCyM1KtXT6r7aGVlRV6/fk0IKX41iyIds2bNYt1rFxcXkpubq2ixGEJDQ1nyDRgwoNg5hU01DRs2FBrz4MED1hhPT0+p5Fq/fj1r/pUrV6SaLy8EAgFp3rw5S9bt27cTPT09Zl9PT4+kpqYqWlSVQtLnt9R5Rk6ePIk5c+bA09MTL1++RIMGDdClSxex8ePZ2dno1KkTwsPDcebMGXz48AF79uxB1apVpT21ylIwg2lBohMzMHLRFtjWdICHh4dUMfzW1tbo378/Vq1ahVu3biE+Ph6fPn3C8ePH8fvvv6N169Ziy6OXNTY2Nnj06BHGjx8v1Ne2bVtUqlRJqF0gEODixYvo27cvqlevjgULFuDTp09ykFY58fX1haurq9hKoeL4+vUrWrRogWU7joj8zNGsuSVn2bJlsLS0ZPZfvnyJHTt2KFAiNra2tkz4N1B8Wngg77vq6urK7L969QohISGsMRUlJfzt27dZYcc2NjbQ1tZGamoq00Zzi5Qh0mo5rq6uZOrUqcw+n88nlpaWYj2xvby8iJ2dXanedlV5ZSSXLxB6O7Wef4mYDl5BNMxrlmgFRFNTk7x8+VLRlyYRe/bsIZqamozsBw8eJOnp6eTIkSOkXbt2xV5r69atyaFDhyqcP0Rubi75+vUrefjwITly5AhZvnw5GT9+POnYsSOpWbOmWH8iZuNwiXGnycznrerUQyzH42Yrb1GTTQk4deoU6z7r6+srlYmxc+fOLPl+/PhR7JzCppqVK1ey+vN/f/O3vn37SiXTtWvXWPPXrl0r1Xx5IBAISMuWLVly7t69m7Rv357V9vDhQ0WLqnKUiZkmKyuL8Hg8IQemkSNHkt69e4uc061bNzJs2DAyYcIEYmpqSpycnMiKFSuKXN7MzMwkSUlJzPb161eVVUZ8Q2KZh4COYxti0MSd6DfqTTStGxBNSweiVsmccNSlz/thY2ND4uLiFH15EuHv78/kGlizZg2rLyQkhPz111/EwsKiyOs1MDAgHh4e5MWLFwq6CuWCz+eTqKgo8vjxY3Ls2DGycuVKMnHiRNK5c2dS3a4GAU8972HZqBepNuM44WobEC1bF2IxZgvzefQNiVX0ZagcAoGAdO3alfXZHDRokKLFYigc+SKJSSQ8PLxIU41AICDa2tpMf7NmzaSS6eXLl6zji0tNoEhu377NkrF69erk48ePrDZ7e3uaW6QESKqMqBW/dvKL2NhY8Pl8oeJJZmZmeP/+vcg5nz9/xp07dzBs2DBcuXIFISEhmDJlCnJycuDp6SlyzqpVq4RqAqgqP1Lylsn5GSlID77PtGvZNITZiPXM/po+tdDEjIeYmBh8//5d5Jbfl5qaivDwcAwbNgyXLl0Cj8eT+3VJQ6NGjfDixQsMGzZMyBRlb2+PFStWYOnSpbh27Rr27t2LS5cugc/ns8YlJyfDy8sLXl5ecHZ2xrhx4zBs2DAYGRnJ81KUBi6XC0tLS1haWqJ58+asvvMBUZhx/CUEaUnITfqOpMfHIMhIRmbYS0SHvYJu3Xao1Go489mkSA6Hw8G2bdtQt25dpk7JyZMnMW7cOHTq1EnB0rHTwgN5RfO6detW5Bxra2u4urrCz88PwC9TTY0aNQD8SgkfFhYGoHyaaQo/b/766y+cOHGC1TZ69GiR9aUoMkIaDScqKooAwnHmc+fOJa6uriLn1KxZk1hZWbFWQjZs2EDMzc3Fnqc8royYDVnJftNv2p9ltpHmLTUtLY18/vyZPHnypNhcAspEbm4uefz4cbHjoqOjyerVq0nNmkWbsWiIsGgKrsZVnXqIcNQ1he8fT50MHT9VKfNlqALLli1j3c8aNWqQjIwMRYtFIiMjWXKJW7EuTHGmmoLhrtra2lKtEGRmZrKO3a1bN6muqay5e/cuSz4rKyuSkZFB7OzsmDYOh6PUIcnKTJk4sJqYmIDH4wlpxt+/fxdycsrHwsICtWrVYr29Ozo6IiYmBtnZ2SLnaGpqwsDAgLWpKq62xrAw1EL29zBWu4ZpXl0IDgALQy242hqLmC0aHR0d2NraolmzZiKdQZUVHo8n9BYvCnNzc8yfPx8fPnzA/fv3MXLkSFaJ9HyysrJw9OhRtG/fHrVq1cLKlSvx7du3shBdpcj/zHEA8LT1Uan1KHC1C32H+Dk4tnc77O3tsX79eloNWErmzZuHWrVqMfshISFYvXq1AiXKw9LSkvVbLIkTK1B84byCx8zIyEBKSorEMmlqasLQ0JDZV7aVkcKrIn/++Sf8/Pzw+fNnpq19+/aoXr26vEWrUEiljGhoaKBRo0a4ffs20yYQCHD79m24ubmJnNOiRQuEhIRAIBAwbR8/foSFhUWJC72pEjwuB5696iDnB1sZUa9ii/wFP89edcDj0uW/wnA4HLRu3RoHDx5EdHQ0vLy80KhRI5FjQ0NDsXDhQlhZWaFXr144f/68xIX/yhv5nzkA4PLUYdC4N6pO2gMDt4HgqGmyxiYkJGDu3LmoXbs2Dh06JGQeo4hGU1NTKJJm1apVCo8A43A4aNKkCbMfHR0tkYKeb6rJp3BUjSwjapRJGXnw4AHu3bvH7FerVg1jx47FgQMHWONGjx4tV7kqIlKH9s6ZMwd79uzBwYMHERwcDA8PD6SlpWHMmDEAgJEjR+LPP/9kxnt4eCA+Ph4zZ87Ex48fcfnyZaxcuRJTp06V3VUoOV3rWsCMX8BXgqcO9crVYG6oBa/hLuha10JxwqkIhoaGmDx5Mvz9/fHq1StMmzZNbIjwpUuX0LdvX1hZWWHBggX4+PGj/AVWMF3rWsBruAvMDfOqI3M1dWHUeiQa/n4QXfsPBZfL/upHRERg1KhRaNSoEa5fvw6i/MW8FU6HDh0wdOhQZj87OxtTp05V+L0r7Dci6erIwIEDWfsFV0cK+wlKk4YAEFZGFH2P8im8KrJgwQLk5OTg1KlTTJu+vj7c3d3lLVrFoyQ2oK1bt5Lq1asTDQ0N4urqSp4+fcr0tWnThowaNYo13tfXlzRt2pRoamoSOzu7YqNpCqPKob2E5FVnLRiKae9Yn2bDlAHp6enk6NGjEocIHzx4sOKFCIvJwPr27VvSq1cvsferQ4cONHJJAqKjo4XqCJ04cUKhMl25coUlz6JFiySaVziqxtnZmenz8vJi9Z06dUoqmQoXmlOG3/KHDx+yZLK0tCQZGRnk4MGDrPZx48YpWlSVhqaDVyICAwPph7uMyQ8RtrS0lChE2N/fn4bpkbzsmoXrrhTchg4dKnWV1orGtm3bWPfM3NycJCYmKkyeHz9+sOTp0qWLxHMLfxY+ffpECCHE29ub1b5161apZJo4cSJrvqgaOPKmY8eOLJm2bNlCCCFCLzc0t0jpKLMMrBTpCQgIYO03aNBAMYKUY/JDhL98+cJkchUV8pwfIty4cWO4uLhg27ZtSEhIUIDEykGrVq3w5MkTnD59GjVr1hTqP3bsGBwcHDB79mzExcUpQELlZ/LkySzTSExMDBYvXqwweapUqQJra2tm39/fX2KziDhHVlmaaQDF+434+vri1q1bzL6FhQUmTJiA8PBw3L17l2m3t7dHixYtFCFihYMqI3Lg9evXrH2qjJQdampq6NmzJ7y9vREZGYk1a9aIfMgCeUri9OnTYWFhgWHDhuHu3bssR+uKAofDwYABA/D27Vts375d6MGRnZ2NTZs2wc7ODqtXr0ZGRoaCJFVOeDwedu7cyfLD2b59O168eKEwmQoqR3FxcQgPD5do3oABA1j7+b4T5S0lfGFfkfnz50NLSwuHDh1itdPcInJEPgs1pUPVzTSFlwMVuYRbEREIBOT+/ftk5MiRrEySorZ8n6bIyEhFi60wkpOTyZIlS4iurq7Ie1S1alWyb98+pSoSpwxMmzaNdZ8aN26ssHu0evXqEvt4FDbVfPz4kaSlpbHaevbsKZU8J06cYM3fvXu3tJckM548eSJkVktPTyd8Pp/Y2trS3CIyhppplARCCMtMY2Njw4q5p5Q90oQIf/78GQsXLkT16tXRq1cv+Pj4VLgQYX19fSxduhQhISGYPHmykLkrKioK48aNg7OzMy5fvqw0kRGKZvny5awVBH9/f+zatUshspQ0ogYQbarR0dFhFd5UZTNN4VWRefPmQVtbG48ePWKyzAI0t4jckYtqVEpUeWUkP2tt/tanTx9Fi0T5P69evSLTpk0jlSpVKnK1xMzMjMybN498+PBB0SIrhPfv3wtFQxTc2rRpQ549e6ZoMZWC48ePs+6NoaEhiY6OlrscCQkJLDnatWsn8VxxUTUFMyJbWVlJJU9QUBDrmDNmzJBqfkl58eIFywH72bNnQt/t/Ai7MWPGsPoOHz4sFxnLOzSaRkkoHGbn6empaJEohcgPES5coVPU1qpVqwoZIkwIIY8fPyYtWrQQe28GDhyoFFESikQgEAiZZYcNG6YQWQoqDwYGBlKVTBBlqmnVqhWzr66uLlU02vfv31nHGzJkSEkuSWq2bt1KmjRpQrKysgghhHTv3p0lx/r16wkhhKSkpLDMkvr6+hXyO14WUDONkkAjaZQfbW1tDB06FLdv30ZISAgWLlwIS0tLkWMfPnyIUaNGwcLCAh4eHlJFKqg6zZs3x8OHD+Ht7Y3atWsL9Z86dQoODg6YPn26wh0UFQWHw8H27dtZ2aWPHj3KylotLwqaapKTk6XKDisqAVrBiJqcnBxWFFpxmXsrV67McgSV1+fj7du3eP78OebOnQt/f39cuXKF6atSpQomT54MADh37hzS0tKYvkGDBkFHR0cuMlL+j3x0o9KhyisjgwYNYmniNGeDapCTk0MuXbpE+vbtS9TU1IpcLWnQoAHZunVrhSo6l5OTQ3bt2kXMzc1F3hN9fX3yzz//kNTUVEWLqhA8PT1Z96NWrVokMzNTrjJs3LixxGaHL1++CJlqCjvovnv3jhBCyOXLl4mHh0exx6xSpQozt169eiW+Lmlo2bIlc84aNWqw5F+7di0zrm3btqy+R48eyUW+igA10ygJtWvXZi2V0kRbqkd0dDRZs2aNRFWEhw4dSm7fvl1hqginpqaSZcuWET09PZH3xMLCguzatYvk5OQoWlS5kpGRIfTw++eff+Qqw4MHD1jnnzlzplTzGzduzJo/a9Ys1v6RI0fIgAEDCACycOHCYo/n5OTE8tUoawQCgVh/MBMTE0ZR/vz5M6uvRo0a9HdahlBlRAlIS0sjXC6X+ZC3bNlS0SJRSoFAICAPHjyQOER4+fLlFSZE+Pv372TatGliV5EcHByIj49PhfqRv379OuseaGlpydWnJiUlhfX706JFC6nmb9iwgSW/qamp2M+7t7d3sccrmNmUx+OVucIeGRkpVl4dHR1iZ2dHbG1thRSW5cuXl6lcFQ2qjCgBhT23p02bpmiRKDIiMTGReHl5Cb09Ft64XC7p0aMH8fb2JtnZ2YoWu8z5+PEj+e2338TejxYtWhBfX19Fiyk3Bg4cyLr+rl27ylUhK7gaoa2tLdUKVWFTTVFbREREsccrfC9iY2NLc2nFUlgZFLcVrC1Ec4vIHurAqgRQ59XyS34V4efPnzOZXI2MjITGCQQCXL58Ge7u7rCyssL8+fPLdRXhmjVr4tSpU3j69Clat24t1P/48WM0b94c/fv3x4cPHxQgoXz5999/Wfk5rl27hrNnz8rt/E2aNGH+n5GRgeDgYInnVq9eHc2aNSt2nKmpKapVqybRuIKUtRNrUFBQsWP69OmDpKQkZr9Dhw40t4iCoMpIGULTwFcMGjRogC1btuDbt284duwY2rdvL3Lc9+/fsXbtWtSuXRutW7fGoUOHkJ6eLmdp5UPTpk1x7949XLx4EU5OTkL9586dg5OTEzw8PKROoKVKWFpaYvny5ay2WbNmISUlRS7nL03yM0A4AZq4c0iSMl3ZlJGhQ4eiUqVKrLbRo0eXnUCUopHTSk2pUFUzTcGcDFwul6SnpytaJIqcCA0NJQsXLpSoivCkSZPI8+fPy60/RW5uLtm3b5/Ye6Grq0s8PT1JcnKyokUtE3JyckjDhg1Z1zx79my5nLuwqViSqJeCSGKqWbx4sUTH2rlzJ2ueNCnqS0KTJk3EytyzZ08SHx9Pc4vIAeozomD4fD4rwsDR0VHRIlEUQH6IsLu7u0Qhwlu2bCFxcXGKFrtMSEtLIytXriQGBgYir9/U1JTs2LGjXPrWPHv2jHA4HNbLyatXr8r8vBkZGazPXePGjaU+RrNmzYr83J4/f16i45w7d441b9u2bVLLIil8Pl9sbaU2bdqQ9PR0cuDAAVb7+PHjy0yeigxVRhRMSEgI64Mur4yDFOUlJiaGrF27ltSqVavIH3dNTU0yZMiQchsi/PPnTzJz5kyirq4u8vpr1apFzpw5U+5Wijw8PFjX2axZM7n8fV1cXJhzqqurS53vpHC+ksJbVFSURMd59OgRa96SJUtKcjkSUThct6Aylv8coblF5ANVRhTMmTNnWB/01atXK1okipIgEAjIw4cPyahRo4oNEba1tS23IcKhoaFkyJAhYq+9WbNm5MGDB4oWU2YkJCQIhcfu2rWrzM87ceJE1jmfP38u1fyIiAixfyNzc3OJj/PhwwfWXGlNRtJw4cIFIVnr1KlDfv78SQihuUXkCY2mUTDUeZUiDg6Hg5YtW+LAgQOIjo7Gzp07hRwN8wkLC8OiRYtQvXp19OzZs1xVEbazs8OxY8fg7+8v0uk3PyKnT58+UkWBKCuVKlXChg0bWG3z588vc0fOwp8tf39/qeZbWVnBzc1NomMXhawdWAkhYlPcv337lrVvY2ODGzduwMTEBABw6NAhVv/o0aMlcsKllB1UGSkjCisjzs7OihGEotQYGhpi0qRJUocIz5s3r9yExjZq1Ai3bt3C1atXUb9+faH+CxcuoG7dupgwYQK+ffumAAllx7Bhw9CuXTtmPzExEXPnzi3TcxYM7wWkj6gBxEfVSKOMGBoaQl1dndkPiYgCX0CkkiM5ORnnzp3D+PHjUbVqVRw4cIDVzxcQPAmNw7WHfkybubk5bt26hapVqwLI+y4dPHiQ6edwOBg5cqRUclDKAPks1JQOVTTTVK9eneWYR6FISkZGBjl27Bjp0KFDkSYcIK+K8IEDB8pNDZjc3Fxy4MABYmVlJfJ6tbW1ycKFC1Xqt6AwwcHBQv4y9+7dK7PzZWdnEy0tLeZc9evXl/oY4kw1ly5dkvgYV998IxoGJsxcNeNqpNnKW+Tqm29i5wgEAvL27Vuybt060q5dO5YzroGBAcvZ++qbb6TZylvEev4lom5qSwAQnrY+2XH2NuuY9+7dY11Dp06dpL4fFMmhPiMKJD4+nn7YKTIhNDSULFq0iFStWrVIpaS8hQinp6eTtWvXFllbZPPmzUxpeFEkJCTIT2ApWbhwIet6HB0di7yW0lIwIobH45UohNXNzU3o7xAdHS3R3KtvvhGb+ZeIhpk9M5erpUds5l8iNvMvsRSStLQ0cunSJTJlyhRiY2Mj9jP/999/Cx3fev4lUn3ueQKeGuGoaxHz4euFjj9q1CjWcY4ePSr1vaBIDvUZUSCBgYGsfWqioZQUOzs7/PPPP/jy5QtjplFTUxMal5ycjF27dqFJkyZwdnbG1q1bER8frwCJZYO2tjbmzp2L0NBQ/P7779DQ0GD1x8bGYubMmXB0dMTJkydBiPByv6enJy5evCgvkaVi4cKFsLW1ZfaDg4OF/ElkSUFzCp/PF8oOLQmFTTXaunoIS1Mv1tTCFxAsvfgOBABX24BpF2SmQsDPBQD8eeAWNm/Zgm7dusHY2Bg9e/bEjh07EB4eLva47969w6RJkzB58mSMnuCBuFu7EH97D1ICrgIAqvRbBM2qDgCApRffgS8gSE1NxZkzZ5hjGBgYoG/fvlLcBUqZIR/dqHSo2srIpk2bWJr3kSNHFC0SpRwhbYjwrVu3VD5EODw8nIwYMYKVq6Pg1rhxY3Lnzh3WnFGjRhENDQ2pTAny5PLly0ImqM+fP5fJuQ4ePMg61+bNm6U+RmFTDUdDh1jPv1SsqcU3JJZY/3/VQtfpV7E8cLhEt0EXomZc9KqftJt2zWakivtfzDnzN9+QWLJ//37W2AkTJpTmtlIkgK6MKBDqvEopS8zMzDB37ly8f/8eDx8+xKhRo6CtrS00LisrC8ePH0fHjh1Ro0YNLF++HJGRkQqQuPRYW1vj0KFDePnyJTp37izUnx+R06NHD7x58wZAXi2W7Oxs9OvXD1evXpW3yMXSvXt39O/fn9nPyMjAjBkzRK7ylJbSpoUHgLdJatC0dGD2SXY6cuIiEZOUCY8jL3EtKFrkvB8pmcz/DVsOg+X4nTAfvRmGrUYg9+cX5MbL1ilZzdAMOrWai5SjsMMrTf+uPFBlpAwouASqqamJ2rVrK04YSrlFVIhw4ciJfMLCwrB48WJYW1ujZ8+e8Pb2VskQYWdnZ1y/fh03btxAw4YNhfqvXLmCBg0aYMyYMfj69SsAIDs7G+7u7rh27Zq8xS2WTZs2QU9Pj9m/dOkSzp8/L/Pz1K5dm3UeacN7800tOg6tWO1pHx4hX3XKN4UUxlRfi/m/eiVzqFeuBk0ze1Ry+w3mI9aj2tRDMO4yDW5tOwqZ40oCR01dZHtOQgzu37/P7NesWVNsyDJF/lBlRMbk5OSwYtydnJxE2vgpFFmSHyLs5+eH169fY8aMGUWGCPfr1w/VqlVT2RDhTp06wd/fH0eOHIG1tTWrjxCCAwcO4MmTJ0xbVlYW+vbtixs3bshb1CKpVq0ali5dymqbPn06UlNTZXoeHo8HFxcXZv/Dhw9ITk6WeL5fWDyikzKhU7vF/1s40LB0gLpxXrVeAiA6KRN+YcJ+Sq62xrAw1IK4LB5qekao1aYvHt6+gdjYWJw+fRrDhw8XKmJXGG9vb4SHh+PjpxA4/34QVcfvhOU4Lxg07sMaxwFgYaiFwHsXWO00t4hyQZURGfPhwwdkZ2cz+9REQ5E39evXx+bNm/Ht2zccP34cHTp0EDnux48fWLduHRwcHNCqVSscPHgQaWlpcpa25HC5XAwbNgwfPnzAhg0bYGxsXOT4rKws9OnTB7du3ZKThJIxY8YMVlLEyMhIIQVFFhRcNSOE4OXLlxLPzTe1qBmYwKT3fFSdehAWI9ZD16GlyHEF4XE58OxVBwCEFJL8fc9edcDjcqCvr48BAwbg8OHD+PHjB27duoXp06fDyspK6LgHDx6EtbU1atawx6rRnaBeuRo0TKzA0zUSOv7iHg44XCDRGYfDwYgRIyS+fkrZQ5URGVPYS51mXqUoCi0tLQwePBi3bt1CaGgoFi1axCR+KsyjR48wevRoWFhYYPLkyXj+/HmZ+C6UBZqampgzZw5CQ0Mxf/58aGlpiR2bmZmJXr164fbt23KUsGjU1NTg5eXFavv3338Z3xdZURq/kYKmFl3HVlDTE634FRxXkK51LeA13AXmhux+c0MteA13Qde6FkJz1NXV0aFDB2zZsgVfvnzBy5cvsWTJEuY31cfHh4lcLO74OvGfWJE5HTt2FKngUBQHh6jAL05ycjIMDQ2RlJQEAwOD4icokLlz52L9+vXM/r1799CmTRsFSkSh/ILP5+P69evYu3cvLl68iNzcXLFj69evj3HjxmH48OHFrjooC0+ePMHQoUOLDAkF8kKHL1++zMqGqmgmTpyIPXv2MPstWrTAgwcPwOXK5p0xNDQUNWrUYPYHDhyIkydPSjSXLyBoueYOYpIyIeqBwUHeg//R/PbgccWbPvgCAr+wePxIyYSpvhZcbY2LHC+OsLAwXLhwATweD9OmTSv2+KNHj2ZlXT169CiGDh0q9Xkp0iPp85sqIzKmc+fOuHnzJrOfkJBQrO2TQlEE379/x6FDh7Bv374i/UY0NTXh7u6O8ePHo127djJ7OMqSnJwcLFu2DCtXroRAIJBojra2Nq5cuYK2bdsCkN2DsqTEx8ejdu3aiI2NZdr27t2LcePGyeT4hBBUrlwZCQkJAABbW1t8/vxZ4vnXgqLhcSTPtFPwoZF/h8StcCia1NRUmJubMyZIAwMDREdHQ0dHR8GSVQwkfX4r36+KCkMIYZlprK2tqSJCUVryQ4SDg4Px8OFDjB49WuQPdFZWFk6cOKHUIcJnzpzB/fv3izTRFCYjIwM9evTAgwcPcC0oGi3X3MGQPU8x80QAhux5ipZr7ogNVy0LjI2NWauqADBv3jyWclIaOBwOy1QTFhaGuLg4ieeXxNSiDJw5c4blCzVo0CCqiCghdGVEhkRHR8PS0pLZ79OnD3x8fBQnEIUiJcnJyThx4gT27t1bpE8Bl8tF165dMW7cOPTq1YtVAE2R5ObmIjg4GH5+fvDz88Pz588RGBgIPp8vdo6Wtg4q9fOEZjUnpi3j8wvo2DUCIN83fkII2rZtiwcPHjBtY8eOxb59+2Ry/L/++gurVq1i9q9du4YuXbpIdQxFryBJS9u2bVkhvb6+vjSkV45QM40CuHr1Krp3787sL1mypEy84ikUeRAYGIh9+/bhyJEjRaaWNzU1xahRozBu3DilzKmTkZGBV69e4fnz54ySEhISwhrD0dCG6W9LoVUtL+oj+tBsqOlXgXEnD1SrasHyhSjrh/Hbt2/h7OzM8ud5+PAhWrZsWcQsyTh37hwr0dry5cuxcOHCUh9XWfn8+TPs7e2Z/Vq1auH9+/c0pFeOUDONAiiceZVG0lBUmfwQ4aioKCaTqygKhwgfOHBAqUKEtbW10bx5c8ycORNHjx7Fp0+fEBcXh+vXr2PC7D+hXcMVHHVN/DjticzIYKS9uw8OTx3pH33xbe9kfHp4Ac8+55kz5GHOcXJywh9//MFq8/DwkEmSusJJ8UqSiVWVKOi0CtDcIsoMXRmRIUOGDMGJEyeY/dDQUNjZ2SlQIgpFtoSFhWH//v3477//EBUVJXacvr4+hgwZgvHjx6Nx48ZK+wA4HxCFmScCQAgBPyUW2bFfEXflXwjSEljj6ru2xKy/12HZ/TihaJKycOBMT09HnTp18OXLF6Zt7dq1mDt3bqmOSwiBubk5fvz4AQCoWrWq0vn/yAqBQAA7OzvmHnI4HERERKBatWoKlqxiQVdGFEBB51V9fX3Y2NgoTBYKpSywtbXFsmXLmCrC/fr1E5lhOCUlBbt374arqysaNGiALVu2KGUV4fy8GBwOB2oGVaBlWQsaJtWFxgX6PcL4Pm2R5HcORMD2PymYDj0nV7xvijTo6Ohg69atrLa///4bERERpTouh8NhrY5ERUUhOlp+Trry5P79+yxlrlOnTlQRUWKoMiIj0tPT8fHjR2a/QYMGShkCSaHIAh6Ph+7du+Ps2bOIjIzEunXrxPqLvHnzBjNnzoSlpSWGDBmCW7duSRx+W9YIpSrn8iDIFs4iCgCCnCwk3P0PMYf/QPaPMABgFBMCIPjKfpx/GCAz2Xr16oU+fX6lNk9PT8eMGTNKfdzCyc+krVOjKtCieKoFNdPICD8/PzRt2pTZnzp1KrZt26ZAiSgU+UIIga+vL/bu3YtTp04hPT1d7FgbGxuMGzcOo0ePVvjbasH8Gemh/siMfAtwuOBwuOBwOOjdsBr44ODym+8AhwsQgtzk7yDZmcj47A+zoauR/u4+kp6cxHbv+5jSt7XMZIuIiICjoyPrXl64cAG9evUq8TEvX76Mnj17Mvvl0dE+JSUF5ubmzH0zMDBATEyMyOrWlLKFmmnkDHVepVR0OBwOWrRogf379yM6Ohq7du2Cq6uryLHh4eFMFeEePXrg3LlzrJpO8qRg/gxt+8YwajMKRq1HwLHnOBzfuR4Ht66Bx4zfYdC0Pwyb9oN+o55IC7qDtLd3IMhIxk/vlUh6kpfJ1EBDtr4x1atXx99//81qmz59eqkchEuTFl5VOHPmDEuBGzx4MFVElB2iAiQlJREAJCkpSdGiiGXq1KkEeau1BADx8/NTtEgUilIQGBhIZs6cSYyNjVnfkcKbqakp+eOPP0hwcLBC5MzlC4hvSCzxeRVJfENiSS5fwPTFxScQHQt7omlZm+jW7UB4BlVEXoPfc3+Zy5WdnU3q1q3LOs+CBQtKdUwrKyvmWFWqVCECgaD4SSpE69atWffL19dX0SJVWCR9flNlREa0aNGC+eBzuVySnp6uaJEoFKUiIyODHD9+nHTs2LFIpQQAadGiBdm/fz9JTU1VtNgMq/edLlbuJ0+elMm5Hz58yDqPmpoaCQoKKvHx3N3dWccLDw+XobSKJSQkhHVttWrVKnfKlioh6fObmmlkgEAgYKpHAnmJdeiSIIXCJr+K8M2bN/H582csXrxYbBXhx48fY8yYMbCwsMCkSZPg5+en8CrC88cOgPuIiUWOkUUuEFG0bNkSY8eOZfZzc3MxZcqUEt+TwvlGypMT66FDh1j7NLeIakCVERkQHh6OlJQUZt/Z2VlxwlAoKkDBEOErV64UGyLctGlTJkRYmnoqsubork1wdHQU219WyggArFmzhlU9+cGDB0IPXkkpr34jAoGAleiMw+FgxIgRCpSIIilUGZEBBfOLANR5lUKRFB6Ph27duuHs2bOIiopiMrmKQhlChLW1tXH48GGRihOAMnXCNTExwdq1a1ltf/zxR4nyt5TX8F6aW0R1ocqIDCgcSUNXRigU6TE1NcUff/yBd+/e4dGjRxgzZozI6qrZ2dk4ceIEOnXqBHt7e/zzzz8is4jyBQRPQuNwPiAKT0LjwBfIxszTqFEjLFmyRGRfWa6MAMCYMWPQvHlzZj82NhYLFiyQ+jhGRkasmi3+/v5Kk/ulNBTOLTJmzBjFCEKRGppnRAb06dMHFy5cYPa/ffsGCwvlLKdNoagS+VWE9+3bBz8/P7HjuFwuunTpgvHjx6Nnz5648zEOSy++Q3TSrwRmFoZa8OxVRyYp23Nzc9GyZUs8e/aM1X7mzBlWIbqy4M2bN2jYsCGrEnFJKtEWLl/x8eNH1KxZU2ZyypvCuUUMDQ0RHR1N/fcUDM0zIkcKroxUqVIF5ubmCpSGQik/GBgYYOLEiXj27BkCAwMxc+ZMlt9EPgKBAFevXkX//v1hamGJQeOmIeLzJ9aYmKRMeBx5KXFRO0IIvn79ips3b2Lr1q3Yvn0706empoZDhw4JPejKemUEAOrVq4fZs2ez2iZPnsyq8isJ5c1v5PTp0zS3iApDlZFSkpiYyLJROjs7U89tCqUMqFevHjZt2oSoqCicOHFCbBXhpPg4JPudw7e9Hog5Mg9ZMSEA2DVkCppsMjMz8ebNG5w+fRr//PMPhg0bhkaNGkFfXx/Vq1dH586dMXv2bFaGZSAvam7dunWsNnkoIwDg6ekJKysrZj8wMBBbtmyR6hjlzW+Epn9XbUR7YVEkhmZepVDki5aWFgYNGoRBgwYxVYT3798v0m8kKyoYPG19EEIgyEhGTtxXfAyIxPCQs0iO+YL3798jLCys2BDZRYsWCT28AWDKlCk4f/48bt68CQB4FvIdNULj4GprDB637F5K9PT0sGXLFri7uzNtnp6eGDhwoMQOmy4uLuBwOMy1q/LKSEhICB4+fMjs165dW0h5pCg5ZZzvRCYoc9KzzZs3sxLsHD58WNEiUSgVjtzcXHLlyhXi1qE7AZfHfB+1rJ2JUfsJhKtjWGzCMnFbtWrVSHh4uNjEWYdvvSA8LT0CgBh3nkKs518izVbeIlfffCvTaxYIBKRnz54sWfv37y/VMRwdHZm5Ojo6JDc3t4ykLVsWL17Mug+rVq1StEiU/yPp85s6sJaScePG4b///mP237x5g7p16ypQIgql4vIkNA4DN11D2ts7SHl9A5VaDoOuYyvkJEQj+bkP0t7cAsnNKtGxtbW1YWdnB3t7e9SoUQP29vZI4BnB62UqMqPeI+7yRhh1mAiDxr2ZKsBew11k4jArjvDwcNSpUwcZGRlM2+XLl9G9e3eJ5o8aNYqVqyQoKAhOTk4yl7MsEQgEsLW1RUREBIA8Z+aIiAixCfUo8kXS5zc105SSgjlGNDQ0xJZRp1AoZY+rrTGqWZojRrcf9Ju4I99TRN3IApU7e8Co5VCQdzeQ+foyYmNjpTp2RkYG3r59i7dv3wp3crjgqGshI+QZDBr3BgHAQZ5/Sqc65mVmsrGxscHixYvx119/MW3Tpk1DUFCQyLDowjRu3JiljDx//lzllJF79+4xigiQl1uEKiKqB3VgLQU5OTmsH6a6detCXV1dgRJRKBUbHpcDz151AABcDgcczq+fOA4Ano4h9mxahYiICHh5eaFGjRqyOTERgORk/v8s/28CEJ2UCb8w6ZOSScPvv//OygobFhaGlStXSjS3PKSFp46r5QOqjJSCDx8+ICvr15IvdV6lUBRP17oW8BruAnNDLVa7uaEWYzbR1tbG5MmT8f79e5w9exbNmjUTe7wRI0Zg0KBBaNy4MYyMjIo8t5Z9I6G2HymZIkbKDg0NDXh5ebHa1q5di/fv3xc7t0GDBqxssqrmxJqcnIwzZ84w+4aGhujTp48CJaKUFGqmKQU0koZCUU661rVApzrm8AuLx4+UTJjqa4mMcOHxeOjXrx/69euHx48fY926dbhw4QIruqZOnTqsLKcJCQkIDQ3Flcev8O/Zh8hJjEZuYgxyE6KhbiwcyWKqryXUJmvatGmDkSNHMiaXnJwcTJkyBbdv3y4y1YC2tjbq1q3LmJtfv36N7OxsaGholLnMsuDMmTMsfxmaW0R1oSsjpYCmgadQlBcelwM3+8ro41wVbvaVi/XbaNGiBXx8fBAcHIyJEydCU1MTAHDy5EnWOCMjIzRu3BgLp4+HQ7dRqNJ9FsyHrka1qQehY//L7MFBXtZXV1vhJG1lwbp161grN3fv3sXRo0eLnVcwZDkrKwtBQUFlIl9ZQE005YcSKSPbt2+HjY0NtLS00LRp0yLTNBfkxIkT4HA46Nu3b0lOq3QULpBXv359xQhCoVBkRu3atbFr1y58+fIFixYtQkREBD5+/Cg0rqB/SmE1J3/fs1edMs03UhBTU1OsXr2a1fb7778jISGhyHmq6jdCc4uUL6RWRk6ePIk5c+bA09MTL1++RIMGDdClSxf8+PGjyHnh4eH4448/0KpVqxILq2wUXBmpXr16sfZkCoWiOpiZmeGff/5BRESE2MgUSfxT5Mn48eNZ/i8/fvzAwoULi5yjqmnhC0YBAXlF8Wj2a9VF6jwjTZs2RZMmTbBt2zYAeTHeVlZWmD59utjqkXw+H61bt8bYsWPx8OFDJCYmwsfHR+JzKmOekZiYGFYxvN69e+P8+fMKlIhCoSgKvoAU658iLwICAtCoUSOmCi+Hw8HTp0/h6uoqcnx2djYMDAwYZ3xnZ2e8evVKbvKWBJpbRHUok0J52dnZePHiBasmBJfLRceOHfHkyROx85YtWwZTU1OMGzdOovNkZWUhOTmZtSkbhU001HmVQqm4SOufUpY4OztjxowZzD4hpMhCehoaGqzfrzdv3rCcQpWRu3fvsnKLdO7cmSoiKo5UykhsbCz4fD7MzMxY7WZmZoiJiRE559GjR9i3bx/27Nkj8XlWrVoFQ0NDZitYEEpZoM6rFApFWVm2bBnr4fzq1Svs2LFD7PiCfiN8Pl/o903ZoI6r5Y8yjaZJSUnBiBEjsGfPHpiYmEg8788//0RSUhKzff36tQylLBl0ZYRCoSgr+vr62LRpE6tt0aJF+Pbtm8jxquQ3kpycjLNnzzL7NLdI+UCqPCMmJibg8Xj4/v07q/379+8wNzcXGh8aGorw8HD06tWLacu3Y6qpqeHDhw+wt7cXmqepqcmE1SkrBd8c9PT0YGtrq0BpKBQKhU3//v3RtWtXXLt2DUDey+Hs2bOFQpUBYWVEmSNqTp8+zTIjDRkyBFpaZZ/LhVK2SLUyoqGhgUaNGuH27dtMm0AgwO3bt+Hm5iY03sHBAW/evEFAQACz9e7dG+3atUNAQIBSml8kISMjAx8+fGD2GzRoAC6XpmyhUCjKA4fDwbZt21gP6lOnTuHGjRtCYx0dHVkRQ8q8MkJNNOUTqZ+gc+bMwZ49e3Dw4EEEBwfDw8MDaWlpGDNmDABg5MiR+PPPPwEAWlpaqFu3LmurVKkS9PX1UbduXZXJ8gcA586dY7IyBgUFMSs8ADXRUCgU5cTe3l4otHfq1KnIzGSnqOfxeHBxcWH2379/j5SUFLnIKA0hISF49OgRs+/g4CA2SoiiWkitjAwaNAjr16/HkiVL4OzsjICAAFy7do1xao2IiEB0dLTMBVU0y5Ytw6hRo5CWlkbTwFMoFJVh7ty5rGriISEhQsnRALYTKyFEKcN7Dx48yNofPXo0zS1STpA6z4giUIY8Iz179sTly5fh6OgIW1tbXLlyhel79uwZnJ2d8ejRI7x+/RqzZs2iXxAKhaI03LlzBx06dGD2NTQ08ObNG9SqVYtpO3bsGIYNG8bsr1+/Hr///rtc5SwKgUAAGxsbJqCB5hZRDcokz0hFJv8DHxwczFJEAMDT0xOVK1dGhw4doKGhQRURCoWiVLRv356laGRnZ2Pq1KmsgoDKnhb+7t27rMhKmlukfEGVEQmpVk24Gmc+165dQ2pqKqpXr47x48fLUSoKhUKRjA0bNsDQ0JDZv3XrFiuyxt7entVf0Ik1ISEBFy5ckI+gYqCOq+UbqoxISFHKSD6LFy9W+pBkCoVSMTEzM8PKlStZbbNnz0ZSUhKAPLNHwRDf0NBQJCQkIDAwEI0bN0ZgYKBc5S1I4dwilSpVorlFyhlUGZGQ4pQRe3t7jBo1Sk7SUCgUivRMmjSJpXDExMRgyJAhTGXfwvlG/vrrLzRr1gyfP38WyrwtT2hukfIPVUYkpDhlxNPTE+rq6nKShkKhUKSHx+Nh586drLxIV69eReXKleHq6ooXL16wxu/cuZNRAhSpjFATTfmHKiMSUpQy4uDggKFDh8pRGgqFQikZjRo1wtSpU1lthBA8f/4ct27dEjtPUcrIp0+fWLlFHB0dhZxtKaoPVUYkRF9fX2xY0tKlS8Hj8eQsEYVCoZSMf/75R2QJj6JQlDJCc4tUDKgyIgWiVkfq16+PAQMGKEAaCoVCKRmGhob4999/pZqjCGWEz+ezlBEul4vhw4fLXQ5K2UOVESkQpYwsW7aM1qWhUCgqx6BBg9CpUyeJxurr60NbW7uMJWLDFxBsP3oekZGRTFuXLl1gaWkpVzko8oE+RaWgsDLSuHFj9O7dW0HSUCgUSsnhcDjYvn27ROkI5L0qci0oGi3X3MFfa7ay2p3b03De8gpVRqSgsDLyzz//UNslhUJRWWrWrIkFCxYUO06eysi1oGh4HHmJqB9xSP/4hGnnauriaIwprgWVv9pnFKqMSEVBZaR58+bo0qWLAqWhUCiU0rNgwQLUqFGjyDHyUkb4AoKlF9+BAEh7/wgkN4vp06nTBlw1DSy9+A58gdKXVKNICVVGJIQvIEjm6jP7S5fRVREKhaL6aGlpYceOHUWOMTU1lYssfmHxiE7KBJC3EqJexYbp06vbAQRAdFIm/MLi5SIPRX6oKVoAVeBaUDSWXnyHL59iAQCa1etjsR9Brlk0uta1ULB0lIoCX0DgFxaPHymZMNXXgqutMXhcqhBTSk+nTp0waNAgVq2agshrZeRHSibzf12HltB1aIn4u/+Bw1OHhkUtkePKAy9evEBERATc3d2LHFeefwOoMlIM+fZLAoCnbwIA0HVqj8ivkZi0Pwm7xrhRhYRS5uQrxPlvjQBgYagFz1516OePIhM2btyIK1euICUlRahPXsqIqb5winc1XSOkBt6ArmNraFSxFjtO1cjJyYG3tzc2b94MX19fXL9+vcjx5f03gEMK1pBWUpKTk2FoaIikpCSxicfKAr6AoOWaO8wfnxCCyC1DIcj89WXlqmvC0qwKTExMULlyZWYrvF+wzcDAgJp4KBJTUCEuSP4nyGu4S7n4MaIonq1bt2LGjBlC7WfPnkW/fv3K/Pz5v7kxSZnM5z03JQ5RO0aDo66Byp2moEbLHng0v73KrgjExsZiz5492LFjBxO2bG5ujq9fv0JNTfT6QP5vgICfC35qHHj6JuBweSrxGyDp85uujBRBQfslkBcKx9XSYykjgpwsREZGsmLhi0NNTQ3GxsbFKjAF942NjWmW1wrIz9g4zPU6h9SvX5CbGAN+WgKMO00GABDkKSRLL75DpzrmKvvjTFEepkyZggMHDuDly5es9o/JXDwJjStzswCPy4FnrzrwOPISHOR9xtX0K0PLuj4yv7xG7JV/4aIZjaxMN+jo6JSZHJIijdkkMDAQW7ZswdGjR5GZyTYzDR06FDweD/Hx8YiIiGBtX75E4MrTN8iI/w5+ajwAAstJe6Feybxc/QZQZaQIRNklBdnppT5ubm4ufvz4gR8/fkg1z8jISGLlJX+jlS1LR25uLs6cOYPWrVuXSbIlgUCAyMhIhIaGCm2fP39GYmKi0JxKrUeCq5n3Q1zQoc/NvrLM5aNULPIL6TVt2hQFF803XnyBne/V5WIW6FrXAl7DXVgmCd06bZD55TUA4Ib3CTRr9hanT59G7dq1ZXbeFy9ewMXFReJVa0nMJnw+HxcvXsTmzZtx7949scc6evQodu3ahbS0NInOnZvwDeqV8tL5l5ffAGqmKYInoXEYsucpqy3p2TkI0hPBT0+GIDMZgowUmGnmIC0pAQkJCRAIBHKTTxJ0dXUlVl7y9/X09Cq8GSk1NRX79u1jUmaHhYWV+J5kZmYiLCxMpMIRFhaG7OxsqY5n3GU60oJug/BzAC4XHC4PNcwMYF5JF2pqauDxeFBTUxP6v6i+CRMmwMnJqUTXRSm/9Bw8GpdP/krDrmFeE+YjN4DLyQvAlIdZoOCqgw6y0auZI7KyfoX66unpYffu3RgyZEiJz0EIwc2bN7FixQoYGhriwoULEs0rznS6tpcdIp5ewbZt2xAeHl5i+cRRucds6NXtwGrbPNgZfZyryvxcpYWaaWSAq60xLAy1WPZLw6a/7KYcAOaGWoz9UiAQIDExEXFxcYiNjUVcXByzFbUv7cNIGtLS0pCWloaIiAiJ56irqxfr91J4v1KlSuXCjBQdHY2tW7fCy8uLWZWYN29esYpIfHy82NWNqKgoyFLn52rponL3mYi7sglZUcEAgLeRwFspjzNnzhzUqVNHZnJRygd8AcH3Wu7g6pyHID0RAJD9PRTZ3z5As6qj3MwCPC6H9abfs2dPnD17ltlPTU3F0KFD8eDBA/z7779SrQILBAJcvHgRK1aswPPnzwEA//33X7HzkpKS8PZdMKZt9Eb818/IiY+EeiULGLUfBwDIjv2KlJcXMXjjHQhyZB/xw9U1gratC9QMhEOtVd2pl66MFEO+BgyApQXLynGIEIK0tDSplJe4uDikpqaW/KLKAA6HAyMjI6n8YCpXrgwNDY0yk0kae+67d++wfv16HD16VEg5fPHiBZydnREVFSVS4QgNDRVpTikNOjo6sLe3h52dPfzi1JGlUwVqlcyhVskCagZVwOGpgQj4SHnug8SHR/JWSaRg6tSp2Lp1a4VfAaMIk78inPr2LuIubYC6mT1Mus+Ehqkda9zxCc3kahbw9vYW60TbsGFDnD59Gvb29kUeg8/n49SpU1i5ciWCgoKYdi6Xi+/fv8PExASEEHz79g3v379HcHAw829wcDCio4Wzv6pXsYFRm1FI9r+AzPBXJbo2dXV1VKlSBVlZWYiPjxf58qJt1whV+i0Gh8deQyj8UqxsSPr8psqIBChjSFVWVpZUyktsbCwSExNl+oYuC/T19aVSXkxMTKCjo1PsQ1SSvxkhBPfv38e6detw5coVscdycHBAWFgYa4lYFlSpUgX29vYiNzMzM+Yai1OI5zfVwZ7lfwg5HYrD2NgY+/fvR+fOnalPEUWI8wFRmHkiAIQQZIQ8g3YNV3A4wvkx5W0WyMrKgpmZGZKSkkT26+jpY+HqLZjvMUrooZydnY3Dhw9j9erVCAkJEZpbuXJl9OjRg1E+RIU3i4WnjqqT9iEnLgI5P78g+2c4cn6GA4lfkZ0pm9WRmk4NkNV5Ebga2mXyUlyWUGVExpSHZDN8Ph8JCQlSm5Fyc3MVLToLTU3NIp12v2Wq4fCreHC19MHV1gdXxxBcTR3G3r1tcH2kfvDF+vXr4e/vX2ZycrlcVK9eXaSyYWdnJ9VnuTjlKicnBytWrMDy5cvB5/MlOqauri66desGd3d39OjRA4aGhlJfI6X8IcpXThTyXhkBgPHjx2Pfvn1FjjF3c8fu7f+iV0NrZGRkYN++fVi7di2+fv1aJjJxtQ1gMWYr1PTZ9+LI2CYw4yQhMDAQb968gZ+fHx49eiSdogPA3t4evr6+ePmDr3QvxZJAlRGKTCCEICUlRWozUnp66aOOZAsH0NQBh8sDsjOkNmuIQ1NTEzVr1hSpcFhbW0NdXV0m5wEkU4hfvHiBkSNH4t27d1IdW11dHe3bt4e7uzv69OkDc3NzmclNUS1E5fooiCLNAnfv3kX79u1FCMWFXv3OUK9iDQ0Ta6gbV0NnzQ+4fGwvvn//LpNz29jYwMHBAbUdHHDhCwcZ2mZQq2wFng5biS/q/ty9excTJ04UuTojiipVquDJkyeM+UkVX4qpMkJRKBkZGUUqK6LaZO13ISs4HA50dHRgYGCAypUrw8LCApaWljh27BhycnLg6uqKCRMmoHPnzowZSZFkZmZiyZIlWL9+fYnMchwOB82aNYO7uzvc3d2LLaJGKX+Uta9cSREIBKhevTqioqKE+ow6TICuU3ukvLiIlBcXIMiU3q9OQ0MDtWrVgqOjIxwcHODo6AhHR0fUqlWL9b0uzf3JysrCP//8gxUrVhQpi66uLu7du4fGjRtLfR3KBFVGKCpHbm4u4uPjpfKDiY+Pl9gsIS+0tLRY5iNJ/GDKIivv48ePMWrUKISGhjJtgwYNwogRI+Dt7Y0LFy7g58+fxR6nbt26jGLi7OxMnV4rCMroKwcAc+fOxfr16wEAPF0j8NMSwNOrDM3qdZER4geSnVGi4w4aNAhHjx6VOCqwpPfn3r17mDJlCoKDg8WOUVNTw8WLF9G1a1fJL0BJocoIpUIgEAiQnJzMKCePgsKwyvs5BBkp4GckI+PTU+TEflG0mMWSn5VXmpBqIyMjsemj80lLS8O8efOYqqyurq549uwZgDwfosePH8Pb2xve3t748qX4+2RjY4O+ffvC3d0dLVq0KBfh3BTxKKNZ4NWrV3BxcYGGmT1M+sxH0uPjqNR+AjggyE2IRm5SDHISopGbGANr9VQkfv+Kb9++SXTsy5cvo3v37hLLIs39+fHjB/744w8cPny42OMeOHAAo0aNklgOZYYqI5QKSWF7d07cV2TFhCA34RtyEr4hN/4b+InfwM+ULNOhslOpUiWJVl8+ffqEpUuXIjU1FUlJSUKrG4QQvH79mlFM3rx5U+y5TUxM0Lt3b7i7u6Njx440MociFwghsKvpgPSGQ6FtX7QJI9/JNj09HeHh4Uzun4J5gApGypmamiIwMFCmhQEFAgF2796NP//8UyJT9IoVK/DXX3/J7PyKhiojlApLcfbcHcMaorG5Oj59+sTaPn78iE+fPkmckllV0dLSgqmpaZHKS3Z2NgICAvD48WO8fPmyWN8TPT09JjKne/fuNDKHUqZcu34Df7/g4ntyVqmdbAUCAb59+8YoKFZWVujUqZNM5Hz16hUmT54MPz8/oT47Ozts3boVvXv3ZkzNU6ZMwbZt28qVKZQqI5QKTUntuYQQxMTEiFRUQkJChApcSYOGhga0bZzBsXACh8sFPyMZ/PRk8JO+gxA+BOnJQFYqOFkpZZqVtyTweDzweDzk5OQUq5ioq6ujVatWGDBgANzd3WlkDqVMUFYnWyDvmbV48WJs27ZNqESIhoYG5s+fjz///BPa2tqwsLBATEwM+vXrh1OnTklt+lRGU1pBqDJCqfDI+ksqEAgQFRWFT58+4cOHD5g7d27JVlE4XOjUbgGDpv2REfocSb4nYdR+HPRdeoLD4eDY+Kaob66l8ll588lfibG3t0f16tWLdewty6y8lPKFsjnZEkJw6tQpzJ49W2S21g4dOmD79u2sAn8NGjSAgYEBbty4AW1tbanOp2zXLwpam4ZS4Slc26K0cLlcWFlZwcrKCgEBAVIpIubm5qhsaY0vuYZQM64KdeOqyPkRjqTHxwEiQMKtXciKeIPK3WbgZ2oW9PRMoKenBxsbG4nPoaxZeTMzM5ly6JKgp6cnVWHHypUrQ1dXt1wtbVMko2tdC3SqY64UKwOfPn3C1KlTcfPmTaE+c3NzbNy4EYMHDxb6nLZr1w6enp4lUkQ8jrwEPyfP34WrrgkAiEnKhMeRl0qdlVUUdGWEQpGSoKAgNGrUSMiUYmBggFq1agltNWvWhIGBASuzJSEEMYdmIzuGnfxIrZI5dh84gjF92BU5ywppsvIWbFO2rLwaGhpS10WqVKkSuFzhNOcUijRkZmZi9erVWL16tVDJCC6XiylTpmD58uVi/aj4fL5UppmsrCw89n2Ckcv/Q+ynV8j69h6Vu82EnlM7Zowy1auhZhoKpQzg8/kYNWoU0tLShJQOU1PTIt/OC0f68NOTEHtpAzLD2DVlNDQ0sGHDBkydOlUp3/bzs/KKU2BiY2MRGhqKT58+ITo6ulR+NmUJl8tlwqklUV7yN1lm1aWoNjdu3MDUqVNFZlRt3Lgxdu7ciUaNGpXqHNnZ2fDz88Pdu3dx7949+Pr6Cn2ndBxaoUqf+UJzFZGyvzBUGaFQlJDCTneECJD89AwSHx4BCNvRrX///ti3b5/KR6aEhITAx8cHZ8+exbNnz4o1C3G5XGhra4MQooRlBcBk4pXGlKTorLyimDlzJpydnfHbb79BT09P0eKoFFFRUZgzZw5OnTol1GdoaIiVK1di0qRJJcrDk5OTA39/f0b5ePz4cbHfA56+CapNOSDULu9ihqKgygiFoqSIcjrTjf+I7+fXIu5HDGusnZ0dTp06Veq3K2UhJiYG58+fh7e3N+7cuYOcnKJrBOVH5rRu3RoNGzaEQCBQ2ay80vrBGBoalunK2J49ezBx4kTo6elh0KBBGDt2LNzc3JRyNU5ZyM3NxbZt27BkyRKRBe+GDx+OdevWSRVBlpubi5cvX+LevXu4e/cuHj16JJUzOlfXCDq13GDcYQI4PPaqHV0ZkTFUGaGUN0RF+sTF/sSIESNw48YN1lgNDQ1s3LgRU6ZMKVcPiqSkJFy+fBk+Pj64cuVKsQ7BHA4HzZs3Z1LT29nZiRxXOCuvpE69ymZO4vF4EmXiLbhvbGxcbFbefFJTU2Fpacl6qDo4OGDs2LEYMWJEsQ9UZQ8plTVPnz6Fh4cHAgIChPocHBywY8cOtGvXTnhiIfh8Pl6/fo27d+/i7t27ePjwIZKTk0skk2Y1R5gNXSv0u0B9RsoIqoxQKgoCgQCrVq3CkiVLhPIT/Pbbb9izZ4/Km21EkZmZiVu3bjE1c2JjY4udU69ePUYxadCgQakVtfT0dKnDqUv6EClL8rPySqLArF69GidOnBA6Bo/HQ48ePTB27Fh0795dyE9GFUJKZUV8fDz+/PNP7NmzR8jEqKWlhcWLF+OPP/4QG5IuEAjw5s0bRvl48OCBVEVBjY2NkZmZKWSq0dLWQeWRW6BeyVzp8qwUhCojFIoKc//+fQwZMkQoV4G9vT1OnToFFxcXBUlW9uTm5jI1c3x8fCSqmWNra8vUzGnevLncauZkZ2dLXdwxISFBSNFUZszMzDBy5EiMHTsWDg4OjN9T4QeHsj0ESwshBIcOHcLcuXNFFpRs164d9u3bB1tbW1a7QCDAu3fvGOXj/v37iI+Pl/i81tbWqFevHhISEuDn5yfWlLlt2zbYt+mn9EohVUYoFBXnx48fGD58uFDeAg0NDfz777/w8PAoV2YbURBCEBAQwNTMCQoKKnZOlSpVWDVzNDU15SCp5AgEAiQmJkptRlKGrLzN3Nzww6I5cqo3RW7yDwCARhUbpl+ZzAOl4e3bt5gyZQoePHggst/Q0BDx8fHgcrkghOD9+/eM8nHv3j2JVvbyqVatGtq1a4dWrVohPT0dJ06cwNOnT4uc06ZNG9y5cwdcLlfpzWVUGaFQygECgQArV66Ep6en0Nv0wIEDsWfPngr1nQgJCWEUkydPnhQ7Xk9PD927d2dq5qjqvSKEIC0tTXmy8nJ5gEAANSNLWIzbDi6P7aeiDI6TJSEtLQ3//PMPNmzYUGQunaZNm2LMmDGM8vH9+3eJz2FhYYF27doxm46ODnbv3o2dO3ciJiam2Pk6OjoIDAyEvb29xOdUJFQZoVDKEffu3cOQIUOEfqxq1KiBU6dOoWHDhgqSTHFER0fjwoULEkfmaGhooEOHDnB3d0fv3r1lWplVWSkuK+/BgwcRFxcn8fE4HA4IVw3g/7rXldqOgWHT/qxxyhBSKi0XLlzA9OnTJc4ULClmZmZo27Yto3zUrFmTWdHMzs7GkiVLsGPHDpHROaLYvHkzZsyYIVMZyxKqjFAo5Yzv379j+PDhuHXrFqtdU1MTmzZtwqRJk4TMNj9+/ICpqak8xVQIiYmJuHLlCry9vXH16lWZReaUZ3x9fdGiRYtix7Vp0wZt2rTB69evcf78eaF+nkEVVJ2wGxy1X06uyrwyUtisYcZNwexZM3HhwgWZHN/ExISlfDg4OBRrTk1OTsaBAwewcePGIn2kWrVqhXv37qlU5mCqjFAo5RA+n4+VK1fi77//FjLbDBo0CLt372Z9R5YsWYLatWtj2LBh8hZVYWRkZODWrVvw8fGRODKnfv36jGJSv379cu+Lw+fz0bhxY1aYqpqaGho2bAg9PT3cvXuXaZ81axbOnDmDyMhIoePoOrWDUfvx4OnkRXgpu89IwSggws9B8nMfJPuegCAnq/jJYjA2NkabNm0Y5aNOnTolUhaePn2Kvn37ijX5aGlpITAwEDVr1iyxrIqAKiMUSjnm7t27GDJkiNAPV82aNXHq1Ck4OzsDAPr27Yvbt2/j5cuXKvcjJgsKRuZ4e3tLtARva2sLd3d39O3bV66ROfJk+/btWLlyJdzc3ODm5oZmzZrBxcUFjx49Qrdu3YpNGsczMIVJl6nQsvuVjE/Zo2kKRgFlRrxB/A0v5MSV3CRTq1YtnDp1CvXq1Sv1SsXRo0cxbtw4odo2Bdm4cSNmz55dqvMoAqqMUCjlnJiYGAwfPhy3b99mtWtqamLz5s2YOHEi7OzsEB4eDhcXF/j6+ipdZIk8IYTg1atXjGLy9u3bYueYmpoykTkdOnQoN/cvISEBRkZGrLa3b9+iefPmReZO4XA4mDlzJloPmYq1t78odUhpQfLrQuWtiOTi255JyE2S3OlUHGvXrsXcuXNLPF8gEGDRokVYtWoVq11LS4uVhM/NzQ0PHz5UScVY4uc3UQGSkpIIAJKUlKRoUSgUpSI3N5csXbqUcDgcgv+Xu8nf+vfvz9qfOXOmosVVKj5+/EjWrl1L3NzchO6dqE1fX58MGjSInDhxotz9FsXExBBra+sir9/JyYk8ffqUmZPLFxDfkFji8yqS+IbEkly+QIFXUDS+IbHEev4lZqvSbzH7+ngahKOhTdTU1SX6LBTcTp8+XSKZUlJSSN++fYWOZ2lpSfz9/YmdnR0BQDQ1Ncn79+9lfEfkh6TPb7oyQqGUA+7cuYOhQ4cWG2J4/vx59O7dW05SqQ7R0dGsmjlFhXUCeZE5HTt2RN++fVU+Mic9PR3t2rWDn59fkePMzc2xbt06DBs2TOV8as4HRGHmiQBW249zy5HzIwzGnTygbd8YQF4UULc6VZCWliZyS01NFWrj8/n466+/oK2tLbE8ERER6N27N16/fs1qb9KkCXx8fGBpaYnRo0fj4MGDpV59UTTUTEOhVDBiYmIwbNgw3LlzR+wYY2NjBAQEwMrKSo6SqRYlicxp0aIF4wBbOCOnMiMQCPDbb7/h3LlzEs9p2bIltm7dyvglqQJPQuMwZA87kRg/PQkcdS1w1X+Z3uQRBfTkyRP07dsXP378YLUPHjwY//33H6PU7N27F3v37sXjx49V0jyTD1VGKJQKCJ/PR69evXD16lWxY1q2bIm7d+9KXFCtIpMfmZNfM0eSnBwNGjRgFJN69eopxSqCuCyd8+bNw7p16yQ6BpfLhZubG7p3744ePXqgQYMGZSy17Mj3GYlJyhRKYw/ILwro8OHDGD9+vFA23WXLlmHRokWsz0pISAiys7NRp06dMpNHHlBlhEKpQBBCcPPmTfz9998SZSZdtGgR/vnnHzlIVn7Izc3Fo0ePmJo5kkTm2NnZMTVz3NzcFPKGK66oXZPMl9i6bF6Rc83MzNC1a1d0794dnTp1EnJ6VSXyo2kAyL2wnEAgwF9//YU1a9aw2rW1tXH48GH0799fzEzVhyojFEoFgRCCtWvXYtGiRcX6OuTD4XBw69YttG/fvoylK5+QEkbm9OnTB+7u7mjfvr1cInPEFbXLDHuJ76f/Bgg7Vw2Xy0WzZs3QrVs3dOvWDQ0bNlSpBFvFoYhqw6mpqRg+fLhQwriqVaviwoUL5broJUCVEQqlwvHz508cP34chw4dwosXL4odb25ujtevX1eIDK1lzadPnxjFpLgiZwCgr6/Pqpmjr68vc5kKhrMWJPtnOGKOzAPJzitJX6VKFUb56Ny5M4yNjWUuizIhz8JyX758Qe/evfG/9u48LKqy/QP4d2ZgBpBFFlkFCfcVF3DBNUMpzS1T01xSU3PtzV+ZZWblRmZmuWSSu+b6KmluqagF4iubpqCYCyDCgOzDPsvz+4OYPMywDM4K9+e65oI55zln7nnEOfc851n++usvzvaePXsiNDQUbm7GNwxa2ygZIaQRi4+Px759+7Bv3z6kpaVVWy4oKAhnzpwBA8+oV/40JWlpaZw1c+o6MqdyzRxtJYdqO20W5kK8/0PwrGxh2cIXVm364thnb6Nv62ZaeU3yr2vXrmHMmDEqHVUnTpyIHTt2aDT6xpRRMkIIgVwuR1hYGPbu3Yvjx4+juLhYpczMxZ8h3mmQyUxgZUry8vJw+vRp5cgcdfX/PD6frxyZM3r06BcamVN1OGvJw2gUxP4Gq1Y9UXT3DzgEzobQ2cckF7Uzdnv37sWsWbNUOqquWrUKn376qVF0atYXSkYIIRwSiQTHjx/Hnj17OGuPgC+A66SvIfJop9xk7FN7m6KSkhJcuHABJ06cwKlTp3Q+MqeyZaT47/+hPOMByp7eQ2lSHCr+dRncZmyGsJm3US9qZ2oq5xxZt24dZ7uVlRX27t3boDuqVqeu1+969UzasmULvL29YWFhgV69etU4WU5ISAj69+8Pe3t72NvbIzAwsNbJdQgh2mdjY4Np06YhLCwMSUlJWLlqFSycmgMKOZ6d+gaK0kIwxiDNears8PjlqQTIFUb/fcUkWFpaYuTIkdi1axfEYjEuX76MRYsW1Tjny61bt/DFF1/A19cXrVq1wocffoiIiIha144BgJ4vOcDNzgKWXp1R+NfFfxIRoHIsCY8ngJtdxS058uIkEgnGjBmjkog0b94c4eHhjTIR0YTGycjhw4exePFirFixArGxsfD19UVQUJDKfbFKV65cwcSJE3H58mVERkbC09MTQ4cOxdOnT184eEJI/bRo0QKvvPUenGf8CNcp38LSxw+5V3aj8E4Y0n6ei9wruyCXliI9vxQ3HucYOtwGx8zMDIMGDcL333+P5ORkREdHY9myZTXOKfHo0SN8++236NevHzw8PDB79mycPXu22sXVBHweVozoAL7ICo5B81X283gV+6lv0ItLSkpC3759cerUKc72Xr16ISoqCt26dTNQZCZE03nme/bsyebPn698LpfLmbu7O1u7dm2djpfJZMzGxobt2bOnzq9Ja9MQon2hcamc9To85u5mfEsb5RoZZk1dmfP4lSw0LtXQoTYqiYmJ7Ouvv2a9e/eu09ootra27K233mKHDx9mBQUFKuc7ezuN9V5zkTXpMIhz3I7TEQZ4dw3Pn3/+yZo1a6by7/L222+zkpISQ4dncHW9fmvUMlJeXo6YmBgEBgYqt/H5fAQGBtZpoiWgYh0EqVRa4/CxsrIyFBQUcB6EEO1ytrHgPM+/fhSKEonyuSxPjMwjy7Hty8XIysrSd3iNVps2bbBkyRJERkbi6dOn2Lp1K4YMGVLtjLkFBQU4dOgQJkyYgGbNmuH111/Hjh07lK3Vr3ZyQ/jHg3Fk1zbYNP130jIZ4yHyYTbdhnsBu3fvxuDBg/Hs2TPO9tWrV2Pfvn2wsLCo5khSlUbJSFZWFuRyucqiUC4uLhCLxXU6x8cffwx3d3dOQlPV2rVrYWdnp3zQOhqEaF9ln4LKRvqm/SfDustQlXLnQo+gXbt22LdvH5jx93dvUNzd3TF37lz8/vvvyMzMxL59+/DGG2/AyspKbfmysjKcPn0a7777Ltzc3DBgwAB89913eJKSjGE92+K9j/+ddfer0/cwMeQ6+n0dhnN30vX1lhoEuVyOJUuWYPr06ZBKpcrtVlZWOH78eKMbMaMNep1aLzg4GIcOHcKJEydqzBg/+eQT5OfnKx9PnjzRY5SENA6VfQqAivEVAksbOL62CC4T18DMgTvUMzs7G1OnTkVQUBAePXpkgGiJvb09Jk+ejP/+97/IysrCr7/+infeeafaVmaFQoE///wTixcvxksvvYSW7Tth+2/XIGz+T78UXsXHvzi/FHP3x1JCUkcSiQSjR49WWdPH09MTERERGDNmjIEiM20aJSNOTk4QCAQqy5RnZGTA1dW1xmPXr1+P4OBg/P777+jSpUuNZUUiEWxtbTkPQoj2vdrJDT9O7g5Xu3+/HFh4dUH390Mwcc5/YG5uzil/4cIFdOrUCevWreN8IyT69fzInIyMDISFhWHhwoU1tiI/uheP/IhfUJ6aAICHkgcVoxpp5FTdJSUlISAgAL/99htne+/evXHjxg2TWsnY2Gg8z0ivXr3Qs2dPbNq0CUBF9u3l5YUFCxZg6dKlao9Zt24dVq9ejfPnz6N3794aB0nzjBCiW9VNkR0fH49Zs2ap7RPm6+uLkJAQ+Pv7GyBiog5jDLGxscqp6RMSEqot6zjsP7DuzL1dTnOOVC88PBxjxoxR6T81efJkhISEUP+QauhsnpHFixcjJCQEe/bswd27dzF37lwUFRVh+vTpAICpU6fik08+UZb/+uuvsXz5cuzcuRPe3t4Qi8UQi8UoLCysx9sihOiCgM9Dn5aOGNXVA31aOiqHe3bs2BHh4eHYunWryvopt27dQu/evfHBBx/Q/2cjwePx0KNHD6xatQrx8fFITExEcHAw2nTmDi3lmQlh2bqPyvGZklKVbY2RXMEQ+TAbv958isiH2dixYycGDx7MSUR4PB7Wrl2LvXv3UiKiBfWagXXz5s345ptvIBaL0bVrV/zwww/o1asXAGDQoEHw9vbG7t27AQDe3t5ITk5WOceKFSvwxRdf1On1qGWEEMN7+vQpFi5ciBMnTqjs8/Lywo8//ohhw4YZIDJSm8iH2Ri34TeUPLiB4vuR4IuaoNlo1ZZsahnhruzLFHLkXdmNgiju33yTJk1w4MABjBo1ykBRmg6aDp4QohMnTpzAggUL1C7AN2HCBGzcuLHWPmREvypX8BXnl1ZMgsEYZ7QHD4CrnQXCPx7cqCdBO3cnHXP3x4IBUJQVI+vUNyh5GMUp4+XlhZMnT8LX19cwQZoYnU4HTwhpvMaMGYOEhATMmzdPZfji4cOH0b59e+zYsYOGARuRqiOnqiYiABr9bKxyBcOXpxL+SUSKIN7/oUoiYu3VAZHX/0eJiA5QMkII0ZidnR22bNmC8PBwdOzYkbMvLy8P7777Ll5++WXcv3/fQBGSqtSNnAIqWkRoQUTgxuMc5crVPKEVRB7tOfubdHwZDuNWIbnYXN3h5AWpn9KPEELqICAgALGxsVi3bh1WrlzJWTL96tWr6NKlCz777DMsWbIEQqHQgJESoCIhGdLBVe3Iqcbu+c67srx0CN3aQpTzFGVP4tF04DTY9hoLHo9HnXx1hPqMEFJFdcNcSc0SExMxZ84cXL16VWVfx44dERISgj59VEdwEGIMIh9m483go8iPPIKie3/CbeoGCGycUJ52H5Yt/ZTlqJOvZqgDKyH18HxP+kpudhZYMaJDo2/GrgvGGHbu3IkPP/wQeXl5nH08Hg9z587FmjVrYGdnZ5gACVHjzp07WLlyFY4cPQIwButuw+E4dC6nDHXyrR/qwEqIhip70j+fiAA0XbYmeDweZs6cibt372LChAmcfYwxbN26FR06dEBoaKhhAiTkOXFxcRg7diw6d+6MI0cOA4yBb2kL+/6TOeWok6/uUcsIIfh36GPVRKRSTd+KZDIZsrKykJGRgczMTGRkZHB+Lyoqwk8//VTjStUN1enTpzFv3jykpKSo7BszZgw2bdoEDw8PNUcSojs3btzAypUrVaZ1B4CFy79GlGUPah3VErpNQ4gGIh9mY2LIdQCAorwUUMggzc+EojgPTC6DojgP8qI8DPWxhKCsQJlwZGRkIDs7u8ZhrEeOHMG4ceP09VaMTmFhIT7//HN8//33UCgUnH02NjYIDg7Ge++9Bz6fGmqJbkVERGDlypU4f/682v3du3fHjRs3AB6f+o1pCSUjhGjg15tP8f6hmwCAp9tnQ5b7z4ReAiEgL6/+wFp89NFHWLdunRYiNH1RUVGYNWsWbt26pbIvICAA27dvVxkmTIg2XL16FV999RXCwsJqLBcREYGAgAA9RdU4UJ8RQjTgbPPv3As8vkD5u8DKFs7jvoS580san9PS0hJt27ZFfHw85HK5VuI0Zf7+/oiKisK6detgaWnJ2Xft2jV069YNy5cvR2kpDZ0kL44xhgsXLmDAgAEYNGhQrYnIlClTKBExIGoZIQTc6bKf7lwA6bMkAIDA2gHN5+8FmALmSZGQ3TiIpKQkjc9vbW2N7t27w8/PD/7+/vD394ePj4/KDKaNxcOHDzF37lxcuHBBZV+bNm2wfft2DBw40ACRkYYgLS0NEyZMQHh4eJ3K29jYIDExEW5u1CdE26hlhBANcKbLfq5lhCnk/0yfzcem5Qtx7949bNy4EY6Oms0zUFhYiD/++AMbNmzAxIkT0apVKzg6OmLo0KFYtmwZTpw4gdTU1EYzhXrLli1x/vx57Nu3D05OTpx99+/fx6BBgzBr1izk5uYaKEJiytzd3XHkyBF888036NChQ63lP//8c0pEDIxaRgh5zrk76XjztZdRlJoIAOBbWKPn56EqPenz8/Oxfv16bNiwAcXFxVp7fVdXV07riZ+fH5o1a6a18xujrKws/N///R/27t2rss/FxQXff/89xo8f32hbkciLefLkCXr37q12YUcAaNu2Lf766y+aIVhHqAMrIfXUJyAA1yMjAQBWTaxRUFBQbU/69PR0fPXVVwgJCVHpF3Lw4EFkZmYiOjoaUVFRSExMrFfLR4sWLZSJib+/P3r06NEgJw27ePEi5syZg0ePHqnsGz58OLZu3QovLy8DREZMVWJiIoYMGYInT55UW+bcuXMICgrSY1SNCyUjhNTTgAED8OeffwKo6IRal5aP+/fvY9myZTh27Jhy288//4yZM2cqnxcUFCA2NhZRUVGIiopCdHQ0Hj9+XK8Y27Rpw2k96datG6ysrOp1LmNSXFyMr776CuvXr1dJ7po0aYLVq1djwYIFEAgE1ZyBkAqxsbEICgpCVlZWtWVGjRpFE/DpGCUjhNTT4MGDcfnyZQCAubk5Z/G32vzvf//Dxx9/jKtXr+Ktt97CwYMHayyflZWF6OhoZetJVFQU0tM1n+lVIBCgY8eOnFs8nTt3Ntmm51u3bmHWrFmIiopS2efn54eQkBB07dpV/4ERk3DlyhWMHDkSEolEuU0oFOLgwYNYuHAh0tLSIBKJkJCQAB8fHwNG2vDV+frNTEB+fj4DwPLz8w0dCmkEhgwZwgAwAIzH42l8vEKhYGfOnGGvvPIKk8vlGh//9OlTFhoayj777DMWFBTEHBwclPFo8hAKhczf35/NmzeP7dy5k92+fZvJZDKN4zEUmUzGNm7cyJo0aaLy3gQCAVuyZAkrKioydJjEyPz6669MJBJx/l6sra3ZxYsXGWOMvfvuuwwAW758uYEjbRzqev2mlhFCqhg2bBjOnj2rfC6Xy+s1O2jlbYYXvaXAGENSUhLn9k5MTAznW19dWVlZoXv37pxbPK1atTLqzqEpKSmYN28eTp8+rbLPx8cH27Ztw5AhQwwQGTE2e/fuxYwZMzi3+BwdHXH27Fn4+/sDAEJDQ/H+++/j7t27DeLWprGj2zSE1NPIkSNx6tQp5fOysjKju92hUCiQmJjIub1z8+bNek0Y1rRpU/j5+XFu8TRv3tyoEhTGGI4ePYpFixYhIyNDZf+UKVOwYcMGlWHCpPHYuHEjPvjgA842Dw8PXLhwAe3bt1duKywsxKVLlzBq1Ch9h9goUTJCSD298cYbOHHihPJ5UVGRSXyDkkqliI+PV7aeREVF4fbt25DJZBqfy9nZmdN64u/vD2dnZx1ErZnc3FwsWbIEP//8s8o+R0dHfPfdd5g8ebLaRIoxZlQJFtEOxhg+//xzrFq1irO9TZs2+P3339GiRQsDRWbc5Aqml/V3KBkhpJ7Gjx+Po0ePKp+b8t9daWkpbt26xbnFc/fu3XoNMfby8uK0nvTo0QNNmzbVftB1cPXqVcyePRv3799X2TdkyBBs27ZNpWPi7du3cf36dcyaNUtfYRIdeP4i6tREiP0bPse2bds4Zbp164Zz584ZRQJtjM7dSceXpxL0sjIxJSOE1NOkSZM4o2Cys7Ph4OBgwIi0SyKRIDY2Vtl6Eh0djYcPH9brXK1bt+a0nnTr1g1NmjTRcsTqlZaWYs2aNQgODoZUKuXss7S0xBdffIEPPvgA5ubmAIDz589j+PDhOH36NM0rYaKev4gyuRRZp79D8d0/OGUGDBiAkydPNsi5eLTh3J10vLcvGrKiPEAuhZmdCwCgsk3kx8ndtZqQUDJCSD1NnToV+/btUz7PyMho8N+wcnJyVIYYP336VOPz8Pl8dOjQgXOLp0uXLhCJRDqIukJ8fDxmz56Na9euqezz9fVFSEgI/P39sWvXLsyYMQM2NjYIDw9Hly5ddBYT0b5zd9Ixd38sGACFtBTPTqxF6eMYTpkRI0bg8OHDKgsxNjZyuRzp6elISkpCcnIykpKS/nkkIzwuAaV5mYBcCksfPziP+0J5HA+Aq50Fwj8erLVbNpSMEFJPM2bMwK5du5TPnz59Cnd3dwNGZBjp6emc1pOoqKgaJ5Cqjrm5Obp06aJMUPz9/dG+fXuYmZlpLVaFQoGffvoJS5cuRUFBAWcfn8/HokWLYGFhgeDgYABA8+bNcf36dXh4eGgtBqI7lQtZpueXQlFaiMxjX6Ls6V1OGadugXgSeRoWIuPqbK4LMpkMqampnGTj+Z8pKSl16itm5tAcHrO2qWw/OKs3+rTUbP2t6tT1+q29TwNCGoiqF8n6dABtCNzc3DBixAiMGDECQEVHweTkZE7rSUxMjMrFvyqpVIqYmBjExMQo7+1bWVmhW7dunD4orVq1qtcQaqAi4Zg7dy5GjhyJRYsW4fjx48p9CoUCGzdu5JRPTU3F66+/jj/++AM2Njb1ek2iPzce5/zbv0FgBlTpiGzTYySsXnkXcakSrV1EDamsrAxPnjypNtlITU2FQqF44deR5YvVduzOlGg+Ku9FUTJCSBWUjKjH4/Hg7e0Nb29vvPnmmwAqLvR///03p/UkLi4OJSUlNZ6ruLgYERERiIiIUG6zs7NDjx49OH1QvLy8NBoB4+Hhgf/+978IDQ3FggULarzVdPPmTUyYMAEnT57UaisN0b7nL458cwvYvzwT2ec3Q5r5GHb93oZdwFvg8XgGuYjWR0lJCZKTk1USjcrf09PTdbaCN9/SFkxaBiYvh43va4BCXpHgPcfZxkInr10T+h9ISBWUjNQdn89H27Zt0bZtW0yePBlARX0lJCRwRvD89ddfKp1Mq8rPz0dYWBjCwsKU25o1a6ayirGrq2utcY0ePRqDBw/Gp59+iq1bt1b7wX727FksXLgQW7dupWG/Ruz5iyOTS5EbtgMu479CyaNYWHd+RW05dZKTk/HLL79g6dKlOv33lkgkapONyp+ZmZk6eV0+nw8PDw+0aNEC3t7enJ/u7u448MsvCA7+GkwhR5NOgXAYModzfGWfkZ4v6b/DPiUjhFRByciLMTMzQ5cuXdClSxflQoGlpaW4ffs2J0FJSEiotan52bNnOHv2LGdG3ObNm3NaT/z8/GBvb69yrK2tLSZNmoTffvsNycnJ1b5G5TDgjz76qJ7vmOhaz5cc4GZnAXF+KfIiDqE8KxmCJvbKRKSmiyhjDJGRkdi4cSOOHz+OmTNnvnAikpeXV+0tlKSkJOTk5LzQ+asjEAjg5eWlNtnw9vZG8+bNlaPHnnfz5k28/fbbuHXrlnKbbY/XOWUqa2TFiA46mW+kNpSMEFIFJSPaZ2FhoWzdqFRYWIi4uDhOH5QHDx7Ueq7U1FSkpqZyJqZr2bIlp/XE09MTK1eu5HRErsmSJUvg7e2NcePGaf7miM4J+DysGNEBM9YfQf71o+AL/x0tU91FVCqV4tixY9i4cSNu3Lih3P7222/X+FqMMWRnZ6vcOnn+Z239pOpLKBTCy8tLbaJR2bqhyS3F8vJyrF69GmvWrOF8jnXo6gfbtp0484y46miekbqiZISQKigZ0Q9ra2v0798f/fv3V27Lzc1FTEwMpw/KkydPaj3Xw4cP8fDhQxw6dAhARf8WCwvN7ntPmTIFHh4eCAgI0OyNEJ2TKxgs+Qzyy5sBpgB4/3Z0rnoRzcnJwfbt27F582aVPkOenp7o27cvxGJxta0aycnJKCoq0sn7sLS0rLZVo0WLFnB1da13J+6q4uLi8M477+Cvv/5S2ffZksUYP2GwXmZgrStKRgipgpIRw7G3t0dgYCACAwOV2zIyMjitJ1FRUXj27FmN52GM1dqJtqqysjKMHDkS169fR6tWrfQ2XTapWeVEZwmntqMgpaLljM/nY2ZfbwR2cFX+u9y7dw8//PAD9uzZg+LiYrXnevbsGaytreu1hlNdWFtbcxKMqslGs2bNdN43qby8HKtWrcKaNWs4CwZWcnV1xdixYyHg84xq5BElI4RUQcmIcXFxccHw4cMxfPhwABWJxpMnTzitJ9HR0cjPz3/h18rOzsarr76K1btCsTE8Qy/TZZPqVU50Vpp+HwXXjym3K8DDzogk+HnbI+zSRXz33XecfkXVedEkpGnTptW2anh7e8Pe3t6gHaFjYmIwffp03L59u9oyc+bMMbqFPwFKRghRQcmIcePxePDy8oKXlxfGjh0LoGKI8cOHDzkdZGNjY6v9hlyThw8fYmJgL1h3GQqL5h1g1bbito04vxRz98dqfbpsop5cwfDlqQQoZOXIPr0R4AsA+T8dnnmA5NZ5jN21ACWZSVp7TScnp2qTjRYtWhjtFPNlZWVYuXIlgoOD1baGVDIzM8OcOXOq3W9IlIwQUgUlI6aHz+ejdevWaN26NSZNmgSg4t/t3r17nATl1q1bKC8vr/V8rLwYkuhQlCbFKpMRhorOkl+eSsCQDq50y0bHKic6Y3IZXCauQdG9P5F78ScIrB0gL8xF9rlN9Tqvr68v2rVrpzbZ0Ne6StoUHR2N6dOn486dO7WWHTduHNzcjDORpmSEkCooGWkYzMzM0KlTJ3Tq1AnTp08HUPEN8vbt25w+KPHx8dUOMTaz5y4DwACk55fixuMco7rf3hBVTmDGF1kBIivY9hgBixa+kBVkojjhD/BFlih/lgyh5Ckkebl1Pu/LL7+M7777Tldh6115eTl6DH4dqVIr5CfFg5VV3/l2wYIFeoxMM5SMEFJFTcmIQqEAj8ejCbJMlEgkgp+fH/z8/PDee+8BqJgNNi4uDlFRUQi98Acirt+ALKdiFIald1e15zGVmT5NmboJzIROXhA6ecHKx0+57Zd3e6GljRx37tzBnTt3EB8fr/xdIpGonOP777/H2LFj0a9fP53Gry8Fti/hqmU/2I3uB/6t88ippsWoe/fu6NOnj56jqztKRkijV1ZWhsWLF+P9999HmzZt1CYjjDH8+uuv2L9/P44dO1bNmYgpsrKyQt++fdG3b1/0GjEFE0OuQ1FaiLKMhzC3V7+QniGmy25snp/oTN38uZUTnfXycYSAz4OLiwteeeXf2VgZY0hNTVVJUBISEjBjxgzcvHkTVlZWens/ulDZr4YBYLJy5F87VG3ZBQsWGPWXKEpG1KAhfY2LSCRCamoq2rdvj3HjxqlMNx4WFoZVq1YhKioKixYtMlCURB+UF0AAli18VfYbcrrsxqZyorO5+2PBAzgJSV1mC+XxePD09ISnpydee+015Xa5XI6kpCQUFxcbJBkpKipCcXExmjVr9kLnkSsYdkc8Vo744pkJ0Wzs58g+vQHSzMcQNe+AstQEAICdvQPeeuutF45dl3hMV6vxaFFdlyDWhsox7doY0ieXy3H//n3ExMRgxIgRRtsTmwC7d+9W9iuoyZkzZzgfbKThqRxOCqi/ANJoGv3S5meyMZDL5fDz84NEIkGfPn2Uj86dO9d5dtWqdaIoLURB1K+QZqfA4bX/oCDyMOwCJuDZiTUoTYrD2OnzcWznZl2+rWrV9fpNychzKj+EqlZIXT6EZDIZEhMTlUulx8TE4ObNmygqKsJbb72FgwcP6ixu8uKys7Ph4uJS47A4CwsL5OTkwNLSstoypGFoaBdAU9fQWqsjIiJU+qw0adIE/v7+yuSkd+/ealtPnr9OKcqKIYk5hYIbx6EoL4Hb9B8gbOatLFvyKAaZx77Ef6/E4I0BXXX7pqpByYiG5AqGfl+HcT58CmJOQZabBp7AHDyBGWysLDD3lXYwNzNDbm4u0tLSkJqaiuTkZKSkpKgdMmhtbY0zZ87Aw8MDQqEQQqEQIpFI+btAINDJ+yGaGzx4MC5fvlzt/qCgIJw7d06PERFDamgXQGJcpk6din379tVYpmXLlpzWkw4dO2HQt38gPb8U5c+SkXnsC8gLKmYjtu76KhyDqoyWYQyyGweRfGm/wf5263r9pj4j/6gc0/684vuRKEv5d17/fADLLml23sLCQgwYMKDa/Xw+X22SUtM2bW2va1lzc3Oj7vikLWPGjKkxGaHbM42LsU2XTUyHQqFAXl4esrOzkZ2djZycHM7P7OxspKen13qeyjWX9u/fDwCwtGoChZMPRO7tIPJoB6u2/SCJOgGe0BJN+3EXAOQBAI+H7d+vM4kkmpKRf6gbqqcoLdT56yoUCpSWlupsrQRtMTc3N9pkSVutTKNHj66xg+qrr776QucnhJgWxhgkEgkniVCXWFT9PTc3F7q46VBSXASk3AYrK4bA2gE2fiNh7uAORWkRBE3sOWUNvQqvpigZ+Ye6oXo8Pt1CqSSVSiGVSg0dRo0EAsELJzrOzs7IzMxUObeDgwPCwsIQERHxQgmXmZlZo2hlIvpTXl5ulGuNGJuSkpI6JRRVtxnLpIeOjo4Y/PpYhPM6Qejio9xu1nlIxUrGz1k+vD3e6fuSSbSIVKI+I/+o7DPy/Jh2WUEWmLQETC4D5DLYCcow1CYdJ0/+iqSkJJ3EQRo+XbQKabvFSVvLmBPd+/DDD/HgwQO8+eabjWLUXnl5OXJycjRKKLKzs42+9VkdPp+PV199FdOnT8eIESNgZi5UuU49r3LoefjHg40mEaEOrPVQ1yF9jDFERkZi27ZtOHLkCMrKytSez9bWFm3btoVYLIZYLNZ7y4JAIEDTpk3RtGlT2NrawtbWFtbW1rCysoKVlRUsLS0hEolgbm4OuVyO8vJyzqOsrKxO257fXlZWppPmSaJfz7cyGWOyJBQKqZXpH48fP0br1q0hl8thbm6OIUOG4M0338TIkSPh6Fi3Pi/lMgX2RSYhOacYLRysMKWPN4Rmuk1I5XK5sl9FXROKnJwctbOqGoMmTZrA0dERjo6OcHBw4PxUt00mk8HX11ftCL7WrVtjxowZmDJlCjw8uBPvmdrQc0pG6knTIX1ZWVnYs2cPtm3bhgcPHnD2iUQipKenw97eHgqFArm5uUhPT0d6ejrEYrHan+np6SgoKNDpe1TH0dERrq6ucHNzg5ubm/L3qj9tbW1rvQA8n9jUJ6F5ke11LWvst5xI3RhzsqTPVqbJkyfjwIEDnG0CgQCDBw/G2LFjMWbMGDg7O6s9du2ZBIT8+RiK564EfB4wq/9L+GRYh1pfmzGGgoICjRKK7Oxs5OXlGeUXF5FIVOeEovJ3BwcHiEQijV5nzZo1WLZsmfK5tbU1xo8fjxkzZiAgIKDGz1lTGnpOycgLqM+QPoVCgbCwMGzbtg2hoaHKbHfLli2YN2+eRq9fXFysbE2pLmERi8XIyMiodoEvXbG0tISrq2utiYuzs3OdJ/AxBMYYpFKp2uRl3bp1+Pnnn5Vlu3XrhlWrVuk1WaJWpobDzMxMZ4lO5fYHDx5g/fr11cbA5/MxYMAAjB07Fm+88Qbc3SsWAFx7JgE//fEYQMX/CSYrg6JEAkWJBPJSCV7xtsRAb6tak4ya5ucxFIFAoJI81CWxsLKy0nmLm1wuh4+PD1JSUjBgwABMnz4db775Jqytret+DhMZek7JiAGlpaVhx44d2L59O5ydnRETE6OT15HL5cjKyqoxYan8vbi4WCcxVIfH46FZs2a1trS4ubkZ3bLd0dHR8Pf3Vz7/5ptv8OGHHxokFplMppNER5vnMJYOfqTuAgICMHrMWGx6ZA++bUWLSd6f+2tc28SQ7O3tNUooHB0d69SKayjR0dEIDQ3FO++8g1atWhk6HJ2iZMQIyGQynD17FgMHDjR43BKJpNaWlvT0dDx79kzvsVlbW9easLi6usLJyUkvTd6MMbRo0QJPnjwBANy+fRudOnXS+euaKoVCAalUqpdk6UX6MhH1hG6tYdW2L1h5GfKv6XamaGtra40SCgcHB9jb29PkkCaMJj0zAmZmZhgxYoShwwAA2NjYwMbGBq1bt66xnFQqRWZmZo0JS+VPbX3AFxYW4u+//8bff/9dYzmBQAAXF5caE5bKnxYW9V9VlcfjYdSoUdi8eTMcXdxQYOEKuYIZZROoMeDz+RCJRBrfM9cnxlitfZmMocVJn61MAjNzmHu0h4V3d1h6d0NZxuM6H1vZr0KTDpsODg40BJlUi5IRwmFubg4PDw+VHtxVMcaQn59fa8IiFouRk5OjldjkcjnS0tKQlpZWa9mmTZvWmrC4ubnB3t5epSn33J10XCrxBgCUuXTGpJ//Z7Sdw0jd8Hg8mJmZwczMzKiXja9sZdI00bl48SJ+/PHHWs/foUMHDB06FEOHDsVjgSfWhSX/+9rScli26gW+hQ0Eljbg//MY37c9xvVtz0ksjLkOiWmi2zRE58rKypCRkVHrSCKxWKz3/gdCoZDTIVcqssO1pzLwmzRF7pXdcBr2H1i1DTDaYXOEKBQK+Pn5IS4uTmWfo6MjhgwZgqFDh2LIkCFo3ry5cl+5TIF2y89yRtFUxecB91a+pvNhvqThots0xGiIRCJ4eXnBy8urxnIKhQI5OTm1JizaHP5cXl6OlJQUpKSkqOzjiZrAwtsXQMV4fh6AL08lYEgHV7plQ4zG0aNHlYmImZkZ+vbtq2z96N69e7X9rIRmfMzq/5JyNI06s/q/RIkI0QtKRojR4PP5cHJygpOTEzp37lxj2crhz7XN2ZKZmVnv4c9CJy/wRf+O9GEA0vNLceNxDi2gRoyCVCrFgQMHsHDhQgwdOhQDBw6EjY1NnY+vnEfkReYZIUQbKBkhJsnKygo+Pj7w8fGpsZxcLsezZ8/qNJKo6vBngZ36SaLULapIiCGYmZnh5MmTL3SOT4Z1wP8Nbaf3GVgJeV69kpEtW7bgm2++gVgshq+vLzZt2oSePXtWW/7o0aNYvnw5kpKS0Lp1a3z99dcYNmxYvYMmpK4EAoGyT0jXrl2rLccYw6W/kjFty++QF+VCXpgDgbWD2rLqFlUkxBC0NY+G0IyPmf1rTuwJ0SWNU9/Dhw9j8eLFWLFiBWJjY+Hr64ugoCC1K50CwLVr1zBx4kTMnDkTcXFxGD16NEaPHo07d+68cPCEaAuPx8PLnVvA66WWsPTshCbtB8DCkzu3CA8VUy73fEl9kkIIIaR+NB5N06tXL/j7+2Pz5s0AKjodenp6YuHChVi6dKlK+QkTJqCoqAi//fabclvv3r3RtWtXbNu2rU6vSaNpiL6Y2iJUhBBizOp6/daoZaS8vBwxMTEIDAz89wR8PgIDAxEZGan2mMjISE55AAgKCqq2PFAxFLSgoIDzIEQfXu3khh8nd4erHfdWjKudBSUihBCiIxr1GcnKyoJcLoeLiwtnu4uLC+7du6f2GLFYrLa8WCyu9nXWrl2LL7/8UpPQCNGaVzu5YUgHV5NYhIoQQhoCoxxN88knn2Dx4sXK5wUFBfD09DRgRKSxEfB5NHyXEEL0RKNkxMnJCQKBABkZGZztGRkZcHV1VXuMq6urRuUBGP06F4QQQgjRHo36jAiFQvTo0QOXLl1SblMoFLh06RL69Omj9pg+ffpwygPAhQsXqi1PCCGEkMZF49s0ixcvxrRp0+Dn54eePXti48aNKCoqwvTp0wEAU6dOhYeHB9auXQsAeP/99zFw4EB8++23GD58OA4dOoTo6Ghs375du++EEEIIISZJ42RkwoQJePbsGT7//HOIxWJ07doV586dU3ZSTUlJ4ayFEBAQgF9++QWfffYZPv30U7Ru3RqhoaHo1KlTdS9BCCGEkEaEVu0lhBBCiE7oZJ4RQgghhBBto2SEEEIIIQZFyQghhBBCDIqSEUIIIYQYFCUjhBBCCDEoSkYIIYQQYlCUjBBCCCHEoCgZIYQQQohBUTJCCCGEEIPSeDp4Q6icJLagoMDAkRBCCCGkriqv27VN9m4SyYhEIgEAeHp6GjgSQgghhGhKIpHAzs6u2v0msTaNQqFAWloabGxswOPxtHbegoICeHp64smTJ7TmjQ5RPesP1bV+UD3rB9WzfuiynhljkEgkcHd35yyiW5VJtIzw+Xw0b95cZ+e3tbWlP3Q9oHrWH6pr/aB61g+qZ/3QVT3X1CJSiTqwEkIIIcSgKBkhhBBCiEE16mREJBJhxYoVEIlEhg6lQaN61h+qa/2getYPqmf9MIZ6NokOrIQQQghpuBp1ywghhBBCDI+SEUIIIYQYFCUjhBBCCDEoSkYIIYQQYlANPhnZsmULvL29YWFhgV69euHGjRs1lj969CjatWsHCwsLdO7cGWfOnNFTpKZNk3oOCQlB//79YW9vD3t7ewQGBtb670L+penfdKVDhw6Bx+Nh9OjRug2wgdC0nvPy8jB//ny4ublBJBKhTZs29PlRB5rW88aNG9G2bVtYWlrC09MTH3zwAUpLS/UUrWn6448/MGLECLi7u4PH4yE0NLTWY65cuYLu3btDJBKhVatW2L17t26DZA3YoUOHmFAoZDt37mTx8fFs1qxZrGnTpiwjI0Nt+YiICCYQCNi6detYQkIC++yzz5i5uTm7ffu2niM3LZrW86RJk9iWLVtYXFwcu3v3LnvnnXeYnZ0dS01N1XPkpkfTuq70+PFj5uHhwfr3789GjRqln2BNmKb1XFZWxvz8/NiwYcNYeHg4e/z4Mbty5Qq7efOmniM3LZrW84EDB5hIJGIHDhxgjx8/ZufPn2dubm7sgw8+0HPkpuXMmTNs2bJl7Pjx4wwAO3HiRI3lHz16xKysrNjixYtZQkIC27RpExMIBOzcuXM6i7FBJyM9e/Zk8+fPVz6Xy+XM3d2drV27Vm358ePHs+HDh3O29erVi82ZM0encZo6Teu5KplMxmxsbNiePXt0FWKDUZ+6lslkLCAggP38889s2rRplIzUgab1/OOPPzIfHx9WXl6urxAbBE3ref78+Wzw4MGcbYsXL2Z9+/bVaZwNSV2SkSVLlrCOHTtytk2YMIEFBQXpLK4Ge5umvLwcMTExCAwMVG7j8/kIDAxEZGSk2mMiIyM55QEgKCio2vKkfvVcVXFxMaRSKRwcHHQVZoNQ37r+6quv4OzsjJkzZ+ojTJNXn3o+efIk+vTpg/nz58PFxQWdOnXCmjVrIJfL9RW2yalPPQcEBCAmJkZ5K+fRo0c4c+YMhg0bppeYGwtDXAtNYqG8+sjKyoJcLoeLiwtnu4uLC+7du6f2GLFYrLa8WCzWWZymrj71XNXHH38Md3d3lT9+wlWfug4PD8eOHTtw8+ZNPUTYMNSnnh89eoSwsDC8/fbbOHPmDB48eIB58+ZBKpVixYoV+gjb5NSnnidNmoSsrCz069cPjDHIZDK89957+PTTT/URcqNR3bWwoKAAJSUlsLS01PprNtiWEWIagoODcejQIZw4cQIWFhaGDqdBkUgkmDJlCkJCQuDk5GTocBo0hUIBZ2dnbN++HT169MCECROwbNkybNu2zdChNShXrlzBmjVrsHXrVsTGxuL48eM4ffo0Vq5caejQyAtqsC0jTk5OEAgEyMjI4GzPyMiAq6ur2mNcXV01Kk/qV8+V1q9fj+DgYFy8eBFdunTRZZgNgqZ1/fDhQyQlJWHEiBHKbQqFAgBgZmaGxMREtGzZUrdBm6D6/E27ubnB3NwcAoFAua19+/YQi8UoLy+HUCjUacymqD71vHz5ckyZMgXvvvsuAKBz584oKirC7NmzsWzZMvD59P1aG6q7Ftra2uqkVQRowC0jQqEQPXr0wKVLl5TbFAoFLl26hD59+qg9pk+fPpzyAHDhwoVqy5P61TMArFu3DitXrsS5c+fg5+enj1BNnqZ13a5dO9y+fRs3b95UPkaOHImXX34ZN2/ehKenpz7DNxn1+Zvu27cvHjx4oEz2AOD+/ftwc3OjRKQa9ann4uJilYSjMgFktMya1hjkWqizrrFG4NChQ0wkErHdu3ezhIQENnv2bNa0aVMmFosZY4xNmTKFLV26VFk+IiKCmZmZsfXr17O7d++yFStW0NDeOtC0noODg5lQKGTHjh1j6enpyodEIjHUWzAZmtZ1VTSapm40reeUlBRmY2PDFixYwBITE9lvv/3GnJ2d2apVqwz1FkyCpvW8YsUKZmNjww4ePMgePXrEfv/9d9ayZUs2fvx4Q70FkyCRSFhcXByLi4tjANiGDRtYXFwcS05OZowxtnTpUjZlyhRl+cqhvR999BG7e/cu27JlCw3tfVGbNm1iXl5eTCgUsp49e7Lr168r9w0cOJBNmzaNU/7IkSOsTZs2TCgUso4dO7LTp0/rOWLTpEk9t2jRggFQeaxYsUL/gZsgTf+mn0fJSN1pWs/Xrl1jvXr1YiKRiPn4+LDVq1czmUym56hNjyb1LJVK2RdffMFatmzJLCwsmKenJ5s3bx7Lzc3Vf+Am5PLly2o/cyvrdtq0aWzgwIEqx3Tt2pUJhULm4+PDdu3apdMYeYxR2xYhhBBCDKfB9hkhhBBCiGmgZIQQQgghBkXJCCGEEEIMipIRQgghhBgUJSOEEEIIMShKRgghhBBiUJSMEEIIIcSgKBkhhBBCiEFRMkIIIYQQg6JkhBBCCCEGRckIIYQQQgyKkhFCCCGEGNT/A8jDIM/BgHgmAAAAAElFTkSuQmCC", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Greedy rollouts over untrained policy\n", + "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n", + "td_init = env.reset(batch_size=[3]).to(device)\n", + "policy = policy.to(device)\n", + "out = policy(td_init.clone(), phase=\"test\", decode_type=\"greedy\", return_actions=True)\n", + "actions_untrained = out['actions'].cpu().detach()\n", + "rewards_untrained = out['reward'].cpu().detach()\n", + "\n", + "for i in range(3):\n", + " print(f\"Problem {i+1} | Cost: {-rewards_untrained[i]:.3f}\")\n", + " env.render(td_init[i], actions_untrained[i])" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Trainer\n", + "\n", + "The RL4CO trainer is a wrapper around PyTorch Lightning's `Trainer` class which adds some functionality and more efficient defaults" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Using 16bit Automatic Mixed Precision (AMP)\n", + "GPU available: True (cuda), used: True\n", + "GPU available: True (cuda), used: True\n", + "TPU available: False, using: 0 TPU cores\n", + "IPU available: False, using: 0 IPUs\n", + "HPU available: False, using: 0 HPUs\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\n" + ] + } + ], + "source": [ + "trainer = RL4COTrainer(\n", + " max_epochs=3,\n", + " accelerator=\"gpu\",\n", + " devices=1,\n", + " logger=None,\n", + ")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Fit the model" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n", + "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n", + "\n", + " | Name | Type | Params\n", + "--------------------------------------------------\n", + "0 | env | TSPEnv | 0 \n", + "1 | policy | AttentionModelPolicy | 710 K \n", + "2 | baseline | WarmupBaseline | 710 K \n", + "--------------------------------------------------\n", + "1.4 M Trainable params\n", + "0 Non-trainable params\n", + "1.4 M Total params\n", + "5.681 Total estimated model params size (MB)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "c15144babb9f45dba930de73d048e1f6", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Sanity Checking: | | 0/? [00:00" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Greedy rollouts over trained model (same states as previous plot)\n", + "policy = model.policy.to(device)\n", + "out = policy(td_init.clone(), phase=\"test\", decode_type=\"greedy\", return_actions=True)\n", + "actions_trained = out['actions'].cpu().detach()\n", + "\n", + "# Plotting\n", + "import matplotlib.pyplot as plt\n", + "for i, td in enumerate(td_init):\n", + " fig, axs = plt.subplots(1,2, figsize=(11,5))\n", + " env.render(td, actions_untrained[i], ax=axs[0]) \n", + " env.render(td, actions_trained[i], ax=axs[1])\n", + " axs[0].set_title(f\"Untrained | Cost = {-rewards_untrained[i].item():.3f}\")\n", + " axs[1].set_title(r\"Trained $\\pi_\\theta$\" + f\"| Cost = {-out['reward'][i].item():.3f}\")" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can see that even after just 3 epochs, our trained AM is able to find much better solutions than the random policy! 🎉" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [], + "source": [ + "# Optionally, save the checkpoint for later use (e.g. in tutorials/4-search-methods.ipynb)\n", + "trainer.save_checkpoint(\"tsp-quickstart.ckpt\")" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "rl4co", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.8" + }, + "orig_nbformat": 4 + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/1-quickstart/index.html b/examples/1-quickstart/index.html new file mode 100644 index 00000000..44d77127 --- /dev/null +++ b/examples/1-quickstart/index.html @@ -0,0 +1,3735 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + RL4CO Quickstart Notebook - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/2-full-training/2-full-training.ipynb b/examples/2-full-training/2-full-training.ipynb new file mode 100644 index 00000000..737ce881 --- /dev/null +++ b/examples/2-full-training/2-full-training.ipynb @@ -0,0 +1,937 @@ +{ + "cells": [ + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Training: Checkpoints, Logging, and Callbacks" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "\n", + "In this notebook we will cover a quickstart training of the Split Delivery Vehicle Routing Problem (SDVRP), with some additional comments along the way. The SDVRP is a variant of the VRP where a vehicle can deliver a part of the demand of a customer and return later to deliver the rest of the demand.\n", + "\n", + "\n", + "\n", + "\n", + "\"Open\n", + "\n" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Installation\n", + "\n", + "Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!\n", + "\n", + "> Note: You may need to restart the runtime in Colab after this\n" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "# !pip install rl4co\n", + "\n", + "## NOTE: to install latest version from Github (may be unstable) install from source instead:\n", + "# !pip install git+https://github.com/ai4co/rl4co.git" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Imports" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "import torch\n", + "from lightning.pytorch.callbacks import ModelCheckpoint, RichModelSummary\n", + "\n", + "from rl4co.envs import SDVRPEnv\n", + "from rl4co.models.zoo import AttentionModel\n", + "from rl4co.utils.trainer import RL4COTrainer" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Main Setup" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Environment, Model and LitModule" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n" + ] + } + ], + "source": [ + "# RL4CO env based on TorchRL\n", + "env = SDVRPEnv(generator_params=dict(num_loc=20))\n", + "\n", + "# Model: default is AM with REINFORCE and greedy rollout baseline\n", + "model = AttentionModel(env,\n", + " baseline='rollout',\n", + " train_data_size=100_000, # really small size for demo\n", + " val_data_size=10_000)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Test greedy rollout with untrained model and plot" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Tour lengths: ['29.45', '14.26', '21.15']\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Greedy rollouts over untrained policy\n", + "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n", + "td_init = env.reset(batch_size=[3]).to(device)\n", + "policy = model.policy.to(device)\n", + "out = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\")\n", + "\n", + "# Plotting\n", + "print(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\")\n", + "for td, actions in zip(td_init, out['actions'].cpu()):\n", + " env.render(td, actions)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Training" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Callbacks \n", + "\n", + "Here we set up a checkpoint callback to save the best model and another callback for demonstration (nice progress bar). You may check other callbacks [here](https://lightning.ai/docs/pytorch/stable/extensions/callbacks.html)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "# Checkpointing callback: save models when validation reward improves\n", + "checkpoint_callback = ModelCheckpoint( dirpath=\"checkpoints\", # save to checkpoints/\n", + " filename=\"epoch_{epoch:03d}\", # save as epoch_XXX.ckpt\n", + " save_top_k=1, # save only the best model\n", + " save_last=True, # save the last model\n", + " monitor=\"val/reward\", # monitor validation reward\n", + " mode=\"max\") # maximize validation reward\n", + "\n", + "# Print model summary\n", + "rich_model_summary = RichModelSummary(max_depth=3)\n", + "\n", + "# Callbacks list\n", + "callbacks = [checkpoint_callback, rich_model_summary]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Logging\n", + "\n", + "Here we will use Wandb. You may comment below lines if you don't want to use it. You may check other loggers [here](https://lightning.ai/docs/pytorch/stable/extensions/logging.html)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We make sure we're logged into W&B so that our experiments can be associated with our account. You may comment the below line if you don't want to use it." + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "# import wandb\n", + "# wandb.login()" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [], + "source": [ + "## Comment following two lines if you don't want logging\n", + "from lightning.pytorch.loggers import WandbLogger\n", + "\n", + "logger = WandbLogger(project=\"rl4co\", name=\"sdvrp-am\")\n", + "\n", + "\n", + "## Keep below if you don't want logging\n", + "# logger = None" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Trainer\n", + "\n", + "The RL4CO trainer is a wrapper around PyTorch Lightning's `Trainer` class which adds some functionality and more efficient defaults" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The Trainer handles the logging, checkpointing and more for you. " + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Using 16bit Automatic Mixed Precision (AMP)\n", + "Trainer already configured with model summary callbacks: []. Skipping setting a default `ModelSummary` callback.\n", + "GPU available: True (cuda), used: True\n", + "Trainer already configured with model summary callbacks: []. Skipping setting a default `ModelSummary` callback.\n", + "GPU available: True (cuda), used: True\n", + "TPU available: False, using: 0 TPU cores\n", + "IPU available: False, using: 0 IPUs\n", + "HPU available: False, using: 0 HPUs\n" + ] + } + ], + "source": [ + "from rl4co.utils.trainer import RL4COTrainer\n", + "\n", + "trainer = RL4COTrainer(\n", + " max_epochs=2,\n", + " accelerator=\"gpu\",\n", + " devices=1,\n", + " logger=logger,\n", + " callbacks=callbacks,\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Fit the model" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "\u001b[34m\u001b[1mwandb\u001b[0m: Currently logged in as: \u001b[33msilab-kaist\u001b[0m. Use \u001b[1m`wandb login --relogin`\u001b[0m to force relogin\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/wandb/sdk/lib/ipython.py:77: DeprecationWarning: Importing display from IPython.core.display is deprecated since IPython 7.14, please import from IPython display\n", + " from IPython.core.display import HTML, display # type: ignore\n" + ] + }, + { + "data": { + "text/html": [ + "wandb version 0.16.6 is available! To upgrade, please run:\n", + " $ pip install wandb --upgrade" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "Tracking run with wandb version 0.16.5" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "Run data is saved locally in ./wandb/run-20240428_182146-xcgdzio4" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "Syncing run sdvrp-am to Weights & Biases (docs)
" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + " View project at https://wandb.ai/silab-kaist/rl4co" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + " View run at https://wandb.ai/silab-kaist/rl4co/runs/xcgdzio4/workspace" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n", + "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n" + ] + }, + { + "data": { + "text/html": [ + "
┏━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━┓\n",
+       "┃     Name                                    Type                   Params ┃\n",
+       "┡━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━┩\n",
+       "│ 0  │ env                                    │ SDVRPEnv              │      0 │\n",
+       "│ 1  │ policy                                 │ AttentionModelPolicy  │  694 K │\n",
+       "│ 2  │ policy.encoder                         │ AttentionModelEncoder │  595 K │\n",
+       "│ 3  │ policy.encoder.init_embedding          │ VRPInitEmbedding      │    896 │\n",
+       "│ 4  │ policy.encoder.net                     │ GraphAttentionNetwork │  594 K │\n",
+       "│ 5  │ policy.decoder                         │ AttentionModelDecoder │ 98.8 K │\n",
+       "│ 6  │ policy.decoder.context_embedding       │ VRPContext            │ 16.5 K │\n",
+       "│ 7  │ policy.decoder.dynamic_embedding       │ SDVRPDynamicEmbedding │    384 │\n",
+       "│ 8  │ policy.decoder.pointer                 │ PointerAttention      │ 16.4 K │\n",
+       "│ 9  │ policy.decoder.project_node_embeddings │ Linear                │ 49.2 K │\n",
+       "│ 10 │ policy.decoder.project_fixed_context   │ Linear                │ 16.4 K │\n",
+       "│ 11 │ baseline                               │ WarmupBaseline        │  694 K │\n",
+       "│ 12 │ baseline.baseline                      │ RolloutBaseline       │  694 K │\n",
+       "│ 13 │ baseline.baseline.policy               │ AttentionModelPolicy  │  694 K │\n",
+       "│ 14 │ baseline.warmup_baseline               │ ExponentialBaseline   │      0 │\n",
+       "└────┴────────────────────────────────────────┴───────────────────────┴────────┘\n",
+       "
\n" + ], + "text/plain": [ + "┏━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━┓\n", + "┃\u001b[1;35m \u001b[0m\u001b[1;35m \u001b[0m\u001b[1;35m \u001b[0m┃\u001b[1;35m \u001b[0m\u001b[1;35mName \u001b[0m\u001b[1;35m \u001b[0m┃\u001b[1;35m \u001b[0m\u001b[1;35mType \u001b[0m\u001b[1;35m \u001b[0m┃\u001b[1;35m \u001b[0m\u001b[1;35mParams\u001b[0m\u001b[1;35m \u001b[0m┃\n", + "┡━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━┩\n", + "│\u001b[2m \u001b[0m\u001b[2m0 \u001b[0m\u001b[2m \u001b[0m│ env │ SDVRPEnv │ 0 │\n", + "│\u001b[2m \u001b[0m\u001b[2m1 \u001b[0m\u001b[2m \u001b[0m│ policy │ AttentionModelPolicy │ 694 K │\n", + "│\u001b[2m \u001b[0m\u001b[2m2 \u001b[0m\u001b[2m \u001b[0m│ policy.encoder │ AttentionModelEncoder │ 595 K │\n", + "│\u001b[2m \u001b[0m\u001b[2m3 \u001b[0m\u001b[2m \u001b[0m│ policy.encoder.init_embedding │ VRPInitEmbedding │ 896 │\n", + "│\u001b[2m \u001b[0m\u001b[2m4 \u001b[0m\u001b[2m \u001b[0m│ policy.encoder.net │ GraphAttentionNetwork │ 594 K │\n", + "│\u001b[2m \u001b[0m\u001b[2m5 \u001b[0m\u001b[2m \u001b[0m│ policy.decoder │ AttentionModelDecoder │ 98.8 K │\n", + "│\u001b[2m \u001b[0m\u001b[2m6 \u001b[0m\u001b[2m \u001b[0m│ policy.decoder.context_embedding │ VRPContext │ 16.5 K │\n", + "│\u001b[2m \u001b[0m\u001b[2m7 \u001b[0m\u001b[2m \u001b[0m│ policy.decoder.dynamic_embedding │ SDVRPDynamicEmbedding │ 384 │\n", + "│\u001b[2m \u001b[0m\u001b[2m8 \u001b[0m\u001b[2m \u001b[0m│ policy.decoder.pointer │ PointerAttention │ 16.4 K │\n", + "│\u001b[2m \u001b[0m\u001b[2m9 \u001b[0m\u001b[2m \u001b[0m│ policy.decoder.project_node_embeddings │ Linear │ 49.2 K │\n", + "│\u001b[2m \u001b[0m\u001b[2m10\u001b[0m\u001b[2m \u001b[0m│ policy.decoder.project_fixed_context │ Linear │ 16.4 K │\n", + "│\u001b[2m \u001b[0m\u001b[2m11\u001b[0m\u001b[2m \u001b[0m│ baseline │ WarmupBaseline │ 694 K │\n", + "│\u001b[2m \u001b[0m\u001b[2m12\u001b[0m\u001b[2m \u001b[0m│ baseline.baseline │ RolloutBaseline │ 694 K │\n", + "│\u001b[2m \u001b[0m\u001b[2m13\u001b[0m\u001b[2m \u001b[0m│ baseline.baseline.policy │ AttentionModelPolicy │ 694 K │\n", + "│\u001b[2m \u001b[0m\u001b[2m14\u001b[0m\u001b[2m \u001b[0m│ baseline.warmup_baseline │ ExponentialBaseline │ 0 │\n", + "└────┴────────────────────────────────────────┴───────────────────────┴────────┘\n" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "
Trainable params: 1.4 M                                                                                            \n",
+       "Non-trainable params: 0                                                                                            \n",
+       "Total params: 1.4 M                                                                                                \n",
+       "Total estimated model params size (MB): 5                                                                          \n",
+       "
\n" + ], + "text/plain": [ + "\u001b[1mTrainable params\u001b[0m: 1.4 M \n", + "\u001b[1mNon-trainable params\u001b[0m: 0 \n", + "\u001b[1mTotal params\u001b[0m: 1.4 M \n", + "\u001b[1mTotal estimated model params size (MB)\u001b[0m: 5 \n" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "07f138c5315e4403abbe0cfed220bfb3", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Sanity Checking: | | 0/? [00:00" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Greedy rollouts over trained model (same states as previous plot)\n", + "policy = model.policy.to(device)\n", + "out = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\")\n", + "\n", + "# Plotting\n", + "print(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\")\n", + "for td, actions in zip(td_init, out['actions'].cpu()):\n", + " env.render(td, actions)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Test function\n", + "\n", + "By default, the dataset is generated or loaded by the environment. You may load a dataset by setting `test_file` during the env config:\n", + "\n", + "```python\n", + "env = SDVRPEnv(\n", + " ...\n", + " test_file=\"path/to/test/file\"\n", + ")\n", + "```\n", + "In this case, we test directly on the generated test dataset" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n", + "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'test_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "a30f0c12c3964a608e2f6e55a8fdb18b", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Testing: | | 0/? [00:00┏━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━┓\n", + "┃ Test metric DataLoader 0 ┃\n", + "┡━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━┩\n", + "│ test/reward -7.363526344299316 │\n", + "└───────────────────────────┴───────────────────────────┘\n", + "\n" + ], + "text/plain": [ + "┏━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━┓\n", + "┃\u001b[1m \u001b[0m\u001b[1m Test metric \u001b[0m\u001b[1m \u001b[0m┃\u001b[1m \u001b[0m\u001b[1m DataLoader 0 \u001b[0m\u001b[1m \u001b[0m┃\n", + "┡━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━┩\n", + "│\u001b[36m \u001b[0m\u001b[36m test/reward \u001b[0m\u001b[36m \u001b[0m│\u001b[35m \u001b[0m\u001b[35m -7.363526344299316 \u001b[0m\u001b[35m \u001b[0m│\n", + "└───────────────────────────┴───────────────────────────┘\n" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/plain": [ + "[{'test/reward': -7.363526344299316}]" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "trainer.test(model)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Test generalization to new dataset\n", + "\n", + "Here we can load a new dataset (with 50 nodes) and test the trained model on it" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [], + "source": [ + "# Test generalization to 50 nodes (not going to be great due to few epochs, but hey)\n", + "env = SDVRPEnv(generator_params=dict(num_loc=50))\n", + "\n", + "# Generate data (100) and set as test dataset\n", + "new_dataset = env.dataset(50)\n", + "dataloader = model._dataloader(new_dataset, batch_size=100)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Plotting generalization\n" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Tour lengths: ['11.84', '12.49', '12.20']\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Greedy rollouts over trained policy (same states as previous plot, with 20 nodes)\n", + "init_states = next(iter(dataloader))[:3]\n", + "td_init_generalization = env.reset(init_states).to(device)\n", + "\n", + "policy = model.policy.to(device)\n", + "out = policy(td_init_generalization.clone(), env, phase=\"test\", decode_type=\"greedy\")\n", + "\n", + "# Plotting\n", + "print(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\")\n", + "for td, actions in zip(td_init_generalization, out['actions'].cpu()):\n", + " env.render(td, actions)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Loading model\n", + "\n", + "Thanks to PyTorch Lightning,[ we can easily save and load a model to and from a checkpoint](https://lightning.ai/docs/pytorch/stable/common/checkpointing_basic.html)! This is declared in the `Trainer` using the model checkpoint callback. For example, we can load the last model via the `last.ckpt` file located in the folder we specified in the `Trainer`. " + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Checkpointing" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/core/saving.py:188: Found keys that are not in the model state dict but in the checkpoint: ['baseline.baseline.policy.encoder.init_embedding.init_embed.weight', 'baseline.baseline.policy.encoder.init_embedding.init_embed.bias', 'baseline.baseline.policy.encoder.init_embedding.init_embed_depot.weight', 'baseline.baseline.policy.encoder.init_embedding.init_embed_depot.bias', 'baseline.baseline.policy.encoder.net.layers.0.0.module.Wqkv.weight', 'baseline.baseline.policy.encoder.net.layers.0.0.module.Wqkv.bias', 'baseline.baseline.policy.encoder.net.layers.0.0.module.out_proj.weight', 'baseline.baseline.policy.encoder.net.layers.0.0.module.out_proj.bias', 'baseline.baseline.policy.encoder.net.layers.0.1.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.0.1.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.0.1.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.0.1.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.0.1.normalizer.num_batches_tracked', 'baseline.baseline.policy.encoder.net.layers.0.2.module.0.weight', 'baseline.baseline.policy.encoder.net.layers.0.2.module.0.bias', 'baseline.baseline.policy.encoder.net.layers.0.2.module.2.weight', 'baseline.baseline.policy.encoder.net.layers.0.2.module.2.bias', 'baseline.baseline.policy.encoder.net.layers.0.3.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.0.3.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.0.3.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.0.3.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.0.3.normalizer.num_batches_tracked', 'baseline.baseline.policy.encoder.net.layers.1.0.module.Wqkv.weight', 'baseline.baseline.policy.encoder.net.layers.1.0.module.Wqkv.bias', 'baseline.baseline.policy.encoder.net.layers.1.0.module.out_proj.weight', 'baseline.baseline.policy.encoder.net.layers.1.0.module.out_proj.bias', 'baseline.baseline.policy.encoder.net.layers.1.1.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.1.1.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.1.1.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.1.1.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.1.1.normalizer.num_batches_tracked', 'baseline.baseline.policy.encoder.net.layers.1.2.module.0.weight', 'baseline.baseline.policy.encoder.net.layers.1.2.module.0.bias', 'baseline.baseline.policy.encoder.net.layers.1.2.module.2.weight', 'baseline.baseline.policy.encoder.net.layers.1.2.module.2.bias', 'baseline.baseline.policy.encoder.net.layers.1.3.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.1.3.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.1.3.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.1.3.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.1.3.normalizer.num_batches_tracked', 'baseline.baseline.policy.encoder.net.layers.2.0.module.Wqkv.weight', 'baseline.baseline.policy.encoder.net.layers.2.0.module.Wqkv.bias', 'baseline.baseline.policy.encoder.net.layers.2.0.module.out_proj.weight', 'baseline.baseline.policy.encoder.net.layers.2.0.module.out_proj.bias', 'baseline.baseline.policy.encoder.net.layers.2.1.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.2.1.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.2.1.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.2.1.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.2.1.normalizer.num_batches_tracked', 'baseline.baseline.policy.encoder.net.layers.2.2.module.0.weight', 'baseline.baseline.policy.encoder.net.layers.2.2.module.0.bias', 'baseline.baseline.policy.encoder.net.layers.2.2.module.2.weight', 'baseline.baseline.policy.encoder.net.layers.2.2.module.2.bias', 'baseline.baseline.policy.encoder.net.layers.2.3.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.2.3.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.2.3.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.2.3.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.2.3.normalizer.num_batches_tracked', 'baseline.baseline.policy.decoder.context_embedding.project_context.weight', 'baseline.baseline.policy.decoder.dynamic_embedding.projection.weight', 'baseline.baseline.policy.decoder.pointer.project_out.weight', 'baseline.baseline.policy.decoder.project_node_embeddings.weight', 'baseline.baseline.policy.decoder.project_fixed_context.weight']\n", + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n" + ] + } + ], + "source": [ + "# Environment, Model, and Lightning Module (reinstantiate from scratch)\n", + "model = AttentionModel(env,\n", + " baseline=\"rollout\",\n", + " train_data_size=100_000,\n", + " test_data_size=10_000,\n", + " optimizer_kwargs={'lr': 1e-4}\n", + " )\n", + "\n", + "# Note that by default, Lightning will call checkpoints from newer runs with \"-v{version}\" suffix\n", + "# unless you specify the checkpoint path explicitly\n", + "new_model_checkpoint = AttentionModel.load_from_checkpoint(\"checkpoints/last.ckpt\", strict=False)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Now we can load both the model and environment from the checkpoint!" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Tour lengths: ['9.12', '7.16', '9.55']\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Greedy rollouts over trained model (same states as previous plot, with 20 nodes)\n", + "policy_new = new_model_checkpoint.policy.to(device)\n", + "env = new_model_checkpoint.env.to(device)\n", + "\n", + "out = policy_new(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\")\n", + "\n", + "# Plotting\n", + "print(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\")\n", + "for td, actions in zip(td_init, out['actions'].cpu()):\n", + " env.render(td, actions)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Additional resources\n", + "\n", + "[**Documentation**](https://rl4co.readthedocs.io/) | [**Getting Started**](https://github.com/ai4co/rl4co/tree/main#getting-started) | [**Usage**](https://github.com/ai4co/rl4co/tree/main#usage) | [**Contributing**](#contributing) | [**Paper**](https://arxiv.org/abs/2306.17100) | [**Citation**](#cite-us)\n", + "\n", + "Have feedback about this notebook? Feel free to contribute by either opening an issue or a pull request! ;)" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "env", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.8" + }, + "orig_nbformat": 4 + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/2-full-training/index.html b/examples/2-full-training/index.html new file mode 100644 index 00000000..d5cc9ba6 --- /dev/null +++ b/examples/2-full-training/index.html @@ -0,0 +1,4469 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + Training: Checkpoints, Logging, and Callbacks - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/2b-train-simple.py b/examples/2b-train-simple.py new file mode 100644 index 00000000..777e2a00 --- /dev/null +++ b/examples/2b-train-simple.py @@ -0,0 +1,67 @@ +import torch + +from lightning.pytorch.callbacks import ModelCheckpoint, RichModelSummary +from lightning.pytorch.loggers import WandbLogger + +from rl4co.envs import TSPEnv +from rl4co.models.zoo import AttentionModel +from rl4co.utils.trainer import RL4COTrainer + + +def main(): + # Set device + device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + # RL4CO env based on TorchRL + env = TSPEnv(generator_params=dict(num_loc=20)) + + # Model: default is AM with REINFORCE and greedy rollout baseline + # check out `RL4COLitModule` and `REINFORCE` for more details + model = AttentionModel( + env, + baseline="rollout", + train_data_size=100_000, # really small size for demo + val_data_size=10_000, + ) + + # Example callbacks + checkpoint_callback = ModelCheckpoint( + dirpath="checkpoints", # save to checkpoints/ + filename="epoch_{epoch:03d}", # save as epoch_XXX.ckpt + save_top_k=1, # save only the best model + save_last=True, # save the last model + monitor="val/reward", # monitor validation reward + mode="max", + ) # maximize validation reward + rich_model_summary = RichModelSummary(max_depth=3) # model summary callback + callbacks = [checkpoint_callback, rich_model_summary] + + # Logger + logger = WandbLogger(project="rl4co", name="tsp") + # logger = None # uncomment this line if you don't want logging + + # Main trainer configuration + trainer = RL4COTrainer( + max_epochs=2, + accelerator="gpu", + devices=1, + logger=logger, + callbacks=callbacks, + ) + + # Main training loop + trainer.fit(model) + + # Greedy rollouts over trained model + # note: modify this to load your own data instead! + td_init = env.reset(batch_size=[16]).to(device) + policy = model.policy.to(device) + out = policy(td_init.clone(), env, phase="test", decode_type="greedy") + + # Print results + print(f"Tour lengths: {[f'{-r.item():.3f}' for r in out['reward']]}") + print(f"Avg tour length: {-torch.mean(out['reward']).item():.3f}") + + +if __name__ == "__main__": + main() diff --git a/examples/2d-meta_train.py b/examples/2d-meta_train.py new file mode 100644 index 00000000..1f3fb8d4 --- /dev/null +++ b/examples/2d-meta_train.py @@ -0,0 +1,80 @@ +from lightning.pytorch.callbacks import ModelCheckpoint, RichModelSummary +from lightning.pytorch.loggers import WandbLogger + +from rl4co.envs import CVRPEnv +from rl4co.models.zoo.am import AttentionModelPolicy +from rl4co.models.zoo.pomo import POMO +from rl4co.utils.trainer import RL4COTrainer +from rl4co.utils.meta_trainer import ReptileCallback + +def main(): + # Set device + device_id = 0 + + # RL4CO env based on TorchRL + env = CVRPEnv(generator_params={'num_loc': 50}) + + # Policy: neural network, in this case with encoder-decoder architecture + # Note that this is adapted the same as POMO did in the original paper + policy = AttentionModelPolicy(env_name=env.name, + embed_dim=128, + num_encoder_layers=6, + num_heads=8, + normalization="instance", + use_graph_context=False + ) + + # RL Model (POMO) + model = POMO(env, + policy, + batch_size=64, # meta_batch_size + train_data_size=64 * 50, # equals to (meta_batch_size) * (gradient decent steps in the inner-loop optimization of meta-learning method) + val_data_size=0, + optimizer_kwargs={"lr": 1e-4, "weight_decay": 1e-6}, + ) + + # Example callbacks + checkpoint_callback = ModelCheckpoint( + dirpath="meta_pomo/checkpoints", # save to checkpoints/ + filename="epoch_{epoch:03d}", # save as epoch_XXX.ckpt + save_top_k=1, # save only the best model + save_last=True, # save the last model + monitor="val/reward", # monitor validation reward + mode="max", # maximize validation reward + ) + rich_model_summary = RichModelSummary(max_depth=3) # model summary callback + + # Meta callbacks + meta_callback = ReptileCallback( + num_tasks = 1, # the number of tasks in a mini-batch, i.e. `B` in the original paper + alpha = 0.9, # initial weight of the task model for the outer-loop optimization of reptile + alpha_decay = 1, # weight decay of the task model for the outer-loop optimization of reptile. No decay performs better. + min_size = 20, # minimum of sampled size in meta tasks (only supported in cross-size generalization) + max_size= 150, # maximum of sampled size in meta tasks (only supported in cross-size generalization) + data_type="size_distribution", # choose from ["size", "distribution", "size_distribution"] + sch_bar=0.9, # for the task scheduler of size setting, where lr_decay_epoch = sch_bar * epochs, i.e. after this epoch, learning rate will decay with a weight 0.1 + print_log=True # whether to print the sampled tasks in each meta iteration + ) + callbacks = [meta_callback, checkpoint_callback, rich_model_summary] + + # Logger + logger = WandbLogger(project="rl4co", name=f"{env.name}_pomo_reptile") + # logger = None # uncomment this line if you don't want logging + + # Adjust your trainer to the number of epochs you want to run + trainer = RL4COTrainer( + max_epochs=15000, # (the number of meta_model updates) * (the number of tasks in a mini-batch) + callbacks=callbacks, + accelerator="gpu", + devices=[device_id], + logger=logger, + limit_train_batches=50 # gradient decent steps in the inner-loop optimization of meta-learning method + ) + + # Fit + trainer.fit(model) + + +if __name__ == "__main__": + main() + diff --git a/examples/3-creating-new-env-model/3-creating-new-env-model.ipynb b/examples/3-creating-new-env-model/3-creating-new-env-model.ipynb new file mode 100644 index 00000000..ff299312 --- /dev/null +++ b/examples/3-creating-new-env-model/3-creating-new-env-model.ipynb @@ -0,0 +1,941 @@ +{ + "cells": [ + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# New Environment: Creating and Modeling\n", + "" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "In this notebook, we will show how to extend RL4CO to solve new problems from zero to hero! 🚀\n", + "\n", + "\"Open\n", + "\n", + "### Contents\n", + "\n", + "1. [Environment](#environment-creation)\n", + "2. [Modeling](#modeling)\n", + "3. [Training](#training-our-model)\n", + "4. [Evaluation](#evaluation)\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Problem: TSP\n", + "\n", + "We will build an environment and model for the Traveling Salesman Problem (TSP). The TSP is a well-known combinatorial optimization problem that consists of finding the shortest route that visits each city in a given list exactly once and returns to the origin city. The TSP is NP-hard, and it is one of the most studied problems in combinatorial optimization." + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Installation" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "## Uncomment the following line to install the package from PyPI\n", + "## You may need to restart the runtime in Colab after this\n", + "## Remember to choose a GPU runtime for faster training!\n", + "\n", + "# !pip install rl4co" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Imports" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [], + "source": [ + "from typing import Optional\n", + "import torch\n", + "import torch.nn as nn\n", + "\n", + "from tensordict.tensordict import TensorDict\n", + "from torchrl.data import (\n", + " Bounded,\n", + " Composite,\n", + " Unbounded,\n", + " Unbounded,\n", + ")\n", + "\n", + "from rl4co.utils.decoding import rollout, random_policy\n", + "from rl4co.envs.common import RL4COEnvBase, Generator, get_sampler\n", + "from rl4co.models.zoo import AttentionModel, AttentionModelPolicy\n", + "from rl4co.utils.ops import gather_by_index, get_tour_length\n", + "from rl4co.utils.trainer import RL4COTrainer" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Environment Creation" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We will base environment creation on the `RL4COEnvBase` class, which is based on [TorchRL](https://github.com/pytorch/rl). More information in [documentation](https://rl4co.readthedocs.io/en/latest/_content/api/envs/base.html)!" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Reset\n", + "\n", + "The `_reset` function is used to initialize the environment to an initial state. It returns a TensorDict of the initial state." + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict:\n", + " # Initialize locations\n", + " init_locs = td[\"locs\"] if td is not None else None\n", + " if batch_size is None:\n", + " batch_size = self.batch_size if init_locs is None else init_locs.shape[:-2]\n", + " device = init_locs.device if init_locs is not None else self.device\n", + " self.to(device)\n", + " if init_locs is None:\n", + " init_locs = self.generate_data(batch_size=batch_size).to(device)[\"locs\"]\n", + " batch_size = [batch_size] if isinstance(batch_size, int) else batch_size\n", + "\n", + " # We do not enforce loading from self for flexibility\n", + " num_loc = init_locs.shape[-2]\n", + "\n", + " # Other variables\n", + " current_node = torch.zeros((batch_size), dtype=torch.int64, device=device)\n", + " available = torch.ones(\n", + " (*batch_size, num_loc), dtype=torch.bool, device=device\n", + " ) # 1 means not visited, i.e. action is allowed\n", + " i = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device)\n", + "\n", + " return TensorDict(\n", + " {\n", + " \"locs\": init_locs,\n", + " \"first_node\": current_node,\n", + " \"current_node\": current_node,\n", + " \"i\": i,\n", + " \"action_mask\": available,\n", + " \"reward\": torch.zeros((*batch_size, 1), dtype=torch.float32),\n", + " },\n", + " batch_size=batch_size,\n", + " )" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Step\n", + "\n", + "Environment `_step`: this defines the state update of the TSP problem gived a TensorDict (td in the code) of the current state and the action to take:" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "def _step(self, td: TensorDict) -> TensorDict:\n", + " current_node = td[\"action\"]\n", + " first_node = current_node if td[\"i\"].all() == 0 else td[\"first_node\"]\n", + "\n", + " # Set not visited to 0 (i.e., we visited the node)\n", + " # Note: we may also use a separate function for obtaining the mask for more flexibility\n", + " available = td[\"action_mask\"].scatter(\n", + " -1, current_node.unsqueeze(-1).expand_as(td[\"action_mask\"]), 0\n", + " )\n", + "\n", + " # We are done there are no unvisited locations\n", + " done = torch.sum(available, dim=-1) == 0\n", + "\n", + " # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here\n", + " reward = torch.zeros_like(done)\n", + "\n", + " td.update(\n", + " {\n", + " \"first_node\": first_node,\n", + " \"current_node\": current_node,\n", + " \"i\": td[\"i\"] + 1,\n", + " \"action_mask\": available,\n", + " \"reward\": reward,\n", + " \"done\": done,\n", + " },\n", + " )\n", + " return td" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### [Optional] Separate Action Mask Function\n", + "\n", + "The `get_action_mask` function simply returns a mask of the valid actions for the current updated state. This can be used in `_step` and `_reset` for larger environments with several constraints and may be useful for modularity" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "def get_action_mask(self, td: TensorDict) -> TensorDict:\n", + " # Here: your logic \n", + " return td[\"action_mask\"]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### [Optional] Check Solution Validity\n", + "\n", + "Another optional utility, this checks whether the solution is feasible and can help identify bugs " + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "def check_solution_validity(self, td: TensorDict, actions: torch.Tensor):\n", + " \"\"\"Check that solution is valid: nodes are visited exactly once\"\"\"\n", + " assert (\n", + " torch.arange(actions.size(1), out=actions.data.new())\n", + " .view(1, -1)\n", + " .expand_as(actions)\n", + " == actions.data.sort(1)[0]\n", + " ).all(), \"Invalid tour\"" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Reward function\n", + "\n", + "The `_get_reward` function is used to evaluate the reward given the solution (actions)." + ] + }, + { + "cell_type": "code", + "execution_count": 26, + "metadata": {}, + "outputs": [], + "source": [ + "def _get_reward(self, td, actions) -> TensorDict:\n", + " # Sanity check if enabled\n", + " if self.check_solution:\n", + " self.check_solution_validity(td, actions)\n", + "\n", + " # Gather locations in order of tour and return distance between them (i.e., -reward)\n", + " locs_ordered = gather_by_index(td[\"locs\"], actions)\n", + " return -get_tour_length(locs_ordered)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Environment Action Specs\n", + "\n", + "This defines the input and output domains of the environment - similar to Gym's `spaces`. \n", + "This is not strictly necessary, but it is useful to have a clear definition of the environment's action and observation spaces and if we want to sample actions using TorchRL's utils\n", + "\n", + "> Note: this is actually not necessary, but it is useful to have a clear definition of the environment's action and observation spaces and if we want to sample actions using TorchRL's utils" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "metadata": {}, + "outputs": [], + "source": [ + "def _make_spec(self, generator):\n", + " \"\"\"Make the observation and action specs from the parameters\"\"\"\n", + " self.observation_spec = Composite(\n", + " locs=Bounded(\n", + " low=self.generator.min_loc,\n", + " high=self.generator.max_loc,\n", + " shape=(self.generator.num_loc, 2),\n", + " dtype=torch.float32,\n", + " ),\n", + " first_node=Unbounded(\n", + " shape=(1),\n", + " dtype=torch.int64,\n", + " ),\n", + " current_node=Unbounded(\n", + " shape=(1),\n", + " dtype=torch.int64,\n", + " ),\n", + " i=Unbounded(\n", + " shape=(1),\n", + " dtype=torch.int64,\n", + " ),\n", + " action_mask=Unbounded(\n", + " shape=(self.generator.num_loc),\n", + " dtype=torch.bool,\n", + " ),\n", + " shape=(),\n", + " )\n", + " self.action_spec = Bounded(\n", + " shape=(1,),\n", + " dtype=torch.int64,\n", + " low=0,\n", + " high=self.generator.num_loc,\n", + " )\n", + " self.reward_spec = Unbounded(shape=(1,))\n", + " self.done_spec = Unbounded(shape=(1,), dtype=torch.bool)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Data generator\n", + "\n", + "The generator allows to generate random instances of the problem. Note that this is a simplified example: this can include additional distributions via the `rl4co.envs.common.utils.get_sampler` method!" + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "torch.Size([32, 20, 2])\n" + ] + } + ], + "source": [ + "class TSPGenerator(Generator):\n", + " def __init__(\n", + " self,\n", + " num_loc: int = 20,\n", + " min_loc: float = 0.0,\n", + " max_loc: float = 1.0,\n", + " ):\n", + " self.num_loc = num_loc\n", + " self.min_loc = min_loc\n", + " self.max_loc = max_loc\n", + " self.loc_sampler = torch.distributions.Uniform(\n", + " low=min_loc, high=max_loc\n", + " )\n", + "\n", + " def _generate(self, batch_size) -> TensorDict:\n", + " # Sample locations\n", + " locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2))\n", + " return TensorDict({\"locs\": locs}, batch_size=batch_size)\n", + " \n", + "# Test generator\n", + "generator = TSPGenerator(num_loc=20)\n", + "locs = generator(32)\n", + "print(locs[\"locs\"].shape)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Render function\n", + "\n", + "The `render` function is optional, but can be useful for quickly visualizing the results of your algorithm!" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "metadata": {}, + "outputs": [], + "source": [ + "def render(self, td, actions=None, ax=None):\n", + " import matplotlib.pyplot as plt\n", + " import numpy as np\n", + "\n", + " if ax is None:\n", + " # Create a plot of the nodes\n", + " _, ax = plt.subplots()\n", + "\n", + " td = td.detach().cpu()\n", + "\n", + " if actions is None:\n", + " actions = td.get(\"action\", None)\n", + " # if batch_size greater than 0 , we need to select the first batch element\n", + " if td.batch_size != torch.Size([]):\n", + " td = td[0]\n", + " actions = actions[0]\n", + "\n", + " locs = td[\"locs\"]\n", + "\n", + " # gather locs in order of action if available\n", + " if actions is None:\n", + " print(\"No action in TensorDict, rendering unsorted locs\")\n", + " else:\n", + " actions = actions.detach().cpu()\n", + " locs = gather_by_index(locs, actions, dim=0)\n", + "\n", + " # Cat the first node to the end to complete the tour\n", + " locs = torch.cat((locs, locs[0:1]))\n", + " x, y = locs[:, 0], locs[:, 1]\n", + "\n", + " # Plot the visited nodes\n", + " ax.scatter(x, y, color=\"tab:blue\")\n", + "\n", + " # Add arrows between visited nodes as a quiver plot\n", + " dx, dy = np.diff(x), np.diff(y)\n", + " ax.quiver(\n", + " x[:-1], y[:-1], dx, dy, scale_units=\"xy\", angles=\"xy\", scale=1, color=\"k\"\n", + " )\n", + "\n", + " # Setup limits and show\n", + " ax.set_xlim(-0.05, 1.05)\n", + " ax.set_ylim(-0.05, 1.05)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Putting everything together" + ] + }, + { + "cell_type": "code", + "execution_count": 28, + "metadata": {}, + "outputs": [], + "source": [ + "class TSPEnv(RL4COEnvBase):\n", + " \"\"\"Traveling Salesman Problem (TSP) environment\"\"\"\n", + "\n", + " name = \"tsp\"\n", + "\n", + " def __init__(\n", + " self,\n", + " generator = TSPGenerator,\n", + " generator_params = {},\n", + " **kwargs,\n", + " ):\n", + " super().__init__(**kwargs)\n", + " self.generator = generator(**generator_params)\n", + " self._make_spec(self.generator)\n", + " \n", + " _reset = _reset\n", + " _step = _step\n", + " _get_reward = _get_reward\n", + " check_solution_validity = check_solution_validity\n", + " get_action_mask = get_action_mask\n", + " _make_spec = _make_spec\n", + " render = render\n" + ] + }, + { + "cell_type": "code", + "execution_count": 29, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "batch_size = 2\n", + "\n", + "env = TSPEnv(generator_params=dict(num_loc=20))\n", + "reward, td, actions = rollout(env, env.reset(batch_size=[batch_size]), random_policy)\n", + "env.render(td, actions)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Modeling\n", + "\n", + "Now we need to model the problem by transforming input information into the latent space to be processed. Here we focus on `AttentionModel`-based embeddings with an encoder-decoder structure. In RL4CO, we divide embeddings in 3 parts:\n", + "\n", + "- `init_embedding`: (encoder) embed initial states of the problem\n", + "- `context_embedding`: (decoder) embed context information of the problem for the current partial solution to modify the query \n", + "- `dynamic_embedding`: (decoder) embed dynamic information of the problem for the current partial solution to modify the query, key, and value (i.e. if other nodes also change state)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Init Embedding\n", + "\n", + "Embed initial problem into latent space. In our case, we can project the coordinates of the cities into a latent space." + ] + }, + { + "cell_type": "code", + "execution_count": 30, + "metadata": {}, + "outputs": [], + "source": [ + "class TSPInitEmbedding(nn.Module):\n", + " \"\"\"Initial embedding for the Traveling Salesman Problems (TSP).\n", + " Embed the following node features to the embedding space:\n", + " - locs: x, y coordinates of the cities\n", + " \"\"\"\n", + "\n", + " def __init__(self, embed_dim, linear_bias=True):\n", + " super(TSPInitEmbedding, self).__init__()\n", + " node_dim = 2 # x, y\n", + " self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias)\n", + "\n", + " def forward(self, td):\n", + " out = self.init_embed(td[\"locs\"])\n", + " return out" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Context Embedding\n", + "\n", + "Context embedding takes the current context and returns a vector representation of it. In TSP, we can take the embedding of the first node visited (since we need to complete the tour) as well as the embedding of current node visited (in the first step we just have a placeholder since they are the same)." + ] + }, + { + "cell_type": "code", + "execution_count": 31, + "metadata": {}, + "outputs": [], + "source": [ + "class TSPContext(nn.Module):\n", + " \"\"\"Context embedding for the Traveling Salesman Problem (TSP).\n", + " Project the following to the embedding space:\n", + " - first node embedding\n", + " - current node embedding\n", + " \"\"\"\n", + "\n", + " def __init__(self, embed_dim, linear_bias=True):\n", + " super(TSPContext, self).__init__()\n", + " self.W_placeholder = nn.Parameter(\n", + " torch.Tensor(2 * embed_dim).uniform_(-1, 1)\n", + " )\n", + " self.project_context = nn.Linear(\n", + " embed_dim*2, embed_dim, bias=linear_bias\n", + " )\n", + "\n", + " def forward(self, embeddings, td):\n", + " batch_size = embeddings.size(0)\n", + " # By default, node_dim = -1 (we only have one node embedding per node)\n", + " node_dim = (\n", + " (-1,) if td[\"first_node\"].dim() == 1 else (td[\"first_node\"].size(-1), -1)\n", + " )\n", + " if td[\"i\"][(0,) * td[\"i\"].dim()].item() < 1: # get first item fast\n", + " context_embedding = self.W_placeholder[None, :].expand(\n", + " batch_size, self.W_placeholder.size(-1)\n", + " )\n", + " else:\n", + " context_embedding = gather_by_index(\n", + " embeddings,\n", + " torch.stack([td[\"first_node\"], td[\"current_node\"]], -1).view(\n", + " batch_size, -1\n", + " ),\n", + " ).view(batch_size, *node_dim)\n", + " return self.project_context(context_embedding)\n", + " " + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Dynamic Embedding\n", + "\n", + "Since the states do not change except for visited nodes, we do not need to modify the keys and values. Therefore, we set this to 0" + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "metadata": {}, + "outputs": [], + "source": [ + "class StaticEmbedding(nn.Module):\n", + " def __init__(self, *args, **kwargs):\n", + " super(StaticEmbedding, self).__init__()\n", + "\n", + " def forward(self, td):\n", + " return 0, 0, 0" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Training our Model" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n" + ] + } + ], + "source": [ + "# Instantiate our environment\n", + "env = TSPEnv(generator_params=dict(num_loc=20))\n", + "\n", + "# Instantiate policy with the embeddings we created above\n", + "emb_dim = 128\n", + "policy = AttentionModelPolicy(env_name=env.name, # this is actually not needed since we are initializing the embeddings!\n", + " embed_dim=emb_dim,\n", + " init_embedding=TSPInitEmbedding(emb_dim),\n", + " context_embedding=TSPContext(emb_dim),\n", + " dynamic_embedding=StaticEmbedding(emb_dim)\n", + ")\n", + "\n", + "\n", + "# Model: default is AM with REINFORCE and greedy rollout baseline\n", + "model = AttentionModel(env, \n", + " policy=policy,\n", + " baseline='rollout',\n", + " train_data_size=100_000,\n", + " val_data_size=10_000) " + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Rollout untrained model " + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Problem 1 | Cost: 11.545\n", + "Problem 2 | Cost: 8.525\n", + "Problem 3 | Cost: 12.461\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Greedy rollouts over untrained model\n", + "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n", + "td_init = env.reset(batch_size=[3]).to(device)\n", + "policy = model.policy.to(device)\n", + "out = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\")\n", + "actions_untrained = out['actions'].cpu().detach()\n", + "rewards_untrained = out['reward'].cpu().detach()\n", + "\n", + "for i in range(3):\n", + " print(f\"Problem {i+1} | Cost: {-rewards_untrained[i]:.3f}\")\n", + " env.render(td_init[i], actions_untrained[i])" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Training loop" + ] + }, + { + "cell_type": "code", + "execution_count": 35, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Using 16bit Automatic Mixed Precision (AMP)\n", + "GPU available: True (cuda), used: True\n", + "TPU available: False, using: 0 TPU cores\n", + "IPU available: False, using: 0 IPUs\n", + "HPU available: False, using: 0 HPUs\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\n", + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n", + "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n", + "\n", + " | Name | Type | Params\n", + "--------------------------------------------------\n", + "0 | env | TSPEnv | 0 \n", + "1 | policy | AttentionModelPolicy | 710 K \n", + "2 | baseline | WarmupBaseline | 710 K \n", + "--------------------------------------------------\n", + "1.4 M Trainable params\n", + "0 Non-trainable params\n", + "1.4 M Total params\n", + "5.682 Total estimated model params size (MB)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "e355955596da4bda95ed46208d002f10", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Sanity Checking: | | 0/? [00:00" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Greedy rollouts over trained policy (same states as previous plot)\n", + "policy = model.policy.to(device)\n", + "out = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\")\n", + "actions_trained = out['actions'].cpu().detach()\n", + "\n", + "# Plotting\n", + "import matplotlib.pyplot as plt\n", + "for i, td in enumerate(td_init):\n", + " fig, axs = plt.subplots(1,2, figsize=(11,5))\n", + " env.render(td, actions_untrained[i], ax=axs[0]) \n", + " env.render(td, actions_trained[i], ax=axs[1])\n", + " axs[0].set_title(f\"Untrained | Cost = {-rewards_untrained[i].item():.3f}\")\n", + " axs[1].set_title(r\"Trained $\\pi_\\theta$\" + f\"| Cost = {-out['reward'][i].item():.3f}\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can see that solutions are way better than with the untrained model, even just after 3 epochs! 🚀" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "rl4co", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.8" + }, + "orig_nbformat": 4 + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/3-creating-new-env-model/index.html b/examples/3-creating-new-env-model/index.html new file mode 100644 index 00000000..72557cee --- /dev/null +++ b/examples/3-creating-new-env-model/index.html @@ -0,0 +1,4916 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + New Environment: Creating and Modeling - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/advanced/1-hydra-config/1-hydra-config.ipynb b/examples/advanced/1-hydra-config/1-hydra-config.ipynb new file mode 100644 index 00000000..a02d31bc --- /dev/null +++ b/examples/advanced/1-hydra-config/1-hydra-config.ipynb @@ -0,0 +1,430 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Hydra Configuration\n", + "\n", + "\"Open\n", + "\n", + "[Hydra](https://hydra.cc/docs/intro/) makes it extremely convenient to configure projects with lots of parameter settings like the RL4CO library. \n", + "\n", + "While you don't need Hydra to use RL4CO, it is recommended to use it for your own projects to make it easier to manage the configuration of your experiments.\n", + "\n", + "Hydra uses config files in `.yaml` format for this. These files can be found in the [configs/](../../../configs/) folder, where the subfolders define configurations for specific parts of the framework which are then combined in the [main.yaml](../../../configs/main.yaml) configuration. In this tutorial we will have a look at how to use these different configuration files and how to add new parameters to the configuration." + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "from hydra import compose, initialize\n", + "from omegaconf import OmegaConf\n", + "\n", + "ROOT_DIR = \"../../\" # relative to this file" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "# context initialization\n", + "with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"):\n", + " cfg = compose(config_name=\"main\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Hydra stores the configurations in a dictionary like object called OmegaConf" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "omegaconf.dictconfig.DictConfig" + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "type(cfg)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The different subfolders in the configs folder are represented as distinct keys in the omegaconf" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['mode',\n", + " 'tags',\n", + " 'train',\n", + " 'test',\n", + " 'compile',\n", + " 'ckpt_path',\n", + " 'seed',\n", + " 'matmul_precision',\n", + " 'model',\n", + " 'callbacks',\n", + " 'logger',\n", + " 'trainer',\n", + " 'paths',\n", + " 'extras',\n", + " 'env']" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "list(cfg.keys())" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Keys can be accessed using the dot notation (e.g. `cfg.model`) or via normal dictionaries:" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "True\n" + ] + } + ], + "source": [ + "print(cfg.model == cfg[\"model\"])" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The dot notation is however more convenient especially in nested structures" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "True\n" + ] + } + ], + "source": [ + "print(cfg.model._target_ == cfg[\"model\"][\"_target_\"])" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "For example, lets look at the model configuration (which corresponds the [model/default.yaml](../../../configs/model/default.yaml) configuration). " + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "generate_default_data: true\n", + "metrics:\n", + " train:\n", + " - loss\n", + " - reward\n", + " val:\n", + " - reward\n", + " test:\n", + " - reward\n", + " log_on_step: true\n", + "_target_: rl4co.models.AttentionModel\n", + "baseline: rollout\n", + "batch_size: 512\n", + "val_batch_size: 1024\n", + "test_batch_size: 1024\n", + "train_data_size: 1280000\n", + "val_data_size: 10000\n", + "test_data_size: 10000\n", + "optimizer_kwargs:\n", + " lr: 0.0001\n", + "\n" + ] + } + ], + "source": [ + "print(OmegaConf.to_yaml(cfg.model))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "If we want to change parts of the configuration, it is generally a good practice to make the changes via the command line when executing the respective python script (in the case of RL4CO for example [rl4co/tasks/train.py](../../../rl4co/tasks/train.py)). For example, if we want to use a different model configuration, we can do something like:\n", + "\n", + "```bash\n", + "python train.py model=pomo model.batch_size=32\n", + "```\n", + "\n", + "Here we use the model/pomo.yaml configuration for the model and also change the batch size during training to 32. \n", + "\n", + "> Note: check out the see [override syntax documentation](https://hydra.cc/docs/1.1/advanced/override_grammar/basic/) on the Hydra website for more!" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "generate_default_data: true\n", + "metrics:\n", + " train:\n", + " - loss\n", + " - reward\n", + " val:\n", + " - reward\n", + " - max_reward\n", + " - max_aug_reward\n", + " test: ${metrics.val}\n", + " log_on_step: true\n", + "_target_: rl4co.models.POMO\n", + "num_augment: 8\n", + "batch_size: 32\n", + "val_batch_size: 1024\n", + "test_batch_size: 1024\n", + "train_data_size: 1280000\n", + "val_data_size: 10000\n", + "test_data_size: 10000\n", + "optimizer_kwargs:\n", + " lr: 0.0001\n", + "\n" + ] + } + ], + "source": [ + "with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"):\n", + " cfg = compose(config_name=\"main\", overrides=[\"model=pomo\",\"model.batch_size=32\"])\n", + " print(OmegaConf.to_yaml(cfg.model))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "It is also possible to add new parameters to a config using the `+` prefix. Using `++` will add a new parameter if it does not exist and _overwrite_ it if it does. " + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "generate_default_data: true\n", + "metrics:\n", + " train:\n", + " - loss\n", + " - reward\n", + " val:\n", + " - reward\n", + " - max_reward\n", + " - max_aug_reward\n", + " test: ${metrics.val}\n", + " log_on_step: true\n", + "_target_: rl4co.models.POMO\n", + "num_augment: 8\n", + "batch_size: 32\n", + "val_batch_size: 1024\n", + "test_batch_size: 1024\n", + "train_data_size: 1280000\n", + "val_data_size: 10000\n", + "test_data_size: 10000\n", + "optimizer_kwargs:\n", + " lr: 0.0001\n", + "num_starts: 10\n", + "\n" + ] + } + ], + "source": [ + "with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"):\n", + " cfg = compose(config_name=\"main\", overrides=[\"model=pomo\",\"model.batch_size=32\",\"+model.num_starts=10\"])\n", + " print(OmegaConf.to_yaml(cfg.model))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Likewise, we can also remove unwanted parts of the configuration. For example, if we do not want to use any experiment configuration, we can remove the changes to the configuration made by [experiments/base.yaml](../../../configs/experiment/base.yaml) using the `~` prefix:" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "generate_default_data: true\n", + "metrics:\n", + " train:\n", + " - loss\n", + " - reward\n", + " val:\n", + " - reward\n", + " - max_reward\n", + " - max_aug_reward\n", + " test: ${metrics.val}\n", + " log_on_step: true\n", + "_target_: rl4co.models.POMO\n", + "num_augment: 8\n", + "\n" + ] + } + ], + "source": [ + "with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"):\n", + " cfg = compose(config_name=\"main\", overrides=[\"model=pomo\",\"~experiment\"])\n", + " print(OmegaConf.to_yaml(cfg.model))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "As you can see, parameters like \"batch_size\" were removed from the model config, as those were set by the experiment config base.yaml. Through the hashbang\n", + "```\n", + "# @package _global_\n", + "```\n", + "in the [configs/experiments/base.yaml](../../../configs/experiment/base.yaml), this configuration is able to make changes to all parts of the configuration (like model, trainer, logger). So instead of adding a new key to the omegaconf object, configurations with a ```# @package _global_``` hashbang typically alter other parts of the configuration. \n", + "\n", + "Another example of such a configuration is the debug/default.yaml, which sets all parameters into a lightweight debugging mode:" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "generate_default_data: true\n", + "metrics:\n", + " train:\n", + " - loss\n", + " - reward\n", + " val:\n", + " - reward\n", + " test:\n", + " - reward\n", + " log_on_step: true\n", + "_target_: rl4co.models.AttentionModel\n", + "baseline: rollout\n", + "batch_size: 8\n", + "val_batch_size: 32\n", + "test_batch_size: 32\n", + "train_data_size: 64\n", + "val_data_size: 1000\n", + "test_data_size: 1000\n", + "optimizer_kwargs:\n", + " lr: 0.0001\n", + "\n" + ] + } + ], + "source": [ + "with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"):\n", + " cfg = compose(config_name=\"main\", overrides=[\"debug=default\"])\n", + " print(OmegaConf.to_yaml(cfg.model))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Summary\n", + "\n", + "- Reference config files using the CLI flag ```=``` (e.g. ```model=am```)\n", + "- Add parameters (or even entire keys) to the config using the \"+\" prefix (e.g. ```+model.batch_size=32```)\n", + "- Remove parameters (or even entire keys) to the config using the \"~\" prefix (e.g. ```~logger.wandb```)\n", + "- The ```# @package _global_``` hashbang allows global access from any config file\n", + "- Turn on debugging mode using ```debug=default```" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "rl4co", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.8" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/advanced/1-hydra-config/index.html b/examples/advanced/1-hydra-config/index.html new file mode 100644 index 00000000..1e13605d --- /dev/null +++ b/examples/advanced/1-hydra-config/index.html @@ -0,0 +1,3592 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + Hydra Configuration - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/advanced/2-flash-attention-2/2-flash-attention-2.ipynb b/examples/advanced/2-flash-attention-2/2-flash-attention-2.ipynb new file mode 100644 index 00000000..f04ab213 --- /dev/null +++ b/examples/advanced/2-flash-attention-2/2-flash-attention-2.ipynb @@ -0,0 +1,410 @@ +{ + "cells": [ + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Using Flash Attention 2 ⚡" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "In this notebook we will compare [Flash Attention 2](https://github.com/Dao-AILab/flash-attention) with the [`torch.nn.functional.scaled_dot_product_attention`](https://pytorch.org/docs/stable/generated/torch.nn.functional.scaled_dot_product_attention.html) function and a simple implementation." + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Installation\n", + "\n", + "Follow instructions here:\n", + "https://github.com/Dao-AILab/flash-attention" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "## Uncomment the following line to install the package from PyPI\n", + "## You may need to restart the runtime in Colab after this\n", + "## Remember to choose a GPU runtime for faster training!\n", + "\n", + "# !pip install rl4co" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Imports" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/.local/lib/python3.10/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n", + " from .autonotebook import tqdm as notebook_tqdm\n" + ] + } + ], + "source": [ + "import torch\n", + "import torch.utils.benchmark as benchmark\n", + "\n", + "\n", + "# Simple implementation in PyTorch\n", + "from rl4co.models.nn.attention import scaled_dot_product_attention_simple\n", + "# PyTorch official implementation of FlashAttention 1\n", + "from torch.nn.functional import scaled_dot_product_attention\n", + "# FlashAttention 2\n", + "from rl4co.models.nn.flash_attention import scaled_dot_product_attention_flash_attn\n", + "\n", + "from rl4co.envs import TSPEnv\n", + "from rl4co.models.zoo.am import AttentionModel\n", + "from rl4co.utils.trainer import RL4COTrainer\n", + "from rl4co.models.common.constructive.autoregressive import GraphAttentionEncoder\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Testing differences with simple tensors" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "True\n", + "True\n", + "tensor(0.0005, device='cuda:0', dtype=torch.float16) tensor(1.2159e-05, device='cuda:0', dtype=torch.float16)\n", + "tensor(0.0005, device='cuda:0', dtype=torch.float16) tensor(6.3777e-06, device='cuda:0', dtype=torch.float16)\n" + ] + } + ], + "source": [ + "bs, head, length, d = 64, 8, 512, 128\n", + "\n", + "query = torch.rand(bs, head, length, d, dtype=torch.float16, device=\"cuda\")\n", + "key = torch.rand(bs, head, length, d, dtype=torch.float16, device=\"cuda\")\n", + "value = torch.rand(bs, head, length, d, dtype=torch.float16, device=\"cuda\")\n", + "\n", + "# Simple implementation in PyTorch\n", + "out_simple = scaled_dot_product_attention_simple(query, key, value)\n", + "\n", + "# PyTorch official implementation of FlashAttention 1\n", + "out_pytorch = scaled_dot_product_attention(query, key, value)\n", + "\n", + "# FlashAttention 2\n", + "out_flash_attn = scaled_dot_product_attention_flash_attn(query, key, value)\n", + "\n", + "\n", + "print(torch.allclose(out_simple, out_pytorch, atol=1e-3))\n", + "print(torch.allclose(out_flash_attn, out_pytorch, atol=1e-3))\n", + "\n", + "print(torch.max(torch.abs(out_simple - out_pytorch)), torch.mean(torch.abs(out_simple - out_pytorch)))\n", + "print(torch.max(torch.abs(out_flash_attn - out_pytorch)), torch.mean(torch.abs(out_flash_attn - out_pytorch)))\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Testing Graph Attention Encoders with Flash Attention 2" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "GraphAttentionEncoder(\n", + " (init_embedding): TSPInitEmbedding(\n", + " (init_embed): Linear(in_features=2, out_features=128, bias=True)\n", + " )\n", + " (net): GraphAttentionNetwork(\n", + " (layers): Sequential(\n", + " (0): MultiHeadAttentionLayer(\n", + " (0): SkipConnection(\n", + " (module): MultiHeadAttention(\n", + " (Wqkv): Linear(in_features=128, out_features=384, bias=True)\n", + " (out_proj): Linear(in_features=128, out_features=128, bias=True)\n", + " )\n", + " )\n", + " (1): Normalization(\n", + " (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", + " )\n", + " (2): SkipConnection(\n", + " (module): Sequential(\n", + " (0): Linear(in_features=128, out_features=512, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=512, out_features=128, bias=True)\n", + " )\n", + " )\n", + " (3): Normalization(\n", + " (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", + " )\n", + " )\n", + " (1): MultiHeadAttentionLayer(\n", + " (0): SkipConnection(\n", + " (module): MultiHeadAttention(\n", + " (Wqkv): Linear(in_features=128, out_features=384, bias=True)\n", + " (out_proj): Linear(in_features=128, out_features=128, bias=True)\n", + " )\n", + " )\n", + " (1): Normalization(\n", + " (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", + " )\n", + " (2): SkipConnection(\n", + " (module): Sequential(\n", + " (0): Linear(in_features=128, out_features=512, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=512, out_features=128, bias=True)\n", + " )\n", + " )\n", + " (3): Normalization(\n", + " (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", + " )\n", + " )\n", + " (2): MultiHeadAttentionLayer(\n", + " (0): SkipConnection(\n", + " (module): MultiHeadAttention(\n", + " (Wqkv): Linear(in_features=128, out_features=384, bias=True)\n", + " (out_proj): Linear(in_features=128, out_features=128, bias=True)\n", + " )\n", + " )\n", + " (1): Normalization(\n", + " (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", + " )\n", + " (2): SkipConnection(\n", + " (module): Sequential(\n", + " (0): Linear(in_features=128, out_features=512, bias=True)\n", + " (1): ReLU()\n", + " (2): Linear(in_features=512, out_features=128, bias=True)\n", + " )\n", + " )\n", + " (3): Normalization(\n", + " (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", + " )\n", + " )\n", + " )\n", + " )\n", + ")" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "env = TSPEnv(generator_params=dict(num_loc=1000))\n", + "\n", + "num_heads = 8\n", + "embed_dim = 128\n", + "num_layers = 3\n", + "enc_simple = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n", + " sdpa_fn=scaled_dot_product_attention_simple)\n", + "\n", + "enc_fa1 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n", + " sdpa_fn=scaled_dot_product_attention)\n", + "\n", + "enc_fa2 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n", + " sdpa_fn=scaled_dot_product_attention_flash_attn)\n", + "\n", + "# Flash Attention supports only FP16 and BFloat16\n", + "enc_simple.to(\"cuda\").half()\n", + "enc_fa1.to(\"cuda\").half()\n", + "enc_fa2.to(\"cuda\").half()" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "def build_models(num_heads=8, embed_dim=128, num_layers=3):\n", + " enc_simple = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n", + " sdpa_fn=scaled_dot_product_attention_simple)\n", + "\n", + " enc_fa1 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n", + " sdpa_fn=scaled_dot_product_attention)\n", + "\n", + " enc_fa2 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n", + " sdpa_fn=scaled_dot_product_attention_flash_attn)\n", + "\n", + " # Flash Attention supports only FP16 and BFloat16\n", + " enc_simple.to(\"cuda\").half()\n", + " enc_fa1.to(\"cuda\").half()\n", + " enc_fa2.to(\"cuda\").half()\n", + " return enc_simple, enc_fa1, enc_fa2" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Times for problem size 10: Simple 0.633, FA1 0.511, FA2 0.554\n", + "Times for problem size 20: Simple 0.646, FA1 0.535, FA2 0.565\n", + "Times for problem size 50: Simple 0.663, FA1 0.547, FA2 0.580\n", + "Times for problem size 100: Simple 0.664, FA1 0.547, FA2 0.580\n", + "Times for problem size 200: Simple 0.670, FA1 0.509, FA2 0.585\n", + "Times for problem size 500: Simple 0.669, FA1 0.512, FA2 0.582\n", + "Times for problem size 1000: Simple 1.088, FA1 0.555, FA2 0.609\n", + "Times for problem size 2000: Simple 3.626, FA1 1.292, FA2 0.790\n", + "Times for problem size 5000: Simple 20.332, FA1 5.748, FA2 2.943\n", + "Times for problem size 10000: Simple 80.337, FA1 20.701, FA2 10.230\n" + ] + } + ], + "source": [ + "threads = 32\n", + "sizes = [10, 20, 50, 100, 200, 500, 1000, 2000, 5000, 10000]\n", + "\n", + "times_simple = []\n", + "times_fa1 = []\n", + "times_fa2 = []\n", + "\n", + "# for embed_dim in [64, 128, 256]:\n", + "for embed_dim in [128]:\n", + " # Get models\n", + " enc_simple, enc_fa1, enc_fa2 = build_models(embed_dim=embed_dim)\n", + "\n", + " for problem_size in sizes:\n", + "\n", + " with torch.no_grad():\n", + " # initial data\n", + " env = TSPEnv(generator_params=dict(num_loc=problem_size))\n", + " td_init = env.reset(batch_size=[2])\n", + " # set dtype to float16\n", + " td_init = td_init.to(dest=\"cuda\", dtype=torch.float16)\n", + "\n", + " t_simple = benchmark.Timer(\n", + " setup='x = td_init',\n", + " stmt='encode(x)',\n", + " globals={'td_init': td_init, 'encode': enc_simple},\n", + " num_threads=threads)\n", + "\n", + " t_fa1 = benchmark.Timer(\n", + " setup='x = td_init',\n", + " stmt='encode(x)',\n", + " globals={'td_init': td_init, 'encode': enc_fa1},\n", + " num_threads=threads)\n", + " \n", + " t_fa2 = benchmark.Timer(\n", + " setup='x = td_init',\n", + " stmt='encode(x)',\n", + " globals={'td_init': td_init, 'encode': enc_fa2},\n", + " num_threads=threads)\n", + " \n", + " times_simple.append(torch.tensor(t_simple.blocked_autorange().times).mean())\n", + " times_fa2.append(torch.tensor(t_fa2.blocked_autorange().times).mean())\n", + " times_fa1.append(torch.tensor(t_fa1.blocked_autorange().times).mean())\n", + "\n", + " print(f\"Times for problem size {problem_size}: Simple {times_simple[-1]*1e3:.3f}, FA1 {times_fa1[-1]*1e3:.3f}, FA2 {times_fa2[-1]*1e3:.3f}\")\n", + "\n", + " # eliminate cache\n", + " torch.cuda.empty_cache()" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Plot results\n", + "import matplotlib.pyplot as plt\n", + "\n", + "\n", + "fig, ax = plt.subplots(1, 1, figsize=(10, 5))\n", + "ax.plot(sizes, times_simple, label=\"Simple\")\n", + "ax.plot(sizes, times_fa1, label=\"FlashAttention 1\")\n", + "ax.plot(sizes, times_fa2, label=\"FlashAttention 2\")\n", + "\n", + "# fancy grid\n", + "ax.grid(True, which=\"both\", ls=\"-\", alpha=0.5)\n", + "ax.set_xscale(\"log\")\n", + "ax.set_yscale(\"log\")\n", + "ax.set_xlabel(\"Problem size\")\n", + "ax.set_ylabel(\"Time (ms)\")\n", + "ax.legend()\n", + "\n", + "# Instead of 10^1, 10^2... show nuber\n", + "ax.xaxis.set_major_formatter(plt.FuncFormatter(lambda x, _: f\"{x:.0f}\"))\n", + "\n", + "plt.show()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Using FlashAttention can speed up inference even at small context lengths (number of nodes in the graph). Difference can be of several times for large graphs between different implementations!" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "env", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.12" + }, + "orig_nbformat": 4 + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/advanced/2-flash-attention-2/index.html b/examples/advanced/2-flash-attention-2/index.html new file mode 100644 index 00000000..5cdd6cca --- /dev/null +++ b/examples/advanced/2-flash-attention-2/index.html @@ -0,0 +1,3541 @@ + + + + + + + + + + + + + + + + + + + + + + + Using Flash Attention 2 ⚡ - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/advanced/3-local-search/3-local-search.ipynb b/examples/advanced/3-local-search/3-local-search.ipynb new file mode 100644 index 00000000..bdef48dc --- /dev/null +++ b/examples/advanced/3-local-search/3-local-search.ipynb @@ -0,0 +1,185 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Local Search\n", + "\n", + "In this notebook, we will show how to improve the solution at hand using local search and other techniques. Here we solve TSP and use 2-opt to improve the solution. You can check how the improvement works for other problems in each Env's `local_search` method. \n", + "\n", + "Note that this notebook is based on [`1-quickstart`](../1-quickstart.ipynb) and we use the checkpoint file from it. If you haven't checked it yet, we recommend you to check it first.\n", + "\n", + "\"Open" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Installation\n", + "\n", + "We use LocalSearch operator provided by PyVRP. See https://github.com/PyVRP/PyVRP for more details.\n", + "\n", + "Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!\n", + "\n", + "> Note: You may need to restart the runtime in Colab after this\n" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "# !pip install rl4co[routing] # include pyvrp" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Imports" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "import torch\n", + "\n", + "from rl4co.envs import TSPEnv\n", + "from rl4co.models.zoo import AttentionModel" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Environment, Policy, and Model from saved checkpoint" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/sanghyeok/NCO/rl4co/.venv/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + "/home/sanghyeok/NCO/rl4co/.venv/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n", + "/home/sanghyeok/NCO/rl4co/.venv/lib/python3.10/site-packages/lightning/pytorch/core/saving.py:188: Found keys that are not in the model state dict but in the checkpoint: ['baseline.baseline.model.encoder.init_embedding.init_embed.weight', 'baseline.baseline.model.encoder.init_embedding.init_embed.bias', 'baseline.baseline.model.encoder.net.layers.0.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.0.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.0.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.0.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.0.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.0.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.0.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.0.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.1.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.1.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.1.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.1.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.1.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.1.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.1.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.1.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.2.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.2.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.2.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.2.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.2.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.2.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.2.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.2.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.num_batches_tracked', 'baseline.baseline.model.decoder.context_embedding.W_placeholder', 'baseline.baseline.model.decoder.context_embedding.project_context.weight', 'baseline.baseline.model.decoder.project_node_embeddings.weight', 'baseline.baseline.model.decoder.project_fixed_context.weight', 'baseline.baseline.model.decoder.pointer.project_out.weight']\n" + ] + } + ], + "source": [ + "# RL4CO env based on TorchRL\n", + "env = TSPEnv(num_loc=50) \n", + "\n", + "checkpoint_path = \"../tsp-quickstart.ckpt\" # checkpoint from the ../1-quickstart.ipynb\n", + "\n", + "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n", + "\n", + "# Model: default is AM with REINFORCE and greedy rollout baseline\n", + "model = AttentionModel.load_from_checkpoint(checkpoint_path, load_baseline=False)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Testing with Solution Improvement" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Greedy rollouts over trained model (same states as previous plot)\n", + "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n", + "td_init = env.reset(batch_size=[3]).to(device)\n", + "model = model.to(device)\n", + "out = model(td_init.clone(), phase=\"test\", decode_type=\"greedy\")\n", + "actions = out['actions']\n", + "\n", + "# Improve solutions using LocalSearch\n", + "improved_actions = env.local_search(td_init, actions, rng=0)\n", + "improved_rewards = env.get_reward(td_init, improved_actions)\n", + "\n", + "# Plotting\n", + "import matplotlib.pyplot as plt\n", + "for i, td in enumerate(td_init):\n", + " fig, axs = plt.subplots(1,2, figsize=(11,5))\n", + " env.render(td, actions[i], ax=axs[0]) \n", + " env.render(td, improved_actions[i], ax=axs[1])\n", + " axs[0].set_title(f\"Before improvement | Cost = {-out['reward'][i].item():.3f}\")\n", + " axs[1].set_title(f\"After improvement | Cost = {-improved_rewards[i].item():.3f}\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can see that the solution has improved after using 2-opt." + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": ".venv", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.10.13" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/advanced/3-local-search/index.html b/examples/advanced/3-local-search/index.html new file mode 100644 index 00000000..ec0efff1 --- /dev/null +++ b/examples/advanced/3-local-search/index.html @@ -0,0 +1,3235 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + Local Search - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+ +
+
+ + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/advanced/index.html b/examples/advanced/index.html new file mode 100644 index 00000000..9268f773 --- /dev/null +++ b/examples/advanced/index.html @@ -0,0 +1,2385 @@ + + + + + + + + + + + + + + + + + + + + + + + Advanced - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + +

Advanced

+

Collection of advanced examples and tutorials - which at the moment are a bit mixed together.

+

Index

+
    +
  • 1-hydra-config.ipynb: here we show how to use Hydra to configure your training and testing scripts.
  • +
  • 2-flash-attention-2.ipynb: this notebook shows the effects of different SDPA (Scaled Dot-Product Attention) implementations on the training of a model.
  • +
+ + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/datasets/1-test-on-tsplib/1-test-on-tsplib.ipynb b/examples/datasets/1-test-on-tsplib/1-test-on-tsplib.ipynb new file mode 100644 index 00000000..fa2f9a7c --- /dev/null +++ b/examples/datasets/1-test-on-tsplib/1-test-on-tsplib.ipynb @@ -0,0 +1,660 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Testing Model on TSPLib\n", + "\n", + "In this notebook, we will test the trained model's performance on the TSPLib benchmark. \n", + "\n", + "[TSPLib](http://comopt.ifi.uni-heidelberg.de/software/TSPLIB95/) is a collection of instances related to the TSP, which is a classic optimization challenge in the field of logistics and transportation. \n", + "\n", + "\"Open" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Installation\n", + "\n", + "Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!\n", + "\n", + "> Note: You may need to restart the runtime in Colab after this\n" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "# !pip install rl4co\n", + "# !pip install tsplib95\n", + "\n", + "## NOTE: to install latest version from Github (may be unstable) install from source instead:\n", + "# !pip install git+https://github.com/ai4co/rl4co.git" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Imports" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "%load_ext autoreload\n", + "%autoreload 2\n", + "\n", + "import torch\n", + "from tensordict import TensorDict\n", + "\n", + "from rl4co.envs import TSPEnv\n", + "from rl4co.models.zoo.am import AttentionModelPolicy\n", + "from rl4co.models.rl import REINFORCE\n", + "from rl4co.utils.trainer import RL4COTrainer\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Utils: download and load TSPLib instances in RL4CO" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "f89749dd9db548c3878190274c9ca633", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + " 0%| | 0.00/2.02M [00:00 torch.Tensor:\n", + " x, y = coord[:, 0], coord[:, 1]\n", + " x_min, x_max = x.min(), x.max()\n", + " y_min, y_max = y.min(), y.max()\n", + " x_scaled = (x - x_min) / (x_max - x_min) \n", + " y_scaled = (y - y_min) / (y_max - y_min)\n", + " coord_scaled = torch.stack([x_scaled, y_scaled], dim=1)\n", + " return coord_scaled \n", + "\n", + "def tsplib_to_td(problem, normalize=True):\n", + " coords = torch.tensor(problem['node_coords']).float()\n", + " coords_norm = normalize_coord(coords) if normalize else coords\n", + " td = TensorDict({\n", + " 'locs': coords_norm,\n", + " })\n", + " td = td[None] # add batch dimension, in this case just 1\n", + " return td\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Test an untrained model" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n" + ] + } + ], + "source": [ + "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n", + "\n", + "# RL4CO env based on TorchRL\n", + "env = TSPEnv(generator_params={'num_loc': 50})\n", + "\n", + "# Policy: neural network, in this case with encoder-decoder architecture\n", + "policy = AttentionModelPolicy(env_name=env.name).to(device)\n", + "\n", + "# RL Model: REINFORCE and greedy rollout baseline\n", + "model = REINFORCE(env, \n", + " policy,\n", + " baseline=\"rollout\",\n", + " batch_size=512,\n", + " train_data_size=100_000,\n", + " val_data_size=10_000,\n", + " optimizer_kwargs={\"lr\": 1e-4},\n", + " ) " + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/tmp/ipykernel_76573/1596842480.py:12: UserWarning: To copy construct from a tensor, it is recommended to use sourceTensor.clone().detach() or sourceTensor.clone().detach().requires_grad_(True), rather than torch.tensor(sourceTensor).\n", + " coords = torch.tensor(problem['node_coords']).float()\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Problem: ulysses16 Cost: 160.6761 BKS: 74.1087 \t Gap: 116.81%\n", + "Problem: ulysses22 Cost: 173.5413 BKS: 75.6651 \t Gap: 129.35%\n", + "Problem: att48 Cost: 86775.2031 BKS: 33523.7109\t Gap: 158.85%\n", + "Problem: eil51 Cost: 1256.7629 BKS: 429.9833 \t Gap: 192.28%\n", + "Problem: berlin52 Cost: 15761.3652 BKS: 7544.3662 \t Gap: 108.92%\n", + "Problem: st70 Cost: 2429.2407 BKS: 678.5975 \t Gap: 257.98%\n", + "Problem: pr76 Cost: 358580.5000 BKS: 108159.4375\t Gap: 231.53%\n", + "Problem: eil76 Cost: 1801.1833 BKS: 545.3876 \t Gap: 230.26%\n", + "Problem: gr96 Cost: 1714.3306 BKS: 512.3093 \t Gap: 234.63%\n", + "Problem: rd100 Cost: 30248.6816 BKS: 7910.3960 \t Gap: 282.39%\n", + "Problem: kroD100 Cost: 80604.9609 BKS: 21294.2930\t Gap: 278.53%\n", + "Problem: kroC100 Cost: 61475.9688 BKS: 20750.7617\t Gap: 196.26%\n", + "Problem: kroA100 Cost: 86844.4609 BKS: 21285.4414\t Gap: 308.00%\n", + "Problem: eil101 Cost: 2444.7129 BKS: 642.3096 \t Gap: 280.61%\n", + "Problem: lin105 Cost: 56784.3906 BKS: 14382.9961\t Gap: 294.80%\n", + "Problem: ch130 Cost: 26669.8164 BKS: 6110.8608 \t Gap: 336.43%\n", + "Problem: ch150 Cost: 32037.0078 BKS: 6532.2812 \t Gap: 390.44%\n", + "Problem: gr202 Cost: 2277.4905 BKS: 549.9980 \t Gap: 314.09%\n", + "Problem: tsp225 Cost: 24270.3203 BKS: 3859.0000 \t Gap: 528.93%\n", + "Problem: a280 Cost: 17521.9512 BKS: 2586.7695 \t Gap: 577.37%\n", + "Problem: pcb442 Cost: 445898.6250 BKS: 50783.5469\t Gap: 778.04%\n", + "Problem: gr666 Cost: 37270.4531 BKS: 3952.5356 \t Gap: 842.95%\n", + "Problem: pr1002 Cost: 3692658.0000 BKS: 259066.6719\t Gap: 1325.37%\n", + "Problem: pr2392 Cost: 11149681.0000 BKS: 378062.8125\t Gap: 2849.16%\n" + ] + } + ], + "source": [ + "tds, actions = [], []\n", + "\n", + "policy = policy.eval()\n", + "for problem in problems:\n", + "\n", + " with torch.inference_mode():\n", + " td_reset = env.reset(tsplib_to_td(problem)).to(device)\n", + " out = policy(td_reset.clone(), env, decode_type = \"greedy\")\n", + " unnormalized_td = env.reset(tsplib_to_td(problem, normalize=False)).to(device)\n", + " cost = -env.get_reward(unnormalized_td, out[\"actions\"]).item() # unnormalized cost\n", + " \n", + " bks_sol = (torch.tensor(problem['solution'], device=device, dtype=torch.int64) - 1)[None]\n", + " bks_cost = -env.get_reward(unnormalized_td, bks_sol)\n", + " \n", + " tds.append(tsplib_to_td(problem))\n", + " actions.append(out[\"actions\"])\n", + " \n", + " gap = (cost - bks_cost.item()) / bks_cost.item()\n", + " \n", + " print(f\"Problem: {problem['name']:<15} Cost: {cost:<14.4f} BKS: {bks_cost.item():<10.4f}\\t Gap: {gap:.2%}\")" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Plot some instances\n", + "env.render(tds[0], actions[0].cpu())\n", + "env.render(tds[-2], actions[-2].cpu())\n", + "env.render(tds[-1], actions[-1].cpu())" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Train\n", + "\n", + "We will train for few steps just to show the effects of training a model.\n", + "Alternatively, we can load the a pretrained checkpoint, e.g. with:\n", + "\n", + "```python\n", + "model = AttentionModel.load_from_checkpoint(checkpoint_path, load_baseline=False)\n", + "```\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Using 16bit Automatic Mixed Precision (AMP)\n", + "GPU available: True (cuda), used: True\n", + "TPU available: False, using: 0 TPU cores\n", + "IPU available: False, using: 0 IPUs\n", + "HPU available: False, using: 0 HPUs\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\n", + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n", + "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n", + "\n", + " | Name | Type | Params\n", + "--------------------------------------------------\n", + "0 | env | TSPEnv | 0 \n", + "1 | policy | AttentionModelPolicy | 710 K \n", + "2 | baseline | WarmupBaseline | 710 K \n", + "--------------------------------------------------\n", + "1.4 M Trainable params\n", + "0 Non-trainable params\n", + "1.4 M Total params\n", + "5.681 Total estimated model params size (MB)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "90faeba76e5a415ca3fdbc8d2dacd4b8", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Sanity Checking: | | 0/? [00:00" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Plot some instances\n", + "env.render(tds[0], actions[0].cpu())\n", + "env.render(tds[-2], actions[-2].cpu())\n", + "env.render(tds[-1], actions[-1].cpu())" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Great! We can see that the performance vastly improved even with just few minutes of training.\n", + "\n", + "There are several ways to improve the model's performance further, such as:\n", + "- Training for more steps\n", + "- Using a different model architecture\n", + "- Using a different training algorithm\n", + "- Using a different hyperparameters\n", + "- Using a different `Generator` \n", + "- ... and many more!" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "rl4co", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.10" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/datasets/1-test-on-tsplib/index.html b/examples/datasets/1-test-on-tsplib/index.html new file mode 100644 index 00000000..5794ffc7 --- /dev/null +++ b/examples/datasets/1-test-on-tsplib/index.html @@ -0,0 +1,4011 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + Testing Model on TSPLib - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/datasets/2-test-on-cvrplib/2-test-on-cvrplib.ipynb b/examples/datasets/2-test-on-cvrplib/2-test-on-cvrplib.ipynb new file mode 100644 index 00000000..112028e9 --- /dev/null +++ b/examples/datasets/2-test-on-cvrplib/2-test-on-cvrplib.ipynb @@ -0,0 +1,643 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Testing Model on VRPLib\n", + "\n", + "In this notebook, we will test the trained model's performance on the VRPLib benchmark.\n", + "\n", + "[VRPLib](http://vrp.galgos.inf.puc-rio.br/index.php/en/) is a collection of instances related to the CVRP, which is a classic optimization challenge in the field of logistics and transportation. \n", + "\n", + "\"Open" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Installation\n", + "\n", + "Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!\n", + "\n", + "> Note: You may need to restart the runtime in Colab after this\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "# !pip install rl4co[graph] # include torch-geometric\n", + "# !pip install vrplib # for reading instance files\n", + "\n", + "## NOTE: to install latest version from Github (may be unstable) install from source instead:\n", + "# !pip install git+https://github.com/ai4co/rl4co.git" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "# Install the `vrplib` package\n", + "# !pip install vrplib" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Imports" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/fabric/__init__.py:41: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:3144: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('sphinxcontrib')`.\n", + "Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n", + " declare_namespace(pkg)\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/fabric/__init__.py:41: Deprecated call to `pkg_resources.declare_namespace('lightning.fabric')`.\n", + "Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:2553: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('lightning')`.\n", + "Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n", + " declare_namespace(parent)\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/__init__.py:37: Deprecated call to `pkg_resources.declare_namespace('lightning.pytorch')`.\n", + "Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:2553: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('lightning')`.\n", + "Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n", + " declare_namespace(parent)\n" + ] + } + ], + "source": [ + "%load_ext autoreload\n", + "%autoreload 2\n", + "\n", + "import os\n", + "import torch\n", + "import vrplib\n", + "from tensordict import TensorDict\n", + "\n", + "from rl4co.envs import CVRPEnv\n", + "from rl4co.models.zoo.am import AttentionModelPolicy\n", + "from rl4co.models.rl import REINFORCE\n", + "from rl4co.utils.trainer import RL4COTrainer\n", + "\n", + "from tqdm import tqdm" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n" + ] + } + ], + "source": [ + "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n", + "\n", + "# RL4CO env based on TorchRL\n", + "env = CVRPEnv(generator_params={'num_loc': 50})\n", + "\n", + "# Policy: neural network, in this case with encoder-decoder architecture\n", + "policy = AttentionModelPolicy(env_name=env.name).to(device)\n", + "\n", + "# RL Model: REINFORCE and greedy rollout baseline\n", + "model = REINFORCE(env, \n", + " policy,\n", + " baseline=\"rollout\",\n", + " batch_size=512,\n", + " train_data_size=100_000,\n", + " val_data_size=10_000,\n", + " optimizer_kwargs={\"lr\": 1e-4},\n", + " ) " + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Download vrp problems" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/vrplib/download/list_names.py:58: DeprecationWarning: read_text is deprecated. Use files() instead. Refer to https://importlib-resources.readthedocs.io/en/latest/using.html#migrating-from-legacy for migration advice.\n", + " fi = pkg_resource.read_text(__package__, \"instance_data.csv\")\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/importlib/resources/_legacy.py:80: DeprecationWarning: open_text is deprecated. Use files() instead. Refer to https://importlib-resources.readthedocs.io/en/latest/using.html#migrating-from-legacy for migration advice.\n", + " with open_text(package, resource, encoding, errors) as fp:\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/vrplib/download/list_names.py:32: DeprecationWarning: The function 'list_names' is deprecated and will be removed in the next major version (vrplib v2.0.0).\n", + " warnings.warn(msg, DeprecationWarning)\n" + ] + } + ], + "source": [ + "problem_names = vrplib.list_names(low=50, high=100, vrp_type='cvrp') \n", + "\n", + "instances = [] # Collect Set A, B, E, F, M datasets\n", + "for name in problem_names:\n", + " if 'A' in name:\n", + " instances.append(name)\n", + " elif 'B' in name:\n", + " instances.append(name)\n", + " elif 'E' in name:\n", + " instances.append(name)\n", + " elif 'F' in name:\n", + " instances.append(name)\n", + " elif 'M' in name and 'CMT' not in name:\n", + " instances.append(name)\n", + "\n", + "# Modify the path you want to save \n", + "# Note: we don't have to create this folder in advance\n", + "path_to_save = './vrplib/' \n", + "\n", + "try:\n", + " os.makedirs(path_to_save)\n", + " for instance in tqdm(instances):\n", + " vrplib.download_instance(instance, path_to_save)\n", + " vrplib.download_solution(instance, path_to_save)\n", + "except: # already exist\n", + " pass " + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "# Utils function: we will normalize the coordinates of the VRP instances\n", + "def normalize_coord(coord:torch.Tensor) -> torch.Tensor:\n", + " x, y = coord[:, 0], coord[:, 1]\n", + " x_min, x_max = x.min(), x.max()\n", + " y_min, y_max = y.min(), y.max()\n", + " \n", + " x_scaled = (x - x_min) / (x_max - x_min) \n", + " y_scaled = (y - y_min) / (y_max - y_min)\n", + " coord_scaled = torch.stack([x_scaled, y_scaled], dim=1)\n", + " return coord_scaled \n", + "\n", + "def vrplib_to_td(problem, normalize=True):\n", + " coords = torch.tensor(problem['node_coord']).float()\n", + " coords_norm = normalize_coord(coords) if normalize else coords\n", + " demand = torch.tensor(problem['demand'][1:]).float()\n", + " capacity = problem['capacity']\n", + " n = coords.shape[0]\n", + " td = TensorDict({\n", + " 'depot': coords_norm[0,:],\n", + " 'locs': coords_norm[1:,:],\n", + " 'demand': demand / capacity, # normalized demand\n", + " 'capacity': capacity, # original capacity, not needed for inference\n", + " })\n", + " td = td[None] # add batch dimension, in this case just 1\n", + " return td" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Test untrained" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Problem: A-n53-k7 Cost: 2777 BKS: 1010 \t Gap: 174.95%\n", + "Problem: A-n54-k7 Cost: 3130 BKS: 1167 \t Gap: 168.21%\n", + "Problem: A-n55-k9 Cost: 2812 BKS: 1073 \t Gap: 162.07%\n", + "Problem: A-n60-k9 Cost: 3151 BKS: 1354 \t Gap: 132.72%\n", + "Problem: A-n61-k9 Cost: 3060 BKS: 1034 \t Gap: 195.94%\n", + "Problem: A-n62-k8 Cost: 3483 BKS: 1288 \t Gap: 170.42%\n", + "Problem: A-n63-k9 Cost: 3736 BKS: 1616 \t Gap: 131.19%\n", + "Problem: A-n63-k10 Cost: 3110 BKS: 1314 \t Gap: 136.68%\n", + "Problem: A-n64-k9 Cost: 3721 BKS: 1401 \t Gap: 165.60%\n", + "Problem: A-n65-k9 Cost: 3548 BKS: 1174 \t Gap: 202.21%\n", + "Problem: A-n69-k9 Cost: 3600 BKS: 1159 \t Gap: 210.61%\n", + "Problem: A-n80-k10 Cost: 4776 BKS: 1763 \t Gap: 170.90%\n", + "Problem: B-n51-k7 Cost: 3286 BKS: 1032 \t Gap: 218.41%\n", + "Problem: B-n52-k7 Cost: 2852 BKS: 747 \t Gap: 281.79%\n", + "Problem: B-n56-k7 Cost: 2762 BKS: 707 \t Gap: 290.66%\n", + "Problem: B-n57-k7 Cost: 3553 BKS: 1153 \t Gap: 208.15%\n", + "Problem: B-n57-k9 Cost: 3622 BKS: 1598 \t Gap: 126.66%\n", + "Problem: B-n63-k10 Cost: 3426 BKS: 1496 \t Gap: 129.01%\n", + "Problem: B-n64-k9 Cost: 2804 BKS: 861 \t Gap: 225.67%\n", + "Problem: B-n66-k9 Cost: 3273 BKS: 1316 \t Gap: 148.71%\n", + "Problem: B-n67-k10 Cost: 2949 BKS: 1032 \t Gap: 185.76%\n", + "Problem: B-n68-k9 Cost: 3992 BKS: 1272 \t Gap: 213.84%\n", + "Problem: B-n78-k10 Cost: 4367 BKS: 1221 \t Gap: 257.66%\n", + "Problem: E-n51-k5 Cost: 1615 BKS: 521 \t Gap: 209.98%\n", + "Problem: E-n76-k7 Cost: 2396 BKS: 682 \t Gap: 251.32%\n", + "Problem: E-n76-k8 Cost: 2402 BKS: 735 \t Gap: 226.80%\n", + "Problem: E-n76-k10 Cost: 2393 BKS: 830 \t Gap: 188.31%\n", + "Problem: E-n76-k14 Cost: 2520 BKS: 1021 \t Gap: 146.82%\n", + "Problem: E-n101-k8 Cost: 3507 BKS: 815 \t Gap: 330.31%\n", + "Problem: E-n101-k14 Cost: 3550 BKS: 1067 \t Gap: 232.71%\n", + "Problem: F-n72-k4 Cost: 1274 BKS: 237 \t Gap: 437.55%\n", + "Problem: M-n101-k10 Cost: 4036 BKS: 820 \t Gap: 392.20%\n" + ] + } + ], + "source": [ + "tds, actions = [], []\n", + "for instance in instances:\n", + " # Inference\n", + " problem = vrplib.read_instance(os.path.join(path_to_save, instance+'.vrp'))\n", + " td_reset = env.reset(vrplib_to_td(problem).to(device))\n", + " with torch.inference_mode():\n", + " out = policy(td_reset.clone(), env, decode_type=\"sampling\", num_samples=128, select_best=True)\n", + " unnormalized_td = env.reset(vrplib_to_td(problem, normalize=False).to(device))\n", + " cost = -env.get_reward(unnormalized_td, out[\"actions\"]).int().item() # unnormalized cost\n", + " \n", + " # Load the optimal cost\n", + " solution = vrplib.read_solution(os.path.join(path_to_save, instance+'.sol'))\n", + " optimal_cost = solution['cost']\n", + "\n", + " tds.append(td_reset)\n", + " actions.append(out[\"actions\"])\n", + " \n", + " # Calculate the gap and print\n", + " gap = (cost - optimal_cost) / optimal_cost\n", + " print(f'Problem: {instance:<15} Cost: {cost:<8} BKS: {optimal_cost:<8}\\t Gap: {gap:.2%}')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Plot some instances\n", + "env.render(tds[0], actions[0].cpu())\n", + "env.render(tds[-2], actions[-2].cpu())\n", + "env.render(tds[-1], actions[-1].cpu())" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Train\n", + "\n", + "We will train for few steps just to show the effects of training a model.\n", + "Alternatively, we can load the a pretrained checkpoint, e.g. with:\n", + "\n", + "```python\n", + "model = AttentionModel.load_from_checkpoint(checkpoint_path, load_baseline=False)\n", + "```\n" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Using 16bit Automatic Mixed Precision (AMP)\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/plugins/precision/amp.py:55: `torch.cuda.amp.GradScaler(args...)` is deprecated. Please use `torch.amp.GradScaler('cuda', args...)` instead.\n", + "GPU available: True (cuda), used: True\n", + "TPU available: False, using: 0 TPU cores\n", + "IPU available: False, using: 0 IPUs\n", + "HPU available: False, using: 0 HPUs\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\n", + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n", + "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n", + "\n", + " | Name | Type | Params\n", + "--------------------------------------------------\n", + "0 | env | CVRPEnv | 0 \n", + "1 | policy | AttentionModelPolicy | 694 K \n", + "2 | baseline | WarmupBaseline | 694 K \n", + "--------------------------------------------------\n", + "1.4 M Trainable params\n", + "0 Non-trainable params\n", + "1.4 M Total params\n", + "5.553 Total estimated model params size (MB)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "5cfb34e636004181b7c6a0886f05bba7", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Sanity Checking: | | 0/? [00:00" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Plot some instances\n", + "env.render(tds[0], actions[0].cpu())\n", + "env.render(tds[-2], actions[-2].cpu())\n", + "env.render(tds[-1], actions[-1].cpu())" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Great! We can see that the performance vastly improved even with just few minutes of training.\n", + "\n", + "There are several ways to improve the model's performance further, such as:\n", + "- Training for more steps\n", + "- Using a different model architecture\n", + "- Using a different training algorithm\n", + "- Using a different hyperparameters\n", + "- Using a different `Generator` \n", + "- ... and many more!" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "rl4co", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.8" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/datasets/2-test-on-cvrplib/index.html b/examples/datasets/2-test-on-cvrplib/index.html new file mode 100644 index 00000000..0c4e00f9 --- /dev/null +++ b/examples/datasets/2-test-on-cvrplib/index.html @@ -0,0 +1,3958 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + Testing Model on VRPLib - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/datasets/index.html b/examples/datasets/index.html new file mode 100644 index 00000000..9d82233b --- /dev/null +++ b/examples/datasets/index.html @@ -0,0 +1,2385 @@ + + + + + + + + + + + + + + + + + + + + + + + Datasets - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + +

Datasets

+

Collection of examples for training and testing with custom datasets.

+

Index

+ + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/index.html b/examples/index.html new file mode 100644 index 00000000..4990cbeb --- /dev/null +++ b/examples/index.html @@ -0,0 +1,2449 @@ + + + + + + + + + + + + + + + + + + + + + + + 🧩 Examples and Tutorials - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + +

🧩 Examples and Tutorials

+

This is a collection of examples and tutorials for using the RL4CO library.

+

The root directory is made of quickstarts and contains the following:

+

⚡️ Quickstarts

+

This is the root directory of the examples. The following quickstarts are available:

+
    +
  • 1-quickstart.ipynb: here we train a model on a simple environment - it takes less than 2 minutes!
  • +
  • 2-full-training.ipynb: similar to the previous notebooks but with a more interesting environment, with checkpointing, logging, and callbacks.

    - 2b-train-simple.py: here we show a simple script that can be called with python 2b-train-simple.py. This is simplified and does not use Hydra - for those who prefer a simpler setup. Note that we also made a Hydra tutorial here. +- 3-creating-new-env-model.ipynb: here we show how to extend RL4CO to solve new problems and create new models from zero to hero!

    +
  • +
+

📁 Folders Index

+

Modeling

+

Under the modeling/ directory, here are some additional examples for modeling and inference.

+

Datasets

+

Under the datasets/ directory, here are some additional examples for using your custom data to train/evaluate your models

+

Advanced

+

Under the advanced/ directory, here are some additional examples for advanced topics.

+

Other

+

Under the other/ directory, here are some additional examples for other topics.

+ + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/modeling/1-decoding-strategies/1-decoding-strategies.ipynb b/examples/modeling/1-decoding-strategies/1-decoding-strategies.ipynb new file mode 100644 index 00000000..b38df09a --- /dev/null +++ b/examples/modeling/1-decoding-strategies/1-decoding-strategies.ipynb @@ -0,0 +1,679 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "5f35f43a-a799-4e5b-8c6b-51e08932b61b", + "metadata": {}, + "source": [ + "# RL4CO Decoding Strategies Notebook\n", + "\n", + "This notebook demonstrates how to utilize the different decoding strategies available in [rl4co/utils/decoding.py](../../rl4co/utils/decoding.py) during the different phases of model development. We will also demonstrate how to evaluate the model for different decoding strategies on the test dataset. \n", + "\n", + "\"Open\n" + ] + }, + { + "cell_type": "markdown", + "id": "866f4981-7358-4086-9044-6df6a4ba8fea", + "metadata": {}, + "source": [ + "### Installation" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "7538da3e-67df-4c72-9acb-345a3bc9fba1", + "metadata": {}, + "outputs": [], + "source": [ + "## Uncomment the following line to install the package from PyPI\n", + "## You may need to restart the runtime in Colab after this\n", + "## Remember to choose a GPU runtime for faster training!\n", + "\n", + "# !pip install rl4co" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "4380f62f-bde8-4fc5-aa1a-072d5be58a32", + "metadata": {}, + "outputs": [], + "source": [ + "import torch\n", + "\n", + "from rl4co.envs import TSPEnv\n", + "from rl4co.models.zoo import AttentionModel, AttentionModelPolicy\n", + "from rl4co.utils.trainer import RL4COTrainer\n", + "from rl4co.utils.ops import batchify" + ] + }, + { + "cell_type": "markdown", + "id": "566e2f04-0576-4789-ac25-706ef3ebb7ca", + "metadata": {}, + "source": [ + "### Setup Policy and Environment" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "40c9a2ac-a2cc-4a90-a810-75a092fa4890", + "metadata": {}, + "outputs": [], + "source": [ + "%%capture\n", + "# RL4CO env based on TorchRL\n", + "env = TSPEnv(generator_params=dict(num_loc=50)) \n", + "\n", + "# Policy: neural network, in this case with encoder-decoder architecture\n", + "policy = AttentionModelPolicy(env_name=env.name, \n", + " embed_dim=128,\n", + " num_encoder_layers=3,\n", + " num_heads=8,\n", + " )\n", + "\n", + "# Model: default is AM with REINFORCE and greedy rollout baseline\n", + "model = AttentionModel(env, \n", + " baseline=\"rollout\",\n", + " batch_size = 512,\n", + " val_batch_size = 64, \n", + " test_batch_size = 64, \n", + " train_data_size=100_000, # fast training for demo\n", + " val_data_size=1_000,\n", + " test_data_size=1_000,\n", + " optimizer_kwargs={\"lr\": 1e-4},\n", + " policy_kwargs={ # we can specify the decode types using the policy_kwargs\n", + " \"train_decode_type\": \"sampling\",\n", + " \"val_decode_type\": \"greedy\",\n", + " \"test_decode_type\": \"beam_search\",\n", + " }\n", + " ) " + ] + }, + { + "cell_type": "markdown", + "id": "fdfa0c33-0f09-4316-84f9-25f6e8f8dfc0", + "metadata": {}, + "source": [ + "### Setup Trainer and train model" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "38e7840f-c3b7-4f47-b694-f00db7f25896", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Using 16bit Automatic Mixed Precision (AMP)\n", + "GPU available: True (cuda), used: True\n", + "TPU available: False, using: 0 TPU cores\n", + "IPU available: False, using: 0 IPUs\n", + "HPU available: False, using: 0 HPUs\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\n", + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n", + "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n", + "\n", + " | Name | Type | Params\n", + "--------------------------------------------------\n", + "0 | env | TSPEnv | 0 \n", + "1 | policy | AttentionModelPolicy | 710 K \n", + "2 | baseline | WarmupBaseline | 710 K \n", + "--------------------------------------------------\n", + "1.4 M Trainable params\n", + "0 Non-trainable params\n", + "1.4 M Total params\n", + "5.681 Total estimated model params size (MB)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "4c79576d702f4301861fafabaae2d86c", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Sanity Checking: | | 0/? [00:00" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "batch_instance = 0\n", + "for i, actions in enumerate(actions_stacked[batch_instance].cpu()):\n", + " reward = rewards_stacked[batch_instance, i]\n", + " _, ax = plt.subplots()\n", + " \n", + " env.render(td[0], actions, ax=ax)\n", + " ax.set_title(\"Reward: %s\" % reward.item())" + ] + }, + { + "cell_type": "markdown", + "id": "0d3387ca", + "metadata": {}, + "source": [ + "### Final notes" + ] + }, + { + "cell_type": "markdown", + "id": "633b4ce9", + "metadata": {}, + "source": [ + "For evaluation, we can also use additional decoding strategies used during evaluatin, such as sampling N times or greedy augmentations, available in [rl4co/tasks/eval.py](../../rl4co/tasks/eval.py)" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.8" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/examples/modeling/1-decoding-strategies/index.html b/examples/modeling/1-decoding-strategies/index.html new file mode 100644 index 00000000..c55eeaec --- /dev/null +++ b/examples/modeling/1-decoding-strategies/index.html @@ -0,0 +1,4269 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + RL4CO Decoding Strategies Notebook - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/modeling/2-transductive-methods/2-transductive-methods.ipynb b/examples/modeling/2-transductive-methods/2-transductive-methods.ipynb new file mode 100644 index 00000000..9207a48b --- /dev/null +++ b/examples/modeling/2-transductive-methods/2-transductive-methods.ipynb @@ -0,0 +1,436 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Transductive Methods\n", + "\n", + "In this notebook, we will showcase how to use the Efficient Active Search (EAS) algorithm to find better solutions to existing problems!\n", + "\n", + "> Tip: in [transductive RL](https://en.wikipedia.org/wiki/Transduction_(machine_learning)) we train (or finetune) to solve only specific ones.\n", + "\n", + "\"Open" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Installation\n", + "\n", + "Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!\n", + "\n", + "> Note: You may need to restart the runtime in Colab after this\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "# !pip install rl4co[graph] # include torch-geometric\n", + "\n", + "## NOTE: to install latest version from Github (may be unstable) install from source instead:\n", + "# !pip install git+https://github.com/ai4co/rl4co.git" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Imports" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "2023-08-22 16:29:17.903805: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.\n", + "2023-08-22 16:29:17.923169: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n", + "To enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n", + "2023-08-22 16:29:18.249479: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n" + ] + } + ], + "source": [ + "%load_ext autoreload\n", + "%autoreload 2\n", + "\n", + "import torch\n", + "\n", + "from rl4co.envs import TSPEnv, CVRPEnv\n", + "from rl4co.models.zoo.am import AttentionModel\n", + "from rl4co.utils.trainer import RL4COTrainer\n", + "from rl4co.utils.decoding import get_log_likelihood\n", + "from rl4co.models.zoo import EAS, EASLay, EASEmb, ActiveSearch\n", + "\n", + "import logging" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:196: UserWarning: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + " rank_zero_warn(\n", + "/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:196: UserWarning: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n", + " rank_zero_warn(\n", + "/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/core/saving.py:164: UserWarning: Found keys that are not in the model state dict but in the checkpoint: ['baseline.baseline.model.encoder.init_embedding.init_embed.weight', 'baseline.baseline.model.encoder.init_embedding.init_embed.bias', 'baseline.baseline.model.encoder.net.layers.0.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.0.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.0.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.0.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.0.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.0.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.0.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.0.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.1.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.1.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.1.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.1.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.1.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.1.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.1.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.1.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.2.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.2.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.2.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.2.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.2.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.2.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.2.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.2.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.num_batches_tracked', 'baseline.baseline.model.decoder.context_embedding.W_placeholder', 'baseline.baseline.model.decoder.context_embedding.project_context.weight', 'baseline.baseline.model.decoder.project_node_embeddings.weight', 'baseline.baseline.model.decoder.project_fixed_context.weight', 'baseline.baseline.model.decoder.logit_attention.project_out.weight']\n", + " rank_zero_warn(\n" + ] + } + ], + "source": [ + "# Load from checkpoint; alternatively, simply instantiate a new model\n", + "checkpoint_path = \"last.ckpt\" # model trained for one epoch only just for showing the examples\n", + "\n", + "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n", + "\n", + "# load checkpoint\n", + "# checkpoint = torch.load(checkpoint_path)\n", + "\n", + "model = AttentionModel.load_from_checkpoint(checkpoint_path, load_baseline=False)\n", + "policy = model.policy.to(device)" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "# env = CVRPEnv(generator_params=dict(num_loc=50))\n", + "# policy = AttentionModel(env).policy.to(device)\n", + "\n", + "env = TSPEnv(generator_params=dict(num_loc=50))\n", + "\n", + "td = env.reset(batch_size=3).to(device)\n", + "\n", + "out = policy(td)" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAiMAAAGdCAYAAADAAnMpAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/bCgiHAAAACXBIWXMAAA9hAAAPYQGoP6dpAAC8FElEQVR4nOzddVxT6x8H8M82ukPpUOwEA/uaqNit2N3dfZWr1+7Cvt6rYlwbA6xrYyIWJiJI9+jY9vz+4MfksNFjZxvP+/XaS89znrN9B4ed757zBIcQQkBRFEVRFMUSLtsBUBRFURRVsdFkhKIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVqmxHUBxiEQihIeHQ19fHxwOh+1wKIqiKIoqBkIIkpOTYWVlBS634PYPpUhGwsPDYWtry3YYFEVRFEWVws+fP2FjY1PgfqVIRvT19QHkvBkDAwOWo6EoiqIoqjiSkpJga2srvo4XRCmSkdxbMwYGBjQZoSiKoiglU1QXC9qBlaIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVtFkhKIoiqIoVpU4GXnw4AF69eoFKysrcDgcXLp0qchj7t27h8aNG0NTUxPVq1fHsWPHShEqRVEURVGqqMTJSGpqKhwdHbF3795i1Q8KCkKPHj3QoUMH+Pv7Y86cOZgwYQJ8fHxKHCxFURRFUaqnxGvTdOvWDd26dSt2/f3796Nq1arYunUrAKBOnTp49OgRtm/fjq5du5b05SmKoiiKUjHl3mfE19cXLi4ujLKuXbvC19e3wGMyMzORlJTEeFAURVEUpZrKPRmJjIyEubk5o8zc3BxJSUlIT0+Xesz69ethaGgoftja2pZ3mBRFURRFsUQhR9MsXboUfD5f/Pj58yfbIVEURVEUVU5K3GekpCwsLBAVFcUoi4qKgoGBAbS1taUeo6mpCU1NzfIOjaIoiqIoBVDuLSMtW7bEnTt3GGW3bt1Cy5Yty/ulKYqiKIpSAiVORlJSUuDv7w9/f38AOUN3/f39ERISAiDnFsuoUaPE9adMmYLv379j0aJF+PTpE/bt24ezZ89i7ty5snkHFEVRFEUptRInIy9fvkSjRo3QqFEjAMC8efPQqFEj/P777wCAiIgIcWICAFWrVsW1a9dw69YtODo6YuvWrTh8+DAd1ktRFEVRFACAQwghbAdRlKSkJBgaGoLP58PAwIDtcCiKoiiKKobiXr/LvQMrRVEUVTChiOB5UDyikzNgpq+FZlVNwONy2A6LouSKJiMURVEs8X4fAXevAETwM8RlloZaWNWrLlzrW7IYGUXJl0LOM0JRFKXqvN9HYOoJP0YiAgCR/AxMPeEH7/cRLEVGUfJHW0YoiqLkTCgicPcKQN4Oe/wnZ5D25Ql4+qZQ06+MSf4W+HN4e9jb28HW1hbW1tbQ0NBgLWaKKk80GaEoipKz50HxEi0iWbEhyIoKBKICAQDJAEb5HBHv53A4MDc3h62trdSHjY0NLC0toaZGP9Yp5UPPWoqiKDmLTv6ViIgyU8H3PQsBP6qQIwBCCCIjIxEZGYkXL15IrcPj8WBpaVlgwmJrawszMzNwufQOPaVYaDJCURQlZ2b6WiCEIO3jAyTcPQydWq3B1dQFR1MXJDO11M8rFAoRGhqK0NDQAldGV1dXh42Njbg1RVrCYmpqCg6Hjuih5IcmIxRFUXJmLIgD/8Iq8L/5ARwuDJr1g5phzurmosw0CJNjYSDkY25LU4SFheLnz5+MR1paWqlfOzs7G0FBQQgKCiqwjra2doGJSm4SY2hoSBMWSmZoMkJRFCUnGRkZWL9+PTZs2ICsrCwAgG6dtuJEBAB4mjrgadph+4jGUof3EkKQkJDASE5CQ0MltjMzM0sdZ3p6Or5+/YqvX78WWEdPT6/Q20G2trbQ1dUtdQxUxUJnYKUoipKDmzdvYvr06fj27RujvMHMg0jSsRJvy2KeEUIIYmJiJFpU8j7CwsIgFApL/RrFYWxszGhNkdbCoqWlVa4xUOwq7vWbJiMURVHlKDw8HHPnzsXZs2cl9nXv3h1XvK6yMgOrUChEVFRUoQlLREQEyvsSUbly5UJvB1lbW0NdXb1cY6DKD01GKIqiWCQQCLB3716sXLkSycnJUus8ePAAv/32m5wjK77s7GyEh4cXeksoOjq6XGPgcDiwsLAo9HaQhYUFeDxeucZBlQ5NRiiKoljy/PlzTJkyBa9fvy6wTsuWLfH48WOl7wSakZGBsLCwQltYEhISyjUGNTU1WFlZFXpLqHLlynIZ0uzu7o6ePXuiSZMm5f5ayoAulFeO6MJWFEVJk5CQgGXLluHAgQNF3t5YsmSJ0iciAKClpYVq1aqhWrVqBdZJTU2VaFHJ/yio9ag4BAIBQkJCEBISUmAdDQ2NAkcI5ZabmJiU+XciEAjQtGlTtGrVCjNnzsSAAQPobaZioC0jJUQXtqIoKj9CCE6ePIn58+cX67ZF3bp18e7dOzr5WB58Pl8iQcmfwKSnp5drDDo6OoUOaba1tS3yGvTlyxfUqlVLvG1lZYUpU6Zg0qRJMDc3L+RI1URv05SD3IWt8v/AcvNojwKG4lEUpdqysrJw8+ZN3Lx5E7du3cKnT58KrX/s2DGMHj1aTtGpBkII4uPjC21dCQ0NRXZ2drnGYWBgILVVJe+jU6dOePr0KeM4DQ0NDBkyBDNnzoSzs3OBz69qLe80GZExoYigzca7jBYRUVY6sqJ/QMumDjgALAy18GhxR6U+cSiKKrtp06bBw8ND6j4bGxsEBgbSRe/KgUgkKnJIc3h4eLkPaebxeIW+RosWLTBz5kwMHDiQcR6oYss7TUZkzDcwDkMPMTPdpOcXkfDfEWja1odhy8HQqtIIpye1RMtqpqzESFEU+w4ePIjJkycXuH/79u2YM2eO/AKiGIRCISIiIgq9JRQZGVnuQ5oBwMLCAlOmTMHkyZPhH0tUsuWdJiMydtk/DLNP+4u3iSAboftGQZT+q9OVhkV1zF2wCOvmjqf3gimqArpy5Qr69esHkUgkLjM2NhaPJjExMUFwcDD09PTYCpEqhqysLIkhzfkfsbGxMns9dXV1GNZrC7UG3aFpVUtivzK3vNPRNDJmps+cJTDlw3+MRAQAsiK/YeOCSbh8eBuWLl2KoUOH0l7UFFVB+Pr6ws3NjZGItGzZEkeOHEG9evVACMGMGTNoIqIENDQ0UKVKFVSpUqXAOunp6VKHNAcFBeHmzZsler3s7GzE+t8B/O9Aw6oWDJsPhCgjBcJ0PgybDwQBEMHPwPOgeJVteactI8WU22ckkp8BAkCUnYn4W/uR+u5WgcfY29tj4cKFGDduHLS1teUXLEVRcvX582e0bt0acXFx4rJatWrh8ePHMDU1haurKx48eICQkBBUqlSJxUip8rZx40YsWbKkWHX19fXRsGFDGFhXxzO+HjQqV0HigxPICHkDAOCoa8F29ilweDlfane6OaGPk3W5xV4einv9pvcSionH5WBVr7oAcprMuOqaMGwxULyfq2MkcUxwcDBmzJiBKlWqYOPGjUhKSpJTtBRFyUtERARcXV0ZiYiFhQW8vb1haprzLXbSpEmYMGECTURU3JcvX7Bq1SqJcg6Hgxo1amDgwIH4448/cOnSJQQFBYHP5+PRo0dYuW4r9J26QdO6DtSMfg3/JdkZyAz7NTIrfwu9KqEtIyWUt7czISL83DEEJCtn7Pv48ePh7++PV69eST3WyMgIM2bMwOzZs+mHEkWpgKSkJLRr1w7+/v7iMn19fTx48ABOTk7isuzsbERHR8PaWrm+1VLFJxKJ0L59e7x9+xaOjo5o2LAhGjZsCEdHR9SrV6/QFYzztrynfHyI2CsbxfsMWg6GSdtRKt9nhCYjpZB3HPjqSYPg/8JXvM/DwwMODg5Yt24d7t+/L/V4HR0dTJo0CfPnz4eNjY28wqYoSoaysrLQo0cP3L59W1ymrq6OGzduoFOnTixGRrEhLS0NsbGxsLW1LdUsrrnzWAnTk/Bz13Dg/+NqNCxqwGr0dpUfTUNv05QCj8tBy2qm6ONkjfatmzP2TZ06FT9//sS9e/fw+PFj9OzZU+L4tLQ07NixAw4ODpg4cSK+fv0qr9ApipIBkUiE8ePHMxIRAPjrr79oIlJB6ejowM7OrtTTybvWt4THiMawtjCDhkV1cXlW1Dds7FlFKRORkqDJSBk1btxYomzixIn4+++/0apVK3h5ecHf3x9ubm4Sw32zs7Nx+PBh1K5dG25ubnjz5o28wqYoqgyWLVuGEydOMMo2bdqE4cOHsxQRpQpc61vi0eKOcOuX50ssIUD4B/aCkhOajJSRtGSEEIKxY8fi5MmTAABHR0ecOnUKnz59woQJEySG+4pEIpw5cwZOTk7o2bMnnjx5IpfYKYoqud27d2Pjxo2MstmzZ2PBggUsRUSpEh6Xg7GDezPKSjpUWBnRPiNlJBQKoa+vL3UBJy6XC09PTwwZMoRRHhoaiq1bt+LgwYNIS0uT+rzt2rXDsmXL0LlzZ5VY2ZOiVMG5c+cwePBgxuycgwYNwunTp+lEh5TMZGZmwtTUFKmpqQAAOzs7/PjxQymvBbTPiJzweDxGr/m8RCIRhg8fjnPnzjHKbWxssH37dvz48QMrVqyAoaGhxLH3799H165d4ezsjAsXLjAmUqIoSv4ePHiAESNGMBKRdu3a4Z9//qGJCCVTmpqaaN++vXg7JCQEX758YS8gOaB/QTIg7VZNLqFQiKFDh+Ly5csS+ypXrow1a9YgJCQEGzZskLq89KtXrzBgwADUq1cPf//9d7mvSElRlKQPHz6gT58+yMzMFJfVq1cPly5dgpaW6s79QLGnc+fOjG1Vv1VDkxEZKCwZAQCBQIBBgwbh6tWrUvcbGBhg8eLFCAoKwt69e2Fvby9R59OnTxgzZgyqV6+OvXv3Sr0tRFGU7IWGhsLV1RWJiYniMhsbG3h7e8PIyIi1uCjV1qVLF8b2rVsFz/atCmgyIgNFJSNAzsiZAQMGwNvbu8A62tramDZtGr5+/Yq///4btWvXlqgTEhJCZ3WlKDlJTExEt27dEBoaKi4zMjKCt7c3nSOIKle1a9dmnGP//fcfsrKyAOR8wT116hRboZULmozIQN26daGhoSF1n7W1NT5+/IigoCB8//4dzZo1K/L51NXVMWrUKHz48AHnz59HkyZNJOpER0djyZIlsLOzw8qVKxETE1Pm90FR1C+ZmZno27cv3r9/Ly7T0NDA5cuXUa9ePRYjoyoCDofDuFWTkpKCp0+fIi0tDQMGDJAYWq7saDIiAxoaGmjQoIHUfWFhYXjx4gWqVKkCa2trmJiYFPt5uVwu+vfvjxcvXsDHxwft2rWTqMPn87F27VrY29tjzpw5jG9wFEWVjkgkwqhRoxizKHM4HJw8eRJt27ZlMTKqIsl/q+b06dNwcXHBlStXCvwCrKxoMiIjubdq7OzscPToUca+VatWiZvXSoPD4aBLly6Fzuqanp6OnTt3wsHBARMmTKCzulJUKRFCMG/ePJw9e5ZRvnPnTgwcOLCAoyiq7HLPvZkzZ+Lvv/+GhYUFY7+Hhwd8fXOWH9HU1GQjxPJDlACfzycACJ/PZzuUAnl4eBAul0sePnxIRCIRadasGUHO4gIEANmzZ49MX8/f35+4ubkRLpfLeJ3cB5fLJUOGDCH+/v4yfV2KUnVbtmyR+HtatGgR22FRFcTr168Jj8eT+rme9zFy5Ei2Qy2W4l6/acuIjDRu3BgrV65EmzZtwOFwsG7dOsb+NWvWiCewkQU6qytFyZ6np6fETKrDhw/H+vXrWYqIqmicnJwwZ86cIuupWssITUZkxMnJCStWrBBvd+rUibFgVlRUFHbt2iXz161RowYOHTqE79+/Y86cOdDW1paoc+3aNbRu3Rrt27eHj48PY9ImiqJy3LlzB2PGjGGUubi44OjRo3RSM0quVq9eDTs7u0Lr0D4jlFQaGhpQU1NjlOVvHdm0aRMSEhLK5fVzZ3UNDg4udFZXV1dXNG3aFOfPn6ezulLU/7158wb9+vVjTCro5OSE8+fPq9yHPqX49PT0sGfPnkLr0JYRqtiaNWuGvn37ircTExOxefPmcn3N4szq6ufnh4EDB9JZXSkKwI8fP9CtWzckJyeLy6pUqYIbN24o3FpYVMXRq1cv9O/fv8D9NBmhSmTt2rWMxY127tyJyMjIcn/d8pjVlSYtlKqJi4uDq6srIiIixGUmJibw9vaWGMlAUfK2c+dO6OnpSd2nai12NBkpZ/Xq1cPIkSPF22lpaVi7dq3cXl+Ws7qeO3cO+/fvL++QKUou0tPT0bt3b3z+/Flcpq2tjatXr6JWrVosRkZROWxsbPDnn39K3UdbRqgSc3d3Z4x2OXjwIIKCgsr0nEIRgW9gHC77h8E3MA5CUeGdUmUxqyuXy8XUqVPh7u5OO8GWs5L+fqmSEQqFGDZsGGOUGZfLxenTp9GyZUsWI6MopunTp0v9vKYtI1SJValSBZMnTxZvZ2dnY9WqVaV6LqFQiNP336HNxrsYeugpZp/2x9BDT9Fm4114v48o8vjSzOr68+dPABAnVKtXr8bUqVMhFApL9R6ownm/jyj175cqGiEEM2fOxKVLlxjl+/btQ+/evdkJiqIKwOPxcODAAYkRXbRlhCqV5cuXQ0dHR7x94sQJxpoXxTVxwe+Ysf4gIvgZjPJIfgamnvAr9gUr76yujx49Qo8ePSTq5M7qWq1aNUyYMAE/fvwQ7ztw4AAGDx6MjIwMieOo0vN+H4GpJ/zK/PulCrZu3Tp4eHgwylauXMn4wkBRiqRJkyaYOXMmo4y2jFClYmFhgdmzZ4u3CSGMeUmK4+UrPxzbvQmZEV8k9uU24rt7BZS4Sb9169a4evUqXr9+jSFDhkhk4NnZ2Thy5Ajmz5/PKL9w4YLE0upU6QlFBO5eAcj720u4ewSJD08gyd8baYEvsfjQVcTGxdPbZKV07Ngxib+7cePGwd3dnaWIKKp41qxZA2tra/G2qrWMcIgSfKolJSXB0NAQfD5fqYfaJSQkwMHBgXHxfvr0KZo3b17ksenp6ajbwAk/Ar9A3awq9Oq7QJSeBKO2IyXqnprYAi2rmZY6zq9fv2LTpk3FHvbbsGFD3LhxA1ZWVqV+TQrwDYzD0ENPxduEiBCypR8gkrwdpqOjAxsbm0IflSpVYozkquhu3LiBXr16MW4vdu/eHZcuXZKYwZiiFNHFixfFw33nrtuNQYOHollVE/C4ivt3Xtzrt1qBeyiZMzY2xuLFi7F06VJx2bJly3Dnzp0ij128eDF+BOa0iGRHByHh7iEAAFfHEAZNmfe5o5PLduskd1bXVatWYevWrThw4EChw37fvn2L1q1bw8fHBzVr1izTa1dk+X9v6YEvpSYiQM6orC9fvuDLF8lWslyampqwtrYuNGExNzevELOLvnjxAoMGDWIkIs7Ozjh79ixNRCiloVW9OYzrtETCR18cfx6OC/ynsDTUwqpedeFa35Lt8MqEtozIWVpaGqpVq8aYa+TWrVtwcXEp8BgfHx+4urpK3cfR0IHtLE9weL/yyrK2jOTn5eWFPn36FHlroFKlSrh+/TqcnZ1l9toVSd6WEWF6EiJPLIIgPrRcX1NNTa3IhMXCwkJiduHysnXrVjRr1ky8xpMsBAYGomXLlozRYdWrV8fjx49hZmYmk9egqPLm/T4CU/55gcyoQER6LkGlXgugW7MVcv9KPEY0VsiEhLaMKCgdHR2sXLkS06dPF5ctW7YMnTp1kvrhGxsbK7FehoT/H8cBYGGohWZVTWQSKyEE+/btw9y5c4vVRyE2NhYdOnTA+fPn0bVrVwA5/SCeB8UjOjkDZvpaCt+kyKaE1EwAOT/3eJ99EGVlwGryYQiTYyFMjoMgORZamYloacFBWFgoQkNDERERUab+IwKBAMHBwQgODi6wDpfLhaWlZaEJi5WVlUw61Ono6KBt27ZwdHTEjBkzMGzYMEbH75KKjo5G165dGYmImZkZvL29aSJCKYysrCxERkYiIiIC4eHhiIiIkHi8/xaM7JREgOQs4yHKTAOQ01+Qg5z+gp3rWijt5yttGWFBVlYWateuzZhr5Pz58xJT/xJCMHDgQFy4cKHQ51M3c4BJx/HQsmuI/SObyCQ7FggEmDx5Mo4ePVriY9XU1HDs2DGYOnaEu1cAY2SIqjQpyppQRNBm411E8DOQ8v4u4q5th5qRBawnH2LU2zesMbo3/PWzy87ORmRkJEJDQxmPnz9/iv8fHh4ul2HY5ubmsLGxga2trdSExdraGlpaWoU+R3x8PCwtLZGVlQUg59bm+PHjMXXqVDg4OJQonpSUFHTs2BEvXrwQl+nq6uLevXto2rRpyd8gRZVQamqq1MQi/yMuLq7Ez12p3zLo1mzFKJN1q7gsFPf6TZMRlhw/fhyjRo0Sb9epUwfv3r0Dj8cTlx07dgxjx44t8rl4hmaoOXAhts4ehm4NZNeJVCAQICgoCJ8/f8anT58Y/+afEE0a444TYODcl1Gm6E2KbMl7i4YIspH45DQ4PHUYtXZj1CvNh41QKERUVJREwpL/IY/p/itVqlRkx9sxY8bg3LlzjOM4HA569uyJGTNmwMXFpcB+LrktceHxydi6cCJ8798W7+PxeLh69WqBtzwpqjgIIeDz+YxkoqDWjLzrHclapT5LoFu7DaNsp5sT+jhZF3AEO2gyouCEQiEcHR3x4cMHcdnyjbvh3KUfzPS1UIkkonEjJ6SkpEg93sGhGr5/DwQA6OjqIjIyCvp6unKJHcj5BistSfn27RsEAoG4nkHzATBqN4ZxCyr3dtKjxR2VtklR1i77h2H2aX/xtjCNj+izv8O400Ro2dYXl5fXh41IJEJsbGyhycrPnz/lMq+Mmpoa4xzKr1atWpg+fTpGjx7N+Dzwfh8Bd68AhCemI+7GLqS+u8U47q+//ir6lidVYeX+DRSnJUPe8yvp6RsgQ90APD0T8PSMoaZrAp267aBpUZ1Rj7aMlDNVTEYA4PLly4xVfXkGlWE98SDA5SLh7DIkB39g1NfS0sLgwYMxceJEvH//HlOnThXvO3PmDAYPHiyv0AuUnZ2NC/f9MHP/NWTHhSIz/DPUK1eBbt124GpoQ03vV38WRfzDYUv+Yb0AEHfTAymvr0GvYRcYdRgHnpYeqz8zQggSEhIYt4CkJSypqalyiUdPTw+jR4/G9OnTESw0wtQTfiAAEh+eAP/JaUbd0bOW4NjO9XKJi1IsAoEAUVFRRbZiREVFFZoEl4dKlSrB0tJS6sPKygqWlpawsLCAppY22my8i0h+BqRdsBX5Cx7twKoEevfujdoNm+DT21cAAGFSDJLfeINkpjESEUdHR0ycOBHDhw+HkZERgJypq/Py9PRUiGREXV0dWpVsoFO9OVC9OcIOTkT6lydIeuwJNUNzWE85Iq5b1iHIqqRZVRNYGmoxPmwMnPsg5fV1pLy9ibRvz+HQaxqcq3RjLUYOhwMTExOYmJjA0dFRah1CCJKSkoq8JSSLifJSUlKwd+9e7N27F4bVG0OjYXfwDM3Bf3KGUU+/UXd8Mu8EoYgo3Ac1VXoZGRnFasWIiYmR6ySBPB4P5ubmBSYZuQ9zc/MSdfpe1asupp7wAwdgJCScPPuV+fymyQiLRATgOA8F/p+MAAD/0UmIMtPA0dCGbp22qNK6F17umgo13q975IQQ3Lt3j/Fc169fR0JCAoyNjeUVfoHM9H91UiSCX/0QOGoaBdYrCVUcocPjciQ+bNSNraBTsyXSvjyBKC0R386sQ8/EV/Dw8EDVqlXZDlkqDocDQ0NDGBoaol69egXWS0lJQVhYmESrys+fP+Hj41PiDrf8b37ANz+oGVnCoPkAJL28DAizoV2jBYxdJiMyKRPPg+JpS5wSSE5OLlZ/DHnP/KyhoVFkK4alpSUqVarE6PsnK671LeExorHEoAALFRkUQJMRFj0PikdapdrQqtIIGT9eAwA46lowajEY+k6u4GrqIBnAix8JjA/Rr1+/IiKCuUZJdnY2zp07h4kTJ8rzLUjF+JYvyBKX5yYjZRmCnNsvQBVH6Ej7sDFo1h9pX36tLOvj44N69erB3d0dc+fOldv8H7Kmp6eHWrVqoVatWozyf//9F9evXy/WcxgYGMDR0REG1tXhm6gPDbOqUK9kB666JrSrNUXSs/Oo1GshONycC0NFaYkTiUQKN5EdIQTx8fHFasmQ122+XHp6ekW2YlhaWsLY2Jj1GY1d61uic10LlfsyBpQyGdm7dy82b96MyMhIODo6Yvfu3WjWrFmB9Xfs2AEPDw+EhISgUqVKGDhwINavX1/kMD9Vl/vhaNR2JBKJCIa/jYCWdZ0C6+XK3yqSy9PTk/Vk5ODBg9DT08PKHu0w3dMfRJinZYSnLm5SHF2bi7dv/NGoUaNiP3fuInL5G1xzF5FThRE6kh82LbAg6CKePH4srpOeno5Fixbh5MmTOHTokMpMMhcfH48ZM2ZI3efg4ABHR0c4OTnB0dERjo6OsLe3B4fDkdrfRsu2PqPjL1D6ljhlIBAI4OXlhf3798PDw6PEw6BLSygUIiYmpsiWjMjISPFwbXkxNjaWvDViYYFUnj54usaoUdUOXZ3rwNBAX65xlRWPy1HJFr4SJyNnzpzBvHnzsH//fjRv3hw7duxA165d8fnzZ6mTCHl6emLJkiU4evQoWrVqhS9fvmDMmJzRFdu2bZPJm1BWuR+OmpY1Ye72Z5H1ct2/f19qvfv37yM0NBQ2NjayC7KEHBwc0LlzZzRq1AgTpyzCijwtI1DTgE78F+h9vo5pm+7g+/fvxX5eaYvI5VKVSX9y5f+wWbhgAfrlSUZyvXnzBs2bN8fMmTOxdu1a6Osr14dqfvPnz0dycjKaN28uTjgcHR3RoEGDQju+Setvk5esJwNUJGFhYTh8+DAOHTqEsLAwtGvXTiaJSN5JuAp7REVFQSQSyeCdFA+Hw4GZmVmRrRgWFhYSX3a930dgxWlfxAr+v8Dctxhsf56sEq2qqqDEo2maN28OZ2dn7NmzB0BOk6CtrS1mzpyJJUuWSNSfMWMGPn78yFh/Zf78+Xj27BkePXpUrNdU1dE0uRNdlaSHNCEENjY2CA8Pl/qcW7ZskVhdV57S09NhbGyMzMxMiX1cLlf8weXs7Iznz58X+3mlffslIiGEaXyVH6EjFApRp04dfP36tcA6NjY22Lt3L3r37l1gHUUmFAoRGBiIatWqlep+e26rGSC9c58it5qVtA+USCTCnTt34OHhgStXrjD61/z999+M+YvyS0tLk0gopLVklGYSrrJQU1ODhYVFkX0yzMzMSnVr8tKLQIyZvRzZiRGo3HuRuFwZzg9lVy6jabKysvDq1SvGQm9cLhcuLi7w9fWVekyrVq1w4sQJPH/+HM2aNcP3799x/fp1jBwpudpsrszMTMbFLCkpqSRhKg1pnRZzFdRD+tu3bwUmIkBOSxSbyYi2tjbatGkjdfG/vN+gSjryJ++tqvQf/kj99BAZ319BzcgCFsM2SK2nKng8HubNm8cYyp1faGgo+vTpg/79+2PXrl2MpcaVAY/HK9Mii8raua8kfaDi4uJw7NgxHDhwQGpiqqamBhMTE5w8ebLAlgx5f5Zqa2sXqz+Gqalpqfu5FJbMEUJw8eIlDB0/FVmJUTBqNxqirHRwNbRz9kO1WlWVWYmSkdjYWAiFQpibmzPKzc3N8enTJ6nHDBs2DLGxsWjTpg0IIRAIBJgyZQqWLVtW4OusX78e7u7uJQlNaZX0Q7Sg/iK5/Pz88OnTJ9SuXbs8wi0WFxeXIlciHjhwYImeMys+Anzfs0gJuA9BQhggzJkPQJgci+y4UKib5tyaUtV+AaNGjcLKlSsRGxtbaL0LFy7g1q1b2LlzZ7Fm71Ulyta5rzh9oLrWs8CzZ8/g4eGBM2fOSG1xzCUQCNCrV6/yDfr/DAwMCk0uclsyDAwMyrXTZ2HJXHWtVMyaNQs3btwQ70t8eBKC5FiYdv6V2BMAEfwMOtqKZeXeFf/evXtYt24d9u3bh+bNm+Pbt2+YPXs21qxZg5UrV0o9ZunSpZg3b554OykpCba2tuUdKmtK8iFaUH+RvDw9PfHHH3+UR6jF0rlzZ0brWX7NmjVDlSpVinyesLAwnD17FqdPnxbf0uGoa8GgcS8kvbgorpfyxgcmHcerbL8AIGcBuenTpxeapLdu3RqdOnVCx44d0aJFCzlGpziUpXNf3j5QhBCI0pPA0zEEkHNxJFnpmLZyEwx/3IO/v7/c4ipsEq68j7IsXigrBSVz4bGJcJs0F6kvL0KQna/TrEiA9MAXQGfJVkZVbFVVJiVKRnLHT0dFRTHKo6KiYGFhIfWYlStXYuTIkZgwYQIAoEGDBkhNTcWkSZOwfPlyqU1zmpqa0NTULEloSq84H6LS5heRxtPTE+7u7qwNQ3NycoKJiQni4+Ol7h80aFCBx8bExOD8+fM4ffo0Hjx4IDFZkanrTGjbOyLplRcgymkdSXl/B8ZtR2FVr8YK+y1YFqZNm4aNGzcWOBX1wIEDMWfOHPkGRZXK86B4RPAzIEiORfzNfciOD4fV2F3ITohAiv91pLz/DyQrTSavxeVyizUJl4WFhUxWXpYHaR3aCSFI+/IYCXePQpgUXeCxpq6zpJaraquqsihRMqKhoYEmTZrgzp074mnMcztTFTQkLy0tTSLhyO2gpgQz0SuUwMBAhIWFwdTUFKtXr8aaNWsQHZ3zR1evXj0cOHAA27dvx8WLF/HixYtCh1uXJx6Ph44dO0osdpYrfzLC5/Nx6dIlnDp1Crdv3y5wwqsZM2agx+S5cPcKQFzNlkj79BAAIEpPgpt5hML2C5AVMzMzjB49GgcOHJC6f968ebCzs5NY/ZlSPFFJ6Uh5exPxd4+AZObMqxF/9wh4WnoQJEaBo65RqmRkwIAB6NatGyPJqFy5crlMwsWm3GQuV2ZUIOJveSA7JhhqprbgampDmJYEbmYKBALmApDxN/fCYuRW8LRzOlOq8mgrpUJK6PTp00RTU5McO3aMBAQEkEmTJhEjIyMSGRlJCCFk5MiRZMmSJeL6q1atIvr6+uTUqVPk+/fv5ObNm6RatWpk8ODBxX5NPp9PABA+n1/ScFXKP//8QxYsWEASEhIIIYRUr16d4P+tuvb29uJ6379/J76+vuwE+X/79+8Xx5b30bx5c0IIIampqeTMmTOkb9++RENDQ2rd/MdlZmYSQggRCEVk1z8XGPs7dOjA5tuVm8+fPxMOh0MAEHV1ddKmTRvGz0FLS4v13z1VuKCgIOLcur3kec7hEstxe4j94qvEfvFVYj3tb7L54Eni7u5O+vTpQ2xsbIr8O6lbt67470SVXXodKv456TfuyfgZ6DfpTdSMrSR+NsadJhLbmSeJ9ZQjxGb2aWK/+Cqp8v/HjXfhbL8llVXc63eJkxFCCNm9ezexs7MjGhoapFmzZuTp06fife3atSOjR48Wb2dnZ5PVq1eTatWqES0tLWJra0umTZsmvqAWB01GcmRnZzO2GzVqJP5DMzU1ZSkq6QIDA6V+WM6fP58MHTqU6OrqFvnBmve9BQcHM55fKBSSatWqMep9/vyZpXcrX3379iUAiJubG0lMTCT169dn/BwqVapEvn37xnaYVD5CoZDs2bNH6rnPUdMkxh0nELuFl8UXyRbrbhOBUMR4jqioKOLt7U3WrVtHBgwYQKpWrSrxXGvXrmXpHcrPk2+x4mTEtOf8Ij9DWrVqRa69CSUt1t0WH2f//58xTUTKV7kmI/JGkxHpfvvtN/Efm6amJtvhSJD2Qfn9+3fi6ekpkUgU9OBwOMTb21vq82/YsIFRd8GCBXJ+h+x49OgRAUDu379PCCEkJCSEWFkxvwnWqFGDxMTEsBwplevLly+Mv9e8D03b+sRq0kHxBbKk39bj4+PJnTt3yKZNm4ibmxtp2LChyiejAqGItFh3m1iN20N06nUq9DNEXV2dfPjwQXzck2+x5NLrUPLkW6xEskfJHk1GKoBu3box/uiysrLYDolh4sSJUm/REEJIVlYW2bRpU5HJyKpVqwp8/sjISKKmpsZoEcjIyJDDO2OXSCQiEyZMICLRrw/S169fEz09PcbPrnXr1iQ9PZ3FSCmBQEC2bNlCtLS0JM5tPT09Mn3FetJ87U2Zf1vPe26oGpFIRG7evEmaSLvVJeXx+++/sx1yhUaTkQpg0KBBjD+6ktz6koczZ84w4tu6dat43+PHj0mVKlUK/RDp0qULEQgEhb7GwIEDGcecPn26vN+WQpCWeN64cYPweDzGz2PQoEFEKBSyECH1/v170qxZswLP7R8/fhBC6Lf14hKJROTEiROkYcOGxUpCAJDatWtXiC8oiowmIxXA2LFjGX94P3/+ZDskhpiYGHFnSwAkODiYZGdnE3d3d4mLZv6Hra1tsW4z3Lx5k3Fcx44d5fDOFNfBgwclfpYV5faVosjKyiJr166V2jHbyMiIHD16VKVbLsrTz58/ycqVK4m5uXmxkpEHDx6wHXKFR5ORCmDmzJmMP7yPHz+yHRKDQCgiterlfIup59SUfA/6ITH6AwDhcrmMWwzq6uqMTtGFEQqFEn1Tvnz5Us7vTLEtXbpU4me8d+9etsOqEPz8/IiTk5PUC2Pv3r1JWFgY2yGqhMzMTInbwPkf+vr6RbasUuWvuNfv0i0GQCkEPT09xnZKSgpLkUjyfh+BNhvvIkKvBgDgh8AANerUl1gc0d7eHg8ePED37t3FZdu2bUPz5s2L9TpcLhcTJ05klB0+fLiM0Su3tWvXYtiwYYyymTNnwsvLi6WIVF9mZiZWrFgBZ2dniRlTTU1NcerUKVy6dAlWVlbsBKhijhw5giNHjhRaJzk5GdeuXZNTRFRZ0WREiSlqMpI7TXMEPwMaVnUAAKnv70KYwYxvyJAh8Pf3R+vWrVG3bl0AgJubG6ZPn16i1xs7dixjJc+//voLWVlZhRyh2rhcLo4ePYp27dqJy0QiEdzc3PDy5UsWI1NNz549Q+PGjfHnn39KTNg3ZMgQBAQEwM3NjbUZkVWJSCTCwoULMW3aNMbCmwXZuXOnHKKiZIEmI0osfzKSnJzMUiS/5J+mOSvis0QdroYWjh79C6dOnYKRkREAoE6dOqhduzYOHTpU4g9tCwsL9O7dW7wdExODy5cvl/YtqARNTU1cvHiRsWBiWloaevbsiR8/frAXmApJS0vDggUL0KpVKwQEBDD2WVhY4MKFCzh9+jTMzMxYilC1pKenY/DgwdiyZQujvGbNmnB2dhZv51035+7du3j37p3cYqRKjyYjSkxfX5+xrQgtI/mnaTZsNQRqhr9WedawqAGL0TtRu20vRtLRqFEjnD9/XiLBKq5JkyYxtg8ePFiq51ElxsbGuH79OuNiGBUVhe7duyMhIYHFyJTfgwcP4OjoiK1bt0p8Qx89ejQ+fPiAfv36sRSd6omOjkbHjh1x/vx5Rvlvv/2GJ0+eYPDgwQByPhPzLrIKALt27ZJbnFTp0WREiSnibZr8K19y1bVQuf9ycNQ0YNB8ICxGbIK6ibVEvRo1aohv1ZRG586dYW9vL96+ffs2AgMDS/18qqJq1aq4evUq49vix48f0a9fv0KXo6ekS05OxowZM9CuXTt8+/aNsc/GxgbXr1/HsWPHYGJC1zmRlU+fPqFFixZ4+vQpo3zYsGG4desWTE1N0aFDBwDA+vXrMX/+fOjq6orrnThxArGxsXKNmSo5mowoMUVMRqStfKlh5gCrSYdg3H4MODz1AuuVBe3IWjBnZ2ecOnWKsWDl/fv3MW7cOLpYZQncunULDRo0wN69eyX2TZ48GR8+fEC3bt1YiEx13b9/H61atUJQUBCjfMWKFThx4oR4dXcnJyd0794dU6dOhZGREUaPHi2um5GRQVtKlQBNRpSYIiYjzaqawNJQC/l7fajpmwLIWSHTspxWyBw7dixjddKjR49W6I6sefXu3VuiudrT0xMrVqxgKSLlkZiYiPHjx6NLly4IDg5m7HNwcMDdu3exf/9+GBgYsBShajpx4gQ6d+7MuKWopqaGI0eOYM2aNYzbvDweD2fOnBEn3LNmzWI81759+5CdzVy9l1IsNBlRYoqYjPC4HKzqlXO7JX9Ckru9qldd8LiyH1lgZWWFXr16ibejo6PpcNY8pk+fjvnz5zPK1q1bhwMHDsI3MA6X/cPgGxgHoYi2luTy8vJCvXr1cPToUUY5h8PBnDlz8PbtW/EtAko2CCFYs2YNRo4cyUggDAwMcOPGDYwbN07qcXk/D2vVqsVopQoLC5Pob0IpFpqMKDFFTEYAwLW+JTxGNIaFIfNWjIWhFjxGNIZrfctye23akbVwmzZtwsCBAxllU6ZNRd+lezH7tD+GHnqKNhvvwvt9BEsRKobY2FgMHz4cvXv3Rnh4OGNfrVq18OjRI2zfvp3RN4Equ6ysLIwbNw6///47o9zOzg6PHz+Gi4tLsZ9r9uzZjG06zFexcYgS3DROSkqCoaEh+Hw+bQrNIyIigjGJ0qhRo/D333+zGBGTUETwPCge0ckZMNPPuTVTHi0ijNcUCuHg4ICQkBBx2ffv31G1atVyfV1lkp6ejk6dOsHX11dcxtHQhsWwjdAwdxC3YJV34qiICCE4d+4cpk+fjpiYGMY+Ho+HhQsXYtWqVdDSkm2fJyrndtiAAQNw9+5dRnmTJk3g5eUFS8uSnYuEENStWxefPn0Slz19+rTYEypSslHc6zdtGVFiitoykovH5aBlNVP0cbJGy2qm5Z6IADkXjAkTJjDKaEdWJm1tbVy8dBlaptbiMpKVjlivLSBEJJ4jxt0roELdsomMjMTAgQMxePBgiUSkQYMGePr0KdavX08TERkRioj49uCF+6/RunVriUSkV69euH//fokTESDnVlr+viO0dURx0ZYRJSYSiRgdNrt06QIfHx8WI1IMYWFhsLOzE8//YGFhgZCQEKir54zkyT2PlH1GzMePH8Pf3x88Hg88Hg9qamri/xdV9jEyBb+ffoR4nz0gmWng6ZvCbPAaaFSyY7zGqYkt0LKaKUvvUD4IITh+/DjmzJkjMf+Kuro6li9fjqVLl0JDQ4OlCFWP9/sIuHsFIIKfgcyIL4g+/wdEqYmMOrNmzcK2bdsYn3EllZqaChsbGyQm5jy3mpoafvz4AWtr68IPpGSmuNdvtQL3UAqPy+VCV1cXqampABRjBlZFYG1tjZ49e+LKlSsAcr7xXr16VTy3Rt++fXHp0iUYGhqyHGnZ1KtXD1OnTi3zDJM8PROYu62Huonkuin554NRNT9//sTkyZNx48YNiX1NmzbF0aNH0aBBAxYiU125y0UQAGlfnyL2ymYQwa85bzgcDrZv3y7R56M0dHV1MXHiRGzevBkAIBAI4OHhgbVr15b5uSnZordplFzeWzWKdpuGTdI6sopEIowePRr37t1DdHQ0S5HJjpGREXx8fErdH0bd1A4WIzbDetrfUhMRQPbzwSgKQggOHjyIevXqSSQimpqa2LhxI3x9fWkiImN5l4vIigpEzIU/mYmImiZqDF+NGTNnFfwkJTR9+nTGHDsHDhxARoZqJ9nKiCYjSo4mI9K5urrCxsZGvO3j44PRo0fjzJkzAHKmRVcF5ubmWLduXYmOUVdXx6rVq9Fo9n5oWdeReruqPOeDYdv379/h4uKCyZMnS7QmtmrVCm/evMGiRYsYiy9SspF3uQh1MwfoNf61WjdX1wjmw9Yj07oJngfFy+w17e3tGVPzx8bGwtPTU2bPT8kGTUaUHE1GfuHz+QgMDERSUhK4XC6jIyshBCdOnBBvK3PLSFxcHE6dOoVRo0bBwsICQ4cOLfaxrVq1gr+/P1avWgX3fk4A5D8fDFtEIhF27dqFBg0aSHSU1NHRwc6dO/HgwQPUqlWLpQhVX+5tP0II0r8+hXrlqtCu5gx1UztYjtwKTcuajHqykv+Wz44dO+jswwqGpv5KjiYjv2hqasLNzQ0vX76EpqZmoXNAKFPLiEgkwuvXr3H9+nXcuHEDz549K9by6Xnp6elhw4YNmDp1qrjJOnc+mNyOhLksDLWwqlddlRrW+/nzZ4wfPx6PHz+W2NehQwccPnwYDg4OLERWsZjpayE7MRIJtw8gI+QtrKcchV7ddoBICK6WHqOeLLVp0waNGjXC69evAQDv3r3DvXv36IR1CoQmI0oubzKSnp4OoVBYpt7nykxLSwsXLlxAkyZNEBMTU+hCcIreMpKQkICbN2/i+vXr8Pb2LlO8PXr0gIeHB2xtbSX2uda3ROe6FnKfD0ZeBAIBtm3bht9//13ifNDX18eWLVswceJEpR9ZpQwyMjLgc2IPIo6sAxFkQb9pH/B0mJ3IOchJhmV9e5DD4WD27NkYM2aMuGznzp00GVEgNBlRcvnnGklNTa3Qw59tbW1x9uxZuLi4QCgUFlhP0VpGRCIR/P39cePGDVy/fh1Pnz4tVuuHgYEBunTpAldXV0ybNo2xFk/lypWxa9cuDBkypNCLbe58MKrm3bt3GDduHF6+fCmxr1u3bjhw4IDUBI2SPW9vb8yYMePXStpcNRg692PUKe/bg25ubli0aJE4sb9y5Qq+f/9OW8QUBO0zouT09fUZ2xX9Vg0AtG/fXjyUryCKkIwkJCTg7NmzGDt2LKysrNCkSROsWLECT548KTQRadiwIZYsWYL79+8jNjYW//77L9q3b89IREaPHo2PHz/Czc2twn3rz8rKgru7O5o0aSKRiBgbG+Off/7BtWvXaCIiByEhIRgwYAC6dev2KxEB0LXvINjY2jDqlvdyEZqampg6dap4mxCCPXv2lMtrUaVAlACfzycACJ/PZzsUhTNjxgwCQPz4/Pkz2yEpBJFIRIYNG8b42eR9tGnThpWYXr9+Tf7880/Spk0bwuPxCowv70NfX5/079+fHD58mISGhkp97nPnzhEApEqVKuTmzZtyfmeK4+XLl6Rhw4ZSf479+vUjERERbIdYIWRmZpL169cTHR0did8Dl8slX758IQKhiDz5FksuvQ4lT77FEoFQVO5xRUREEHV1dXEsBgYGJCkpqdxftyIr7vWb3qZRcoo+JTxbOBwODh06hPfv3+Pt27cS++XVMpKYmIjbt2+L+35ERBRvAboGDRqge/fu6NatG1q1aiWePbYg7969w7x58/DHH39UyMXbMjIy4O7ujs2bN0vcnqtcuTL27t2LgQMHVrhWIjbcvXsX06dPZ6wJk9fAgQNRo0YNAJD77UELCwu4ubnh+PHjAHJmBz127Bhmzpwp1zgoKeSUHJUJbRkp2Nq1axnfOu7du8d2SAolMDCQGBsbS3w7MzQ0LJfXE4lExN/fn6xbt4789ttvJWr96NevHzl06BD5+fNniV83ISFB9m9GSTx+/JjUqlVL6s912LBhJCYmhu0QK4Tw8HAydOjQIs/1169fsxrny5cvGfHUqFGDCIVCVmNSZbRlpIKgLSOFc3BwgKenJ7p3786YV4DP5yMjI0Mmi57x+Xzcvn0bN27cwI0bNySWnC9I/fr10a1bN3Tv3h2tWrUq09onRkZGpT5W0QUEBCAlJQXNmjVjlKempmLFihXYuXOnxJwRlpaW2L9/P3r37i3PUCskgUCAPXv24Pfffy9ySYru3bvDyclJPoEVoEmTJmjTpg0ePXoEAPj69Stu3LiBHj16sBpXhSeX1KiMaMtIwQ4fPszI8k+fPs12SApp3bp1Et/QQkJCSvVcIpGIvHnzhmzYsIG0a9eOqKmpFav1Q09Pj/Tt25ccOHCg1K9d0URHR5OqVauSo0ePMsrv3r1LHBwcpP6cx40bV6FbiuTp0aNHBfbRkfZ4+PAh2yETQgj5999/GXF17tyZ7ZBUFm0ZqSBoy0jxLFmyBC9fvsSFCxfEZVFRUcUeUZGUlMRo/QgLCyvWcfXq1RO3frRu3Zqu/FoCmZmZ6NevH4KCghASEgIg5/ewePFi7N+/X6K+nZ0dDh06hC5dusg71Aqrdu3aWLZsGXx8fODj41Noq+Bvv/2GNm3ayDG6gvXt2xd2dnbi8+rWrVv48OED6tWrx3JkFRdNRpQcTUaKh8Ph4NixY/j48SM+fvwIALj/5hvC1CylTvRFCMGHDx/Es54+evQIAoGgyNfR1dWFi4sLunXrhm7dusHOzq7c3pMqI4Rg0qRJ4hlTQ0JC4O3tjUmTJuHnz58S9adNm4YNGzZIDHWnypepqSmGDBmCIUOG4NGjR+jQoUOBfyfLli2Tc3QFU1NTw/Tp07F48WJx2a5du3DgwAEWo6rYOIQo/gT9SUlJMDQ0BJ/Pr9ATeklz//59tG/fXry9du1aLF++nL2AFNznz5/RuKkz0lKSYdptNvQadgaQsyjcwo524Eb8SkBCQ0OL9Zx169YVJx9t2rSBpqZmeb6FCmHDhg1YunSpeFtXVxepqakS9apXr47Dhw+jXbt28gyPyufDhw9o06YNEhMTpe5v1KgRXr16pVCjmeLj42FjY4P09HQAgLa2NkJDQ2FionqLQ7KpuNdv2jKi5OikZyUTlG0AvS5zkHZhDQSpiciKCUb695eI+v4KA1YEAKKiWz90dHQYrR/29vZyiLziuHjxIiMRASCRiHC5XMydOxd//PEHdHR05BkelU9ISAi6du3KSEQsLCwQHR0tnrxv6dKlCpWIAICJiQlGjx4tvuWXnp6OQ4cOMVpLKDmSQ/+VMqMdWAv2+fNnRkesGTNmsB2SwhIIRaTFutvEfvFVYtjKjagZWxW7413t2rXJvHnzyK1bt0hGRgbbb0Vl+fn5SZ0oK++jTp06xNfXl+1QKUJIXFwcqVOnjsSw+bdv35IePXoQAKRmzZpEIBCwHapUAQEBjNhtbW1JdnY222GplOJev+l08EqO9hkpvudB8eLVaQ3bDIOGRfUC6+ro6KBnz57Yt28fgoKC8PHjR2zduhUuLi70Nkw5CQ8PR69evZCWllZgHW1tbRw4cAAtWrSQY2SUNGlpaejZs6e4DxaQM+X6lStX0KBBA0yYMAEAsHjxYoVdvLNOnTqMDs8/f/7ExYsXWYyo4qLJiJKjyUjxRSdniP/P4XBh2HIwY7+aiQ30m/bBag9PxMXFwcvLC1OnTkWVKlXkHGnFk5aWht69exc5Sik9PR1t27bF2LFjERkZKafoqPwEAgGGDBkCX19fcRmXy8Xp06fRtm1bADmrRTs7O2PEiBFshVkss2fPZmzv2LGDnUAqONpnRMnln/q7qEmHKjIzfeYEZ+qV7KFbvyM0LWtBy6EJ1I0sAABdOreQyWRoVPGIRCKMHj0ar169KvYxZ86cQXZ2Njw8POgIGjkj/x/pdPXqVUa5h4cH+vbtK95WV1fHlStXFH44u6urK2rWrIkvX74AAJ48eYKXL1+iadOmLEdWsdCWESXH4/Ggra0t3qYtIwVrVtUEloZa4qXKORwOKvWYB/3GPaBuZAEOckbVNKtKe9OXF6GIwDcwDpf9w+AbGAehiGDVqlU4d+5ckcfa2tpi6tSpuHbtGuLi4nDixAmaiLBg+fLl+Ouvvxhlq1evxqRJkyTqWlhYyCusUuNyuRJr0+zcuZOlaCouOrRXBZiZmSEmJgYA4OjoCH9/f3YDUmDe7yMw9YQfgJwea7lyE5TyXMK8ovN+HwF3rwBxvx0AUA96jG9n10utz+Fw0Lx5c/Ts2RM9e/ZEw4YNFW5ERkWza9cuidsaU6ZMwb59+5T6d5OSkgIbGxvw+XwAOa06wcHBsLSknwVlVdzrN20ZUQF5+43QlpHCuda3hMeIxrAwZN6GsTDUoolIOcpNAvMmIhmhH/Ht/GZGPX19fQwcOBDHjh1DZGQkfH19sXz5cjg6Oir1xU4VnDlzBnPmzGGU9e/fH3v27FH6342enh7Gjx8v3s7OzpY6yy9VfmjLiApwdHTE27dvAQDm5ua0Y18xCEUEz4PiEZ2cIXUGVkp2hCKCNhvvMhIRAT8KEf/MgyiNDzUjC1Sq2wrHVk1Bh/btFL6PQUV0+/ZtdO/eHdnZ2eKytm3bwsfHR2X6VwUFBaF69eriuVHMzMwQHBysMu+PLXTSswqEtoyUHI/LQctqpmyHUSHkDqkW8KPAf/ov9Bv3Qor/DRg0GwCd6s5QM7EBh8OBQbXGNBFRQH5+fujXrx8jEWnQoAEuX76sUhfqqlWronfv3rh06RIAIDo6GqdPn8aYMWNYjauioLdpVEDeZCQ1NVWc2VOUIsgdUs1/dgEp/t6I+GsmhOlJ0K3TBuqmtuIm/rxDrynFEBgYiG7dujG+5Njb28Pb2xtGRkbsBVZO8veH2blzJ5Tg5oFKoMmICsg/10hhk0ZRlLyZ6WtBmJqA1He3cgqICGlffAGumkQ9SnFERUWha9euiI6OFpeZmprCx8cHVlZWLEZWftq1awdHR0fxtr+/Px4+fMhiRBUHTUZUAJ34jFJkzaqaQPTuGoggS1ym16AT1PRyhlDTIdWKJzk5Gd27d0dgYKC4TEdHB9evX0etWrVYjKx8cTgcqa0jVPmjyYgKoMkIpciSk/hIeJlngiwOFwbNB+b89/9Fq3rVpR2IFURmZib69esHPz8/cZmamhrOnz+PZs2asRiZfAwdOhSVK1cWb1+6dAk/fvxgL6AKgiYjKiB/MkJnYaUUyb59+5Ce+itB1qnzm3i2WzqkWrHkzoZ7584dRvnRo0fh6urKUlTypaWlhcmTJ4u3RSIR9uzZw2JEFQNNRlQAbRmhFFVaWprEWh8HNq/BTjcnnJrYAo8Wd6SJiIIghGDu3Lk4c+YMo3zz5s0YOXIkS1GxY+rUqVBT+9Wn6fDhw/RztZzRZEQF5E9GXnwNh1BEe4BT7Dt69Kh4dmAA6NmzJ0Z0/w19nKzRspopvTWjQDZu3Ihdu3YxyubNm4cFCxawFBF7rKysMGTIEPE2n8/HP//8w2JEqo8mIyogOEnI2F5/xR9tNt6F9/sIliKiqJxZLDdvZs6wunTpUpaioQrz119/Sfxuhg8fLvH7q0jyd2TdtWsXnTahHNFkRMl5v4/AyVfRjDKSlY5IfgamnvCjCQnFmlOnTiEkJES83bZtW7Rq1YrFiChprl69iokTJzLKunTpgqNHj4LLrbiXCGdnZ7Rs2VK8/fnzZ9y8eZPFiFRbxT3TVIBQRODuFQCOhjajXJSdIV4Ezt0rgN6yoeROJBJhw4YNjLJly5axFA1VEF9fXwwePBhC4a/WVWdnZ5w/f57OhgvJ1pH8/Z8o2aHJiBLLnWabq8GcLIpkpef8CyCCn4HnQfEsREdVZJcvX8bHjx/F240aNUKXLl1YjIjK7+PHj+jZsyfS09PFZTVq1MC1a9ck+qFVVP3794e1tbV428fHB58+fWIxItVFkxElljt9toZFDZj2mAfTXgtgM8sTBs36S61HUfJACMH69esZZUuXLlX6lV1VSWhoKLp27Yr4+F9fVCwsLODj48OYY6OiU1dXx/Tp0xll+Tv5UrJBkxElZqavBUFSLOJ89iDhv6PQqd4CPG0DcHh0mm2KPXfv3sWLFy/E2zVr1kT//v0LOYKSp4SEBLi6uuLnz5/iMgMDA3h7e6Nq1aosRqaYJk2axFgQ8O+//0ZCQgKLEakmmowoqYyMDNw+5YGIw1OQFnAfBs36SdyuodNsU2zI3yqyaNEi8Hg8lqKh8kpPT0fv3r3x4cMHcZmGhgYuX77MWJOF+sXU1JQxz0paWhqOHDnCYkSqqVTJyN69e1GlShVoaWmhefPmeP78eaH1ExMTMX36dFhaWkJTUxM1a9bE9evXSxVwRUcIwcWLF1G3bl38vnIlRNkZ4GobwKBRD0Y9Os02xYbnz58zZu+0sbGpcBNmKSqBQAA3Nzc8evRIXMbhcHDy5Em0b9+evcCUwKxZsxjbe/bsgUAgEG+fPHlS3iGpnBInI2fOnMG8efOwatUq+Pn5wdHRUWJlx7yysrLQuXNn/PjxA+fOncPnz59x6NAhRqcgqng+fPiAzp07o3///ggKChKXj548A1aVjRh16TTbFBvyt4rMnz+fjspQAIQQTJ06FVeuXGGU79mzBwMHDmQpKuVRv359dOrUSbwdHByMy5cvA8hJRKZMmQJC6KjFMiEl1KxZMzJ9+nTxtlAoJFZWVmT9+vVS63t4eBAHBweSlZVV0pcS4/P5BADh8/mlfg5lFh8fT2bOnEl4PB5BziAZ8cPU1JQkJycTgVBEnnyLJZdeh5In32KJQChiO2yqgvnw4YPEuZmSksJ2WBQhZOXKlRKfHStXrmQ7LKVy5coVxs/vt99+I0+ePCGampoEAImLi2M7RIVU3Ot3iVpGsrKy8OrVK7i4uIjLuFwuXFxc4OvrK/WYK1euoGXLlpg+fTrMzc1Rv359rFu3jjGuPb/MzEwkJSUxHhWRUCiEh4cHatSogd27d0v9mc2fPx96enrgcTloWc2UTrNNsWbjxo2M7VmzZkFXV5elaKhc+/btw5o1axhlEydOhLu7O0sRKacePXqgWrVq4u2HDx+ie/fuyMzMBADGBH9UyZUoGYmNjYVQKIS5uTmj3NzcHJGRkVKP+f79O86dOwehUIjr169j5cqV2Lp1K9auXVvg66xfvx6Ghobih62tbUnCVAn3799H48aNMW3aNMTFxUmtY2JighkzZsg5MoqS9OPHD8Z9cz09PXpuKoBz585J/B769OmDffv20aHWxRAaGop//vkHly5dwr179yTmyklMTBT/nyYjZaNWdJWyEYlEMDMzw8GDB8Hj8dCkSROEhYVh8+bNWLVqldRjli5dinnz5om3k5KSKkxCEhwcjIULF+Lff/8tsu78+fOhr68vh6goqnBbtmxhtNxNmTIFJiZ0FBeb/vvvPwwfPpzRl6FNmzY4deoUY0VaqmBWVla4cuUKzp8/X2Td4OBgOUSkukp0RlaqVAk8Hg9RUVGM8qioKFhYWEg9xtLSEurq6oyhfXXq1EFkZCSysrKkdm7T1NSEpqZmSUJTekKhEOvWrcO6deuQkVH0JGXGxsb0myelEKKiohhDHTU0NDB37lwWI6LevHmDvn37IisrS1xWr149XLlyBdra2oUcSeXF5XLxzz//4MePH3j16lWhdWnLSNmU6DaNhoYGmjRpwhi6JxKJcOfOHcaCQnm1bt0a3759Y6x2+OXLF1haWtJe9nnweDxMmTIFBw4cwKBBg2BgYFBo/Xnz5hVZh6LkYefOnYwEesyYMbCysmIxoootKCgIrq6ujL52tra28Pb2hrGxMYuRKScdHR1cuXKlyBGgtGWkjEraM/b06dNEU1OTHDt2jAQEBJBJkyYRIyMjEhkZSQghZOTIkWTJkiXi+iEhIURfX5/MmDGDfP78mVy9epWYmZmRtWvXyrw3rqoQiURk+vTpEr3fcx9GRkYkMTGR7TApiiQmJhIDAwPxucnlcsm3b9/YDqvCio6OJjVq1GB8XpiYmJCAgAC2Q1N6fn5+REdHp8DP5ebNm7MdokIq7vW7xDcOhwwZgpiYGPz++++IjIyEk5MTvL29xZ1aQ0JCGMtO29rawsfHB3PnzkXDhg1hbW2N2bNnY/HixaVMn1Tf6tWrsXfv3gL3z5s3D4aGhnKMiKKk8/DwYHwDHzx4MGPEASU/KSkp6N69O75+/Sou09bWxrVr11CnTh0WI1MNjRo1gqenJ/r16yd1ThHaMlI2HCLtp6pgkpKSYGhoCD6fr/K3JrZt24b58+czyiwtLREREQEAMDIywo8fP2gyQrEuPT0dVapUYUx46O/vT6cVZ0FWVhZ69eqFmzdvist4PB4uX76MHj16FHIkVVJbtmzBwoULpe7LyMiocP0di1Lc6zddm0aBHD16VCIR6dGjBx48eCDenjNnDk1EKIVw9OhRRiLSo0cPmoiwQCQSYdy4cYxEBAAOHz5ME5FyMH/+fIwfP17qvryLD1IlQ5MRBXHu3DlMnDiRUdauXTv8+++/qF69Ojp06ABDQ0PMnj2bpQgp6pfs7Gxs3ryZUbZ06VKWoqnYFi5cKLE2yvr16zFmzBh2AlJxHA4H+/btk7qeDx1RU3o0GVEAPj4+GDZsGGPEUZMmTRjD8EaPHo3Zs2fDyMiIpSgp6pfTp08z7pH/9ttvaN26NYsRVUxbtmzBtm3bGGW0T17509DQwPnz51GjRg1GOU1GSo/OfMOyR48eoV+/fsjOzhaX1alTB97e3oz7awMGDGDUoSi2iEQibNiwgVFGW0Xk7/jx4xJ9F9zc3LBt2zY6u6ocmJiY4OrVq2jRogUSEhIAAI9ef4SxUxjM9LXQrKoJXZajBGgywiJ/f3/07NkT6enp4rIqVarg1q1bqFSpEqOunp6evMOjKKm8vLwQEBAg3nZycoKrqyuLEVU83t7eGDduHKPMxcUFx44dY4xmpMpXzZo1cf78eXTu0gVCgQCn/3uN29r+AABLQy2s6lWXrpxeTPSsZcmXL1/QpUsX8Pl8cZmFhQVu375d5OQ6FMUWQgjWrVvHKFu6dCn9Ji5Hz549w4ABAyAQCMRljRs3xoULF+hIDhZkVq4NI5epAABh0q8O3ZH8DEw94Qfv9xFshaZUaDLCgpCQELi4uCAmJkZcZmxsjJs3b9I5GiiF9t9//+H58+fi7Ro1amDAgAEsRlSxfP78GT169EBaWpq4rFq1arh+/Tpdp4oFQhGBu1cA9By7wqBZfwiSYiDKTIMoKx25c2a4ewVAKFL4GTRYR5MROYuKikLnzp0ZQ8B0dXVx48YNNGjQgMXIKKpo69evZ2wvWrSIse4UVX7Cw8PRtWtXxireZmZm8PHxkVhJnZKP50HxiODnLIVg1G40NMyrgf/sPML2jUHCvWPITo5FBD8Dz4PiWY5U8dFkRI4SExPRtWtXfPnyRVymoaGBy5cvo3nz5ixGRlFFe/nyJW7fvi3etrKywsiRI1mMqOJITEyEq6srYwSTvr4+vL29aWsqi6KTf63JxOHyYOwyGSn+1yHKTEXSs3MI2z8esVe34tlLPxajVA40GZGT1NRU9OzZE2/evBGX8Xg8nDlzBp06dWIxMooqnvytIvPnz6d9FOQgIyMDffr0wbt378Rl6urquHTpEho1asRiZJSZvhZjO/3LE4jSk38ViIRI/fAf5rp1gYuLC27cuCF1KnmKJiNykZmZif79++Px48eM8r/++gt9+/ZlJyiKKoGPHz/i4sWL4m0TExNMmjSJxYgqBqFQiOHDhzNmYeZwODh+/Dg6duzIYmQUADSragJLQy3kdt/WtK4NnTptAY7kpfXOnTvo3r076tevjyNHjjBWuqZoMlLuBAIBhg8fLjFV8+7du2kTN6U0Nm7cyPhGN2vWLDrcvJwRQjB9+nRcuHCBUb5z504MGTKEpaiovHhcDlb1qgsA4ADQMHNA5d6LYD35MAyc+4KjoS1xTEBAACZMmAB7e3usWbMGsbGxco5aMdGF8soRIQQTJkzA0aNHGeVr1qzBihUrWIqKokomJCQE1apVEw8l1dXVRUhICExMTFiOTLW5u7tj9erVjLKlS5dKDK2m2Of9PgLuXgHizqxAzjwjC9rb4MeTq9i5c2eB69Zoa2tj9OjRmDt3LmrWrCmvkOWm2NdvogT4fD4BQPh8PtuhFJtIJCJz584lABiP+fPnE5FIxHZ4FFVsM2fOZJzD8+bNYzsklbd//36Jz45x48bRzw4FJhCKyJNvseTS61Dy5FssEQh//a6ysrKIp6cnadKkicTvNffB4XBI7969yb1791Tq91zc6zdNRsrJH3/8IXGyjR8/XqVOMkr1pKenk8OHD4u3o6Ojiba2tvgcVldXJ6GhoSxGqPouXLhAuFwu47OjZ8+eJDs7m+3QqDISiUTk3r17pFevXgUmJQBI06ZNiaenJ8nKyir0+fz8/OQUeenRZIRFO3fulDi5Bg0aRAQCAduhUVSh3r17RzQ0NMjz588JIYQsX76ccR5PmDCB5QhV2/3794mmpibjZ96yZUuSmprKdmiUjH369IlMnjyZaGlpFZiU2NnZkS1bthR47bO1tSVnz56Vc+QlQ5MRlhw7dkzihHJ1dSWZmZlsh0ZRRTp37hwBQGxtbcm3b9+IoaGh+Dzmcrnky5cvbIeost6+fcv4eQMgderUIXFxcWyHRpWj6Oho4u7uTszMzApMSvT19cm8efNIcHAw41h7e3sCgGzcuFFhW92Le/2mo2lk6OLFixKLV7Vp0wbnz5+HhoYGS1FRVPHlTsj38+dPODs7M9ZOGjRokMSS6ZRsBAcHw9XVlfHztrGxgY+PD+0orOIqV66M33//HcHBwTh06BDq1KkjUSc5ORnbtm2Dg4MDhg4dipcvXwLI6UwOAIsXL8a0adMY6xUpG5qMyMjt27fh5uYGkUgkLmvUqBGuXr0KHR0dFiOjqOL7/Pmz+P+5y6LnGj9+PMLCwhAUFIQvX75AKBTKOzyVFBsbi65duyI8PFxcZmRkBG9vb9ja2rIYGSVPWlpamDBhAt6/f49r165JnUdGKBTi9OnTcHZ2Rrt27Rh/o/v370fv3r2RnJwscZwyoMmIDDx9+hR9+/ZFVlaWuKxmzZrw9vaGoaEhi5FRVMnkTUby69KlC2xsbODg4ICDBw/SNWlkIDU1FT169GD83LW0tHD16lXUq1ePxcgotnC5XHTv3h137tzB69evMWLECKipqUnUe/DgASIimCsC37hxA7/99hvCwsLkFa7M0GSkjN6+fYtu3bohNTVVXGZnZ4fbt2/DzMyMxcgoqmQIIYUmI7mGDx+OTZs2ySEi1ZadnY1BgwYxVkHmcrk4c+YMWrduzWJklKJwcnLC8ePHERQUhEWLFhXry+2bN2/QvHlzxtIjyoAmI2Xw7ds3dOnSBYmJieIyMzMz3Lp1izavUkonNjZW4tZMfl26dMHRo0fB5dKPjrIg/58Q8caNG4zyAwcOoHfv3ixFRSkqGxsbbNy4EaGhodi5cyeqVKlSaP2wsDC0adMG3t7e8glQBugnSimFhobCxcUFUVFR4jJDQ0PcvHlTJWfRo1RfUa0iTZs2pZ2xZWTJkiX4559/GGVr167FhAkTWIqIUgZ6enro3r07tLUlp5nPLyUlBT179sTBgwcZ5UIRgW9gHC77h8E3MA5CkWJMwi55I4oqUkxMDDp37sxYzltHRwfXrl2Do6Mji5FRVOkVloxUr14d165do+vRyMD27dslbnNNnz4dy5YtYykiSlncvn0bgwcPLrIFM5dQKMTkyZPx/ft3rFu3DjcDoqROW7+qV1241rcsr7CLhbaMlBCfz4erqys+ffokLlNXV8fFixfpfV5KqeUO683P3NwcPj4+tA+UDHh6emLevHmMskGDBmHnzp3gcDgFHEVRQGBgILZu3QpjY+MSdx7fuHEjOnTvi8nHnjISEQCI5Gdg6gk/eL+PKOBo+aAtIyWQlpaGXr16wc/PT1zG5XJx6tQpdOnShcXIKKrspLWM6Ovr48aNG3BwcGAhItVy8+ZNjBkzhlHWoUMHHD9+nI5MoopUrVo1cR8jgUCA0NBQfP/+Hd+/f0dQUBDj/zExMRLHP/Dxgub7QFTuvxw8nV8dYQlyVhx29wqASx1zqPHYaaOgq/YWU1ZWFvr27SvR4ezIkSMSE51RlDKqU6eORIuft7e31PkOqJJ5+fIl2rdvzxh15+TkhHv37tHh/5TMJScnIygoSJykPHkdgGtP3kCQGAlweajcdyl4usYQZaZBzaASiEiIxPt/4+Lh7ejYwE6msRT3+k1bRopBKBRi1KhREonI9u3baSJCqQSBQIDAwEDxNofDwfHjx2kiIgNfv35F9+7dGYlI1apVcePGDZqIUOVCX18fDRs2RMOGDQEADv5heGHlDyISIs57F6IvrIUgLhQ6tVrBpMs0xF7ZhMywT0gS7GQtZpqMFEAoIngeFI+opHQc27Qcl8+cYexftWoV5syZw05wFCUjuee5//sAZGdni8t37NiBIUOGsBiZaoiMjETXrl0ZzeaVK1eGj48PLCwsWIyMqii8vb1x58ELZEUbQb1yFWT+DIAgMad/SMbP94j4ey6ESdHgGVSGuUHRo3TKC01GpPB+HwF3rwCEJ6Yj8d5fSHp+gbF/1qxZWLVqFUvRUZRs5J7nEfwMpH37NfHW4PEzMGvWLBYjUw25nd2DgoLEZbq6urh+/Tpd44eSm5YtW2LEiBGIi4sDV9sAEP1axkGU9mstJC19YzSryt46SHQ0TT7e7yMw9YQfIvgZSHr6r0Qi4tJ7MLZv3057vlNKLe95DgCC+FAAgG79Tnhm2pX1nvXKLjMzE3379mXMgqmmpoYLFy6gadOmLEZGVTSGhob4/fffAQCi9CSIMlOl1qtT1QY8LnvXNZqM5CEUEbh7BYAASHl3G4kPmJMS6dRsiWTn8SCgiQilvPKe57my48OhZe8EU9eZ4HA4cPcKUJjJkJSNUCjEiBEjcO/ePUb533//TUfdUayYMmVKkSPi6lVjd9Zwmozk8TwoXvxNUcveCWomNuJ9WvZOqNRrESJTsvE8KJ6tEKkyUtTZB+Up73meS5jGR1bkN6QHPgcBEMHPoOd5KRBCMHv2bJw7d45Rvm3bNgwbNoylqKiKTkNDA+vWrSu0TuXKleUUjXS0z0ge0cm/PqDVDCqhcr+liP53NXh6Jqjcfzk4auoS9SjlkbePRC5FmX1QnvKfv4KkGGT+fAdRZgpiLq6DXqPuMO4wnp7nxZTbCTg6OQPXj+/Dwb17GfsXLVqEuXPnshQdReUYNGgQtmzZgpcvX0rdz/akhjQZycNMX4uxrVHJHuqVq0CYmgBBYiQ0zKpKrUcpvtw+EvnbQXJnH/QY0bjCJCT5z984nz0QZaSIt1NeX0fmz/dIcfEEnKzlHZ5SyZvgJr/xQbz3bsb+UaNGYcOGDSxFR1G/cLlcbNq0qcDh+my3jNDbNHk0q2oCS0MtRo8Qo5ZDkB35DRHHZiPhv6Mw0yas9jimSk4oIlh9+R2yEiORHviCMXIkNzmpSH0k8p/nJp0mQcO8GqNOdmwIJvR3wYEDB6AE8yKyIm8n4LSvzxDvw2wRadqmIw4fPkw7u1MKo0OHDujevbvUfWy3jNBkJA8el4NVveoCgPiDWtO6NjRt6gJEhKTnFxB8cCq8b1xnL0iqUCkpKXj16hVOnjyJlStXYtCgQahZpx6ereqJ8AMTEH3OHYkPjzOOqWh9JPKf5+om1rAYsQX6Tfsw6mVkZGDKlCkYNGhQsRfmqijydgLOCA1A7JWNABGJ92tY1gLHZS64PNr4TCmWjRs3gsuVvPTTZETBuNa3hMeIxrAw/NWUbdB8gPj/0eGh6NmzJwYOHIiwsDA2QqzwCCEIDQ3F7du3sWfPHsyYMQMuLi6wsbGBvr4+mjZtihEjRmDt2rU4d+4cvn/5CAh/TeiVHfcTJM+FI1dF6iOR/zznqKnDpNNE1Bq1FgbGzJa/8+fPw8nJCY8fP2YjVIWUtxMwh6cGjvqvzws1ExuYDfwd0emcCpPgUsqjfv36GD16tEQ527dp6No0BcjbKa2SrgYm9mmHjx8/Muro6+vjzz//xLRp0+hCV+UgIyMDX79+xadPnxiPz58/M6bWLg3rKUegZmjOKDs1sQVaVjMt0/Mqm7znuZm+FppVNUFUZARGjhyJu3fvMuryeDysXr0aS5culTjfvby80KtXL3mGzqrL/mGYfdofwpQEpH9/Aahp5kwFIMyGxYgtUDPM+Za5080JfWi/G0rBhIaGokaNGsjI+PUFLDU1FTo6OjJ/reJev2kyUkxHjx7F+PHjpe5r2rQpDhw4gMaNG8s5KuVHCEFMTIxEwvHp0yf8+PFDJv0VDAwMkKVhgMzEGBBBFkxcZ0C39m/gaub84XEAWBhq4dHijqxO+qNIhEIhNm3ahJUrV0IoFDL2tW/fHidOnIC19a+LbO3atbFs2TKMGjVK3qHKlUgkgp+fH/Yf/xfHz15EVuRX6NRshUp9l0CYmghRejI0KtuL61fEBJdSDkuXLhV3rtbV1UVKSkoRR5QOTUZkLDMzE1WrVkVEhPSZKblcLmbNmoU//vgD+vr6co5O8WVnZ+P79+9Sk47ExESZvIa9vT1q166NWrVqoXbt2qhduzZsbW2xZcsWHDhwAACgU7MVKvdbJj4mN/WoSKNpSsLX1xdDhw5FcHAwo9zExAR//fUXevfujczMTOjq6kJDQwPPnz9H/fr1WYq2fCQnJ+PWrVu4du0arl+/jsjISPE+DYsaMB+2Hlx15gglmuBSio7P56NatWqIi4uDubUdLt73Q7OqJjI/X2kyUg42bdqExYsXF1rHxsYGu3fvRt++feUTlIJJSEjA58+fJRKOwMBACASCMj+/tra2ONnIm3TUqFEDurq6jLqPHz/G6NGjGavR1hm3CWmV64q3K+I8IyWVmJiIyZMn4+zZsxL7Zs6ciZEjR6JZs2YAclpIXrx4AT09PXmHKVPfvn3D1atXce3aNdy/f5+xiGCuSuaW0Bq4EWp6Jowh4zTBpZSB9/sITFmyBsHXPKBhWROWo7aVy+chTUbKAZ/Ph62tLZKTk4us27t3b+zevRt2dnZyiEy+hEIhQkJCpLZyREdHy+Q1LC0tJRKO3JYOaT3B88rMzMTvv/+OzZs3M27z1KhRAx8CPuJlcCKjjwT95lo0QgiOHDmCWbNmIT09nbHPyMiI0bo1bNgwnDhxQqmGtGZlZeHRo0e4du0arl69ii9fvhRaX1dXF48ePUKkmjmdSI9SOrnD0kWCbIQfngL1SnYwG7iqXBLp4l6/6bizEjA0NMTkyZOxZcuWQutxuVxER0fj1KlTWLBggdJ2bk1JScGXL18kEo4vX74gMzOzzM+vrq6OGjVqSCQctWrVgqGhYame09/fHyNHjsT79+8l9k2ZMgXqajx6D78UOBwOJkyYgNatW8PNzQ1v374V78t/m83T0xNt27bF5MmT5RxlyV29ehV///03bt68iaSkpGIdw+FwcPLkSTg5OQEAOte1kOgETBNcSlEJRQQrzz5H2o/3yIr8mrOSLzcnFSDIadlz9wpA57oWcj2PactICYWGhsLBwUFqsy0ALFiwACtWrCj1xbQg4eHhsLKykulzAjnfeMPDw6W2coSGhsrkNUxMTFCnTh2JpKNq1apQU5NNPiwQCLBx40asXr1a6u0gTU1NhIWFwdSUJiJllZGRgYULF2LPnj0F1tHQ0ICvr6/Cd+qOj4/H6tWrsW/fPomOugXZvHkzFixYUM6RUZRspKam4vXr13j58iVevHiBh0+e4ueP74w6ek7dYdp1GqNMVp2vactIObGxscHw4cNx7NgxqfsPHz6MsWPHyiQZIYTg/v37WLduHZo3b441a9aU+rkyMjLw7ds3qcNkZdGLmsvlwsHBQeqtlUqVKpX5+Qvz5csXjBo1Cs+ePSuwzpAhQ2giIiNaWloYP348bt68WeDtjKysLAwaNAivXr2CkZGRfAMsARMTE+zatQuTJk3CxIkT8fTp00LrT5gwAfPnz5dTdBRVMpmZmXj37h1evHiBFy9e4OXLl/jw4QNEIsl5lZgk2yTkPe8STUZKYcGCBYxkhMvlin/ZiYmJ6NatG3x9fUvdkkEIwfXr17Fu3To8efIEAIq1vgUhBLGxsQUOky36hCyavr6+1ISjevXq0NTULPPzl4RIJMLevXuxePFiiX4M+U2ZMkVOUam2jx8/YtWqVfj333+LrPv9+3eMGzcO58+fV+j+I4QQPHv2TGIeofw6dOiAvXv3KvR7oSoOoVCIgIAAcYvHixcv8PbtW2RlZZX4uQQJ4RJl8l6DjSYjpVCvXj306NED165dA4/Hg7e3NwYOHAg+nw8ACAkJQY8ePfDgwYMSDfMVCoU4f/481q1bhzdv3ojL7e3t0ahRI/F2dnY2goKCpLZyxMfLZsZHOzs7iYSjdu3asLS0VIgP45CQEIwdO1ZiYi5pHB0d0aJFCzlEpdqys7Nx48aNIjt35nXx4kXs2LFDYVetDQoKwqRJk3D79u1C69WoUQPnzp2DhoaGnCKjqF9EIhECAwMZLR5+fn5IS0sr8XPp6+uDU8kBqFwNGpY1oWFRnTEBZO6wdHmvwUb7jJTSgwcP0K5dO/Tv3x/nz5/HvXv30LVrV0ZW2rlzF6zc9TfiM4SFdmzLysrCyZMnsWHDBqkf9C1atED79u0Zw2QL6rNSElpaWqhZs6ZEwlGzZk2JYbKKhBCCAwcOwMfHB76+voiKiiq0voeHB20ZkbEPHz7g1KlT8PT0RFBQUKF11dTU8ODBA7Rs2VJO0RVNJBJhz549WLZsWZGz+RobG+Pp06eoWbOmnKKjlFlAQACMjIzK1DL+8+dPRovHy5cvxV92S0JLSwuNGjVC06ZN4ezsDGdnZ9SsWRM3A6Iw9YRfzuvlqc/maBqajJQSIQQtW7bEH3/8gS5dugAATp8+jaFDhzLq6dZ3gWn32eBwOBJD/tLT03H48GFs3rwZP3/+LLdYLSwspLZy2NnZFTlMVtERQvDPP/9gzJgxUvfr6ekhPDycTkRXTnJvcXh6euLMmTMFDu22sbHB69evYWxiyvrIk0+fPmH8+PHiW6B5tW3bFuPHjxev3aGmpoabN2+iQ4cOco2RUj6hoaFYvXo1Tp06hdjYWGhraxfruOjoaEbS8eLFi1JNkaCmpoYGDRqIk46mTZuiXr16UFdXl1rf+32EXIal02REDp4+fYpmzZoxLuibN2/GokWLGPUMWw+FUZvh4qxzS5/q+Hr/IrZv3y6zeTnU1NQKHCaryB0Iyyo4OBhNmzZFbGys1P1Tp07Fvn375BxVxSQQCHDnzh14enriwoULEh2jm7bpCJ7rEkQm/2o9lOecHNnZ2diyZQvc3d0lhqbr6elh06ZNmDx5MsLDw2Frawsgp0N6QctAUBSQM9Hjxo0bsXPnTmRkZKBjx464c+eO1LqJiYl49eqVOPl48eJFqb6Icjgc1KlTh9Hi4ejoCC2tkvXzkLY2FZ2BtRCKmoxIIxCKYNOmP6KeXmaUV+q1AFpVGiH55RWkvL4KYUbpFnozNjaWaOHIHSZbUAasqtLS0tC6dWv4+/uLy6ytrRmrKb958wYNGzZkIbqKLT09HVevXoWnpyeuX78uvn1p1HYUDFsOFteT12yl/v7+GDduHF6/fi2xz9XVFQcOHBBPUCgUCqGpqYl58+Zh06ZN5RYTJUkeF0dZycjIwJ49e7Bu3TokJCSIy9evX48lS5aIh9TmbfH4+vVrqV7LwcGB0eLRuHFjpWntpckIS3wD4+B24DFiLq1H+tecYYLqZlWhYVkLaQH/gWSXbrKwdevWYcKECahUqZJCdCBlGyEEw4YNw+nTp8Vlurq68PX1xfLly+Hl5YVWrVrRZe8VQGxcPJpPWofwV7eQ8TMA5kP+gJbdrwQxt8Pcw0UdoMaT7W3DzMxMrFmzBhs3bpSYf8bY2Bg7duzAyJEjJf6mZs+ejW3btinthIXKSF63DcpKKBTi+PHj+P3336W2arRv3x6xsbEICAgo1QhGa2trRotH06ZNYWIi386kskSTEZbkLi0uys5A1Onl4GkbwLjrdIiS4yBIjER2YgQECZGwU09CYuTPAhfey8/Ozg5v3rxR6VsuJSFtnaBz585hwIABePjwIdq2bYt//vkHI0eOZClCKpdvYByGHspJzDOjvyPt02OoGVSGKCMZhi0GgQgF4D85jS3zxmLCgC6ye11fX4wfP17qkN0BAwZgz549sLCwkHqsSCRS+v5UbBGKCP57F4yNq5fCwcEB3do2h5NjQ9jb2xf4RSp3evK8FyNRVgayIr5A276hXNb5KapVhhCCa9euYcmSJfjw4YNMXtPU1JSRdDg7O8PSUnESL1mgk56xJHdsNlddC+aD3MHR0AaHywP0K0HTqpa43pH/z26XmpqK79+/IzAwEIGBgfj27Zv4/8HBweJZIUNCQjB16lR4enpW+JYRb29vLFmyhFG2fPlyDBgwAADQpk0b9OjRA4MGDWIjPCoPkUiEM54nIEw1BU/XGGkfHyDp6bmcnRwutB2aIO76TmRFBUJz7bLCn6yYUlNTsXz5cuzatQv5v2uZm5tj79694nOlIDQRKZ28rRtJKYa4vW0dDm7L2aevr48GDRpIPAwMjeDuFQACgIiEyAh6jZQP/yHtyxMYtR4KbfuG5T49eVGtMk+fPsXixYvx4MGDUr+Gvr4+mjRpIk4+nJ2dC03QKhqajMhYs6omsDTUQiQ/A1wtyZVL84/h1tXVFf9R5pednY3g4GBGovLp0yfUqVOnvN+Gwvr69SuGDh3KuMj07NkTf/zxh3ibw+HA09OzxJ25KNnjcrmI+P4RoX8fgqZtfXA18owwICJEHJsDEBG42gaoblf25Q7u3LmDiRMnSh1uPHr0aGzbtk2pm7wVWf7WDf3GPZD28SEywwIAAMnJyXjy5InEKCYzCyskcg0AYTayEyJAsn7NnZEdHwqRIBsRfOB5ULzM15UihODKqyDM/NsXwqx0kKx0qFeyBYenjkh+BsbvvIwqQVfw5M6NEj1v7pDavC0eNWvWpEluIUp1m2bv3r3YvHkzIiMj4ejoiN27d4uXEC9M7tDXPn364NKlS8V+PWW6TQP8+qMEyn8Md0WSnJyMFi1aICAgQFxWq1YtPHv2TOZrAVGy8z3oB6pVrwYUcv9cz64eEoPelfqbL5/Px4IFC3D48GGJfba2tjh48CBcXV1L9dxU0YQigjYb7zJaFiJPLkZmxGdAKLlWVEloWNVC5b5LsXeiC/o4WUMoFCIlJQXJyclITk5GUlKS+P/SHkXtz9+XyGrSQXDUNMF/7ImUt7cAUvJ+HxcuXEC/fv3K9L5VRbndpjlz5gzmzZuH/fv3o3nz5tixYwe6du2Kz58/w8zMrMDjfvz4gQULFuC3334r6UsqHdf6lvAY0Vii2c9CATtjKQuRSIRRo0YxEhEDAwNcvnyZJiIKzqFqFbR37YN71y8WWKdl4/qlTkS8vLwwZcoUhIdLTmk9bdo0bNiwQWlGHiir50HxjM86ADkX8TImIgCQFf4ZYR7jMPKkAYTZWaWadbQkMsM+IzXgPwj4UeBoaINklnzk49ixY1G/fn3UqFGjHCJUTSVORrZt24aJEydi7NixAID9+/fj2rVrOHr0qMR9/FxCoRDDhw+Hu7s7Hj58KLHkuCpyrW9JlxaXoTVr1jBa03JvxdSqVavggyiFsf3P39GokGSkU4tGBe4rSExMDGbPno1Tp05J7KtRowYOHz6Mtm3blvh5qZKLTPqViKQH+SHt0yOQUrQoFIiIkMxPlN3zFULNsDLMB/+67UsE2VjpYg2nShxERUUhOjoaUVFRUv8fExMDQgj4fD769++Pp0+fKvRs1oqkRMlIVlYWXr16haVLl4rLuFwuXFxc4OvrW+Bxf/zxB8zMzDB+/Hg8fPiwyNfJzMxkTEqUlJRUkjAVBo/Lkfk9zoro0qVLWL16NaNszZo16NGjBzsBUSXm5OSELl264ObNm1L3lySpJITgzJkzmDlzpsRkd1wuF/Pnz4e7u3uxZ8Ckyi4+5dfnddy17RCm5sy7oVapCgSxP1iKSpKenh709fXFD6KmhY9x2eBoaIOroQOuhjZ4usaMYzhq6qhXwwFNi/FZLhQKERsby0hSHBwcyuvtqJQSJSOxsbEQCoUwNzdnlJubm+PTp09Sj3n06BGOHDnCmJiqKOvXr4e7u3tJQqNUVEBAgMTw3IEDB2LZMtmMvKDkZ9GiRWVORsLDwzF16lRcuXJFYl+DBg1w5MgRODs7lylOquRMdHMWEBSmJ0OUned2jaiMt2m4PHAIkWhlMTIygouLC6ysrBjJhYGBAWM770NPT0+iA2luX5dIfgakdZ4s6aJxPB4P5ubmMDc3lzoogSpYuY6mSU5OxsiRI3Ho0CFUqlSp2MctXboU8+bNE28nJSWJp2emKo6EhAT06dOHMa14gwYN8Ndff9HhcEqoY8eOaNSokcQsqDweD9WqVSv0WEIIjh49ivnz50ssGKauro4VK1ZgyZIldFVdllgY5rRC8bT1YTZoNfhPzkLTph7Svz6Bsctk6NZtB0F8GPpaJOHH+xd4/PgxkpOTC33Olu1c8PDuTSQmxMPNzY2xsnJiYiL+++8/nD59Gi4uLqWOm8flYFWvuph6wg8cSB9wsKpXXXp7XQ5KNJomKysLOjo6OHfuHPr27SsuHz16NBITE3H5MnMKdH9/fzRq1Igxi2HujHRcLhefP38u8kMIUL7RNFTZCYVC9OzZE97e3uIyY2NjvHz5kjZ7KjFpi0lWr1690Gmyg4KCMGnSJMbFKJezszOOHj2K+vXryzxWqvikjaYhwuyclg1OTmuEpaEWHi3uCB6XA4FAAH9/f9y/fx8PHjzAw4cPGVOq57p16xZcXFwgFAqxfPlybNy4kbGfy+Vi/fr1WLhwYZm+oCjL7K/KqNxmYG3evDmaNWuG3bt3A8hJLuzs7DBjxgyJDqwZGRn49u0bo2zFihVITk7Gzp07UbNmzWJ9k6HJSMWzZMkSxgcPl8uFj49Pmb4FUewTCASoUaMGfvz4IS7r2bMnvLy8JOoKhULs3bsXS5culRhBoaWlhbVr12LOnDl0ynYFIW0W1VwcFD6lgUgkwrt378TJyYMHDxATE4MGDRrg9evX4t/xv//+i7FjxyI1lTnCZdCgQTh69Cj09CTndiouZVoXR5kU+/pNSuj06dNEU1OTHDt2jAQEBJBJkyYRIyMjEhkZSQghZOTIkWTJkiUFHj969GjSp0+fEr0mn88nAAifzy9puJQSOnXqFEFOi6n4sXXrVrbDomRk9+7djN/t/PnzJeoEBASQVq1aSZwHAEi7du3I169fWYicKsqNd+GkxbrbxH7xVfGjxbrb5Ma78BI9j0gkIh8+fCAeHh7kw4cPjH3v3r0j1atXlzgv6tatS758+SLLt0PJQHGv3yVORgjJ+TCxs7MjGhoapFmzZuTp06fife3atSOjR48u8FiajFCFef36NdHW1mZ8yIwYMYKIRCK2Q6NkJCUlhZiamop/vwcPHhTvy8rKIn/++SfR0NCQuNjo6+sTDw8PIhQKWYyeKopAKCJPvsWSS69DyZNvsUQglP3fbkJCAunZs6fEOWJgYEC8vLxk/npU6ZVrMiJvNBmpGKKjo4m9vT3jw6VJkyYkLS2N7dAoGfv999/Fv+M/D58jT77FkhcvX5FGjRpJbQ3p1q0bCQkJYTtsSoEIhUKyatUqqefL6tWradKqIIp7/aYT5VMKITs7G0OGDEFwcLC4rHLlyrh48SKdL0IF1ek0CBy1nP5i+17y4TpyGpybOUuMtDExMcE///yDa9eu0RF1FAOXy8Xq1avh5eUl0Rdh9erV6Nu3r8TIK0px0WSEUggLFizAf//9J95WU1PD+fPn6QVIBXm/j8DS68HQbdAZUNdC1NlVSPI9K7F2zcCBA8XzzNCh3FRBevbsiZcvX6Ju3bqMci8vLzg7O+PDhw8sRUaVBE1GKNb99ddf2LVrF6Ns165dFWIdo4pGKCLi5eK1bOsD2RkQxIcy6qjrm+Dff8/h33//lZhgkaKkqVGjBp49e4aBAwcyyr9+/YrmzZvj3LlzLEVGFRdNRihWPXv2DFOmTGGUTZw4UaKMUg15F1TTqd0a6pXsGft167vAfNw+WDdqL//gKKWmp6eHs2fPYsOGDYyZVlNTUzFo0CAsWbIEQqGQxQipwtBkhGJNREQE+vfvj6ysLHFZy5YtsXv3btosr6Kik39NKsXhcFG5/3Jw1DTBM6gMs0HuqNRjDnhaeox6FFVcHA4Hixcvhre3N0xMmFO4b9y4Ea6uroiLi2MpOqowNBmhWJGZmYkBAwYwln23srLC+fPnoampyWJkVHky09dibKsbW6HygJWwGrcX2g5NCqxHUSXRuXNnvHz5Ek5OTozy27dvo0mTJhIdpSn20WSEkjtCCGbMmMFY6VlDQwMXLlyApSWdelmVNatqAktDLeRt99Ku4gSupg6AnJk6LUuwMBlFFaRq1ap4/PgxRowYwSgPDg5Gq1atcPz4cZYio6ShyQgld/v378fhw4clypo3b85SRJS85C5MBgD5b8TRhckoWdPR0cE///yDXbt2QU3t17qwGRkZGDVqFGbNmoXs7GwWI6Ry0WSEkquHDx9i1qxZjLKZM2di7NixLEVEyZtrfUt4jGgMC0PmrRgLQ61C1y+hqNLgcDiYOXMm7ty5AzMzM8a+3bt3o1OnToiKimIpOipXiRfKYwNdKE81/Pz5E02bNkV0dLS4rEOHDvDx8YG6ujqLkVFsoAuTUfIWFhaGAQMG4NmzZ4zy3P5qLVq0YCky1VXc6zdtGaHkIj09HX379mUkIvb29jhz5gxNRCooHpeDltVM0cfJGi2rmdJEhCp31tbWuH//PiZOnMgoDw8PR7t27XDw4EGJY/z9/fH+/Xt5hVhh0WSEKneEEEyaNAl+fn7iMm1tbVy6dAmVK1dmMTKKoioaTU1NHDx4EAcPHoSGhoa4PCsrC5MnT8bEiRORmZkpLn/06BFGjBjBKKNkjyYjVLnbvn07Tpw4wSg7evSoxLA7iqIoeZk4cSIePHgAa2trRvnhw4fRtm1bhIbmzAz84sULvHnzBqtWrWIjzAqDJiNUubp9+zYWLlzIKFu0aBHc3NxYioiiKCpH8+bN8erVK7Rt25ZR/vz5czRp0gT379/H8+fPAQCbNm3CgwcP2AizQqAdWKly8/37dzg7OyM+Pl5c5urqiqtXr4LH47EYGUVR1C/Z2dlYuHAhdu7cySjn8XiMKeTt7e3x9u1beh0qAdqBlWJVSkoK+vTpw0hEqlevDk9PT5qIUBSlUNTV1bFjxw4cP34c2tra4vL8a9kEBwdLTE1AyQZNRiiZEYoIfAPjcOl1KHoNHMboga6np4dLly7B2NiYxQgpiqIKNmLECDx58gRVqlQpsM7ff/+N8+fPyy+oCkKt6CoUVTTv9xFw9wpABD8D/CdnkPjQi7H/+PHjqFevHkvRURRFFU0oFOLLly/Q19cvtN7kyZPRqlUrunyFDNGWEarMvN9HYOoJP0TwM5D27TkSHzJHzgyfOg99+/ZlJziKoqgiEEJw5MgR1KpVC0OGDMG7d+8KrR8XF4dx48ZBCbpcKg2ajFBlIhQRuHsFgAAQJEUj1msLgF9/oNo1WuCbtSuEIvpHS1GUYuJwOHB1dcWYMWNgZ2dXrGO8vb3h4eFRzpFVHDQZocrkeVA8IvgZAACefiUYNO8v3qduaotKPeYhMjkLz4PiC3oKilJJuX2oLvuHwTcwjibkCs7a2horVqzA9+/fcePGDfTr16/IzvYLFizA58+f5RShaqN9RqgyiU7OEP+fw+FCTc8UlfouQ8Ldw6jcf4V4afi89ShK1eXtQ5XL0lALq3rVpQsBKjgejwdXV1e4uroiIiICf/31Fw4dOoQfP35I1E1PTxd3euXy1OhaS2VA5xmhysQ3MA5DDz0FAKQG3Aff9wysxu8DEWaDw/u15sypiS3QspopW2FSlNzk9qHK/8Gae1miKxMrH5FIhNu3b+PgwYO4fPkyBAIBY//QyXMQZN+TJp9S0HlGKLloVtUEloZaSP/6DLFXt0K9kj0AiBMRDnL+KJtVNWExSoqSj9w+VCKREKkB9xB7dau4k2NucuLuFUBv2SgZLpeLLl264Ny5cwgNDcWGDRvg4OAg3n/q4C78CPBnHBPJz8DUE37wfh8h52iVE01GqDLhcTnoXSkW0ZfXA0QE9cr24n253wRX9apLmyupCuHRpwh8uX8J4YemINZrC1I//If07y/F+wmACH4G7UOlxMzNzbF48WJ8/foVPjdvwaRBO4DDRezVrRBlpQMAiEhIk88SoskIVSZPnjzB2jnjAGFOs6VG5arifRaGWrRJmqoQ0tLSsHPnTgzo0ATxPnsgSPz1bTjh9gGJ+rQPlfLjcrnQd2gE/e4LYTPtGPScXJH8+gZS3t1BxF+zIMpIoclnCdAOrFSp+fn5oXv37khLSxOXeczsCzUjc9qBi6oQ+Hw+9u3bh+3btyMmJkZqHQE/Gtnx4VA3sRKXmelryStEqhzlJpU8XSMYNO2N+DuHkXjvKAAg1msLKg/8HRwOlyafxUCTEapUPn78iK5du4LP54vL9PT00K+tE7hc2uBGqbbY2Fjs2LEDe/bsYfwN5KVpVRvatVoj8b8jSA96BXUTK3CQ02JI+1CphrxJZVbUd6T43xBvp39/Cf6jUzD6bThNPouBXjWoEvv+/TtcXFwQGxvLKG/QoAFNRCiVFh4ejnnz5sHe3h5//vmn1ETEqXkbmLutg8WIzeBwcloGU9/foX2oVFBuB34OAE2rWjBqN4axn//kFDTD/WjyWQz0ykGVSFhYGFxcXBAeHi6xr0GDBixERFHlLygoCFOmTEHVqlWxfft2xq3JXL169cLTp0/x+ulDHFs+BpZG2sgMDQAAZEV+g0FGJO1DpWJ4XA5W9aoLIKfDvkGzftCp/RujTujFzQj89pWF6JQLTUaoYouJiUHL39ojKChI6v6GDRvKOSKKKl8fP37EqFGjUKNGDRw4cABZWVmM/RwOB0OGDMGbN29w5coVNG/eHADgWt8SDxd1gHbCN3HdzuqfaCKiglzrW8JjRGNYGGqBw+HAtNts8RQHAJCWkox+/fohOTmZxSgVH01GqGIhhGD2inWI5RhCq2oT/Bq4+0uarpXkgRSlhPz8/DBw4EDUq1cPx48fh1AoZOxXU1PDuHHj8OnTJ5w+fVpqIh4S/ANxMdHi7ZMnTkhMlkWpBtf6lni0uCNOTWyB3aNa4OTpf2FoaCjeHxAQQBfWKwJNRqhiEREgqEpPmA1yh36TnoDE/JLA2e8cOp6eUmqPHj1Ct27d0KRJE5w/f17i4qGlpYUZM2YgMDAQR44cQc2aNQt8rsePHzO2IyMjcevWrXKJm2Ifj8tBy2qm6ONkjUGdnHHy5ElxnyEAOHfuHDZt2sRihIqNJiNUgbKyshAXF4fg4GCc8nmMHwGvkR7kB2FaEvScuoGjoQOjdmPA0zUGT78SYrLU6Xh6SukQQnDz5k20a9cOv/32G7y9vSXq6OnpYfHixfjx4wd2795drJVd8ycjAPD333/LJGZK8fXo0QOrV69mlC1btowmpAWgQ3srED8/P9y8eRPJycniR0pKCmM77yP//fEcHBi0HAQTl8kwajsKXE0daFrWRNKLiwDoZE6U8hCJRLhy5Qr+/PNPvHz5UmodExMTzJ49GzNnzoSxsXGJnl9aMnLp0iUkJibCyMioNCFTSmbFihV49eoVrly5AiDnnHNzc8OrV69QpUoVdoNTMHShvAokMzMTgwcPFv9hlBRP1ximPedDu4qTxL7sxEioG1nQBfEohScQCHDmzBmsX78eHz58kFrHwsIC8+fPx+TJk6Gvr1/i10hISICJifThnAcOHMCkSZNK/JyUcuLz+XB2dsbXr79G1DRq1AiPHz+GtrY2i5HJB10oj5KgqamJc+fOYdCgQSU+tkuXrnCcdRA6UhIRANAwsqAL4lEKLTMzE4cOHULt2rUxYsQIqYmIvb099u7di6CgICxYsKBUiQgA+Pr6Frjv2LFjpXpOSjkZGhri4sWL0NXVFZe9fv0akydPph1a86DJSAWjpqaGGTNmFLvJWU1NDZs2bcKNG9fx57DWACTH0dDJnChFlrtuTLVq1TBp0iQEBgZK1KlZsyb++usvfP36FdOmTYOWVtlmzJR2iyaXr68vvnz5Uqbnp5RLvXr1JJLQ48ePY+/evewEpIBoMlJBBAQEYPny5XBwcEC7du2QkJBQ5DFVqlTBo0ePsHDhQnC5XMZ4+rzogniUIuLz+Vi3bh3s7e0xZ84chIWFSdRxdHTE2bNnERAQgDFjxkBdXV0mr11YMgIA//zzj0xeh1IeAwcOxOLFixllc+fOxcOHD1mKSLHQPiMqLCwsDKdOncLJkyfh7+9fomMHDx6MgwcPMsbK5xKKCJ4HxSM6OYMuiEcpnOKsG9OyZUssX74c3bt3Zwy/lIXs7GwYGhoiPT29wDq2trb48eMHXT6hghEKhXB1dcXt27fFZebm5nj16hWsra1ZjKz8FPv6TZQAn88nAAifz2c7FIWXmJhIjhw5Qjp06EA4HA5BzoQgxX5oa2uTQ4cOEZFIxPZboagSCQsLI3PnziU6OjoFnt+dOnUid+/eLdfz+9mzZ8X6W7t9+3a5xUAprtjYWGJvb884F1q0aEEyMjLYDq1cFPf6TdNyFZCZmYmLFy9i4MCBMDc3x/jx4/Hff/9J7RzF5XLRpUsX/P333xJNhvXq1cOLFy8wYcIEmX9bpHJalHwD43DZPwy+gXFlniBO2u+3IirOujG9e/fG06dPcfv2bXTo0KFcz++8t2jyD9/s2bMnqlevDoDOOVJRmZqa4uLFi4x+SU+fPsWcOXPYC0oB0HlGlJRIJMKDBw9w8uRJnDt3DomJiYXWd3Z2xvDhwzFkyBBYWFgAACZOnCjeP3nyZGzbtg06OjrlGXaF5f0+Au5eAYjg/5qHxdJQC6t61S12X5vk5GT4+vri4cOHePjwIaZMmQI3N7fyClnhBQQEYMOGDfD09JSYrh3ISbwHDx6MpUuXynXdpMePH6NmzZrYsWMHBAIBevfuLd7XpUsXXL58GTdv3sRff/2F1NRUxigLqmJo1KgRDh48iFGjRonL9u/fD2dnZ4wbN47FyNhDkxElQgjB27dvcfLkSZw6dQqhoaGF1q9evTqGDx+OYcOGSZ22Ojg4GIaGhjh06FCphvtSxeP9PgJTT/hJTKAfyc/A1BN+BXb+jY6OxqNHj8TJh7+/v/ii27hxYwwePFgO0SsePz8//Pnnn7h48aLU1iE1NTWMGjUKS5YsQY0aNeQeX79+/eDp6QkNDQ2JzokJCQk5ncFdXeHq6ir32CjFMXLkSLx48QK7d+8Wl02dOhUNGjSAs7Mzi5GxgyYjSiA4OBienp44efJkgZM05TIzM4ObmxuGDx8OZ2fnQpujLSws8Pr1a1StWlXWIVP/JxQRuHsFSFnJJ+dmMQeAu1cAXOqY42dIsDjxePjwIT5//lzg8+7YsUNmnR+VpUPyo0eP8Oeff0qdrh3IWTdmwoQJWLhwYbGmay8vw4cPF/8//xD64oxioyqOrVu3wt/fX5y0ZmVloX///nj16hXMzMxYjk6+aDKioOLi4vDvv//i5MmTePToUaF1dXV10b9/fwwfPhydOnWCmlrxfq3Hjh2jvfnL2fOgeMatGQAQZaUjKzYEXHVNZP78gOjQD7DaORIxURHFes4qVaogMDAQsbGxMDQ0hIGBAQwNDcUPTU3NYscni9tH5YkQglu3buHPP//EgwcPpNbR09PD9OnTMXfuXJibm8s5wsLlT0aKup1KVSzq6uo4e/YsmjRpgvDwcABAaGgohgwZglu3bhX7s1wVVJx3qgTS09Ph5eWFEydOwNvbG9nZ2QXWVVNTQ9euXTF8+HD07t27VPedaSJS/vKu1UMIQer7u4i/cwAkMx15Vz6W7HJZsB8/fmDs2LEF7tfQ0GAkJ/mTldztnynAqdex4GjqgKdrBA3zagCKvn0kDyKRCJcvX8a6devKZd0Yecm/Bg1tGaHys7CwwLlz59CuXTvxZ/69e/ewePFibN26leXo5IcmIywTCoW4e/cuTp48iQsXLiA5ObnQ+q1atcLw4cMxePBgVKpUSU5RUqVlpv+rx3zCnYNIfuUl3ta0qQdRZiqyY37I9DWzsrIQExODmJiYYh+jYV4NlmN2AmDePupc10Kut2zksW6MPOno6EBdXV18kaEtI5Q0LVu2xO7duzFlyhRx2bZt29C0aVMMHTqUxcjkhyYjLCCE4NWrVzh58iROnz6NyMjIQuvXqVNH3BGV9u9QLs2qmsDSUAuR/AzoNeiMZL9rABEBADLDP8F63F6YaHPgov4Zpzw9izwXygtHnTmrLgEQwc/A86B4uSx8mJmZiX/++QcbN26UOl07kLNuzKJFizBu3LgyT9cuLxwOB0ZGRuLEkLaMUAWZNGkSXrx4gSNHjojLxo8fj3r16sl1NBhbaDIiY4V1BgwMDMTJkydx8uTJItemsLKywtChQzF8+HA4OTnReT+UFI/LwapedTH1hB80zR2g59gFKf7/74ApEiL+7mEcvnwFrvUnYdPGjbh48SLOnz8PLy8vqfNlADlzVbi5uYHP54PP5yMpKUn8/4K2RSJRoXEKU+Kllue9zVQe0tLScOjQIWzevFnqdO0AUKtWLSxduhTDhg2T2XTt8mRsbCxORmjLCFUQDoeDPXv24O3bt3jx4gWAnFv3/fr1w4sXLwpcBVpV0GREhqR1BqzES4ez6BNe/3cVz549K/R4AwMDDBw4EMOHD0e7du3A4/HKO2RKDnLX9HH3CoDgt5FI/fgQJDMVAJD+/SVEIa+B+pZQU1PDlStXMGXKFBw+fBgXLlzA8ePHcefOHcYQ1pcvX+L8+fPQ0NAo1usTQpCamspITnw//sS6S68gykpDypubQAH9h/LeZpIlPp+PvXv3Yvv27YiNjZVax9HREcuXL0f//v2V+m8hb78R2jJCFUZLSwvnz59HkyZNxAns9+/fMXz4cFy9elWp/w6KVL4TwcqGMkwHf+NdOKmy+CqxX3yV2M79l5j2nE+0qjYh4HALnRJaQ0OD9OvXj5w7d46kp6ez/TaociQQisiTb7Fk/MLVjHOgZs2aJDMzk1y9epUAIO7u7ozjfv78STZu3Ejq168vPubkyZNljqXFutukcp8lBADRa9iF2P///LVffJVUWXyVtFh3mwiEsp02PSYmhixfvpwYGhoW+DfRsmVLcvXqVZVZkqBr166M95ednc12SJSC+++//wiPx2OcNytWrGA7rFIp7vWbJiMykPvBnvtBrl65SqEJCIfDIe3btyeHDh0i8fHxbIdPyVlWVhapW7cu45xYuXIlsba2JgCIi4uL1ONEIhF5/fo1mTdvHunbt2+Z4zjm85xwNXUJAKLfpBcjEamy+Cq58S68zK+Rqzjrxri4uJT7ujFsGDJkCON9xsbGsh0SpQS2bdsm8Tdy8eJFRp2fP38q7HUxV3Gv3/Q2jQzkn0tCu1ozqSMkqteuh0njRsPNzQ22trZyjJBSJOrq6tixYwe6dOkiLluzZo34/76+vhAIBBJzDHA4HDg5OcHJyQkCgQCEkFL3JRIIBDj0x1yI/n+7iKOhLd5nIcN5Rr5//45Nmzbhr7/+QlZWltQ6vXv3xrJly9C8efMyv54ikjbxmalp+XcKppTbnDlz8OLFC5w6dUpcNmrUKDx//hy1a9cGkDPiplatWpg8eTJbYcoMnWhCBvJ38tOt89uvDZ461CtVgZ5TN7gOGYvGjRsjIyMDGRnl2zGQUlxZWVlwcnJCmzZtpO5PTU3F69evC30ONTW1MnVqXrNmDWNBt6Eta2CnmxNOTWyBR4s7ljkRCQgIwMiRI1GzZk0cOHBAIhHhcrlwc3PDmzdvcPnyZZVNRAA68RlVOhwOB4cOHWKMpElOTka/fv2QnJyMuLg4HDx4EAcPHmQxStmhLSMykL+Tn4ZZVRj+NgKCxCikvruF7NgfyI79gT3+N7AnTz1zc3PY29vDzs4O9vb2jP/b2dnB2NiYjqJRIS9fvkT37t2LNf/HgwcPym19igcPHmDt2rWMsrr2ZujjZF3m53716hXWrVunsOvGsIFOfEaVlq6uLi5cuICmTZuKk9hPnz5hzJgxaNiwIVJTU+Hn54dXr16hSZMm7AZbRqVqGdm7dy+qVKkCLS0tNG/eHM+fPy+w7qFDh/Dbb7/B2NgYxsbGcHFxKbS+MsqdSyJv2mDUyg2Vus9GpV4LAZ704YhRUVF4/vw5zp07h61bt2LWrFno27cvGjVqBFNTUxgYGGDfvn3yeRNUuWvatCkuXbokcXGSJv8Ca7ISHx+P4cOHSwz1LWwG36KGBQM58Xbr1g1NmzbFhQsXJBIRLS0tzJw5E4GBgThy5EiFSUQA2jJClU21atVw6tQpxhfTCxcuMG7tqkLrSImTkTNnzmDevHlYtWoV/Pz84OjoiK5duyI6Olpq/Xv37mHo0KH477//4OvrC1tbW3Tp0qXAOQWUUe5cEgCQvx1Dr247WAxdDyOTks2WyuPxsGHDBkybNk1GUVKKoFWrVrh3716Ri2A9evSoWElASRBCMGHCBKmrPevp6Uk95vPnz1i1alWBz+fj44O2bduibdu2Uhew09fXx+LFi/Hjxw/s2rWL1QXs2EJbRqiycnV1ZSQfAMQreAOAp6cnUlJS5B2WTJU4Gdm2bRsmTpyIsWPHom7duti/fz90dHRw9OhRqfVPnjyJadOmwcnJCbVr18bhw4chEolw586dMgevSHLnkrAwZN6ysTDUwl+Lh8Hf7yUaNGhQrOfS0dHBjRs3MH369PIIlWKZo6MjHj58WGgn5ri4OHz69Emmr3vgwAFcvHhR6j5pLSMvXrxAmzZtJL44iEQiXLx4Ec2aNYOrq6vUVhwTExO4u7sjODgYGzZsULgF7OSJrtxLlYVIJMLHjx9hbW0NAwMDqXVSUlJw+vRpOUcmYyUZopOZmUl4PJ7E8KJRo0aR3r17F+s5kpKSiJaWFvHy8iqwTkZGBuHz+eLHz58/FXpob165c0lceh1KnnyLZczTwOfzSffu3Qsd9pv7aN68OfH09CRZWVksvhuqPAUHB5OaNWsWeA54eHjI7LXevXtHtLS0Cnyt//77j1Hfx8eH6OrmDPudOHEiIYSQ7OxscuLECVKvXr0Cn8fCwoJs3ryZJCcnyyx2ZffixQvGz2jJkiVsh0QpCW9vb2JsbFysa4azszPb4UpVLvOMhIWFEQDkyZMnjPKFCxeSZs2aFes5pk6dShwcHAqd4GvVqlVSf9jKkIwURSAQkDlz5hTr5AJArK2tyZ9//kliYmLYDp0qB1FRUcTJyUnq737YsGEyeY20tLRCEwgA5Pnz5+L6np6eRF1dXbxv3Lhx5ODBg8TBwaHA4+3t7cm+ffvoxH1SfPv2jfGzmjx5MtshUUrk0aNHpGrVqsW6Xvj5+bEdrgSFTEbWr19PjI2NyZs3bwqtp8wtI8Xl4eEhMcNeYQ8tLS0yYcIE8u7dO7ZDp2QsISGBtG7dWuJ3bmNjI5MJwKZNm1bk+RUQEEAIIWTnzp3FPicBkFq1apFjx47RFrxCxMXFMX5mQ4YMYTskSskkJSWRcePGFfn3OHXqVLZDlVAuyUhZbtNs3ryZGBoakhcvXpTkJQkhij8Da2n5+PgQAwMDxsk0duxYUqtWrUJPuI4dO5IrV64QoVDI9lugZCQlJYV06dJF4ncdFBRUpue9ePFisZKKHz9+kOXLlxc7CXFyciJnz54lAoFANj8AFSYQCBg/uy5durAdEqWkLl68SCpVqlTg36WBgQFJSUlhO0yGcpsOvlmzZmTGjBnibaFQSKytrcn69esLPGbjxo3EwMCA+Pr6lvTlCCGqm4wQQsiHDx8YTXAXLlwgQqGQ3Lhxg7i6uhZ6QahWrRrZsWOHSv5cKqKMjAwyYMAAxu/42LG/C+yDVJSQkBDx/WYtLS2ip6dX4Lk0atSoYiUhrVq1IteuXVO5KdvLW94vHYp6b59SDhEREYX2PTx69CjbITKUWzJy+vRpoqmpSY4dO0YCAgLIpEmTiJGREYmMjCSEEDJy5EhGB60NGzYQDQ0Ncu7cORIRESF+lKSDmyonI4QQEh0dTdq0afP/i88xxr6PHz+SqVOnFrqmh76+Ppk9ezb59u0bS++AkpXs7GwyduxY8e/WzLk7YwG7FutuF3vNmHfv3pHHjx+T8PBwIhQKScuWLUt0C0ZaEzBNQkrHzs5O/HOsUaMG2+FQSk4kEhEPDw+p14UWLVqwHR5DuS6Ut3v3bmJnZ0c0NDRIs2bNyNOnT8X72rVrR0aPHi3etre3l/rBtmrVqmK/nqonI4TkfCseOXIk2b17t9T98fHxZPPmzYwPtfwPDodDevXqRe7cuUMvGkpMKBSSfiMnEQBEzcRGYjXdki5il5ktJOtP32OcK/Xr1ycjRowocUIybdo0kpmZWY7vXjU5OjqKf4aVKlViOxyFUNjIQ6p4Pn/+X3t3HtbEtf4B/JsEAogIirKKC7SiCEoF2VrUCldca6tVW73ickWl7rQuxbVXQWt7rV5FraIW61bFrSpiVdxFVDZF1NsKraKAisoOgeT8/uBHypiAgCSTwPt5Hp7HnDmZeeeY5c2ZM+fcZ25ubgrv04TEJI1p29p+fwsYUzJns4bJy8uDsbExcnNzq73PujFgjOHRo0c1TgxVXl6Oo0ePYu3atbh8+XK19RwdHTFr1iyMGTMGBgYG1dYjmkcqY3h/1VncO/kTci/vRtvpuyAyNJFvF6Bi/prL8/tCJKx5uYCVUanYeikdL6/ux6uLO+XlfUYE4OX/riM5ObnO8bm7u+PgwYOwtn776eObij59+uDChQsAKqbEl0gkTXqph+iUTHxzLJWzwKhlAy7Q2JSUlZUhJCQEK1askE+EZu4xFPq9A+R1+Gzb2n5/00J5GkQgELxxhkodHR0MHz4cly5dQnx8PPz9/SEWixXqpaSkICAgADY2Nli4cGGjmvG2sbue/gJPnr2ArKQAArEBitNucrYzAJm5Jbie/qLG/ayMSsWPF9MhY0Dh3YucbZeiD9cqEbG2toaPjw+mT5+ODRs24MyZMzh48CCsrKzqfF5NWdWJz8rLy1FYWMhjNPyKTslE4K4ETiICAFm5JQjclYDolEyeItNOurq6WLZsGa5cuQKrdh0BAE8Tz0BW9nf7akPbUjKixXr06IGIiAj89ddfWLp0qdIpxnNychAaGooOHTpg9OjRiIuL4yFSUluMMfyydxceb52C/JtHwSTFKHmYorTu66tFVyUpl2HrpfSKfz/7E2XP/vx7o1AEaf5z+UNdXV04ODhg2LBhCA4Oxs6dO3Hjxg3k5eUhIyMDZ86cwfr16zFt2jT4+PjA2tq6Sf+qr4/Xp4RvquvTSGUM3xxLhbSsBCUZqZxtlV303xxLhVSm8R32Gse1pxusJ/4XzZ37g5UWouj+36tya0PbUjLSCFhYWGDZsmV4+PAhIiIi8N577ynUKS8vx969e+Hh4QEPDw/s3bsXZWVlPERLqpOcnIxevXph3eLZkBW+kpcXppxFaebvCvVfXy26qp9j/4T8M4fJYPCOOyAQAQDE5nYw6TMebYYtxordZ1BYWIg7d+7g4MGDCAkJwdixY+Hq6gojI6OGPL0mjaaEr3A9/QUePXqE7N3z8fSXxSjN4r6ua9vrRxRdT3+Bp8UCmPpNR+thi1H8O/eHp6a3LSUjjYienh78/f0RHx+PixcvYvjw4RAKFf+L4+LiMHr0aHTs2BGhoaF4/vy5kr0RdXn16hVmzpyJHj16KBkHJEDz9wZAx8SiSknFNWC3jq2q3edfL4rk/xab2cJs+GK0nbELrfrPgNnwJTB2/xTN3nVHqaE5dHWVrypNGg4lIxUuXLqEzJ1zIMl+AFZeimcHlyP7wDLkxu6H5Gm6fLXnmnr9iHJV2yw/7iCkxXl4dXWfwg8ZTW1bSkYaIYFAAG9vb0RGRiItLQ1fffWV0mXrHz9+jIULF8LGxgYBAQFISVF+OYCohkwmQ0REBOzt7bF+/XqFVXr1rOxhOe4HmPb7AiKDil6KyosjS4c41Dh4tX2rZgplIgMjGHX34wyGVVaPNDy6TANs27YNiyeP5PT6SQteQGxmi1dX9iJzxww83jQBOafC8PvNiyguLuYvWC1U2VMqLc5H6eO7KH2UgtxLu/Di9Cal9TQNJSONXPv27fHdd98hIyMDGzduhL29vUKdkpIShIeHw8nJCT4+Pjh27FiDL19PuJKSkuDt7Y3x48fj6dOnnG2tW7fG9u3bcejkWbS3d+RsszDWx6Z/9njjqPixnh3whhttIBRU1COq15R7RsrKyjBz5kxMmjQJ5VUuDQt09ND6o3lo2dsfrQfNAQBI85+jIOkk5gaMhqmpKQYPHozNmzfj0aNHfIWvNdw6toKlsT5KH97C36NEAP323QHUrkeVTzp8B0DUw9DQEIGBgZgyZQp+++03rFu3DtHR0Qr1YmJiEBMTAzs7O8yYMQMTJkxo1LdTq9vLly+xePFibNq0SSHhEwqFCAwMxPLly+VfXn6OVhXXgvNLYGZU8UHyptt5AUCsI0SAd0f8eDG92joB3h0h1qHfI+rQVHtGcnJyMHLkSMTExHDKRUZtYDZsIcQW7wAADLv0QnlOBl5d2SOvU1xcjBMnTuDEiRMAgO7du2Pw4MEYNGgQ3NzcIBKJ1HciWkAkFGDpEAeMPLCGU67fvnute1T5RJ9ETYxQKET//v1x8uRJ3L17F4GBgWjWTLGr/sGDB5g9ezbatm2L2bNn48GDBzxE23jIZDJs374d9vb2CAsLU0hEvLy8EB8fjw0bNnB+RYuEAnjamWKoszU87Uzr9EHy9UAHTOnVUaGHRCgApvTqiK8HOrzVOZHaa4o9IykpKXBzc1NIRN5//338/OsZhV4/+4ET0GfAx9XuLzk5GSEhIfDy8oKFhQXGjRuHAwcOIDc3VxXha6X+jpYwfnn/7wKRLvSsu9S6R5VXqp9/7e01hRlY+USzu6pWfHw88/DwUNquZmZm7KefflLpooelZVIWfvEBW3zkNgu/+ICVltECi+qWkpLC+X+fOXMm3yGp1JEjR5SuhRQQECCfwVfZDKzFxcXVvleq+9PR0WFfffUVLRzKGMvIyOC0jVNPL62ZgZWSESJXVlbGIiMjmbe3d41vfkdHR7Z161ZWVFTEd8gaLScnhwUGBjKBQKDQhkKhkM2cOZO9fPmS7zCJGjx+/Jjz/+/v7893SCohk8nYv//9b4XXu0gkYhs2bKjVD5msrKwafxhV/WvTpg3bunUrrR79/yIiIjjts2LFCr5DomSEvJ34+Hjm7+/PxGJxtR8EpqamLDg4mGVkZPAdrkaRSqVs69at1S71/cEHH7CkpCS+wyRqVFRUxHkNDBkyhO+QGlxBQQH79NNPlX5OxMTE1GlfycnJNa4yDYB17NiRPXv2TEVno51eX3376tWrfIdEyQhpGFlZWWzZsmXM3Ny8xm7Szz//nLNgYlN148YNpQtXAWDm5uZs586ddJmrCZLJZJzE3tvbm++QGtSff/7JWQywai9qWlpavfZ5/PhxJhQKa0xInJ2dWUJCQgOfjXaSyWSsbdu28rYxMjJiZWVlfIdFyQhpWCUlJSwiIoK99957NX44uLu7sz179jCJRCJ/blNYnfP58+dsypQpSi/JiEQiNnv2bPbq1Su+wyQ8qprQOzo68h1Og7lw4YLSXsBPPvmE5efnv9W+16xZ88ZLNSKRiAUHB7Pi4uIGOiPtdP/+fU67DB48mO+QGGOUjBAVkclk7OLFi2z48OE1/mqxtrZmISEhbN/F28wj9AxrP/+4/M8j9Aw7efsJ36fSIMrLy9mPP/7IWrVqpbQdevXqxW7dusV3mEQD2Nvby18Xbdu25TucBrFp0yamo6Oj8LpfunRpgwwolclkbPLkyZx9W1hYKH2vde7cWSMuS/Bl48aNnPb44Ycf+A6JMUbJCFGDP//8k3311VfMxMSk2qREoCNmzbv1Y5YTN8iTkQ7//6ftCUlcXBxzdXVVet6WlpZs9+7ddEmGyFW9S8TQ0JDvcN5KaWkpmzp1qsLrvlmzZiwyMrJBjyWRSFjfvn3lx9iyZQs7fPiw0qREIBCw2bNns4KCggaNQRsMHz6c0xbJycl8h8QYo2SEqFFBQQHbuHEj69y5c43dqfrtu7N2Xx6SJyQeoWe08pLNs2fP2KRJk6q9JBMUFESvVaKgf//+nNdK1UuZ2uTp06esV69eCq/9Dh06qOwL8MWLF6xTp04MADt58qS8bMKECUo/a2xtbdnZs2dVEosmkkqlnN7ZNm3aaMytzrX9/qZJz8hbq5zd9c6dOzh58iT69+9fbV2BjhhAxTtGk1eQVEYqlWLz5s3o1KkTwsPD5Yt6VerTpw+Sk5Pxn//8h2atJQpen/hMG2dhTU5ORs+ePXHx4kVOee/evXHjxg1069ZNJcdt2bIljh8/jpYtW6Jdu3bysu3btyM6OlpeViktLQ0+Pj6YMmVKk5gULTk5GS9e/P1Z2rdvX6WLpGoy7YqWaLSqs7tuOHQezd8bBIGunny7fkcXMJmU8xxNXUHyddeuXYObmxsCAwMVZs+0srLC3r17ERMTg65du/IUIdF02j4La2RkJLy8vPDXX39xyr/44gucPn0arVu3Vunx3333XRw6dAg2Njaccj8/P6SkpGDatGkKz9myZQscHR0RFRWl0tj4dvbsWc5jHx8fniKpP0pGiEr06OYI036BsP4iAiZ9JkK/fTeIjEyRc+IHTkKiqStIVnr27Bn+9a9/wdPTEwkJCZxtOjo6mDt3Lu7du4fPPvsMAoFmrvlANIO2rk8jk8mwZMkSjBgxAkVFRfJyHR0d/PjjjwgLC4Ourq5aYunTpw+MjIwUyo2MjLBhwwZcuHAB77zzDmdbRkYGBg0aBH9/f+Tk5KglTnWjZISQalSuIKmj3xzG7sNg/lko9Cw7oTD1PHKi1gIyqUavICmVShEWFoZOnTph+/btCtt9fHxw69YtrF69WumHIyGv08aekfz8fAwfPhzLly/nlLdp0wYxMTGYPHkyT5Ep16tXL9y6dQtz585VuEzx888/w8HBAZGRkTxFpxoSiYRz2ax9+/bo2LEjjxHVDyUjRCUqV5AEIF8xUsfEAkI9QxTeOYfnJ9dh0UB7jVxB8urVq3B1dcX06dMVfr1aW1tj//79OH36NLp06cJPgEQraVvPSFpaGry8vHDkyBFOubOzM27cuAFvb29+AnsDAwMDrF69GrGxsQqXTZ8+fYoRI0bg008/RVZWFk8RNqzr169zeqx8fHy0speWkhGiMv0dLbHpnz1gYVxxKUYgEMiXDC9MicGBHxZBKpXWtAu1evr0KSZMmID3338fSUlJnG26urqYP38+7t27hxEjRmjlm53wS5t6RmJiYtCzZ0+kpKRwykeMGIHLly+jffv2PEVWe25uboiPj8eSJUugo6PD2Xbw4EE4ODhg586dCgPRtU1juEQDAHRrL1G5qjOw/nPyTM4teBMmTOD9FrSysjL23//+lxkbGyu9TfAf//gHu3fvHq8xEu135swZzusqNDSU75AUyGQytn79eiYSiRTeBytWrNDaeXOSkpJYjx49lL6/BwwYwB4+fMh3iPX2+sKmmZmZfIfEQfOMEI104MABhQ+DiRMn8paQXLp0iXXr1k3ph5SNjQ2LjIzU2g9golni4+M5r6958+bxHRJHaWkpmzRpksL7oHnz5uzo0aN8h/fWysrK2KpVq5ienp7CORoZGbHNmzfz/sOorgoKCpiurq78PBwcHPgOSQHNM0I0kouLi0LZ9u3bMWXKFMhkMrXFkZWVBX9/f3h7e+PWrVucbWKxGMHBwbh79y6GDx9Ol2RIg3h9zIgmXabJzs5G3759ER4ezim3s7PDtWvX8NFHH/EUWcPR0dHB/PnzkZycDC8vL862/Px8TJ06FT4+Pnjw4AFPEdbd5cuXUVZWJn+stZdoQGNGiJp16NABrVop3kETHh6OqVOnqjwhKS8vx9q1a2Fvb4+ff/5ZYbufnx9u376NkJAQGBoaqjQW0rRo6qRn8fHxcHV1xZUrVzjlPj4+uH79eqObO8fe3h4XL17EunXr0KxZM8628+fPw8nJCT/88INGjWerTqMZLwLQmBGifv369at2yvjJkye/VVdpXFwcKykpUbrtwoULzMnJSelx27Vrxw4dOkSXZIjKSKVSzhICvr6+fIfE9u7dy/T19RXeD7NmzdKI5edVLS0tjfn4+Cj9TPDw8GCpqal8h1ijquNghEIhe/nyJd8hKaAxI0RjBQcH17iGzdSpU+uVFNy9e5eZmpqyx48fc8qfPHnCxowZo/RYYrGYLVq0iBUWFjbU6RFSraqDpF1cXHiLo7y8nC1YsEDh/aCrq8u2bdvGW1x8kMlkbOvWraxFixZKPx9CQkI0ch2hnJwcTnLbs2dPvkNSisaMEI2lbNxIVZs3b8a0adPqdMtdRkYG+vXrh5ycHPksi2VlZVizZg3s7e2xe/duhecMHDgQd+7cwfLlyxW6awlRhaqXavi6TJOXl4ehQ4di1apVnHJzc3OcP38eEydO5CUuvggEAkyaNAmpqakYPHgwZ5tEIsHChQvh5uaGxMREniJU7ty5c5zPSK2+RAMaM0J44Orq+sY6mzZtwowZM2qVkOTk5KBfv3549OgRAOD58+c4f/483nvvPXz55ZfIz8/n1O/QoQOOHj2K48ePK0wdTYgqVR3EyscA1t9//x0eHh44ceIEp9zFxQU3b95UGNjZlFhbW+PXX3/F7t27YWpqytmWlJSEnj17YtGiRSgtLeUpQq6YmBjOY21PRugyDVE7mUzG2rRpU+Olmsq/6dOn13jJpqCggHl4eHCe4+joqHRfenp6bMmSJayoqEiNZ0vI3/p8+CHnGn9ZufpuJT116hQzMTFReF+MHj2a3hOvyc7OZiNHjlT6OdKlSxcWGxvLd4jM3t6eczlJU/8PacwI0WgDBgyoNgE5deoUe/LkCcvJyWEFBQXVJiMSiYT179+/VknN4MGD2R9//KHmsyTkbydvP2EtHT7gvC5dlxxlJ28/UelxZTIZW7NmDRMKhZxjCwQC9u2339Kg7RocOnSIWVhYKHyeCAQCNmfOHN7GmmVkZHDi6dOnDy9x1AaNGSEaraZxI1u3boWlpSVatWoFQ0NDpfN8yGQyTJgwAdHR0TUex9bWFseOHcOxY8dgZ2f31nETUh/RKZkI3JUAiciAU571LAeBuxIQnZKpkuOWlJRgwoQJCAoK4tw236JFCxw/fhzz5s2jeXRq8MknnyA1NRXjx4/nlDPG8MMPP8DJyQnnzp1TeRw5OTkoLi6WP25Ut/T+P0pGCC8qx40IBAIcOnQILVq0kG+LjIzEjRs3qn0uYwxBQUFKB6VW9dlnn+HOnTsKg9IIUSepjOGbY6lgAET6zbnbSgoAAN8cS4VUVvsB27WRmZmJPn36ICIiglPeqVMnxMXFYeDAgQ16vMaqZcuW2LFjB6Kjo2FjY8PZlpaWhr59+2Lq1KnIy8tTWQwPHz6Er68vnj9/DqARjhcBJSOEJ5XJyIIFC/DJJ59g7ty5nO0LFiyodvDqqlWrsG7dujce48CBA1i8eDFnRUtC1O16+gtk5pYAAPRsHGHkMgRGbsPQsm8ARM1aggHIzC3B9fQXDXbMGzduwNXVFXFxcZxyPz8/xMXFoXPnzg12rKbCz88PKSkpCAwMVNj2448/omvXrjh58qRKjm1gYICrV6/Cy8sLDx484PSMGBkZoWfPnio5rjpRMkJ4YWVlhcGDB2PZsmUAgDlz5sDc3Fy+PSYmBqdPn1Z4Xnh4OIKDg2t1DKlUiu+//x6Ojo64fPlyg8RNSF09zS+R/7vZu+5o5TsFrKQARq4fQdS8pdJ6b2PXrl3w9vbGkydPOOVfffUVTpw4oTAtPam9Fi1aYOPGjTh//rzCnXgZGRkYOHAg/P398eJFwyWWQEUyAlTcDeXi4oKMjAz5tt69ewMAbt26hfDwcNy8ebNBj60ulIwQXggEAvzyyy8Qi8UAAENDQyxZsoRTZ2bQXBxOeITYBzmQyhiOHDmCKVOm1Gr/zZs3x4ABA7B69Wrs378fnp6eDX4OhNSGmZE+5zGTlqEgJQaSzP/VWK+upFIp5s6di7Fjx3JuP9XT08POnTvx3XffQSQSvdUxSIXevXsjOTkZX375JYRC7tfozz//DAcHBxw8eLDBjld1HqTc3FzOtmvXrsHY2Bjdu3fHypUrtXb6fgGrri9cg+Tl5cHY2Bi5ubmcsQWkcZFIJOjSpQvS0tLkZa0/mgfDLr1gmHMfv+8MRplE+T3+hoaG+OCDD9CnTx98+OGHcHFxgY6OjrpCJ6RaUhnDB9/GICu3BAyAJDsNmT/NhKFjX7QeFAQBAAtjfVye3xciYf0Gk7569Qqff/65woBuKysrHD58GG5ubm9/IkSpuLg4TJw4EampqQrbPv30U2zYsIHT61sfBQUFMDIyemO9qKgoDBgw4K2O1dBq+/1NPSNEY4jFYoyY8iWn7NWln1Ga+Tvu7lzMSUQMDAzg6+uLkJAQXLlyBS9fvkR0dDQWLFgAd3d3SkSIxhAJBVg6xAEAIAAgya5YFbbw7iXIiip+5S4d4lDvROT+/ftwd3dXSETc3d1x48YNSkRUzN3dHQkJCVi8eLHC505kZCQcHBywa9euOs0o/brKyzQ1GTZsmMYlInWi8puMGwDNM9I0lEtlzH3Fb0xsbse9p1+vGYNIl+m368ba+o5n5y9crHYxPEI01cnbT5hH6Blm5DJE/tq28ZtUq3lGioqK2O7duxXKT5w4oXRNlXHjxrHi4mJVnAapQVJSEmfxuqp/AwcOZI8ePar3vnV1daudR8nQ0JA9fPiwAc+k4dA8I0TrXE9/gax8CUx6+QMAdFpaoXmPwWjzySK0m/0LzD8PhcjlU4itHaCnp8dztITUTX9HS1ye3xe2wmfyMuG90/hHF7M3PnfRokXYsWOH/DFjDKtXr8bgwYM5t5QKhUKsWbMGO3bsgL7+241BIXXXvXt3xMXFYeXKlQqfUVFRUejatSu2bNlSr16SmtbPWrJkicJtx9qGxowQjXE06TFm7UsCYwzFv1+DgV1PCESKl1vWfeaMoc7WPERIyNuRyWQwMTHhrJd07NixGufCuXTpEnr37g1DQ0O8evUKEokEkyZNwp49ezj1TExM8Msvv6Bfv34qi5/U3r179zBx4kTExsYqbPvwww8RHh4OW1vbWu/P0tISWVlZCuUODg5ITEyU3wygaWjMCNE6lXcTCAQCNOvkqTQRqVqPEG2TlpamsHBjWFhYtfULCgowfvx4MMZQUFCAU6dOoVevXgqJSJcuXXD9+nVKRDRI586dcenSJaxdu1ahV+PcuXNwcnLCunXrIJVKa7W/6saNbNy4UWMTkbqgZIRoDLeOrWBprI/qhvEJAFga68OtYyt1hkVIg0lKSlIoi46Oxh9//KG0/vz58zl3lw0ZMkRhHolBgwbh2rVrePfddxs0VvL2RCIRZs2ahdu3b6Nv376cbUVFRZg9eza8vb1x9+7dN+5L2WWasWPHyucZ0XaUjBCN8fpdB1VVPn6buw4I4VtiYqLS8k2bNimUnT17Fhs3buSUVV1fBgC+/vprHD16lC5fazhbW1ucOXMGW7ZsUfi/io2NhbOzM1auXImysrJq9/F6z4ixsTG+++47lcTLB0pGiEbp72iJTf/sAQtj7qUYC2N9bPpnD/R3tOQpMkLeXnXJyPbt2znLFuTl5WHixInV7sfAwAB79+5FaGgoTWSmJQQCAQICAnDnzh0MGjSIs00ikSA4OBju7u5Ke88AxWQkJCTkrecv0SSUjBCNU3nXwd4AD6z7zBl7AzxweX5fSkSI1qvui+bVq1fYt2+f/HFQUBAePnxY7X6kUil+++033Llzp6FDJCrWtm1bHDt2DLt27UKrVtxLzomJiejZsycWL17MmUUX4CYjPXr0wNSpU9USr7pQMkI0kkgogKedKYY6W8PTzpQuzRCtl52djczMzGq3h4WFgTGGqKgobNu2rcZ9SSQS7NixA46Ojhg0aFCN+yWaRyAQYMyYMUhNTcWIESM428rLy7FixQr06NEDcXFxkMoYYh/kILdMIH/upk2bGl2PGCUjhBCiBtX1ilRKSEjA6dOnERAQUKv9mZqaYt68eVi/fj0sLanXUBuZm5tj//79OHjwoMIll9TUVHh5ecGm90iM2nget7MqFlJs03MQXjTT7jlFlKFkhBBC1KC68SJVTZ06VWG13de5u7sjIiICGRkZ+Pbbb+s0VwXRTMOGDUNqair8/f055TKZDJmXI5G5fQZkJQUQGrSAnscYBO5KQHRK4+oNo2SEEELUoDbJSHp6utJyfX19TJw4ETdv3sS1a9fg7+9PM6w2Mq1atUJERASioqIUZlMtf5WJkvR4NHfyhdCgYsG8b46lQirT+DlLa42SEUIIUYPKyzROTk5oZ9eJs81s1AoIdBWXOHjnnXewZs0aPH78GNu2bYOLi4s6QiU8GjBgALb/ehHNnbmL3um0soZxr7EAKhakycwtwfX0FzxEqBqUjBBCiIoVFBTg0aNHCAkJQWjEcbxo1o6zPe/GYbCyirsnBAIBhg4dilOnTuH+/fuYM2eOwl0XpHErhC5M/abB/PNQ6JhYAiIdtPlkIYQiXU69p/klPEXY8GiddUIIUbGCggIkJSXB7p138cG3MRA1N+VsL0mLh7CZCYy6+8HW+yMcXPk53UHWhFUueaHfrhssJ65H6eN7ELduV229xoCSEUIIUTELCwtYWFgg9kEOMnNLIDLiJiNGLh+hZZ8JEOjo4gUqVrD2tDNVvjPS6FUujZGVWwKhrj4MOjhztgtQMRFkY1oag5IRQghRk8pudQM7V5iNXA5RM2PomJhDIG4GgUCgUI80TZVLYwTuSoAAFWNEKjXWpTHqNWYkLCwMHTp0gL6+Ptzd3XH9+vUa6x84cACdO3eGvr4+nJycEBUVVa9gCSFEm1V2q+u0MINBx/cgNreFUM+Qk4hUrUearqa2NEade0Z++eUXBAUFYfPmzXB3d8fatWvh5+eH+/fvw8zMTKH+1atX8fnnn2PlypUYPHgw9uzZg48//hgJCQlwdHRskJMghBBtULX7XdlNmY2x+53UX39HS/zDwQLX01/gaX4JzIwqXhuNqUekkoAxVqcbld3d3dGzZ09s2LABQMWkLDY2NpgxYwYWLFigUH/UqFEoLCzE8ePH5WUeHh5wdnbG5s2ba3XMvLw8GBsbIzc3l1anJIRoteiUTATuSgCgvPu9Mf7qJU1Xbb+/63SZRiKRID4+Hr6+vn/vQCiEr68vYmNjlT4nNjaWUx8A/Pz8qq0PAKWlpcjLy+P8EUJIY9DUut8JqY06XaZ5/vw5pFKpwhz65ubmuHfvntLnZGVlKa2flZVV7XFWrlyJb775pi6hEUKI1mhK3e+E1IZG3k3z9ddfIygoSP44Ly9PYXpcQgjRZpUrUxNC6piMtG7dGiKRCNnZ2Zzy7OxsWFhYKH2OhYVFneoDgJ6eHvT0FKdGJoQQQkjjU6cxI2KxGC4uLjh79qy8TCaT4ezZs/D09FT6HE9PT059ADh9+nS19QkhhBDStNT5Mk1QUBDGjRsHV1dXuLm5Ye3atSgsLMSECRMAAP7+/rC2tsbKlSsBALNmzULv3r3xn//8B4MGDcK+fftw8+ZNbNmypWHPhBBCCCFaqc7JyKhRo/Ds2TMsWbIEWVlZcHZ2RnR0tHyQ6sOHDyEU/t3h4uXlhT179mDRokUIDg7Gu+++iyNHjtAcI4QQQggBUI95RvhA84wQQggh2kcl84wQQgghhDQ0SkYIIYQQwitKRgghhBDCK0pGCCGEEMIrSkYIIYQQwitKRgghhBDCK0pGCCGEEMIrSkYIIYQQwitKRgghhBDCqzpPB8+Hykli8/LyeI6EEEIIIbVV+b39psnetSIZyc/PBwDY2NjwHAkhhBBC6io/Px/GxsbVbteKtWlkMhmePHkCIyMjCASCBttvXl4ebGxs8OjRI1rzRoWondWH2lo9qJ3Vg9pZPVTZzowx5Ofnw8rKirOI7uu0omdEKBSibdu2Ktt/ixYt6IWuBtTO6kNtrR7UzupB7aweqmrnmnpEKtEAVkIIIYTwipIRQgghhPCqSScjenp6WLp0KfT09PgOpVGjdlYfamv1oHZWD2pn9dCEdtaKAayEEEIIabyadM8IIYQQQvhHyQghhBBCeEXJCCGEEEJ4RckIIYQQQnjV6JORsLAwdOjQAfr6+nB3d8f169drrH/gwAF07twZ+vr6cHJyQlRUlJoi1W51aeetW7fC29sbLVu2RMuWLeHr6/vG/xfyt7q+pivt27cPAoEAH3/8sWoDbCTq2s6vXr3CtGnTYGlpCT09PXTq1Ik+P2qhru28du1a2Nvbw8DAADY2NpgzZw5KSkrUFK12unjxIoYMGQIrKysIBAIcOXLkjc85f/48evToAT09Pbzzzjv46aefVBska8T27dvHxGIx2759O7tz5w4LCAhgJiYmLDs7W2n9K1euMJFIxFavXs1SU1PZokWLmK6uLrt9+7aaI9cudW3n0aNHs7CwMJaYmMju3r3Lxo8fz4yNjVlGRoaaI9c+dW3rSunp6cza2pp5e3uzoUOHqidYLVbXdi4tLWWurq5s4MCB7PLlyyw9PZ2dP3+eJSUlqTly7VLXdt69ezfT09Nju3fvZunp6ezUqVPM0tKSzZkzR82Ra5eoqCi2cOFCdujQIQaAHT58uMb6aWlprFmzZiwoKIilpqay9evXM5FIxKKjo1UWY6NORtzc3Ni0adPkj6VSKbOysmIrV65UWn/kyJFs0KBBnDJ3d3c2ZcoUlcap7erazq8rLy9nRkZGLCIiQlUhNhr1aevy8nLm5eXFwsPD2bhx4ygZqYW6tvOmTZuYra0tk0gk6gqxUahrO0+bNo317duXUxYUFMTef/99lcbZmNQmGZk3bx7r2rUrp2zUqFHMz89PZXE12ss0EokE8fHx8PX1lZcJhUL4+voiNjZW6XNiY2M59QHAz8+v2vqkfu38uqKiIpSVlaFVq1aqCrNRqG9b//vf/4aZmRn+9a9/qSNMrVefdv7111/h6emJadOmwdzcHI6OjggNDYVUKlVX2FqnPu3s5eWF+Ph4+aWctLQ0REVFYeDAgWqJuang47tQKxbKq4/nz59DKpXC3NycU25ubo579+4pfU5WVpbS+llZWSqLU9vVp51fN3/+fFhZWSm8+AlXfdr68uXL2LZtG5KSktQQYeNQn3ZOS0tDTEwMxowZg6ioKPzxxx/44osvUFZWhqVLl6ojbK1Tn3YePXo0nj9/jg8++ACMMZSXl2Pq1KkIDg5WR8hNRnXfhXl5eSguLoaBgUGDH7PR9owQ7bBq1Srs27cPhw8fhr6+Pt/hNCr5+fkYO3Ystm7ditatW/MdTqMmk8lgZmaGLVu2wMXFBaNGjcLChQuxefNmvkNrVM6fP4/Q0FBs3LgRCQkJOHToEE6cOIHly5fzHRp5S422Z6R169YQiUTIzs7mlGdnZ8PCwkLpcywsLOpUn9SvnSt9//33WLVqFc6cOYNu3bqpMsxGoa5t/eDBA/z5558YMmSIvEwmkwEAdHR0cP/+fdjZ2ak2aC1Un9e0paUldHV1IRKJ5GVdunRBVlYWJBIJxGKxSmPWRvVp58WLF2Ps2LGYNGkSAMDJyQmFhYWYPHkyFi5cCKGQfl83hOq+C1u0aKGSXhGgEfeMiMViuLi44OzZs/IymUyGs2fPwtPTU+lzPD09OfUB4PTp09XWJ/VrZwBYvXo1li9fjujoaLi6uqojVK1X17bu3Lkzbt++jaSkJPnfRx99hA8//BBJSUmwsbFRZ/haoz6v6ffffx9//PGHPNkDgP/973+wtLSkRKQa9WnnoqIihYSjMgFktMxag+Hlu1BlQ2M1wL59+5ienh776aefWGpqKps8eTIzMTFhWVlZjDHGxo4dyxYsWCCvf+XKFaajo8O+//57dvfuXbZ06VK6tbcW6trOq1atYmKxmEVGRrLMzEz5X35+Pl+noDXq2tavo7tpaqeu7fzw4UNmZGTEpk+fzu7fv8+OHz/OzMzM2IoVK/g6Ba1Q13ZeunQpMzIyYnv37mVpaWnst99+Y3Z2dmzkyJF8nYJWyM/PZ4mJiSwxMZEBYGvWrGGJiYnsr7/+YowxtmDBAjZ27Fh5/cpbe+fOncvu3r3LwsLC6Nbet7V+/XrWrl07JhaLmZubG7t27Zp8W+/evdm4ceM49ffv3886derExGIx69q1Kztx4oSaI9ZOdWnn9u3bMwAKf0uXLlV/4Fqorq/pqigZqb26tvPVq1eZu7s709PTY7a2tiwkJISVl5erOWrtU5d2LisrY8uWLWN2dnZMX1+f2djYsC+++IK9fPlS/YFrkXPnzin9zK1s23HjxrHevXsrPMfZ2ZmJxWJma2vLduzYodIYBYxR3xYhhBBC+NNox4wQQgghRDtQMkIIIYQQXlEyQgghhBBeUTJCCCGEEF5RMkIIIYQQXlEyQgghhBBeUTJCCCGEEF5RMkIIIYQQXlEyQgghhBBeUTJCCCGEEF5RMkIIIYQQXlEyQgghhBBe/R+Apvp2fKwXkgAAAABJRU5ErkJggg==", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "env.render(td.cpu(), out[\"actions\"].cpu())" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## EAS\n", + "\n", + "We perform few iterations of EASLay for demonstration" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:196: UserWarning: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + " rank_zero_warn(\n", + "/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:196: UserWarning: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n", + " rank_zero_warn(\n", + "INFO:rl4co.models.rl.common.base:No metrics specified, using default\n", + "INFO:rl4co.models.zoo.eas.search:Setting up Efficient Active Search (EAS) with: \n", + "- EAS Embedding: False \n", + "- EAS Layer: True \n", + "\n" + ] + } + ], + "source": [ + "logging.basicConfig(level=logging.DEBUG)\n", + "\n", + "env.generator.num_loc = 200\n", + "\n", + "dataset = env.dataset(batch_size=[2])\n", + "# eas_model = EASEmb(env, policy, dataset, batch_size=2, max_iters=20, save_path=\"eas_sols.pt\") # alternative\n", + "eas_model = EASLay(env, policy, dataset, batch_size=2, max_iters=20, save_path=\"eas_sols.pt\")\n", + "\n", + "eas_model.setup()" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "INFO:rl4co.models.common.constructive.autoregressive.policy:Instantiated environment not provided; instantiating tsp\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Plot initial solution\n", + "td_dataset = next(iter(eas_model.train_dataloader()))\n", + "td_dataset = env.reset(td_dataset).to(device)\n", + "out = policy(td_dataset)\n", + "\n", + "env.render(td_dataset.cpu(), out[\"actions\"].cpu())" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Perform search \n" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "WARNING:rl4co.utils.trainer:gradient_clip_val is set to None. This may lead to unstable training.\n", + "Using 16bit Automatic Mixed Precision (AMP)\n", + "GPU available: True (cuda), used: True\n", + "TPU available: False, using: 0 TPU cores\n", + "IPU available: False, using: 0 IPUs\n", + "HPU available: False, using: 0 HPUs\n", + "INFO:rl4co.models.zoo.eas.search:Setting up Efficient Active Search (EAS) with: \n", + "- EAS Embedding: False \n", + "- EAS Layer: True \n", + "\n", + "DEBUG:fsspec.local:open file: /home/botu/Dev/rl4co-rebuttal/notebooks/dev/lightning_logs/version_181/hparams.yaml\n", + "DEBUG:fsspec.local:open file: /home/botu/Dev/rl4co-rebuttal/notebooks/dev/lightning_logs/version_181/hparams.yaml\n", + "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]\n", + "INFO:rl4co.models.rl.common.base:Instantiating optimizer \n", + "\n", + " | Name | Type | Params\n", + "------------------------------------------------\n", + "0 | env | TSPEnv | 0 \n", + "1 | policy | AttentionModelPolicy | 710 K \n", + "------------------------------------------------\n", + "710 K Trainable params\n", + "0 Non-trainable params\n", + "710 K Total params\n", + "2.841 Total estimated model params size (MB)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "75a65a8984b34ad780ce54612a4eaa01", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Sanity Checking: 0it [00:00, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:432: PossibleUserWarning: The dataloader, val_dataloader, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 32 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", + " rank_zero_warn(\n", + "/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:432: PossibleUserWarning: The dataloader, train_dataloader, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 32 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n", + " rank_zero_warn(\n", + "/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/loops/fit_loop.py:280: PossibleUserWarning: The number of training batches (1) is smaller than the logging interval Trainer(log_every_n_steps=50). Set a lower value for log_every_n_steps if you want to see logs for the training epoch.\n", + " rank_zero_warn(\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "f94c336fc12c4d59b8cccb01fd176037", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Training: 0it [00:00, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/Dev/rl4co-rebuttal/notebooks/dev/../../rl4co/models/zoo/eas/nn.py:22: UserWarning: nn.init.xavier_uniform is now deprecated in favor of nn.init.xavier_uniform_.\n", + " torch.nn.init.xavier_uniform(self.W1)\n", + "/home/botu/Dev/rl4co-rebuttal/notebooks/dev/../../rl4co/models/zoo/eas/nn.py:23: UserWarning: nn.init.xavier_uniform is now deprecated in favor of nn.init.xavier_uniform_.\n", + " torch.nn.init.xavier_uniform(self.b1)\n", + "INFO:rl4co.models.rl.common.base:Instantiating optimizer \n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/trainer/connectors/logger_connector/result.py:212: UserWarning: You called `self.log('step', ...)` in your `training_step` but the value needs to be floating point. Converting it to torch.float32.\n", + " warning_cache.warn(\n", + "INFO:rl4co.models.zoo.eas.search:0/20 | Reward: -15.52 \n", + "INFO:rl4co.models.zoo.eas.search:1/20 | Reward: -15.32 \n", + "INFO:rl4co.models.zoo.eas.search:2/20 | Reward: -15.30 \n", + "INFO:rl4co.models.zoo.eas.search:3/20 | Reward: -15.28 \n", + "INFO:rl4co.models.zoo.eas.search:4/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:5/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:6/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:7/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:8/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:9/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:10/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:11/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:12/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:13/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:14/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:15/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:16/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:17/20 | Reward: -15.01 \n", + "INFO:rl4co.models.zoo.eas.search:18/20 | Reward: -14.84 \n", + "INFO:rl4co.models.zoo.eas.search:19/20 | Reward: -14.74 \n", + "INFO:rl4co.models.zoo.eas.search:Best reward: -14.74\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "9e6619ed6eae4a0ab770ebb08d266915", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Validation: 0it [00:00, ?it/s]" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "INFO:rl4co.models.zoo.eas.search:Saving solutions and rewards to eas_sols.pt...\n", + "`Trainer.fit` stopped: `max_epochs=1` reached.\n" + ] + } + ], + "source": [ + "from rl4co.utils.trainer import RL4COTrainer\n", + "\n", + "trainer = RL4COTrainer(\n", + " max_epochs=1,\n", + " gradient_clip_val=None,\n", + ")\n", + "\n", + "trainer.fit(eas_model)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Load actions\n" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Load\n", + "actions = torch.load(\"eas_sols.pt\")[\"solutions\"][0].cpu()\n", + "actions = actions[:torch.count_nonzero(actions, dim=-1)] # remove trailing zeros\n", + "state = td_dataset.cpu()[0]\n", + "\n", + "env.render(state, actions)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Even with few iterations, the search method can clearly find better solutions than the initial ones!" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "env", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.6" + }, + "orig_nbformat": 4 + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/modeling/2-transductive-methods/index.html b/examples/modeling/2-transductive-methods/index.html new file mode 100644 index 00000000..aef81a6f --- /dev/null +++ b/examples/modeling/2-transductive-methods/index.html @@ -0,0 +1,3625 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + Transductive Methods - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/modeling/3-change-encoder/3-change-encoder.ipynb b/examples/modeling/3-change-encoder/3-change-encoder.ipynb new file mode 100644 index 00000000..b13cea60 --- /dev/null +++ b/examples/modeling/3-change-encoder/3-change-encoder.ipynb @@ -0,0 +1,520 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Encoder Customization\n", + "\n", + "In this notebook we will cover a tutorial for the flexible encoders!\n", + "\n", + "\"Open" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Installation\n", + "\n", + "Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!\n", + "\n", + "> Note: You may need to restart the runtime in Colab after this\n" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "# !pip install rl4co[graph] # include torch-geometric\n", + "\n", + "## NOTE: to install latest version from Github (may be unstable) install from source instead:\n", + "# !pip install git+https://github.com/ai4co/rl4co.git" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Imports " + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "from rl4co.envs import CVRPEnv\n", + "\n", + "from rl4co.models.zoo import AttentionModel\n", + "from rl4co.utils.trainer import RL4COTrainer" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## A default minimal training script\n", + "\n", + "Here we use the CVRP environment and AM model as a minimal example of training script. By default, the AM is initialized with a Graph Attention Encoder, but we can change it to anything we want." + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + "/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n", + "Using 16bit Automatic Mixed Precision (AMP)\n", + "GPU available: True (cuda), used: True\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "TPU available: False, using: 0 TPU cores\n", + "IPU available: False, using: 0 IPUs\n", + "HPU available: False, using: 0 HPUs\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Encoder: GraphAttentionEncoder\n" + ] + } + ], + "source": [ + "# Init env, model, trainer\n", + "env = CVRPEnv(generator_params=dict(num_loc=20))\n", + "\n", + "model = AttentionModel(\n", + " env, \n", + " baseline='rollout',\n", + " train_data_size=100_000, # really small size for demo\n", + " val_data_size=10_000\n", + ")\n", + " \n", + "trainer = RL4COTrainer(\n", + " max_epochs=3, # few epochs for demo\n", + " accelerator='gpu',\n", + " devices=1,\n", + " logger=False,\n", + ")\n", + "\n", + "# By default the AM uses the Graph Attention Encoder\n", + "print(f'Encoder: {model.policy.encoder._get_name()}')" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/callbacks/model_checkpoint.py:630: Checkpoint directory /datasets/home/botu/Dev/rl4co/notebooks/tutorials/checkpoints exists and is not empty.\n", + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n", + "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n", + "\n", + " | Name | Type | Params\n", + "--------------------------------------------------\n", + "0 | env | CVRPEnv | 0 \n", + "1 | policy | AttentionModelPolicy | 694 K \n", + "2 | baseline | WarmupBaseline | 694 K \n", + "--------------------------------------------------\n", + "1.4 M Trainable params\n", + "0 Non-trainable params\n", + "1.4 M Total params\n", + "5.553 Total estimated model params size (MB)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "3db02ec8f6dc4913a26462bbc1a851e8", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Sanity Checking: | | 0/? [00:00 Note: while we provide these examples, you can also implement your own encoder and use it in RL4CO! For instance, you may use different encoders (and decoders) to solve problems that require e.g. distance matrices as input" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "# Before we init, we need to install the graph neural network dependencies\n", + "# !pip install rl4co[graph]" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + "/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n", + "Using 16bit Automatic Mixed Precision (AMP)\n", + "GPU available: True (cuda), used: True\n", + "TPU available: False, using: 0 TPU cores\n", + "IPU available: False, using: 0 IPUs\n", + "HPU available: False, using: 0 HPUs\n" + ] + } + ], + "source": [ + "# Init the model with different encoder\n", + "from rl4co.models.nn.graph.gcn import GCNEncoder\n", + "from rl4co.models.nn.graph.mpnn import MessagePassingEncoder\n", + "\n", + "gcn_encoder = GCNEncoder(\n", + " env_name='cvrp', \n", + " embed_dim=128,\n", + " num_nodes=20, \n", + " num_layers=3,\n", + ")\n", + "\n", + "mpnn_encoder = MessagePassingEncoder(\n", + " env_name='cvrp', \n", + " embed_dim=128,\n", + " num_nodes=20, \n", + " num_layers=3,\n", + ")\n", + "\n", + "model = AttentionModel(\n", + " env, \n", + " baseline='rollout',\n", + " train_data_size=100_000, # really small size for demo\n", + " val_data_size=10_000, \n", + " policy_kwargs={\n", + " 'encoder': gcn_encoder # gcn_encoder or mpnn_encoder\n", + " }\n", + ")\n", + " \n", + "trainer = RL4COTrainer(\n", + " max_epochs=3, # few epochs for demo\n", + " accelerator='gpu',\n", + " devices=1,\n", + " logger=False,\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/callbacks/model_checkpoint.py:630: Checkpoint directory /datasets/home/botu/Dev/rl4co/notebooks/tutorials/checkpoints exists and is not empty.\n", + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n", + "\n", + " | Name | Type | Params\n", + "--------------------------------------------------\n", + "0 | env | CVRPEnv | 0 \n", + "1 | policy | AttentionModelPolicy | 148 K \n", + "2 | baseline | WarmupBaseline | 148 K \n", + "--------------------------------------------------\n", + "297 K Trainable params\n", + "0 Non-trainable params\n", + "297 K Total params\n", + "1.191 Total estimated model params size (MB)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "81c30fe25912497bb53cfb492810c655", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Sanity Checking: | | 0/? [00:00 Tuple[Tensor, Tensor]:\n", + " \"\"\"\n", + " Args:\n", + " td: Input TensorDict containing the environment state\n", + " mask: Mask to apply to the attention\n", + "\n", + " Returns:\n", + " h: Latent representation of the input\n", + " init_h: Initial embedding of the input\n", + " \"\"\"\n", + " init_h = self.init_embedding(td)\n", + " h = None\n", + " return h, init_h" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "rl4co", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.6" + }, + "orig_nbformat": 4 + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/modeling/3-change-encoder/index.html b/examples/modeling/3-change-encoder/index.html new file mode 100644 index 00000000..7c966689 --- /dev/null +++ b/examples/modeling/3-change-encoder/index.html @@ -0,0 +1,3669 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + Encoder Customization - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+ +
+
+ + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/modeling/index.html b/examples/modeling/index.html new file mode 100644 index 00000000..4784102b --- /dev/null +++ b/examples/modeling/index.html @@ -0,0 +1,2386 @@ + + + + + + + + + + + + + + + + + + + + + + + Modeling - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + +

Modeling

+

Collection of examples on models and related topics.

+

Index

+
    +
  • 1-decoding-strategies.ipynb: here we show how to use different decoding strategies at inference time, such as greedy evaluation, beam search, and various sampling methods including top-k and nucleus sampling.
  • +
  • 2-transductive-methods.ipynb: here we show how to use transductive methods (i.e. online / test time optimization) such as EAS.
  • +
  • 3-change-encoder.ipynb: here we show how to change the encoder of a model.
  • +
+ + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/other/1-mtvrp/1-mtvrp.ipynb b/examples/other/1-mtvrp/1-mtvrp.ipynb new file mode 100644 index 00000000..ba44b756 --- /dev/null +++ b/examples/other/1-mtvrp/1-mtvrp.ipynb @@ -0,0 +1,647 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# MTVRP: Multi-task VRP environment\n", + "\n", + "\"Open\n", + "\n", + "\n", + "This environment can handle _any_ of the following variants:\n", + "\n", + "\n", + "| VRP Variant | Capacity (C) | Open Route (O) | Backhaul (B) | Duration Limit (L) | Time Window (TW) |\n", + "|-------------|--------------|----------------|--------------|--------------------|------------------|\n", + "| CVRP | ✔ | | | | |\n", + "| OVRP | ✔ | ✔ | | | |\n", + "| VRPB | ✔ | | ✔ | | |\n", + "| VRPL | ✔ | | | ✔ | |\n", + "| VRPTW | ✔ | | | | ✔ |\n", + "| OVRPTW | ✔ | ✔ | | | ✔ |\n", + "| OVRPB | ✔ | ✔ | ✔ | | |\n", + "| OVRPL | ✔ | ✔ | | ✔ | |\n", + "| VRPBL | ✔ | | ✔ | ✔ | |\n", + "| VRPBTW | ✔ | | ✔ | | ✔ |\n", + "| VRPLTW | ✔ | | | ✔ | ✔ |\n", + "| OVRPBL | ✔ | ✔ | ✔ | ✔ | |\n", + "| OVRPBTW | ✔ | ✔ | ✔ | | ✔ |\n", + "| OVRPLTW | ✔ | ✔ | | ✔ | ✔ |\n", + "| VRPBLTW | ✔ | | ✔ | ✔ | ✔ |\n", + "| OVRPBLTW | ✔ | ✔ | ✔ | ✔ | ✔ |\n", + "\n", + "\n", + "It is fully batched, meaning that _different variants can be in the same batch_ too!\n" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning_utilities/core/imports.py:14: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html\n", + " import pkg_resources\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:2832: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('sphinxcontrib')`.\n", + "Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n", + " declare_namespace(pkg)\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/fabric/__init__.py:41: Deprecated call to `pkg_resources.declare_namespace('lightning.fabric')`.\n", + "Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:2317: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('lightning')`.\n", + "Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n", + " declare_namespace(parent)\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/__init__.py:37: Deprecated call to `pkg_resources.declare_namespace('lightning.pytorch')`.\n", + "Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:2317: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('lightning')`.\n", + "Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n", + " declare_namespace(parent)\n" + ] + } + ], + "source": [ + "%load_ext autoreload\n", + "%autoreload 2\n", + "\n", + "from rl4co.envs.routing.mtvrp.env import MTVRPEnv\n", + "from rl4co.envs.routing.mtvrp.generator import MTVRPGenerator" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Let's now generate some variants! By default, we can generate all variants with the `variants_preset` variable" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['VRPLTW', 'OVRP', 'VRPLTW', 'OVRPLTW', 'OVRPL', 'VRPB', 'OVRPTW', 'OVRPB']" + ] + }, + "execution_count": 2, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Single feat: generate a distribution of single-featured environments\n", + "generator = MTVRPGenerator(num_loc=50, variant_preset=\"all\")\n", + "env = MTVRPEnv(generator, check_solution=False)\n", + "\n", + "td_data = env.generator(8)\n", + "env.get_variant_names(td_data)" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "all: {'O': 0.5, 'TW': 0.5, 'L': 0.5, 'B': 0.5}\n", + "single_feat: {'O': 0.5, 'TW': 0.5, 'L': 0.5, 'B': 0.5}\n", + "single_feat_otw: {'O': 0.5, 'TW': 0.5, 'L': 0.5, 'B': 0.5, 'OTW': 0.5}\n", + "cvrp: {'O': 0.0, 'TW': 0.0, 'L': 0.0, 'B': 0.0}\n", + "ovrp: {'O': 1.0, 'TW': 0.0, 'L': 0.0, 'B': 0.0}\n", + "vrpb: {'O': 0.0, 'TW': 0.0, 'L': 0.0, 'B': 1.0}\n", + "vrpl: {'O': 0.0, 'TW': 0.0, 'L': 1.0, 'B': 0.0}\n", + "vrptw: {'O': 0.0, 'TW': 1.0, 'L': 0.0, 'B': 0.0}\n", + "ovrptw: {'O': 1.0, 'TW': 1.0, 'L': 0.0, 'B': 0.0}\n", + "ovrpb: {'O': 1.0, 'TW': 0.0, 'L': 0.0, 'B': 1.0}\n", + "ovrpl: {'O': 1.0, 'TW': 0.0, 'L': 1.0, 'B': 0.0}\n", + "vrpbl: {'O': 0.0, 'TW': 0.0, 'L': 1.0, 'B': 1.0}\n", + "vrpbtw: {'O': 0.0, 'TW': 1.0, 'L': 0.0, 'B': 1.0}\n", + "vrpltw: {'O': 0.0, 'TW': 1.0, 'L': 1.0, 'B': 0.0}\n", + "ovrpbl: {'O': 1.0, 'TW': 0.0, 'L': 1.0, 'B': 1.0}\n", + "ovrpbtw: {'O': 1.0, 'TW': 1.0, 'L': 0.0, 'B': 1.0}\n", + "ovrpltw: {'O': 1.0, 'TW': 1.0, 'L': 1.0, 'B': 0.0}\n", + "vrpbltw: {'O': 0.0, 'TW': 1.0, 'L': 1.0, 'B': 1.0}\n", + "ovrpbltw: {'O': 1.0, 'TW': 1.0, 'L': 1.0, 'B': 1.0}\n" + ] + } + ], + "source": [ + "# Here is the list of presets and their probabilities of being generated (fully customizable)\n", + "env.print_presets()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can change the preset to generate some specific variant, for instance the VRPB" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "vrpb selected. Will not use feature combination!\n" + ] + }, + { + "data": { + "text/plain": [ + "['VRPB', 'VRPB', 'VRPB', 'VRPB', 'VRPB', 'VRPB', 'VRPB', 'VRPB']" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Change generator\n", + "generator = MTVRPGenerator(num_loc=50, variant_preset=\"vrpb\")\n", + "env.generator = generator\n", + "td_data = env.generator(8)\n", + "env.get_variant_names(td_data)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Greedy rollout and plot" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "import torch\n", + "from rl4co.utils.ops import gather_by_index\n", + "\n", + "\n", + "# Simple heuristics (nearest neighbor + capacity check)\n", + "def greedy_policy(td):\n", + " \"\"\"Select closest available action\"\"\"\n", + " available_actions = td[\"action_mask\"]\n", + " # distances\n", + " curr_node = td[\"current_node\"]\n", + " loc_cur = gather_by_index(td[\"locs\"], curr_node)\n", + " distances_next = torch.cdist(loc_cur[:, None, :], td[\"locs\"], p=2.0).squeeze(1)\n", + "\n", + " distances_next[~available_actions.bool()] = float(\"inf\")\n", + " # do not select depot if some capacity is left\n", + " distances_next[:, 0] = float(\"inf\") * (\n", + " td[\"used_capacity_linehaul\"] < td[\"vehicle_capacity\"]\n", + " ).float().squeeze(-1)\n", + "\n", + " # # if sum of available actions is 0, select depot\n", + " # distances_next[available_actions.sum(-1) == 0, 0] = 0\n", + " action = torch.argmin(distances_next, dim=-1)\n", + " td.set(\"action\", action)\n", + " return td\n", + "\n", + "\n", + "def rollout(env, td, policy=greedy_policy, max_steps: int = None):\n", + " \"\"\"Helper function to rollout a policy. Currently, TorchRL does not allow to step\n", + " over envs when done with `env.rollout()`. We need this because for environments that complete at different steps.\n", + " \"\"\"\n", + "\n", + " max_steps = float(\"inf\") if max_steps is None else max_steps\n", + " actions = []\n", + " steps = 0\n", + "\n", + " while not td[\"done\"].all():\n", + " td = policy(td)\n", + " actions.append(td[\"action\"])\n", + " td = env.step(td)[\"next\"]\n", + " steps += 1\n", + " if steps > max_steps:\n", + " print(\"Max steps reached\")\n", + " break\n", + " return torch.stack(actions, dim=1)" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Cost: 17.503389358520508\n", + "Problem: OVRPLTW\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Cost: 18.86773109436035\n", + "Problem: CVRP\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Cost: 15.39835262298584\n", + "Problem: VRPB\n" + ] + } + ], + "source": [ + "# NOTE: if we don't select ovrpbltw, the below does not work and there is still some\n", + "# minor bug in either masking or variant subselection\n", + "\n", + "generator = MTVRPGenerator(num_loc=50, variant_preset=\"all\")\n", + "env.generator = generator\n", + "td_data = env.generator(3)\n", + "variant_names = env.get_variant_names(td_data)\n", + "\n", + "td = env.reset(td_data)\n", + "\n", + "actions = rollout(env, td.clone(), greedy_policy)\n", + "rewards = env.get_reward(td, actions)\n", + "\n", + "for idx in [0, 1, 2]:\n", + " env.render(td[idx], actions[idx])\n", + " print(\"Cost: \", - rewards[idx].item())\n", + " print(\"Problem: \", variant_names[idx])\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Train MVMoE on Multiple Problems" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "single_feat selected. Will not use feature combination!\n" + ] + } + ], + "source": [ + "from rl4co.utils.trainer import RL4COTrainer\n", + "from rl4co.models.zoo import MVMoE_POMO\n", + "\n", + "device_id = 0\n", + "device = torch.device(f\"cuda:{device_id}\" if torch.cuda.is_available() else \"cpu\")\n", + "generator = MTVRPGenerator(num_loc=50, variant_preset=\"single_feat\")\n", + "env = MTVRPEnv(generator, check_solution=False)" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n", + "Using 16bit Automatic Mixed Precision (AMP)\n", + "GPU available: True (cuda), used: True\n", + "TPU available: False, using: 0 TPU cores\n", + "IPU available: False, using: 0 IPUs\n", + "HPU available: False, using: 0 HPUs\n", + "/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\n", + "Missing logger folder: /home/botu/Dev/rl4co/examples/other/lightning_logs\n", + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n", + "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n", + "\n", + " | Name | Type | Params\n", + "--------------------------------------------------\n", + "0 | env | MTVRPEnv | 0 \n", + "1 | policy | AttentionModelPolicy | 3.7 M \n", + "2 | baseline | SharedBaseline | 0 \n", + "--------------------------------------------------\n", + "3.7 M Trainable params\n", + "0 Non-trainable params\n", + "3.7 M Total params\n", + "14.868 Total estimated model params size (MB)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "bac126d9831c49da91319e21e79150e1", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Sanity Checking: | | 0/? [00:00" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Cost: 17.188127517700195\n", + "Problem: OVRPLTW\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Cost: 14.578388214111328\n", + "Problem: CVRP\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Cost: 12.24499797821045\n", + "Problem: VRPB\n" + ] + } + ], + "source": [ + "# Greedy rollouts over trained model (same states as previous plot)\n", + "policy = model.policy.to(device)\n", + "out = policy(td.to(device).clone(), env, phase=\"test\", decode_type=\"greedy\")\n", + "actions_mvmoe = out['actions'].cpu().detach()\n", + "rewards_mvmoe = out['reward'].cpu().detach()\n", + "\n", + "for idx in [0, 1, 2]:\n", + " env.render(td[idx], actions_mvmoe[idx])\n", + " print(\"Cost: \", -rewards_mvmoe[idx].item())\n", + " print(\"Problem: \", variant_names[idx])" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Getting gaps to classical solvers\n", + "\n", + "\n", + "We additionally offer an optional `solve` API to get solutions from classical solvers. We can use this to get the gaps to the optimal solutions." + ] + }, + { + "cell_type": "code", + "execution_count": 31, + "metadata": {}, + "outputs": [], + "source": [ + "# PyVRP - HGS\n", + "pyvrp_actions, pyvrp_costs = env.solve(td, max_runtime=5, num_procs=10, solver=\"pyvrp\")\n", + "rewards_pyvrp = env.get_reward(td, pyvrp_actions)" + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "tensor([-17.1881, -14.5784, -12.2450]) tensor([-17.5034, -18.8677, -15.3984]) tensor([-12.6954, -11.9107, -9.9261])\n", + "Gap to HGS (NI): 50.47%\n", + "Gap to HGS (MVMoE): 27.05%\n" + ] + } + ], + "source": [ + "def calculate_gap(cost, bks): \n", + " gaps = (cost - bks) / bks\n", + " return gaps.mean() * 100\n", + "\n", + "# Nearest insertion\n", + "actions = rollout(env, td.clone(), greedy_policy)\n", + "rewards_ni = env.get_reward(td, actions)\n", + "\n", + "print(rewards_mvmoe, rewards_ni, rewards_pyvrp) \n", + "print(f\"Gap to HGS (NI): {calculate_gap(-rewards_ni, -rewards_pyvrp):.2f}%\")\n", + "print(f\"Gap to HGS (MVMoE): {calculate_gap(-rewards_mvmoe, -rewards_pyvrp):.2f}%\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "With only two short epochs, we can already get better than NI!" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "rl4co", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.8" + }, + "orig_nbformat": 4 + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/other/1-mtvrp/index.html b/examples/other/1-mtvrp/index.html new file mode 100644 index 00000000..fbfec565 --- /dev/null +++ b/examples/other/1-mtvrp/index.html @@ -0,0 +1,3996 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + MTVRP: Multi-task VRP environment - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/other/2-scheduling/2-scheduling.ipynb b/examples/other/2-scheduling/2-scheduling.ipynb new file mode 100644 index 00000000..ffe6782b --- /dev/null +++ b/examples/other/2-scheduling/2-scheduling.ipynb @@ -0,0 +1,829 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Solving the Flexible Job-Shop Scheduling Problem (FJSP)\n", + "\n", + "The following notebook explains the FJSP and explains the solution construction process using an encoder-decoder architecture based on a Heterogeneous Graph Neural Network (HetGNN)\n", + "\n", + "\"Open" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Requirement already satisfied: torch_geometric in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (2.5.0)\n", + "Requirement already satisfied: tqdm in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (4.66.1)\n", + "Requirement already satisfied: numpy in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (1.26.3)\n", + "Requirement already satisfied: scipy in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (1.11.4)\n", + "Requirement already satisfied: fsspec in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (2023.12.2)\n", + "Requirement already satisfied: jinja2 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (3.1.3)\n", + "Requirement already satisfied: aiohttp in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (3.9.1)\n", + "Requirement already satisfied: requests in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (2.31.0)\n", + "Requirement already satisfied: pyparsing in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (3.1.1)\n", + "Requirement already satisfied: scikit-learn in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (1.4.1.post1)\n", + "Requirement already satisfied: psutil>=5.8.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (5.9.7)\n", + "Requirement already satisfied: attrs>=17.3.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (23.2.0)\n", + "Requirement already satisfied: multidict<7.0,>=4.5 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (6.0.4)\n", + "Requirement already satisfied: yarl<2.0,>=1.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (1.9.4)\n", + "Requirement already satisfied: frozenlist>=1.1.1 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (1.4.1)\n", + "Requirement already satisfied: aiosignal>=1.1.2 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (1.3.1)\n", + "Requirement already satisfied: async-timeout<5.0,>=4.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (4.0.3)\n", + "Requirement already satisfied: MarkupSafe>=2.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from jinja2->torch_geometric) (2.1.3)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from requests->torch_geometric) (3.3.2)\n", + "Requirement already satisfied: idna<4,>=2.5 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from requests->torch_geometric) (3.6)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from requests->torch_geometric) (1.26.18)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from requests->torch_geometric) (2023.11.17)\n", + "Requirement already satisfied: joblib>=1.2.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from scikit-learn->torch_geometric) (1.3.2)\n", + "Requirement already satisfied: threadpoolctl>=2.0.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from scikit-learn->torch_geometric) (3.3.0)\n" + ] + } + ], + "source": [ + "! pip install torch_geometric" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "%load_ext autoreload\n", + "%autoreload 2\n", + "\n", + "import torch\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "import numpy as np\n", + "from IPython.display import display, clear_output\n", + "import time\n", + "import networkx as nx\n", + "import matplotlib.pyplot as plt\n", + "from rl4co.envs import FJSPEnv\n", + "from rl4co.models.zoo.l2d import L2DModel\n", + "from rl4co.models.zoo.l2d.policy import L2DPolicy\n", + "from rl4co.models.zoo.l2d.decoder import L2DDecoder\n", + "from rl4co.models.nn.graph.hgnn import HetGNNEncoder\n", + "from rl4co.utils.trainer import RL4COTrainer" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "generator_params = {\n", + " \"num_jobs\": 5, # the total number of jobs\n", + " \"num_machines\": 5, # the total number of machines that can process operations\n", + " \"min_ops_per_job\": 1, # minimum number of operatios per job\n", + " \"max_ops_per_job\": 2, # maximum number of operations per job\n", + " \"min_processing_time\": 1, # the minimum time required for a machine to process an operation\n", + " \"max_processing_time\": 20, # the maximum time required for a machine to process an operation\n", + " \"min_eligible_ma_per_op\": 1, # the minimum number of machines capable to process an operation\n", + " \"max_eligible_ma_per_op\": 2, # the maximum number of machines capable to process an operation\n", + "}" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "env = FJSPEnv(generator_params=generator_params)\n", + "td = env.reset(batch_size=[1])" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Visualize the Problem\n", + "\n", + "Below we visualize the generated instance of the FJSP. Blue nodes correspond to machines, red nodes to operations and yellow nodes to jobs. A machine may process an operation if there exists an edge between the two. \n", + "\n", + "The thickness of the connection between a machine and an operation node specifies the processing time the respective machine needs to process the operation (thicker line := longer processing).\n", + "\n", + "Each operation belongs to exactly one job, where an edge between a job and an operation node indicates that the respective operation belongs to the job. The number above an operation-job edge specifies the precedence-order in which the operations of a job need to be processed. A job is done when all operations belonging to it are scheduled. The instance is solved when all jobs are fully scheduled.\n", + "\n", + "Also note that some operation nodes are not connected. These operation nodes are padded, so that all instances in a batch have the same number of operations (where we determine the maximum number of operations as num_jobs * max_ops_per_job). " + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": { + "jupyter": { + "source_hidden": true + } + }, + "outputs": [ + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAxoAAAH4CAYAAADNU5vyAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjguMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8g+/7EAAAACXBIWXMAAA9hAAAPYQGoP6dpAADk4klEQVR4nOzdeVxU97k/8M/AsO+yCSr7DuKGirLNqLjHnSxNbYwm19g2drltb5vYNr03/po2t02bpI0mJNGbxiYFUWPiBjoDgqCiuLDvi4LsyDrDLOf3B5lTRxZhFmZ73q8XL4U553u+6HA4z3d5Hg7DMAwIIYQQQgghRIPMdN0BQgghhBBCiPGhQIMQQgghhBCicRRoEEIIIYQQQjSOAg1CCCGEEEKIxlGgQQghhBBCCNE4CjQIIYQQQgghGkeBBiGEEEIIIUTjKNAghBBCCCGEaBwFGoQQQgghhBCNo0CDEGJ0jhw5Ag6Hg/r6er3rB4/HA4/Hm/a+6Oq6U9Ha2oodO3bA1dUVHA4Hf/nLX6bcxq5du2Bvb6/5zhFCCJkyCjQIIXpv06ZNsLW1RV9f37jHPP/887C0tERnZ+c09ky/lJaW4o033tB5gKWqn/zkJzh//jx+9atf4bPPPsPatWvHPG5wcBBvvPEGhELh9HbwEW+88QY4HM6YH4cOHWKP43A4+OEPf6h0bnt7O370ox8hLCwMNjY28PDwwJIlS/Bf//Vf6O/vZ4/btWuXUruOjo6YN28e/vSnP0EsFk/b90oIIari6roDhBDyJM8//zxOnz6NEydO4Hvf+96o1wcHB3Hq1CmsXbsWrq6u2LlzJ5599llYWVnpoLcTu3DhgtbaLi0txe9+9zvweDz4+flN23U15dKlS9i8eTN+9rOfTXjc4OAgfve73wGAzmdpPvjgg1EzKEuXLh33+K6uLsTExKC3txe7d+9GWFgYOjs7cefOHXzwwQfYt2+fUntWVlZITU0FAPT09OD48eP42c9+huvXr+OLL77QzjdFCCEaQoEGIUTvbdq0CQ4ODjh27NiYgcapU6cwMDCA559/HgBgbm4Oc3Pz6e7mpFhaWprUdaeira0Nzs7Ouu7GlOzYsQNubm6TPv7jjz9GY2Mj8vLysHz5cqXXent7R/0/cblcfPe732U///73v4+lS5fiyy+/xJ///Gd4e3ur9w0QQogW0dIpQojes7GxwbZt23Dx4kW0tbWNev3YsWNwcHDApk2bAIy9N6KwsBBr1qyBm5sbbGxs4O/vj927d7OvC4VCcDicUctx6uvrweFwcOTIEfZrd+7cwa5duxAQEABra2vMnDkTu3fvntSyrcf3Svj5+Y27BEfRl4aGBnz/+99HaGgobGxs4OrqipSUFKXv78iRI0hJSQEA8Pn8UW2MtUejra0Ne/bsgaenJ6ytrTFv3jwcPXp0zO//f//3f/Hhhx8iMDAQVlZWWLx4Ma5fv/7E7xcAamtrkZKSghkzZsDW1haxsbH45ptvlPrO4XDAMAz+9re/sX0fS319Pdzd3QEAv/vd79hj33jjDaXj7t+/jy1btsDe3h7u7u742c9+BplMpnSMXC7HX/7yF0RGRsLa2hqenp7Yu3cvuru7J/V9qaKmpgbm5uaIjY0d9ZqjoyOsra0nPN/MzIz9fzTUJXKEENNBMxqEEIPw/PPP4+jRo/jXv/6ltOa9q6sL58+fx3PPPQcbG5sxz21ra8Pq1avh7u6OX/7yl3B2dkZ9fT0yMjJU6ktmZiZqa2vx4osvYubMmSgpKcGHH36IkpISFBQUjPuQPJa//OUvSuvyAeCdd97BrVu34OrqCgC4fv06rly5gmeffRazZ89GfX09PvjgA/B4PJSWlsLW1haJiYnYv38/3n33Xbz22msIDw8HAPbPxw0NDYHH46G6uho//OEP4e/vj7S0NOzatQs9PT340Y9+pHT8sWPH0NfXh71794LD4eCPf/wjtm3bhtraWlhYWIz7/bW2tmL58uUYHBzE/v374erqiqNHj2LTpk1IT0/H1q1bkZiYiM8++ww7d+5EcnLymLNWCu7u7uwSo61bt2Lbtm0AgOjoaPYYmUyGNWvWYOnSpfjf//1fZGVl4U9/+hMCAwOxb98+9ri9e/fiyJEjePHFF7F//37U1dXh/fffR1FREfLy8ib8vhS6urqUPjc3N4eLi8u4x/v6+kImk+Gzzz7DCy+88MT2x1JTUwMA7PuDmBaZTAaJRKLrbhANsbS0hJmZ8Y77U6BBCDEIK1asgJeXF44dO6YUaKSlpUEikbDLpsZy5coVdHd348KFC4iJiWG//uabb6rUl+9///v4z//8T6WvxcbG4rnnnkNubi4SEhIm3daWLVuUPk9LS8PNmzfx3//935g7dy4AYMOGDdixY4fScU899RSWLVuG48ePY+fOnQgICEBCQgLeffddJCcnP3HvwocffoiysjL84x//YP/tXnnlFSQlJeHAgQPYvXs3HBwc2OMbGxtRVVXFPkSHhoZi8+bNOH/+PDZu3Djudd566y20trbi8uXLiI+PBwC8/PLLiI6Oxk9/+lNs3rwZAQEBCAgIwM6dOxESEqK0VOhxdnZ22LFjB/bt24fo6OgxjxWJRHjmmWfw61//mv2+Fi5ciI8//pgNNHJzc5GamorPP/8c3/nOd9hz+Xw+1q5di7S0NKWvjyc0NFTpc19f3wlnGnbv3o133nkHu3btwltvvQUej4fExESsX78eTk5OY57T0dEBAHj48CH+9a9/4eTJk4iOjh51bWLcGIbBgwcP0NPTo1Y7AwMcNDZaYniYA0tLBj4+w7CzYzTTSTJlZmZm8Pf3N4jlraqgQIMQYhDMzc3x7LPP4p133kF9fT272fnYsWPw9PTEypUrxz1Xse7/66+/xrx58yY1Uj2RR2dORCIR+vv72aUwN2/enFKg8ajS0lLs3r0bmzdvxoEDB8a8nkQiQW9vL4KCguDs7IybN29i586dU77WmTNnMHPmTDz33HPs1ywsLLB//34899xzyM7OVgognnnmGaWResX3WFtb+8TrLFmyhA0yAMDe3h7/8R//gV/96lcoLS1FVFTUlPv/JK+88orS5wkJCfjss8/Yz9PS0uDk5ITk5GT2QR4AFi1aBHt7ewgEgkkFGsePH4ejoyP7+Xizagqenp64ffs2/vu//xsnTpzAoUOHcOjQIVhaWuLAgQM4cOCA0ozYwMAAu1RMYfny5UrfCzENiiDDw8MDtra2U5o5LSvj4KOPzHH+vBnq6jhgmH+fy+Ew8PdnsGaNHC+/LEN4OAUd00Uul6O5uRktLS3w8fGZ0v+poaBAgxBiMJ5//nm88847OHbsGF577TXcu3cPly9fxv79+yfc/J2UlITt27fjd7/7Hd555x3weDxs2bIF3/nOd1TKTNXV1YXf/e53+OKLL0btGXn48OGU2wNGNgJv27YNs2bNwv/93/8p/cIZGhrC73//e3z66ae4f/8+GObfDwKqXq+hoQHBwcGjpuwVS60aGhqUvu7j46P0uSLoeNJ+hoaGhjGzMD16HU0HGtbW1qMezl1cXJT6WlVVhYcPH8LDw2PMNsbaCzSWxMTEKW0GBwAvLy988MEH+Pvf/46qqiqcP38ef/jDH/Cb3/wGXl5eeOmll5S+l9OnTwMYyUDl7++P2bNnT+l6xPDJZDI2yJjKkrm6OmDvXiAzE+ByAal09DEMw0FtLQcffWSGDz7gIjkZOHwY8PfX4DdAxuXu7o7m5mZIpVK1B8H0EQUahBCDsWjRIoSFheGf//wnXnvtNfzzn/8EwzATLpsCRmoZpKeno6CgAKdPn8b58+exe/du/OlPf0JBQQHs7e3HHUl6fAMxADz99NO4cuUKfv7zn2P+/Pmwt7eHXC7H2rVrIZfLVfredu3ahebmZly7dk1phBwAXn31VXz66af48Y9/jGXLlsHJyQkcDgfPPvusytebqvECuUeDHn0xmYxjcrkcHh4e+Pzzz8d8/fFARRs4HA5CQkIQEhKCDRs2IDg4GJ9//rlSoGFubo5Vq1ZpvS9Evyn2ZNja2k76nNRU4NVX/x1cjBVkPErxukAAREQA770HPPJWJFqiWDIlk8ko0CCEEF17/vnn8etf/xp37tzBsWPHEBwcjMWLF0/q3NjYWMTGxuLgwYM4duwYnn/+eXzxxRd46aWX2BH6x9c/Pz6y393djYsXL+J3v/sdfvOb37Bfr6qqUvl7euutt3Dy5ElkZGQgLCxs1Ovp6el44YUX8Kc//Yn9mkgkGtXXqUy7+/r64s6dO5DL5UqzGuXl5ezrmuDr64uKiopRX1fnOppYXhAYGIisrCzExcU9cbnTdAgICICLiwtaWlp03RWixyb73j94EHhk9eWUSKUjHy+/DLS2Aq+/rlo7ZHKMcbnUo4x3mzshxCgpZi9+85vf4NatW0+czQBGgoPHR97nz58PAGyFZV9fX5ibmyMnJ0fpuL///e9KnytGyx9v7y9/+cukv4dHZWVl4cCBA3j99ddHbQx/9JqPX++9994bNdtiZ2cHYHSwNJb169fjwYMH+PLLL9mvSaVSvPfee7C3t0dSUtLUvpEJrnPt2jXk5+ezXxsYGMCHH34IPz8/RERETLlNxaiuOptin376achkMvzP//zPqNekUqnaG27Hc/XqVQwMDIz6+rVr19DZ2UkbvInaUlNVDzIed+AA8PHHmmmLmCaa0SCEGBR/f38sX74cp06dAoBJBRpHjx7F3//+d2zduhWBgYHo6+vDRx99BEdHR6xfvx4A4OTkhJSUFLz33nvgcDgIDAzE119/PWqtvqOjIxITE/HHP/4REokEs2bNwoULF1BXV6fS9/Pcc8/B3d0dwcHB+Mc//qH0WnJyMjw9PbFx40Z89tlncHJyQkREBPLz85GVlTVqrfb8+fNhbm6OP/zhD3j48CGsrKywYsWKMfch/Md//AcOHz6MXbt24caNG/Dz80N6ejry8vLwl7/8RSnjlDp++ctf4p///CfWrVuH/fv3Y8aMGTh69Cjq6upw/PhxldI62tjYICIiAl9++SVCQkIwY8YMREVFTWmvR1JSEvbu3Yvf//73uHXrFlavXg0LCwtUVVUhLS0Nf/3rX0dl+tKEzz77DJ9//jm2bt2KRYsWwdLSEmVlZfjkk09gbW2N1157TePXJKajrm5kuZQm/fCHwIoVhrFn44033sDJkydx69atcY/h8XiYP3++yoNDZGoo0CCEGJznn38eV65cwZIlSxAUFPTE45OSknDt2jV88cUXaG1thZOTE5YsWYLPP/8c/o/89nzvvfcgkUhw6NAhWFlZ4emnn8bbb7896gH22LFjePXVV/G3v/0NDMNg9erVOHv2rEpVmhUZj8aqqSAQCODp6Ym//vWvMDc3x+effw6RSIS4uDhkZWVhzZo1SsfPnDkThw4dwu9//3vs2bMHMpkMAoFgzEDDxsYGQqEQv/zlL3H06FH09vYiNDQUn376KXbt2jXl72M8np6euHLlCv7rv/4L7733HkQiEaKjo3H69Gls2LBB5XZTU1Px6quv4ic/+QmGh4fx29/+dsqbyg8dOoRFixbh8OHDeO2118DlcuHn54fvfve7iIuLU7lvCopZqEf3jOzduxe2tra4ePEiTp06hd7eXri7u2P16tX41a9+hQULFqh9XWK69u598l6MqZJKR9q9cEG183ft2oWjR49i7969OHTokNJrP/jBD/D3v/8dL7zwglJRVG3KyMgwyr0Q+orD6ONOPkIIIcTA9fb2wsnJCQcOHBhziRYhkyUSiVBXVwd/f/9xq8eXlgKRkdrrQ2kpME79zwnt2rULly5dQm9vL1paWtg9USKRCF5eXnB0dASfz9dIoDGZGQ19M5n/W0NGezQIIYQQLbh+/ToAqLQPhZCpOnRoJIWtNnC5wAcfqH7+woULMWfOHGRkZLBfy8jIgI+Pj9Is3rlz5xAfHw9nZ2e4urpi48aNqKmpUWrr3r17eO655zBjxgzY2dkhJiYGV69eVTrms88+g5+fH5ycnPDss8+ir6+PfY3H4+HHP/4x+7mfnx/+3//7f2yRUh8fH3z44YdK7TU1NeHpp5+Gs7MzZsyYgc2bN09YmJP8GwUahBBCiAbduXMHf/7zn/HCCy/A1dVVrSVihEzWmTOaXzalIJUCZ8+q18bu3bvx6aefsp9/8sknePHFF5WOGRgYwE9/+lMUFhbi4sWLMDMzw9atW9k03v39/UhKSsL9+/fx1Vdf4fbt2/jFL36hlOa7pqYGJ0+exNdff42vv/4a2dnZeOuttybs25/+9CfExMSgqKgI3//+97Fv3z42W55EIsGaNWvg4OCAy5cvIy8vD/b29li7di2Gh4fV+0cxAbRHgxBCCNGgjIwMvPXWW4iJicE777wzqi4KIZrW1wfU1mr3GjU1QH8/YG+v2vnf/e538atf/YpNGZ6Xl4cvvvgCQqGQPWb79u1K53zyySdwd3dHaWkpoqKicOzYMbS3t+P69euYMWMGAIzapyeXy3HkyBE2ocXOnTtx8eJFHDx4cNy+rV+/Ht///vcBAP/1X/+Fd955BwKBAKGhofjyyy8hl8uRmprKpqL99NNP4ezsDKFQiNWrV6v2D2IiKNAghBBCNOiNN97AG2+8oetuEBNSUwNoe8ctwwDV1cC3mcGnzN3dHRs2bMCRI0fAMAw2bNgANzc3pWOqqqrwm9/8BlevXkVHRwc7U9HY2IioqCjcunULCxYsYIOMsfj5+SllzfPy8hqVPfBx0dHR7N85HA5mzpzJnnP79m1UV1ePysQnEolGLesio1GgQQghhBBiwL4tB6T319m9ezd++MMfAgD+9re/jXr9qaeegq+vLz766CN4e3tDLpcjKiqKXaI0meKaj2eU4nA4SkurpnpOf38/Fi1ahM8//3zUee7u7k/sj6mjQIMQQgghxIBZWRnGdRT7Gjgczqj03J2dnaioqMBHH32EhIQEAEBubq7SMdHR0UhNTUVXV9eEsxqatHDhQnz55Zfw8PCgZZAqoM3ghBBCCCEGLCgI+Hb7gNZwOCPXUYe5uTnKyspQWlqqVF8GAFxcXODq6ooPP/wQ1dXVuHTpEn76058qHfPcc89h5syZ2LJlC/Ly8lBbW4vjx48jPz9fvY5N4Pnnn4ebmxs2b96My5cvo66uDkKhEPv378e9e/e0dl1jQYEGIYQQQogBs7cHAgK0e43AQNU3gj/K0dFxzJkBMzMzfPHFF7hx4waioqLwk5/8BG+//bbSMZaWlrhw4QI8PDywfv16zJ07F2+99daooEWTbG1tkZOTAx8fH2zbtg3h4eHYs2cPRCIRzXBMAhXsI4QQQgjRY5Mp6rZ//0itC22kuOVygX37gHff1Xzbpo4K9hFCCCGEEL32yivaraOxb5922ibGjQINQgghhBADFxEBJCdrvjo4lzvSbni4ZtslpoECDUIIIYQQI3D4sHYCjcOHNdsmMR0UaBBCCCGEGAF/f+C99yY+xg79mIdbWIKrmIdbsEP/hMe///5Iu4SogupoEEIIIYQYiZdeAlpbgQMH/v21cJTiFRzCepxBAGphhn/nAZKDg1oE4AzW4xBeQRki2NcOHgT27JnO3hNjQzMahBBCCCFG5PXXgY8+AkIt63ABq1GKSOzDBwhCjVKQAQBmYBCEGuzDByhFJC5gNUIt65CaCrz2mo6+AWI0aEaDEELI5PT3A9XVgFg8UiI4KEgzifUJIRr3ElKxm/Mq5BwpwAAWmDglleJ1PkeAUk4EzJj3ALw0DT0lxowCDUIIIeMrLQUOHQLOnAFqa4FHSy9xOCNVwtavH8mtGRExfjuEkOlz8CBw4ADMMPWlK1xGCoilwMsvj6zBev11bfSQmAhaOkUIIWS0ujpg9WogMnKkClhNjXKQAYx8XlMz8npk5MjxdXW66S8hZERqqvIGDXUcOAB8/LFm2iImiQINQgghylJTR2YnBIKRz59UBUzxukAwcl5qqnb7RwgZW10d8Oqrmm3zhz802QGEXbt2YcuWLbruhkGjQIMQQsi/HTw4smRCJJp6mWGpdOS8l18eaYcQMr327tV8eXCpdKRdNTQ1NWH37t3w9vaGpaUlfH198aMf/QidnZ0a6qR66uvrweFwcOvWLaWv//Wvf8WRI0d00idjQYEGIYSQEbTkghDDVVoKZGZqJ9DIzATKylQ6vba2FjExMaiqqsI///lPVFdX49ChQ7h48SKWLVuGrq4uzfb3EcPDw2qd7+TkBGdnZ810xkRRoEEIIYSWXBBi6A4d0nxZcAUud2Qvlgp+8IMfwNLSEhcuXEBSUhJ8fHywbt06ZGVl4f79+3j9283mfn5++J//+R8899xzsLOzw6xZs/C3v/1Nqa2enh689NJLcHd3h6OjI1asWIHbt2+zr7/xxhuYP38+UlNT4e/vD2trawDAuXPnEB8fD2dnZ7i6umLjxo2oqalhz/P/tiLhggULwOFwwOPxAIxeOiUWi7F//354eHjA2toa8fHxuH79Ovu6UCgEh8PBxYsXERMTA1tbWyxfvhwVFRUq/dsZAwo0CCGE6O2SC0LIJJ05o/mfYQWpFDh7dsqndXV14fz58/j+978PGxsbpddmzpyJ559/Hl9++SWYbxNNvP3225g3bx6Kiorwy1/+Ej/60Y+QmZnJnpOSkoK2tjacPXsWN27cwMKFC7Fy5UqlWZHq6mocP34cGRkZ7FKogYEB/PSnP0VhYSEuXrwIMzMzbN26FXK5HABw7do1AEBWVhZaWlqQkZEx5vfzi1/8AsePH8fRo0dx8+ZNBAUFYc2aNaNmZV5//XX86U9/QmFhIbhcLnbv3j3lfzujwRBCCDFtJSUMM5JDSjsfpaW6/g4JMWhDQ0NMaWkpMzQ0NPYBvb0Mw+Fo9+eYw2GYvr4p9bugoIABwJw4cWLM1//85z8zAJjW1lbG19eXWbt2rdLrzzzzDLNu3TqGYRjm8uXLjKOjIyMSiZSOCQwMZA4fPswwDMP89re/ZSwsLJi2trYJ+9Xe3s4AYO7evcswDMPU1dUxAJiioiKl41544QVm8+bNDMMwTH9/P2NhYcF8/vnn7OvDw8OMt7c388c//pFhGIYRCAQMACYrK4s95ptvvmEAjPt/98T/WwNHMxqEEGLq9HTJBSFkksZKP61pDDNSsFOlUyfXt2XLlo36vOzbvSG3b99Gf38/XF1dYW9vz37U1dUpLYPy9fWFu7u7UjtVVVV47rnnEBAQAEdHR/j5+QEAGhsbJ/091NTUQCKRIC4ujv2ahYUFlixZwvZRITo6mv27l5cXAKCtrW3S1zImVLCPEEJMnR4uuSCETIFYrJfXCQoKAofDQVlZGbZu3Trq9bKyMri4uIwKDMbS398PLy8vCIXCUa89umHbzs5u1OtPPfUUfH198dFHH8Hb2xtyuRxRUVFqbxYfj4WFBft3DocDAOwyLVNDMxqEEGLK+vpGKn5rU00N0N+v3WsQYsqsrPTyOq6urkhOTsbf//53DA0NKb324MEDfP7553jmmWfYh/GCggKlYwoKChAeHg4AWLhwIR48eAAul4ugoCClDzc3t3H70NnZiYqKChw4cAArV65EeHg4uru7lY6xtLQEAMhksnHbCQwMhKWlJfLy8tivSSQSXL9+HREREZP41zBNFGgQQogp0/MlF4SQSQgKAr59WNcaDmfkOlP0/vvvQywWY82aNcjJyUFTUxPOnTuH5ORkzJo1CwcfqbmTl5eHP/7xj6isrMTf/vY3pKWl4Uc/+hEAYNWqVVi2bBm2bNmCCxcuoL6+HleuXMHrr7+OwsLCca/v4uICV1dXfPjhh6iursalS5fw05/+VOkYDw8P2NjY4Ny5c2htbcXDhw9HtWNnZ4d9+/bh5z//Oc6dO4fS0lK8/PLLGBwcxJ49e6b872IqKNAghBBTpqdLLgghU2BvDwQEaPcagYEj15mi4OBgFBYWIiAgAE8//TQCAwPxH//xH+Dz+cjPz8eMGTPYY//zP/8ThYWFWLBgAd588038+c9/xpo1awCMLEE6c+YMEhMT8eKLLyIkJATPPvssGhoa4OnpOe71zczM8MUXX+DGjRuIiorCT37yE7z99ttKx3C5XLz77rs4fPgwvL29sXnz5jHbeuutt7B9+3bs3LkTCxcuRHV1Nc6fPw8XF5cp/7uYCg4z2R06hBBCjM+tW8CCBdq/TlERMH++9q9DiBESiUSoq6tTqg0xyv79I4kXtLHfissF9u0D3n1X821/y8/PDz/+8Y/x4x//WGvX0EeT+r81YDSjQQghpkyPl1wQQqbglVe0m9Rh3z7ttE2MGgUahBBiyvR4yQUhZAoiIoDkZM2nquZyR9r9dlM2IVNB6W0JIcTUrV+v3SUX69Zpvl1CyGiHD48EHJr8WeZyR9rVsvr6eq1fg0w/mtEghBBTR0suCDEO/v7Ae+9NeIjUGugLBHrDR/6UPmlbwPvvj7RLiApoRoMQQkydYsmFQKD5kVA+n5ZcEDKdXnoJaG0FDhxgvzTgCzRvAjqXAiIvKA8zywHrFsD1KuD9FWDX8MhrBw8ClLqVqIGyThFCCAHq6kYCDpFIc21aWwOlpTQaSoiaVMpMlJqKoTd/gMofDqM7BoAUEw8vf/u6SyEQ8r4lbH79dwoypgFlnSKEEGL8JrHkYspoyQUhOtO8Hrh+lIPuBd9mlXvSGpZvX+9ewMH1oxw0r6NxaKI+CjQIIYSMeOkl4M03NdMWLbkgRGcaGg6isvJlyBkxYD7FgMGcgZwRo7LyZTQ0HHzy8YRMgAINQggh//b668BHH40se5pqmkwud+S81FTgtde00z9CyISam1NRV3fgyQdOQl3dAbS0fKyRtohpokCDEEKIspdeGtlbweePfP6kgEPxOp8/ch7NZBCiE0NDdaiuflWjbVZV/RBDQ3Uqn79r1y5s2bJlUscKhUJwOBz09PSofD2iXyjrFCGEkNH8/YELF0YCh0OHgLNngZoa4NH8IRzOSDG+detGUthSdilCdKqyci/kcs2mqpbLpais3It58y6odP5f//pXUN4h00WBBiGEkPFFRADvvjvy9/5+oLoaEIsBKysgKIgqfhOiJwYGStHdnamFlqXo7s7EwEAZ7OymPpjg5OSkhT4RQ0FLpwghhEyOvT0wfz6wdOnInxRkEKI3mpsPQXvjx1w0N3+g0pmPLp0Si8XYv38/PDw8YG1tjfj4eFy/fn3UOXl5eYiOjoa1tTViY2NRXFzMvtbQ0ICnnnoKLi4usLOzQ2RkJM6cOaNS34j2UaBBCCGEEGLgOjvPYKQYhjZI0dl5Vu1WfvGLX+D48eM4evQobt68iaCgIKxZswZdXV1Kx/385z/Hn/70J1y/fh3u7u546qmnIJFIAAA/+MEPIBaLkZOTg7t37+IPf/gD7GnQQ29RoEEIIYQQYsCk0j6IRLVavYZIVAOptF/l8wcGBvDBBx/g7bffxrp16xAREYGPPvoINjY2+Phj5cxWv/3tb5GcnIy5c+fi6NGjaG1txYkTJwAAjY2NiIuLw9y5cxEQEICNGzciMTFRre+NaA8FGoQQQgghBmxoqAaAtjdcMxgaqlb57JqaGkgkEsTFxbFfs7CwwJIlS1BWVqZ07LJly9i/z5gxA6Ghoewx+/fvx5tvvom4uDj89re/xZ07d1TuE9E+CjQIIYQQQgwYw4iN6joTeemll1BbW4udO3fi7t27iImJwXvvvafrbpFxUKBBCCGEEGLAOBwrvb9OYGAgLC0tkZeXx35NIpHg+vXriIiIUDq2oKCA/Xt3dzcqKysR/kj67Dlz5uCVV15BRkYG/vM//xMfffSRyv0i2kXpbQkhhBBCDJiNTRAADrS7fIrz7XVUY2dnh3379uHnP/85ZsyYAR8fH/zxj3/E4OAg9jxW5PO///u/4erqCk9PT7z++utwc3NjM1f9+Mc/xrp16xASEoLu7m4IBAKlIIToFwo0CCGEEEIMGJdrD2vrAIhENVq7hrV1ILhc9bI7vfXWW5DL5di5cyf6+voQExOD8+fPw8XFZdRxP/rRj1BVVYX58+fj9OnTsLS0BADIZDL84Ac/wL179+Do6Ii1a9finXfeUatfRHs4DJVrJIQQQgjRWyKRCHV1dfD394e1tfWYx1RV7cf9+x9AOyluuZg1ax+Cg9+d8pnPPfcczM3N8Y9//EML/TJ8k/m/NWS0R4MQQgghxMB5e78CbdbR8PbeN7UzpFKUlpYiPz8fkZGRWuoX0XcUaBBCCCGEGDg7uwi4uCRD86viuXBxSYad3dT2QRQXFyMmJgaRkZF45ZVXNNwnYihojwYhhBBCiBEICTmM69cjIJdrbmbDzIyLkJDDUz5v/vz5GBwc1Fg/iGGiGQ1CCCGEECNgY+OPoCDN1pQIDn4fNjb+Gm2TmA4KNAghhBBCDMBk8vd4e78Ef/83NXI9f/+D8PLa8+QDicqMPScTBRqEEEIIIXrMwsICACa9FMnX93WEhHwEMzNrTH2VPBdmZtYIDU2Fr+9rUzyXTNXw8DAAwNzcXMc90Q5Kb0sIIYQQoudaWlrQ09MDDw8P2NragsPhPPEckagedXU/xMOHFzEScEy0d2PkdSenlfD3fx/W1n6a6TgZl1wuR3NzMywsLODj4zOp/1NDQ4EGIYQQQoieYxgGDx48QE9Pz5TPlUqrMTj4JYaHL0Mma4JyBXEOzM3nwNIyAba2z4LLDdRUl8kkmJmZwd/fny1IaGwo0CCEEEIIMRAymQwSiUSN8/shEtVALhfDzMwK1taBMDdXr+I3UZ2lpSXMzIx3JwMFGoQQQianvx+orgbEYsDKCggKAuzpAYUQQsjYqI4GIYSQ8ZWWAocOAWfOALW1wKNjUxwOEBAArF8PvPIKEBGhu34SQgjROzSjQQghZLS6OmDvXiAzE+ByAekEm0gVrycnA4cPA/6Uc58QQgiltyWEEPK41NSR2QmBYOTziYKMR18XCEbOS03Vbv8IIYQYBAo0CCGE/NvBg8DLLwMi0ZMDjMdJpSPnvfzySDuEEEJMGi2dIoQQMiI1dSRI0GR7e6iqMCGEmCoKNAghhIzsyYiIGJmR0BRr65HN5LRngxBCTBItnSKEEDKy8XuqS6WeRCodaZcQQohJohkNQggxdaWlQGSkdtsPD9de+4QQQvQSzWgQQoipO3RoJEWtNnC5wAcfaKdtQggheo1mNAghxNQFBQE1Ndptv6pKe+0TQgjRSxRoEEKIKevrA5yclCt+axqHA/T2Avb22rsGIYQQvUNLpwghxJTV1Gg3yABG2q+u1u41CCGE6B0KNAghxJSJxcZ1HUIIIXqDAg1CCDFlVlbGdR1CCCF6g/ZoEEKIKevvBxwdaY8GIYQQjaMZDUIIMWX29kBAgHavERhIQQYhhJggCjQIIcTUrV+v3Toa69Zpp21CCCF6jZZOEUKIqaPK4IQQQrSAZjQIIcTURUQAycman9XgckfapSCDEEJMEs1oEEIIAerqRgIOkUhzbVpbj8xm+Ptrrk1CCCEGg2Y0CCGEjAQD772n2Tbff5+CDEIIMWEUaBBCCBnx0kvAm29qpq2DB4E9ezTTFiGEEINES6cIIYQoS00FXn0VkEpHPiaLyx35eP99CjIIIYTQjAYhhJDHvPTSyN4KPn/k8ydtEle8zuePnEdBBiGEENCMBiGEkImUlgKHDgFnzwI1NcoVxDmckWJ869YB+/ZRdilCCCFKKNAghBAyOf39QHU1IBYDVlZAUBBV/CaEEDIuCjQIIYQQQgghGkd7NAghhBBCCCEaR4EGIYQQQgghROMo0CCEEEIIIYRoHAUahBBCCCGEEI2jQIMQQgghhBCicRRoEEIIIYQQQjSOAg1CCCGEEEKIxlGgQQghhBBCCNE4CjQIIYQQQgghGkeBBiGEEEIIIUTjKNAghBBCCCGEaBwFGoQQQgghhBCNo0CDEEIIIYQQonEUaBBCCCGEEEI0jgINQgghhBBCiMZRoEEIIYQQQgjROAo0CCGEEEIIIRrH1XUHCCGEGIj+fqC6GhCLASsrICgIsLfXda8IIYToKQo0CCGEjK+0FDh0CDhzBqitBRjm369xOEBAALB+PfDKK0BEhO76SQghRO9wGObR3xqEEEIIgLo6YO9eIDMT4HIBqXT8YxWvJycDhw8D/v7T109CCCF6i/ZoEEIIUZaaOjI7IRCMfD5RkPHo6wLByHmpqdrtHyGEEINAgQYhhJB/O3gQePllQCR6coDxOKl05LyXXx5phxBCiEmjpVOEEEJGpKaOBAmabG/PHs21RwghxKBQoEEIIWRkT0ZExMiMhKZYW49sJqc9G4QQYpJo6RQhhJCRjd9TXSr1JFLpSLuEEEJMEs1oEEKIqSstBSIjtdt+eLj22ieEEKKXaEaDEEJM3aFDIylqtYHLBT74QDttE0II0Ws0o0EIIaYuKAioqdFu+1VV2mufEEKIXqJAgxBCTFlfH+DkpFzxW9M4HKC3F7C31941CCGE6B1aOkUIIaaspka7QQYw0n51tXavQQghRO9QoEEIIaZMLDau6xBCCNEbFGgQQoiJkkgkyL1+fXouZmU1PdchhBCiN7SUZoQQQoi+YhgG169fx4kTJzDQ2oo4ABxtXpDDGdkQTgghxKRQoEEIISakuroaaWlpqK+vH/mChQXaHR3h0durvYsGBtJGcEIIMUEUaBBCiAlob29HRkYGbt68Oeq14jlzkFRaCnMtbAqXcTi4HxUFt8FB2Nraarx9Qggh+osCDUIIMWKDg4M4c+YMLl26BJlMNuYxORERWFFSopXrmzMMjlhbo+0Xv8DSpUvB5/Mxe/ZsrVyLEEKIfqE6GoQQYoRkMhlycnJw+vRpDAwMPPH4/d98g7DmZs3OanC5AJ+P3vR05ObmIjs7Gz09PQgKCgKfz8f8+fPB1VZFckIIITpHgQYhhBgRhmFw584dHD9+HK2trZM+z7W3F2+kpcFCJtPcxnBra6C0FPD3BzAS/Ny+fRsCgQCVlZVwdHREYmIiEhIS4OzsrKmrEkII0RMUaBBCiJFoampCWloaKioqVDo/rrwc38vJ0VyHUlOBPXvGfKm5uRkCgQBXr16FRCLBwoULwePxEBQUBA5HqzmwCCGETBMKNAghxMD19PTg1KlTyM/Phzq3dGdnZ/ygpwc+H36ofqcOHgRee+2Jhw0NDSE/Px9CoRCtra2YPXs2eDwelixZAiuqvUEIIQaNAg1CCDFQYrEYFy5cwIULFzA8PKxyO5aWllizZg2Sk5NHHu5TU4FXXwWk0pGPyeJyRz7ef3/cmYzxMAyDsrIyCIVC3LlzB9bW1oiLi0NSUhI8PDym+B0RQgjRBxRoEEKIgWEYBvn5+Th16hR6enpUbofD4WD58uXYtGnT6D0SdXXA3r1AZuZI8DBRwKF4PTkZOHyY3ZOhqo6ODuTk5CA3NxcDAwOIiooCj8dDVFQULasihBADQoEGIYQYkIqKCqSlpaGpqUmtdsLCwrBjxw7MmTNn4gNLS4FDh4CzZ4GaGuDRXxkczkgxvnXrgH37gPBwtfr0OIlEguvXr0MgEKCxsRFubm7g8XhYvnw57OzsNHotQgghmkeBBiGEGIDW1lYcP34ct2/fVqsdT09P7NixA3Pnzp367EB/P1BdDYjFgJUVEBQ0LRW/GYZBXV0dhEIhbty4AQ6HgyVLloDP5z85UCKEEKIzFGgQQogeGxgYwOnTp5GdnQ25XK5yO3Z2dti0aRMSEhJgbm6uwR5Or97eXuTm5iInJwfd3d0IDAwEn8/HggULqCYHIYToGQo0CCFED0mlUggEApw5cwaDg4Mqt8PlcrFixQqsW7cOtra2GuyhbsnlcrYmR0VFBdXkIIQQPUSBBiGE6BGGYVBUVITjx4+jo6NDrbYWLVqEbdu2wc3NTUO900/Nzc3Izs5Gfn4+JBIJFixYAD6fTzU5CCFExyjQIIQQPVFfX4+0tDRUV1er1Y6fnx+efvppBAYGaqhnhmFoaAgFBQUQCARobW3FrFmzwOfzqSYHIYToCAUahBCiY11dXThx4gSuXbumVjszZszAtm3bEBMTY9Ij+QzDoLy8HAKBgK3JsXz5cvB4PKrJQQgh04gCDUII0RGRSIRz584hKysLEolE5Xasra2xbt06rFy5EhYWFhrsoeHr7OxETk4OLl++jIGBAURGRrI1OczMzHTdPUIIMWoUaBBCyDSTy+XIy8vDqVOn0NfXp3I7HA4HCQkJ2LRpExwcHDTYQ+MjkUhQWFgIgUCAhoYGuLm5ISkpCXFxcVSTgxBCtIQCDUIImUYlJSVIT09Hc3OzWu1ERkZix44d8Pb21lDPTEd9fT0EAgEKCwvZmhw8Hg8+Pj667hohhBgVCjQIIWQaNDc3Iz09HSUlJWq14+3tjR07diAyMlJDPTNdfX19yM3NRXZ2Nrq7uxEQEAA+n4+FCxdSTQ5CCNEACjQIIUSLent7cfr0aVy+fBnq3G4dHBywefNmxMXF0d4CDVPU5BAKhSgvL4ejoyPi4+ORmJgIFxcXXXePEEIMFgUahBCiBRKJBFlZWTh37hxEIpHK7VhYWGDVqlVYu3YtrK2tNdhDMpaWlhYIhUK2Jsf8+fPB5/MRHBxs0pm8CCFEFRRoEEKIBjEMg8LCQmRkZKCrq0uttpYuXYotW7ZgxowZGuodmSyRSMTW5Hjw4AG8vb3B5/OxdOlSqslBCCGTRIEGIYRoSE1NDf71r3+hvr5erXaCgoKQkpICPz8/jfSLqI5hGFRUVEAgEOD27duwsrJCXFwckpKS4OnpqevuEUKIXqNAgxBC1NTR0YGMjAzcuHFDrXbc3Nywfft2LFiwgJbp6KGuri62Jkd/fz8iIiLA5/OpJgchhIyDAg1CCFHR4OAgzp49i0uXLkEqlarcjo2NDTZu3Agej0fZjgyARCLBjRs3IBAIUF9fD1dXVyQlJSE+Pp5qchBCyCMo0CCEkCmSyWTIycnB6dOnMTAwoHI7ZmZm4PF42LhxIz2gGqjHa3IsXrwYPB4Pvr6+uu4aIYToHAUahBAySQzD4O7du0hPT0dra6tabc2bNw/bt2+ndf5Goq+vD3l5ecjOzkZXVxcCAgLA4/GwaNEimqUihJgsCjQIIWQSmpqakJ6ejvLycrXamTNnDlJSUhAaGqqhnhF9IpfLcefOHQiFQpSVlcHBwQEJCQlUk4MQYpIo0CCEkAn09PTg1KlTyM/PV6vgnrOzMzZv3ozY2FjD3Tjc3w9UVwNiMWBlBQQFAfb2uu6V3mppaUF2djby8/MxPDyM+fPng8fjISQkhDb7E0JMAgUahBAyBrFYjMzMTJw/fx7Dw8Mqt2NpaYk1a9YgOTnZMOsvlJYChw4BZ84AtbXAo78yOBwgIABYvx545RUgIkJ3/dRjipocQqEQLS0t8PLyAp/PR2xsrGG+JwghZJIo0CCEkEcwDIOCggKcPHkSPT09KrfD4XCwbNkybN68Gc7Ozhrr37SpqwP27gUyMwEuF5goq5bi9eRk4PBhwN9/+vppQBQ1OYRCIW7dugUrKyssW7YMfD6f9uoQQowSBRqEEPKtiooKpKWloampSa12QkNDkZKSgjlz5mioZ9MsNRV49dWR4GEqaXu53JGP994DXnpJe/0zAoqaHLm5uejr60N4eDj4fD7mzp1ruEvrCCHkMRRoEEJMXmtrK44fP47bt2+r1Y6npyd27NiBuXPnGu4a/IMHgQMH1G/nzTeB119Xvx0jJ5VK2ZocdXV1bE2OuLg42NP+F0KIgaNAgxBisgYGBvD1119DKBRCLper3I6dnR2eeuopJCYmwtzcXIM9nGapqcDLL2u2vT17NNeekWtoaIBQKMS1a9cAAIsXLwafz6eaHIQQg0WBBiHE5EilUgiFQnzzzTcYHBxUuR1zc3OsXLkS69atg62trQZ7qAN1dSObuUUizbVpbT2ymZz2bExJf38/8vLyIBQK0dXVBX9/f/D5fKrJQQgxOBRoEEJMBsMwKCoqQkZGBtrb29Vqa+HChdi2bRvc3d011DsdW70aEAimtifjSbhcgM8HLlzQXJsmRC6X4+7duxAIBGxNjvj4eCQlJVFNDkKIQaBAgxBiEurr65GWlobq6mq12vHz80NKSgqCgoI01DM9UFoKREZqt/3wcO21bwIePHgAoVCI/Px8iMVitiZHaGio4e4HIoQYPQo0CCFGrbu7GydOnMDVq1fVamfGjBnYtm0bYmJijO/Bbv9+4IMPNDubocDlAvv2Ae++q/m2TZBIJMLVq1chEAjYmhw8Hg+xsbGwtrbWdfcIIUQJBRqEEKMkEolw/vx5ZGZmQiKRqNyOlZUV1q1bh1WrVsHCwkKDPdQjQUFATY1226+q0l77JohhGFRVVUEgEODWrVuwtLTEsmXLwOPxMHPmTF13jxBCAFCgQQgxMnK5HHl5efjqq6/Q29urcjscDgcJCQl46qmn4OjoqMEe6pm+PsDJSbnit6ZxOEBvL0DpWrWiu7sbOTk5uHz5Mvr6+hAWFgY+n4/o6GiqyUEI0SkKNAghRqO0tBTp6em4f/++Wu1ERkZix44d8Pb21lDP9NitW8CCBdq/TlERMH++9q9jwhQ1OYRCIWprazFjxgy2JoeDg4Ouu0cIMUEUaBBCDF5LSwvS09NRXFysVjve3t7YsWMHIrW5MVrfXL0KxMZq/zoFBcDSpdq/DgEwuiZHTEwM+Hw+/Pz8dNsxQohJoUCDEGKw+vr68NVXXyE3N1etgnsODg7YvHkz4uLiTG+pCc1oGLWBgQHk5uYiOzsbnZ2d8PPzY2tyGO2eI0KI3qBAgxBicCQSCS5evIizZ89CpEaBOS6Xi+TkZKxdu9Z0M/b09wOOjrRHw8jJ5XIUFxdDIBCgtLQU9vb2SEhIQGJiImbMmKHr7hFCjBQFGoQQg8EwDAoLC3HixAl0dnaq1daSJUuwZcsWuLq6aqh3BoyyTpmU1tZWZGdnIy8vD2KxGPPmzQOfz6eaHIQQjaNAgxBiEGpra5GWloba2lq12gkMDMTTTz9Na9UfpcU6GjIOB/Xr18Pl//6PRs71jFgsZmtyNDc3Y+bMmeDxeFi2bJnpzvARQjSKAg1CiF7r6OjAiRMnUFhYqFY7bm5u2L59OxYsWECjto/TcmXw//fd76LRzo6qWeupx2tyWFhYsDU5vLy8dN09QogBo0CDEKKXBgcHcfbsWVy6dAlSNUbabWxssGHDBvD5fHC5XA320HjIZDJ0L1kC19u3wZHJNNcwlwvw+RCfPq00ck7VrPVXd3c3Ll++jJycHLYmB4/Hw7x580wvUQIhRG0UaBBC9IpMJsPly5dx+vRp9Pf3q9yOmZkZkpKSsHHjRtjTJuRxtba2Ijc3FysDAuC8fDmgxub6UaytR2ZL/P0BjIycV1dXQyAQoKioiEbO9ZhUKsXNmzchEAhQW1sLFxcXJCUlIT4+nmpyEEImjQINQoheYBgGd+/exfHjx/HgwQO12oqOjsb27dsxc+ZMDfXO+DAMgytXrkAikSAxMXFktDo1FXj5Zc1dJDUV2LNnzJd6enrYata9vb00cq7HGhsb2ZocDMNQTQ5CyKRRoEEI0bl79+4hLS0N5eXlarUzZ84c7NixA2FhYRrqmXHq7e1FVlYWFi9ejDlz5ii/ePAgcOCA+hc5eBB47bUnHiaVSlFUVASBQICamhoaOddjAwMDyMvLQ3Z2Njo6OuDr6ws+n4+YmBiqyUEIGRMFGoQQnXn48CFOnTqFK1euQJ1bkZOTE7Zs2YLY2FgaDX+CO3fu4P79+1i1atX4D4epqcCrr45koZrK/hgud+Tj/ffHncmYSFNTEwQCAY2c6zlFTQ6hUIiSkhLY2dkhPj4eSUlJlC6aEKKEAg1CyLQbHh5GZmYmzp8/D7FYrHI7lpaWWL16NVavXg0rKysN9tD4iMViXLhwAUFBQQgPD3/yCXV1wN69QGbmSPAwUcCheD05GTh8mN2ToarHR879/PzA4/Fo5FwPKWpyXLlyBSKRCNHR0eDz+QgLC6PMYoQQCjQIIdOHYRhcvXoVJ06cQE9Pj8rtcDgcLFu2DJs3b4azs7PG+mesamtrcefOHSQnJ8POzm5qJ5eWAocOAWfPjhT1e/RXBocDBAYC69YB+/YBkwlgpkAul6OkpAQCgYAdOVdUs6aRc/0iFotx7do1CAQC3L9/H56enuDz+VSTgxATR4EGIWRaVFZWIi0tDY2NjWq1ExoaipSUlNF7C8goMpkMAoEAjo6OWLx4sfojzP39QHU1IBYDVlYjFb+nKaNXW1sbW82aRs7111iZxWJjY8Hj8eDt7a3r7hFCphkFGoQQrWpra8Px48dx69Yttdrx9PTE9u3bER0dTQ+Wk9DW1obLly+Dx+MZ1ej/4yPnVM1af/X09LA1OXp7exEaGgo+n0+ZxQgxIRRoEEK0YmBgAN988w0EAgHkcrnK7djZ2eGpp55CYmIizM3NNdhD48QwDPLz8yEWi5GUlGS0D3SKkXOhUIibN29STQ49NlZmscTERCQkJFBmMUKMHAUahBCNkkqlEAqF+OabbzA4OKhyO+bm5lixYgXWr18PW1tbDfbQePX19SEzMxMxMTHw8fHRdXemDY2cG47HM4stWrQIPB4P/v7+NFNJiBGiQIMQohEMw+DWrVvIyMhAW1ubWm0tXLgQ27Ztg7u7u4Z6Z/zu3r2LpqYmrFq1CpaWlrrujk7QyLnhGBgYwJUrVyAUCtmaHDweD4sXLzaozGI5OTl4++23cePGDbS0tODEiRPYsmWLrrtFiN6gQIMQoraGhgakpaWhqqpKrXb8/PyQkpKCoKAgDfXM+InFYmRmZsLf3x+RkZG67o7eaGpqglAoxNWrV9mRc0VNDho51x+KzGJCoRDFxcUGV5Pj7NmzyMvLw6JFi7Bt2zYKNAh5DAUahBCVdXd348SJE7h69apa7bi4uGDr1q1YsmQJPQROQX19PYqKipCcnAz7acr+ZGiMZeTcFCgyi125cgVDQ0OIjo4Gj8dDeHi4QdwXOBwOBRqEPIYCDULIlIlEIpw/fx6ZmZmQSCQqt2NlZYV169ZNXKWajCKXyyEQCGBnZ4elS5caxEOYrjEMw9bkMMSRc1OiyCwmFApx7949eHp6spnFbGxsdN29cVGgQchoFGgQQiZNLpfjypUrOHXqFHp7e1Vuh8PhID4+Hps2bYKjo6MGe2j82tvbkZOTg6SkJLi5uem6OwZprJFzqsmhf8bKLLZ06VLw+Xy9rMlBgQYho1GgQQiZlLKyMqSlpeH+/ftqtRMREYGUlBS9fFDQZ4qq6oODg+DxeJRNSQMMdeTcFD2eWSwkJITNLKYvaa8p0CBkNAo0CCETamlpQXp6OoqLi9Vqx9vbGzt27KANyyro7+9HZmYmFi5cCF9fX113x+gwDIOamhoIBAJ25JyqWesnqVSKW7duQSAQoLq6Gs7OzkhKSkJ8fLzOZ0cp0CBkNAo0CCFj6uvrw+nTp3H58mW1Cu45ODhg06ZNiI+Pp1F4FZSUlKC+vh6rVq2ClZWVrrtj9B4+fIjLly8jOztbb0fOyYh79+5BKBSioKAAcrmczSymq5ocFGgQMhoFGoQQJRKJBJcuXcKZM2cgEolUbofL5SI5ORlr166FtbW1BntoGoaHh5GZmQlfX19ERUXpujsmRzFyLhQKUVVVpVcj50TZ4OAgrly5AoFAgI6ODvj4+IDP509LZrH+/n5UV1cDABYsWIA///nP4PP5mDFjhkkVzSRkPBRoEEIAjCwfuXHjBjIyMtDZ2alWW4sXL8bWrVspm4+KGhsbcePGDaxatYoKzemBx0fOY2JiqJq1Hno0s1hJSQlsbW0RFxen1cQJQqEQfD5/1NdfeOEFHDlyRCvXJMSQUKBBCEFtbS3S0tJQW1urVjuBgYFISUmBv7+/hnpmWuRyObKzs2FtbY3Y2Fh6iNUzipFzoVCI9vb2aR05J1PT3t6O7Oxs5OXlYWhoCHPnzgWPx0NERAT9XBEyjSjQIMSEdXR04MSJEygsLFSrHTc3N2zfvh0LFiygX+Iq6ujoQHZ2NhISEuDh4aHr7pAJKEbOFdWsp2PknKhmeHgY165dg0AgwL179+Dh4cFmFrO1tdV19wgxehRoEGKChoaGcPbsWVy8eBFSqVTldmxsbLB+/XqsWLECXC5Xgz00HQzD4Nq1a+jr68OKFStow7yBGWvknM/nG0w1a1PBMAxqa2shEAhw48YNcLlcNrPYrFmzdN09QowWBRqEmBC5XI6cnBycPn0a/f39KrdjZmaGpKQkbNy4Efb29hrsoWkZGBhAZmYm5s2bR8vNDNzw8DCuX7+OS5cu0ci5nlNkFsvJycHDhw8RHBwMPp+P+fPnU2YxQjSMAg1CTADDMCguLsbx48fR0tKiVlvR0dHYvn07Zs6cqaHemaaysjLU1NQgOTmZ0tYaERo5NxwymQxFRUVKmcUSExORkJBAmcUI0RAKNAgxcvfu3UN6ejrKysrUamf27NlISUlBWFiYhnpmmiQSCTIzMzF79mxER0frujtT098PVFcDYjFgZQUEBQE0ozWux0fOQ0JCwOPxaORcDykyi129ehUymQwLFy4En89HQEAALYEjRA0UaBBipB4+fIhTp07hypUrUOfH3MnJCVu2bEFsbCztH1BTU1MTrl+/jlWrVhnOiGlpKXDoEHDmDFBbCzz6XuJwgIAAYP164JVXgIgI3fVTj9HIueEYHBxEfn4+hEIh2traMGfOHDazmKWlpa67R4jBoUCDECOjKPR2/vx5iMVilduxsLDAmjVrsHr1alraoybF3hhLS0ssW7bMMEZI6+qAvXuBzEyAywUmShqgeD05GTh8GKD9JuOikXPDwDAMSktLIRAIUFxcDBsbG8THx1NmMUKmiAINQowEwzC4evUqTpw4gZ6eHpXb4XA4iI2NxZYtW+Ds7Kyx/pmqzs5OCIVCxMfHw9PTU9fdmZzUVODVV0eCh6lkJeNyRz7eew946SXt9c8I0Mi54VCkns7NzcXQ0BCioqLA5/OpJgchk0CBBiFGoLKyEunp6WhoaFCrnZCQEKSkpMDHx0dDPTNdDMOgsLAQPT09WLFiheGsyT94EDhwQP123nwTeP119dsxcoqRc6FQiLt379LIuR5TZBYTCARoamqCh4cHkpKSsHz5csosRsg4KNAgxIC1tbUhIyMDRUVFarXj4eGBHTt2IDo6mkboNGBwcBAXLlzA3LlzERgYqOvuTF5qKvDyy5ptb88ezbVn5Gjk3DA8mlns5s2bMDc3x9KlS8Hj8TB79mxdd48QvUKBBiEGaGBgAN988w2EQiFkMpnK7djZ2WHjxo1ITEykgnsaUl5ejqqqKiQnJ8Pa2lrX3Zm8urqRzdwikebatLYe2UxOezamhEbODUdvby+bWaynpwfBwcHg8XhYsGCB4cxiEqJFFGgQYkCkUimys7Px9ddfY3BwUOV2zM3NwefzsWHDBnpw0RCJRIKsrCx4e3tj3rx5uu7O1K1eDQgEU9uT8SRcLsDnAxcuaK5NE6IYORcKhbhx4waNnOsxmUyGW7duQSgUorKyEk5OTmxmMScnJ113jxCdoUCDEAPAMAxu376N48ePo62tTa22FixYgG3btsHDw0NDvSP379/H1atXsXLlSsN8qCgtBSIjtdt+eLj22jcBNHJuOO7fvw+hUIiCggJIpVIsWrQIPB4PgYGBtASOmBwKNAjRcw0NDUhLS0NVVZVa7fj6+iIlJQXBwcEa6hlhGAY5OTkwNzdHXFyc4T5E7N8PfPCBZmczFLhcYN8+4N13Nd+2CZLJZLh9+zYEAgEqKyvh7OyMhIQEGjnXQ49nFps9ezb4fD6WLFlCmcWIyaBAgxA91d3djZMnT6KgoECtdlxcXLB161YsWbLEcB+E9VB3dzcuXbqE5cuXw8vLS9fdUYlMJkNnZyecYmJg1dSkvQsFBQFqBspktLFGzqkmh/4ZK7NYXFwckpKS4O7uruvuEaJVFGgQomfEYjHOnz+PCxcuQCKRqNyOlZUV1q5di1WrVtHomYbduHEDnZ2dWLFihd5vopdIJOjo6EBbWxva29vR3t6OtrY2tLW1oaurCxYiEf565Ai0+ljK4QC9vYC9vTavYrJo5NxwKDKL5eXlYXBwEJGRkeDz+YiMjKTgkBglCjQI0RNyuRz5+fk4efIkent7VW6Hw+EgPj4emzZtgqOjowZ7SAYHB5GZmYmIiAi9WoImFouVgohHg4menh5MdJuf3dGBX2dkaL+TRUXA/Pnav44JYxgGZWVlEAgENHKu5yQSCa5fv45Lly6hqakJ7u7u4PF4lFmMGB0KNAjRA2VlZUhPT8e9e/fUaic8PBwpKSmYNWuWhnpGFCorK1FeXo7Vq1frJG3t0NCQUhDx6J8PHz5UuV2/tjb86uRJzXV0PAUFwNKl2r8OAUAj54aCYRjU1dVBKBSisLAQZmZmWLp0Kfh8PmUWI0aBAg1CdKilpQXHjx/H3bt31WrHy8sLO3bsoIcILZBKpbh48SI8PDywYMECrV2HYRgMDAyMWuKk+LO/v18r16UZDeOmGDkXCARobGykkXM91tvbi9zcXGRnZ6OnpwdBQUHg8/mYP3++3i/RJGQ8FGgQogN9fX34+uuvkZOTA7lcrnI7Dg4O2LRpE+Lj42FmZqbBHhIAaG5uRn5+PlauXAlnZ2e122MYBn19feyypseDiaGhIfU7PUWDbW04evIktPnuYTgcdNfXY4aPjxavQiYy1sh5bGws1eTQQ49nFnN0dGRrcmjiPkTIdKJAg5BpJJFIIBAI8M0330CkRgVmLpeLVatWYe3atbCxsdFgDwkw8lCWm5sLAIiPj5/SLBHDMOjp6RkzmGhvb4dYLNZWt6dEJpOhrq4Ozc3NOFdTA181Eg88SZujI3797LPw8vJCZGQkIiMjERwcDAsLC61dk4xvvJFzqsmhf5qbm9nMYhKJBAsXLgSPx0NQUBDNXhODQIEGIdOAYRjcuHEDGRkZ6OzsVKutxYsXY+vWrXB1ddVQ78ijenp6cPHiRSxbtgze3t5jHiOXy9HV1TXungmpNupRaFB/fz/Ky8sxNDQEKysrvPbgAbY+eACtLM7gciF5+WXcfeklFBcXo7S0FN3d3bCwsEBoaCgiIiIQFRUFDw8PenCaZnK5HLdu3WJHzp2cnNiaHDRyrl+GhobYzGKtra2YPXs2eDwelixZAisrK113j5BxUaBBiJbV1tYiLS0NtbW1arUTEBCAlJQUBAQEaKhn5HFFRUVoa2vDypUrAQCdnZ1KGZwUf+/o6FBrydt0Mjc3h5ubG9zd3eHm5oaGhgYUFRXBysoKVlZWMDMzg1d3N95IS9NeJx6pDM4wDFpaWlBSUoKSkhJUVVVBKpXC1dUVkZGRiIqKQmhoqE423JuysUbO+Xw+VbPWMwzDoLy8HAKBAHfu3IGNjQ2WL1+OpKQkeHh46Lp7hIxCgQYhWtLZ2YkTJ07g+vXrarXj6uqKbdu2YdGiRfQLX8MkEgna29tx7949nDt3Dra2tuByuWhvb0dnZ+eEaWH1iYWFBdzd3dkPDw8PeHh4wN3dHTNmzICZmRk6Ojrw6aeforq6esw29n/zDcKam2Guye+ZywX4fODChXEPEYvFqKqqQnFxMUpKStDW1gYzMzMEBQWxy6xmz55N7/1pQiPnhqOzsxPZ2dnIzc3FwMAAoqKiwOPxEBUVRT8vRG9QoEGIhg0NDeHs2bO4ePGiWktorK2tsWHDBvD5fFrLrgaRSMTuj3h8dqK7uxsPHz5Ed3c3Zs+erdeZXaysrNgg4vFgwtnZedwHC4ZhUFBQgC+++GLCfUGuvb14Iy0NFjKZ5or3WVuPzGb4+0/6lPb2dpSUlKC0tBTl5eUQi8VwdHRkg47w8HDYU+E/raORc8PxeGYxNzc3NrOYnZ2drrtHTBwFGoRoiFwux+XLl/HVV1+plYrUzMwMiYmJ2LhxIxwcHDTYQ+M1ODg4ZrG69vb2cYsfyuVy3L9/H9bW1npTzMzGxkYpgHj07w4ODlMepRwYGMA//vEP3Lx5c1LHx5WX43s5Oap0fWypqcCePSqfLpVKUVNTwy6zunfvHjgcDnx9fREVFYXIyEj4+flRxjUtG2vknGpy6J9HM4vduHEDHA4HS5YsAZ/Px5w5c3TdPWKiKNAgRE0Mw6CkpATp6eloaWlRq63o6Ghs27YNXl5eGuqdcWAYBv39/eMGEwMDA1Nqb3BwEK2trfD29p725SAODg5KS5weDShsbW019uBWWlqKI0eOTLmY37qbN7GlsBAMoN7MxsGDwGuvqdPCKD09PSgtLWVnPAYHB2Fra4vw8HB2xoM2MWuPYuRcKBSioaGBRs71mCKzWE5ODrq7uxEYGMhmFtPnmVtifCjQIEQN9+/fR1paGsrKytRqZ/bs2dixYwfCv90wa4oYhsHDhw/HLFbX1tamVjrgR6/x4MEDAMDMmTO1Nhrr5OSkFEQ8+qe20xFLJBJkZGTg0qVLKp0fExOD7w0Pw+pnPwOk0pGPyeJyRz7ef1+tmYzJkMvlqK+vZ4OOuro6MAyDWbNmsUFHUFAQPVRpAcMwqK+vh0AgoJFzPSeXy9maHBUVFVSTg0w7CjQIUUFvby9OnTqFvLw8tTYMOzo6YsuWLVi2bJlJLP9gGAbd3d3jpoUdHh7W2rWHh4dx//59eHh4qD36yuFw4OLiMiqIUHzoatNsU1MTPv74Y5Vm1qytrfGd73wHS5YsGQnA6uqAvXuBzMyR4GGigEPxenIycPjwlPZkaMrAwADKyspQUlKC4uJi9Pb2wtLSEmFhYWzgoS9L5IxJX18fW5ODRs71W3NzM7Kzs5Gfnw+JRIIFCxaAz+dTTQ6iVRRoEDIFw8PDyMrKwrlz59QqvGZhYYE1a9Zg9erVRpfJRS6Xo7Ozc8xgoqOjQyc1Jjo7OzE4OIhZs2ZNOqAzMzODq6vrmLMSbm5uerVBXy6XIzMzE6dOnYJMJpvy+cHBwXjxxRfHrs1SWgocOgScPQvU1ACP/srgcIDAQGDdOmDfPjaFra4xDIP79++zezuqq6shk8ng7u7OBh2hoaFG97OnSzRybjiGhoZQUFAAgUCA1tZWzJo1C3w+nzKLEa2gQIOQSWAYBteuXcOJEyfQ3d2tVluxsbHYsmULXFxcNNS76SeVStHR0aFU8Vrxd32qMSGTyXDv3j04OTmN+bCjqDHx+AZsd3d3uLq6GkSV5M7OThw5cgSVlZVTPtfc3BybN29GcnLy5AKw/n6guhoQiwErKyAoCDCADFAikQgVFRVs4NHR0QEul6uUQtfb25tGdTXk8ZFzqmatnx7PLGZtbY3ly5eDx+NRZjGiMRRoEPIEVVVVSEtLQ0NDg1rthISEYMeOHfD19dVQz7RreHiYDSYen53o6urS+xoTvb296Orqgr+/P7y8vJSCCUVA4eLiYrBL1hTB77Fjx1Tav+Ll5YU9e/aY3Jp6hmHYFLrFxcWoqKiARCKBs7OzUgpdW1tbXXfV4IlEIuTn59PIuQHo7OxETk4OLl++jIGBAURGRrI1OQz1Hkn0AwUahIyjra0NGRkZKCoqUqsdDw8P7NixA9HR0Xo3mqeoMTFWMNHT06Pr7k2alZWV0rKmxsZGzJkzBytXrpywxoShGhwcxOeff47CwkKVzufz+di+fbteLf/SFYlEgurqana2o7m5GRwOB/7+/mylch8fH3rYUgONnBsOiUSCwsJCCAQCNrNYUlIS4uLiKLMYUQkFGoQ8ZnBwEN988w0EAoFK690VbG1tsXHjRiQlJel0U+TAwMCYG6/b2trQ19ens35Nla2t7Zj1JTw8PGBvbw8Oh4PW1lbk5uaCx+ONvd/ACJSXl+PTTz9VKRB0cnLCCy+8gMjISM13zEh0d3ezQUdZWRmGhoZgZ2eHiIgIdsbD0dFR1900WMY2cv773/8eGRkZKC8vZ4sa/uEPf0BoaKiuu6Y2RWaxwsJCNrMYj8eDj4+PrrtGDAgFGoR8SyqVIjs7G998882U6zI8ytzcHHw+H+vXr5+WESBFjYmx6ku0tbVhcHBQ633QFAcHh1HLmxSfT/RvyTAMrly5AolEgsTERIN8YHkSiUSCkydPIisrS6XzFyxYgJ07d9Ko5BTI5XLU1dWhuLgYJSUl7PLJOXPmsEFHQEAAZVdSgUQiwY0bN3Dp0iWDHjlfu3Ytnn32WSxevBhSqRSvvfYaiouLUVpaalDfx0QezywWEBAAPp+PhQsX0nufPBEFGsTkMQyD27dv4/jx42hra1OrrQULFmDbtm0aXw6gqDExXjChTgas6ebs7DxmsTp3d3dYW1tPub3e3l5kZWVh8eLFRrvf4N69e/j444/R3Nw85XOtrKzw7LPPYtmyZUa3hGy69fX1sSl0S0pK0NfXB2tra4SGhrKVyo11Jk2bxho5N9SaHO3t7fDw8EB2djYSExN13R2NUmQWEwqFKC8vh6OjIxISEpCYmEiZxci4KNAgJq2xsRFpaWkqZex5lK+vL1JSUhAcHKxyG3K5XKnGxOMBhUQiUauP04XD4WDGjBljBhNubm6wtLTU2LXu3LmD+/fvY9WqVUa534BhGGRlZeHkyZMqpQUODAzE7t274ebmpoXemTaGYdDU1MQGHTU1NZDL5fD09GSDjpCQEKN8X2qLMdTkqK6uRnBwMO7evYuoqChdd0drWlpaIBQK2cxi8+fPB5/PR3BwMA1oECUUaBCT1N3djZMnT+Lq1atqZU9ycXHB1q1b/13k7AlkMhk6OzvHrHzd0dGh1p6Q6WRmZgY3NzelJU6KP93c3LT+UCAWi5GZmYnAwECjrabe3d2NTz/9FBUVFVM+18zMDJs2bcKaNWuMchmZPhoaGkJ5eTkbeHR1dYHL5SIkJIRdZqXNavTGRC6X486dOxAIBAY1ci6Xy7Fp0yb09PQgNzdX192ZFiKRiK3J8eDBA3h7e4PP52Pp0qWUWYwAoECDmBixWIwLFy7g/Pnzas0QWFlZYe3atVi1atWoEXqJRIKOjo4xg4muri69qTHxJFwul60x8XgwMWPGDJ3VmKitrcWdO3eQnJxsNGugH3f9+nUcO3ZMpf01np6e2LNnj8GkUTZGDMPgwYMHKC0tRUlJCSoqKiCVSjFjxgw26AgLC4ONjY2uu6r3DGnkfN++fTh79ixyc3Mxe/ZsXXdnWjEMg4qKCggEAty+fRtWVlaIi4tDUlISPD09dd09okMUaBCTIJfLkZ+fj1OnTuHhw4cqt8PhcBAXF4e1a9dCLBYrBROKv3d3d+t9jQkFCwuLMYvVubu7612NCblcjkuXLsHR0RGLFy/Wu4cMTRgcHMQ///lPXLt2TaXzeTwetm/frtHlaUR9w8PDqKqqYmt3tLa2wszMDIGBgYiMjERERAR8fHyM8j2tKfo+cv7DH/4Qp06dQk5ODvz9/XXdHZ3q6upiM4v19/cjIiICfD7fYDOLEfVQoEGMXnl5OdLS0nDv3r0pnSeVSiESiTA0NIShoSG4uLggICAAw8PDagUr083a2nrMWQl3d3c4OTkZxMNNW1sbLl++bNRpaysrK/HJJ5+oVHne0dERL7zwglGvCTcmnZ2dSil0xWIxHBwc2BS6ERERcHBw0HU39ZJi5FwoFOLWrVs6HzlnGAavvvoqTpw4AaFQqNY+PWOjyCwmEAhQX18PV1dXJCUlIT4+3mhno8loFGgQo/XgwQMcP34cd+7cGfN1hmEglUoxNDSkFFAo/q5YWmVra4uAgAC4uLjo7UO5nZ3dmPUl3N3d2RoThohhGOTn50MsFiMpKckoR8OkUilOnTqFzMxMlWbC5s2bh507d9KDqYGSSqWora1FaWkpiouL0dTUBA6HAx8fH6UUusb43leXPoycf//738exY8dw6tQppdoZTk5OtDTuEfX19RAKhbh+/To4HA4WL14MHo9HSzxNAAUaxOj09/fj9OnTyMnJgUwmg0QiUQoiHg0qJsrkY2FhAT8/P73ZwOno6DgqmFB8GOPoUF9fH7KysrBo0SKjLRDV3NyMjz/+eMqzbcDIPqFnnnkGy5cv14v3J9GM3t5eNugoLS3FwMAAbGxsEB4ezgYeLi4uuu6mXtHlyPl4P3uffvopdu3apdVrG6K+vj7k5eUhOzsbXV1dCAgIAI/Hw6JFiwwmsxiZGgo0iMFjGAY9PT1oaWnBuXPncOnSJTx8+JANKKaaycnMzAyzZs3CnDlzpv3G5+LiMmaxOlVrTBiq4uJiNDY2jrnZ3hgwDINLly4hIyNDpbS1AQEBePHFFzVer4XoF7lcjsbGRnaZVW1tLRiGgZeXFyIjIxEVFYWgoCBKofuIsUbO+Xy+0Q5WGCpFZjGhUIiysjI4ODiwmcUokDYuFGgQgyCXy9HV1TVmsbr29na0tLSgrq4OIpFIreu4u7vD399faw/1ihoTYxWrc3d3N/kHBrFYjKysLPj5+SEyMlLX3dGKnp4eHDlyBGVlZVM+18zMDBs2bMD69etpKY0JGhwcVCoY2NPTAwsLC4SGhrKzHR4eHjTDBRo5NyQtLS3Izs5Gfn4+hoeHMX/+fPB4PISEhNB72QhQoEH0hlQqHbPGRHt7+7g1Jvr6+lBTU4Pe3l61ru3o6IiAgAA4Ojqq1Q7w7xoTjwYQioDC1dWVfsmNo76+HkVFRUhOToa9vb2uu6MVN27cwD/+8Q+V0tZ6eHhg9+7dJp/RhoxgGAYtLS0oLi5GSUkJqqurIZVK4ebmxgYdoaGhJjUTOha5XI67d+9CIBDQyLmeU2QWEwqFaGlpgZeXF/h8PmJjY/UisxhRDQUaZFopakw8Xl+ivb0dnZ2dk94MKxKJUF9fj7a2NrX6Y21tDX9/f7i5uU1p5ITL5Y5ZrE5RY4JGmydPLpdDIBDA3t5+0oUPDc3Q0BC++OILFBQUqHR+QkICUlJS6JctGZdYLEZlZSU729HW1gZzc3MEBgaylcpnzZpllD9fkzXWyLm+1uQwZWNlFlu+fDl4PB7V5DBAFGgQjXu8vsSjwURPT49aNSZkMhkaGxtx//59tQrfcblczJkzB7NmzRo3KLC0tBwzLayHhwecnZ3pF5MGtLe3IycnB0lJSXBzc9N1d7SiqqoKn376KTo7O6d8roODA773ve8hOjpaCz0jxqytrU2pYKBYLIajoyOioqIQERGBiIgIo0wiMRmPj5x7e3uDx+PRyLkeUmQWy83NRV9fH8LDw8Hn8zF37lwa0DMQFGgQlQwODo5ZrK6trU3tZUxjUVTabWhowPDwsMrtcDgceHl5wdfXFxYWFrC2toanp+eYsxOOjo4UTGgJwzC4evUqBgYGwOfzjfIXhlQqxenTp3H+/HmVguvo6Gjs3LlTI8v5iGmTSqWorq5mZzvu378PDofD7oWKjIyEn5+fUf4cToRhGFRWVkIgENDIuZ6TSqVsZrG6ujo2s1hcXJzRLrU1FhRoTEF/P1BdDYjFgJUVEBQEGOv7m2EYDAwMjNoroQgmBgYGpq0v3d3dqKmpUWldOzCSptbGxgZBQUFYvXo1wsLC2GDCzs6Ogolp1t/fj8zMTCxYsAB+fn667o5WtLS04OOPP0ZTU9OUz7W0tERKSgoSEhL0771pSjdBI9bT08POdpSWlmJwcBC2trZKBQOdnZ113c1pRSPnhqOhoQFCoRDXrl0DADazmLZrckil/RgaqgbDiMHhWMHGJghcLt3/noQCjScoLQUOHQLOnAFqa4FH/7U4HCAgAFi/HnjlFSAiQnf9VAXDMOjt7R03mFA3g5O6BgYGUFtbO6lKyZaWlrCxsYGNjQ2sra2V/vTz88OOHTsQHh4+Db0mEykpKUF9fT1WrVpllEsUGIaBUCjE8ePH2YKPU+Hn54fdu3fr12iqMd8ECeRyOerr69nZjvr6ejAMg9mzZ7NBR1BQkMkksaCRc8PR39+PvLw8CIVCdHV1wd/fH3w+X6OZxQYGStHcfAidnWcgEtUCePSRmQNr6wC4uq6Ht/crsLOj+99YKNAYR10dsHcvkJkJcLnARKnuFa8nJwOHDwP6lBSGYRh0d3ePWuKk+FOdZUjaMjw8jIaGBjx48EBpyYmVlZVSAPHo383NzUe14+joiC1btmDZsmU0IqVjw8PDyMrKgo+PD6KionTdHa14+PAhjh49ipKSkimfy+Fw2LS1Y72XdcJYboJkSgYGBtjZjpKSEvT29sLKyopNoRsVFWW0+6ke9/jI+ZIlS6iatR4aK7NYfHw8kpKSVM4sNjRUh8rKvejuzgTABTBRvaOR111ckhESchg2NnT/exQFGmNITQVefXXk9+ZUamlxuSMf770HvPSS9vr3OEWNibHqS7S3t6tUEEwXFDMszc3N7P6JRwOKyQYLFhYWWL16NdasWWOUo+aGprGxEYWFhUhOToaDg4Ouu6MVRUVF+Oyzz1RaUuju7o7du3cjICBACz1TkaHdBIlWMAyDe/fusZXKq6urIZfL4eHhwe7tCAkJMfr77HSMnBPNaG1thVAoxJUrVyAWi9maHKGhoZNeitrcnIrq6lchl0sxcYDxOC7MzLgICnoP3t50/1OgQOMxBw8CBw6o386bbwKvv65+OwqKGhNjBRMdHR1qZWCaTmZmZqNqS7i5uaGpqQlCoRAPHz5Uq/3Y2Fhs2bKF8qPrAblcjuzsbFhbWyM2Nlb/9htogEgkwpdffokrV66odH58fDyefvpp/XpQ09ebINE5kUiEiooKtnZHZ2cnuFwugoODERERgaioKHh5eRnlzzqgnZFzoh0ikQhXr16FQCBga3IoMotNVFumoeEg6urUv//5+78JX1+6/wEUaChJTQVeflmz7e3ZM/njh4eH2RoTjy916urqUist7HSysLBgg4nHq18/XmOiqqoK6enpqK+vV+uawcHBSElJoSltPdHZ2QmhUIiEhAR4eHjoujtaUVNTg08++QQdHR1TPtfe3h47d+7E/PnzNd8xdej6JkgMBsMwaGtrY5dYVVRUQCKRwNnZmV1iFRYWBltbW113VSvGGjnn8/lUzVrPMAyDqqoqNrOYpaUlli1bBh6Ph5kzZyod29ycispKzd3/QkNT4eVF9z8KNL5VVzeyj1GT+5+trUf2UT66XFkkEo1KB6v4e09Pj+YurmVWVlZj1pdwd3efVI2J9vZ2ZGRk4ObNm2r1w8PDA9u3b8e8efPo5q4HGIbB9evX0dvbixUrVhjl3hiZTIavv/4aZ8+eVSn4j4qKwgsvvKB/aWun6yZIjJJEIkF1dTU729HS0gIzMzP4+/uzy6x8fX2N7j6tGDkXCoVobm6e9Mg5mX7d3d3IycnB5cuX2cxiPB4P0dHREIsbcP16BORyzd3/zMyssXhxqcnv2aBA41urVwMCwdSWIz+JuTmDuXM7sH//12ww0dfXp7kLaJmNjY1SAPHonw4ODir9whgcHMQ333wDgUAAmUymct9sbW2xceNGJCUl0RpZPTEwMIDMzEzMmzcP/kb6YNna2oqPP/4YDQ0NUz7XwsICO3bsQFJSkn4+bGnjJsjlAnw+cOGC5tokBqGrq4tNn1taWgqRSAR7e3ulFLp6F2yrICcnB2+//TYKCwvx4MEDvPLKKwAw4cg50S1FZjGhUIja2lrMmDEDq1adh7n5HQCqP5eMxoWLCx/z5pn2/Y8CDYwMuEVGaq/9lJTfwsXlgfYuoAZ7e/txq1/b2tpq7IFIJpMhOzsbX3/9tVo1OMzMzMDn87FhwwaTrWqrj8rKylBTU4Pk5GT92m+gIQzDICcnB2lpaSqlrfX19cXu3bv194FD2zfB0lKA0kubLJlMhrq6OnaZlSJQnzNnDqKiohAZGYmAgAD9ybg2BWfPnkVeXh4WLVqEbdu24cSJE0hKSho1ck41OfRTQ0MD8vI+h7e39vZTLF5cCjs7073/UaABYP9+4IMPNDuQp8DhyBARkY24uC813/gkOTk5jRlMuLu7w8bGRqvXZhgGd+7cwfHjx9Ha2qpWWwsWLMC2bduMds2/IZJIJMjKysKsWbMQHR2t6+5oRW9vL/7v//4Pd+/enfK5HA4H69atw4YNG/R75k2bN0EuF9i3D3j3Xc23TQxSX1+fUsHAvr4+WFtbIywsjF1m5erqqutuThmHw8GJEyewZcsWAGOPnCtqchhrBj5DVFW1H/fv/x2anc1Q4GLWrH0IDjbd+x8FGhgpbltTo732HR3b8Oyzv9Za+xwOBy4uLmzw8Ggg4e7urrMR5sbGRqSlpaGyslKtdnx8fJCSkoKQkBAN9Yxowr1793Dt2jWsWrXKKJZAjOX27dv47LPPVFry6Obmht27dyMwMFALPdMwbd8Eg4KAqirttU8MFsMwaGxsZIOOmpoayOVyzJw5UymFroWFha67+kSPBxqPerwmR0xMDPh8Pvz8/Ka3k2SUgoIgiETau/9ZWwchNtZ0738mH2j09QFOTsrFbjWPwYsv/ggWFmKVWzAzM8OMGTPG3DPh5uamVzfhnp4enDx5EgUFBWplynJ2dsbWrVuxdOlS/VzTbqLkcjlycnJgYWGB5cuXG+X/jVgsRlpaGi5fvqzS+cuXL8czzzxjGJtBp+MmyOEAvb0AVVYmTzA0NITy8nKUlJSguLgY3d3dsLCwQEhICBt4eHp66uV9Z6JAQ2FgYAC5ubnIzs5GZ2cn/Pz82Joc+vR73FRIpX3IzXWCcsVvTeMgPr4XXK5p3v9MPtC4dQtYsED719m27X/g5nZvwmPMzc3h5uY2ZjDh6uqq9+tXxWIxLly4gAsXLqhVcdzKygpr167FqlWrYGlpqcEeEnV1dXVBIBAgPj4enp6euu6OVtTW1uLTTz9FW1vblM+1s7PDd7/7XSxcuFALPdOS6boJFhUB+pbOl+g1hmHw4MEDdm9HZWUlpFIpXF1d2U3l4eHhehPQTybQUJDL5SguLoZAIEBpaSns7e2RkJCAxMREzJgxQ/udJQCAvr5buHFD+/e/RYuK4OAwX+vX0Ud6vGh4eohVn2SYErl85J9aUWNirD0TLi4uBrlRTC6Xo6CgACdPnlSr4B6Hw8Hy5cuxefNmODk5abCHRBMKCwvR3d2NLVu26H3Qqwq5XI5vvvkGZ86cUakAZkREBF544QU4OztrvnPaNF03wem6DjEaHA4HXl5e8PLywqpVqzA8PIzKyko28Lh8+TLMzMwQGBjI1u6YPXu2Xs52PM7MzAzR0dGIjo5Ga2srsrOzIRAIcO7cOZWqWRPVMMz03Jem6zr6iGY0bk3PYN7Jkw1ISnKCk5OTUd04ysvLkZ6ejqamJrXaCQsLQ0pKCmbPnq2hnhFNGRwcRGZmJqKiogxjv4EK2tra8Mknn6Curm7K51pYWGD79u3g8XiG+bNNMxrEQHV0dKC0tBTFxcUoLy+HWCyGg4MDu8QqPDx8WjddT2VGYyxisZitZk01OaYHzWhon8kHGv39gKMjLU+eqtbWVqSnp+POnTtqtTNz5kzs2LEDUVFRhvmQZuQqKipQWVmJ5ORko/xFxzAMcnNz8a9//Uul5X5z5szBnj174OXlpYXeTZNpuAkyAJpKSjAnPJx+zolWSKVS1NbWsrMdTU1N4HA48PX1RUREBKKiouDv76/xVQP9/f2orq4GMJIZ8c9//jP4fD5mzJgBHx8fldp8vJq1hYUFW5PDoO81ekgq7UduriNoj4b2mHygAWg/4cqsWYNoarIxil+w/f39+Prrr5Gdna3S8hIFe3t7PPXUU0hISDDKZTiGTiqVIisrCzNnzsR8Ix2F7uvrw2effYbbt29P+VwOh4PVq1dj06ZN+p22drK0fBNsd3LCgWeegYODg1LBNkrxSbTl4cOHSil0BwYGYGNjg/DwcERFRSEiIgIuLi5qX0coFILP54/6+gsvvIAjR46o3X53dzcuX76MnJwc9PX1ISwsDDweD/PmzTPIpdb6iLJOaRcFGtBuCnlACheXL5CYmI6XX34Zq1atMsiCZlKpFJcuXcKZM2cwNDSkcjtcLhcrV67EunXrtF7Dg6jm/v37uHr1KlauXGm0e2Xu3r2Lo0ePqpS2dsaMGdi9ezeCg4O10DMd2b8fzN//Do5MC3nkuVzI9+5F9f797DIXxWizj48Pu8wlICCAHpyIVsjlcjQ2NqK4uBglJSWoq6sDwzDw9vZm339BQUF6nfVJKpXi5s2bEAqFqKmpgYuLC5KSkhAfH08Bu5pG6mh8AEAbD4FUR4MCDWi/KG509LMYHr4Nc3NzBAQEICUlBatXrzaIrD0Mw6CoqAjHjx9HR0eHWm3FxMRg69atcHNz01DviCYxDMNuroyLizOKGbjHicVipKenIycnR6XzY2Nj8eyzzxpVkCwWi3HzH//Aspde0t5FHqsM3tvbywYdj482Kx78NDHaTMhYBgYG2BS6JSUl6OnpgaWlJUJDQ9n3n7u7u97eAxsbG9maHAzDUE0ONQ0MlOL6de09BFJlcAo0AACrVwMCgWZnNTgcGby9y7Fhw7vo7+9HS0sL2traYG5uDn9/fyQlJWHFihWYO3euXo7k1dXVIS0tDTVqLqlQBFcBAQEa6hnRtO7ubly6dAnLly832jXA9fX1+OSTT1SqUG9ra4vnn38eMTExWuiZbjAMg6tXr6KzsxMJCQlw3LFD8zdBLhfg84ELF8Y9RDHarHjoq62tBcMw8PLyYjMJ6ftoMzFcDMOgubmZff9VVVVBJpPBzc0NUVFRiIyMRGhoqF6uRBgYGEBeXh6ys7PR0dFBNTnUcPv2anR3C6DZWQ0uXFz4mDdv/PufKaBA41t1dUBEBCASaapFBubmEqSkvAFHx072q1KpFA8ePEBLSws7wxEYGIikpCTExcXBXg92jHd2duLEiRO4fv26Wu24urpi27ZtWLRokd6ODBHg5s2b6OjowIoVK4xjv8Fj5HI5zp07h9OnT6u0rygsLAy7du0yqhH2iooKlJWVYcmSJfD29h75ouZvgoC19chshr//pE8ZHBxEWVmZ0mizhYWF0mizh4cH3VOIVojFYlRUVLAFAzs6OmBubo6goCD2/Tdr1iy9ev8panIIhUKUlJTA3t4e8fHxSExMhKurq667ZxCGhupw/XoE5HLN3f/MzKyxeHEpbGwmf/8zRhRoPCI1FXj5Zc2197e/ieHmdgoCgWDUAw7DMOju7kZzczPMzMzg7+8PBwcHLF68GHw+H76+vprryCSJRCKcO3cOmZmZkKoxqmltbY3169djxYoVNKqix4aGhnDhwgVEREQY136DR7S3t+OTTz5BbW3tlM/lcrnYunUrVq5cqVcPFepobW1Ffn4+goODETnWelFN3wRTU4E9e1Q+nWEYtLS0sGvrq6urIZVK4ebmxj70hYaGGmVGNKIf2tra2A3l5eXlGB4ehpOTk1IKXTs7O113k9XW1gahUIgrV65AJBIhOjoafD4fYWFhRnMf05bm5lRUVmru/hcamgovL9Xvf8aCAo3HHDwIHDigmXZee23k762trcjIyMCtW7fGPFYkEuHBgwcwNzfHzJkzYWFhAX9/f3YKVNujzHK5HLm5ufjqq69U2hyrYGZmhoSEBDz11FO0OU3PVVZWory8HMnJyUa130CBYRhcuXIFX375JcQqFIqbNWsW9uzZg1mzZmmhd9NvYGAA2dnZcHZ2Rmxs7MRLNbVxE9QQsVisVLBNsRQ1MDCQXeaib6PNxHhIpVJUV1ezsx3Nzc3gcDjw9/dnAw9fX1+9WAotFotx7do1CAQC3L9/HzNnzgSPx8OyZcsoMJ9AQ8NB1NWpf//z9z8IX1/N3v8MFQUaY0hNBV59dWSp8lQG9rnckY/33x97EK+yshJpaWlobGwc83yZTIbe3l7Y2trCwsICZmZmcHBwQHx8PJKSkrSydKOkpATp6elobm5Wq52oqCjs2LHDaNf3GwupVIqLFy/C3d0dCxcu1HV3tKK/vx+fffbZuIH9RDgcDpKTk7F582ajWEYmlUqRm5uL4eFhJCYmTv4BQ1s3QQ1ra2tjU5hWVFRALBbD0dGRTV8aERGhV6PNxLh0d3ez77+ysjIMDg7Czs5OKamBrjP3MQyD6upqCAQCFBUVUU2OSWhuTkV19auQy6WY2p4NLszMuAgOfp9mMh5BgcY46uqAvXuBzMyR35sT/a5VvJ6cDBw+PPFyZMUGzBMnTqCnp2fcY7hcLlxdXdHe3g6GYcDhcDB//nzweDyEhoaqPWLX3NyM9PR0lJSUqNXOrFmzkJKSgvBw082oYCiam5uRn5+PlStXwtnZWdfd0Yri4mIcPXoUvb29Uz7XxcUFL774IkJDQ7XQs+nFMAxu3bqFe/fuYfny5aqt09bWTVBLHh1tLikpwf3798HhcODn58c+9Pn5+enFaDMxPnK5HHV1dez7r6GhAQzDYPbs2ez7LzAwUKcDGD09PWxNjt7eXoSGhoLP51NNjjEMDdWhsnIvurszAXAxccAx8rqLSzJCQg6b/J6Mx1Gg8QSlpcChQ8DZsyP1rB791+JwgMBAYN06YN8+peyNTzQ8PIzMzEycO3duworEs2bNwuzZs1FRUcEGJl5eXuDxeIiNjZ3yFGhvby+++uor5ObmQp3/ekdHR2zevBnLly+nG5SeU6StBYCEhASjXFYyPDyM48ePQygUqnT+4sWL8Z3vfAe2traa7ZgO1NfXo6ioCAsWLNBMuktt3QS1rKenR6lg2+DgIGxtbZUKBhprwE10r7+/H2VlZWwK597eXlhZWSEsLIwNPHSV6l0qlaKoqAgCgYCtyZGYmIiEhARa9vyYgYFSNDcfQmfn2W+L+j363MSBtXUgXF3Xwdt7n0mnsJ0IBRpT0N8PVFcDYjFgZTVSTFfdJFE9PT346quvcOXKlQkf/GNiYhAYGIiioiJUVlYCGNl0rZgCnTlz5oTXkUgkyMrKwtmzZ1Vas65gYWGB5ORkrFmzhtZ5GoCenh5cvHgRy5Yt+3d2ISPT2NiIjz/+GA8ePJjyuTY2NvjOd76DJUuWaKFn06urqwu5ubmYPXs2FixYoJ2AUhs3wWkgl8tRX1/PjjbX19crjTZHREQgKCjIKJbLEf3DMAzu3bvHvv+qq6shl8vh4eHBpnAOCQmBpaXltPetqakJAoGArcmxaNEitiaHMQ5KqUMq7cfQUDUYRgwOxwo2NkHgcvX//qdrFGjoiaamJqSnp6O8vHzcYywsLLBq1SrMnTsXBQUFKCgoYGdDwsLCwOfzER0drTTDwDAMrl+/jhMnTqCrq0utPsbGxmLLli1GlebTmBUVFaGtrQ0rV640ygcouVyO8+fP46uvvlIpbW1ISAhefPFFzJgxQwu9mz4ikQg5OTmwtLREfHy8Uf5fa9rAwAA721FSUsKONitS6EZFRVFhUaI1IpFIqWBgZ2cnuFwumw0uMjISXl5e0/qgPzAwgCtXrkAoFKKjowO+vr7g8XhYvHgxZY8kaqFAQ48wDIPi4mKkp6dPODrr4OCAzZs3Y8GCBbh69SqEQiHa2toAADNmzGBrcrS2tiItLQ319fVq9Ss4OBgpKSk6SblLpk4kEuHChQsICwtDSEiIrrujFR0dHfj0009RXV095XPNzc2xZcsWJCcnG/SInVwuR0FBAXp6epCYmKgXNXgMkWK0WVGp/PHR5sjISISEhOhlwTZi+BiGQVtbG5vCubKyEhKJBC4uLuz7LywsbNqWdcrlcpSUlEAoFKK4uBh2dnZsQhqqyUFUQYGGHpLJZLh8+TK++uorDAwMjHuct7c3duzYgYiICJSWlkIoFOLu3bsYHBxkM1t5e3urvObS3d0d27dvx/z58w36gcyUKDbDJicnG8V+g8cxDIOCggJ88cUXEKlQWM7b2xt79uzB7NmztdC76aOoYBwbG/vEZZNkakQiESoqKtgHP30YbSamQyKRoKqqip3taGlpYWttKVI4+/j4TMv7r62tDdnZ2bhy5QqGhoaoJgdRCQUaemxwcBBnz57FpUuXJiygFxkZiR07dsDZ2RlffPEFvvzyS7S0tEAikQAYmQHx9vaGu7v7pDZu29raYuPGjUhKSqJlGAZCkbbW1dUVMTExuu6OVgwMDOAf//gHbt68qdL5K1euxNatWw16GUBzczOuXbuGsLAwhIWF6bo7Rk8x2qx46KuoqIBEIoGzszO7xGo6R5uJ6ens7FRKoSsSiWBvb8/uLYqIiICjo6NW+6CoySEUCnHv3j14enqyNTmMsQ4T0SwKNAxAR0cHTpw4gcLCwjFfZxgGDx48gEQiwcyZM2FpaQm5XI62tjY0Nzejv78fwMgeDy8vL8ycOXPMjdxmZmbg8/nYsGED5Z43IC0tLbhy5QpWrFhhtPtnSktLceTIETx8+HDK5zo7O2PXrl0GnYK5t7cXly9fhqurK5YsWUKZ3nREIpGgurqane14dLT50YJtNNpLtEEmk6G2tpYNfBUrF3x8fNj3X0BAAMzNzbVyfUVNDqFQiJs3b8LCwgKxsbHg8XhGm2yEqI8CDQNSU1ODtLQ01NXVARj5oe/q6kJdXR0GBwcBAFwuF7Nnz8bs2bNhZmYGhmHQ19eH5uZmdHR0QC6Xg8PhwNXVFd7e3nBycmJrdGzbtg2enp66/BbJFDAMg7y8PMhkMiQmJhrlw41EIkFGRgYuXbqk0vmLFi3C888/b7CBs0QiQW5uLmQyGRISEmifgJ7p6upiH/oeHW1+NIWutkebienq7e1FWVkZ+x7s7++HtbU1WzAwIiJCa/sqHq/JERISAj6fj/nz59NACFFCgYaBYRgGhYWFOHLkCG7evDlu0T9ra2v4+fnB3d2dfQAdHh7GgwcP0NLSwqa49fLywq5du/D0009TuloD8vDhQ2RlZWHp0qUGv99gPE1NTfj444/R0tIy5XOtra3x3HPPYenSpQYZgDEMgxs3bqClpQUJCQlU78EAyGSyUQXbAGDOnDns2nptjjYT08YwDBobG1FSUoLi4mLU1dVBLpfDy8uLne0IDg7W+NJRqVSKW7duQSAQoLq6mq3JER8fT0E2AUCBhsHp6enBqVOnkJubi/v376OpqWnC/RsODg4IDAxU+oGXy+UYHh6Gk5MTRCIROBwOrKys2JocXl5e0/GtEBXdvn0bzc3NWLVqlUHvNxiPXC5HZmYmTp06BZlMNuXzg4OD8eKLLxpshpSamhrcvn0bMTEx8PHx0XV3iIr6+vqUCgb29fXB2tpaqWCbob5Hif4bHBxUSqHb3d0NCwsLhISEsPuLPDw8NDoQc+/ePQiFQhQUFEAulyMmJgY8Hg/+/v4GOeBDNIMCDQMhFotx4cIFXLhwQamS+PDwMBoaGvDgwYMJC/65ubkhICAAjo6OWLt2LZKTk2FpaYnm5mYIBAJcvXqVneUICwsDj8fDvHnzaApUj4hEImRmZiI4ONhoNwJ3dnbiyJEjbFHKqTA3N8emTZuwevVqg3zfdnR0IC8vD35+foiOjqZfzEbk0dHm0tJS1NTUQC6XY+bMmUopdI1x4IDoHsMwaGlpYVM4V1VVQSqVwtXVVSmFrqZWNQwODuLKlSsQCATo6OiAj48P+Hw+1eQwURRo6DmGYZCfn49Tp06Nu0wKGMnIU1dXN25RPg6HA29vb+zcuRMpKSmjsqQMDQ0hPz8fQqEQra2tAAAXFxckJSUhPj5e5RS5RDNqampw9+5dJCcnG+x+g4kwDINr167h2LFjKqWt9fLywu7duw1yBmBwcBA5OTmws7PD8uXLaWmNCRgaGmJHm4uLi0eNNkdGRsLT05OCTaIVYrEYVVVVKC4uRmlpKVpbW2FmZoagoCD2/Td79my1338Mw6CkpAQCgQAlJSWwtbVFXFwckpKSqCCmCaFAQ49VVFQgLS0NTU1Nkz5HsTn80fobzs7OCAwMZB9Q7ezs8NRTTyExMXHUQw3DMCgrK4NQKMSdO3fAMAy4XC5iYmLA5/Ph5+enke+NTI5MJsOlS5fg4uKCRYsWGeWDx+DgID7//PNxs6o9CZ/Px/bt2w1upEwmk+HKlSvo7+9HUlISpUg1UYqsgYolLpWVlexos2JTeXh4OO2hI1rT0dHBvv/Ky8shFovh6OiIiIgIREVFITw8XO2CoI/X5Jg7dy74fD7Cw8ON8vca+TcKNPRQa2srjh8/jtu3b6t0vuIXV3t7O2bPng0XF5cxf5A9PT2xY8cOzJ07d8zXOzo6kJOTg9zcXDZw8fX1BZ/PR0xMjME92Bma1tZW5ObmgsfjGe1a7vLychw5cgTd3d1TPtfR0RG7du1CZGSkFnqmPQzD4O7du6irq8Py5cvh7u6u6y4RPTI8PIzKykr2wU8x2hwYGMiurdfEaDMhY5FKpaipqWHff/fu3QOHw4Gvry872+Hv76/y8tTh4WFcu3YNAoEA9+7dg4eHB3g8HpYvX041OYwUBRp6ZGBgAKdPn0Z2djbkcrnK7djZ2WHTpk1YvHgxsrKykJmZyRbvG0toaChSUlIwZ86cMV+XSCS4fv06BAIBm7fbzs4O8fHxSEpKMtqHYF1RLJcbHh5GYmKiQe43eBKJRIKTJ08iKytLpfMXLFiA7373u2qPsk23pqYmFBYWIioqCsHBwbruDjEAHR0d7Np6xWizg4MD+9AXHh5OS1uJ1vT09CgVDBwYGICtrS2bQjcyMlKlrHgMw6C2thYCgQA3btyAhYUFli5dCh6Ph1mzZmn+GyE6Q4GGHpBKpRAIBDhz5gxbD0MVXC4XK1aswLp165SWYXR1deHkyZO4evXquOdyOBwsW7YMmzdvHvemwTAM6urqIBQKUVhYCJlMBg6Hg+joaPD5fISFhdEom5p6e3uRlZWFxYsXjxv4Gbr79+/j448/xv3796d8rpWVFZ599lksW7bMoN5ripzzM2fORExMjEH1negPqVSqVLCtqamJHW1WLHNRZ7SZkInI5XI0NDSw77+6ujowDANvb282hXNQUBC4XO6U2n348CFbk+Phw4dsTY558+bRnjUjQIGGDjEMg6KiIhw/fhwdHR1qtRUTE4OtW7dOuMGqvr4eaWlpqK6uHvcYS0tLrFmzBsnJyRMWB+vt7UVubi5ycnLYZS+enp7g8/lYtmwZrSdWwZ07d3D//n2jTVvLMAwuXryIEydOTJiSeTyBgYHYvXu3QW0iFIvFuHz5MjgcDhITE43y/5XozsOHD5VS6A4MDMDGxgbh4eGIiopCREQEXFxcdN1NYqQGBgaUCgY+fPgQlpaWCA0NZWc7PDw8Jt2eTCZDUVERhEIhqqqq4OzsjMTERCQkJFBNDgNGgYaO1NfX41//+hdqamrUasff3x8pKSkIDAyc1PEMw+DWrVs4fvw42tvbxz3O2dkZmzdvfuLIsVwux+3btyEQCFBRUQFgZNQ5NjYWPB4P3t7eU/uGTJBYLEZmZiYCAwMRHh6u6+5oRXd3N44cOYLy8vIpn2tmZoannnoKa9euNZiRWkUWrfb2diQmJtIvSaJ1crkcjY2NKC4uHjXarHjoCwoKomCXaAXDMLh//z4bdFRXV0Mmk8Hd3Z19/4WGhk44gPkoRU2Oq1evQiaTYeHCheDz+QgICKAZYQNDgcY06+rqwokTJ3Dt2jW12nF1dcXWrVtVXoYhlUohFArxzTffTLhca86cOUhJSUFoaOgT22xubmaL9ShqcoSGhrJToIbykDid6urqcPv2baNNWwsA169fx7Fjx1RaFujp6Yk9e/bA19dXCz3TjsrKSpSWlmLJkiUUaBOdUYw2K2Y8enp6Ro02u7u700Mb0QqxWIyKigo2hXNHRwfMzc0RHBzMvv+8vb2f+P4bHBxkU++3tbVhzpw54PP5WLJkCQXNBoICjWkiEolw7tw5ZGVlTbgx+0msra2xfv16rFixQiM/ZAMDA/j6668hFAon3IA+b948bN++HZ6enk9sc2hoCAUFBRAIBEo1ORRToLRxcWT08dKlS3B0dMTixYuN8pf94OAgvvjiiwn3Bk0kKSkJ27dvn/QImK61trYiPz+f/UVKiL5gGAbNzc3saHNVVRVkMhnc3NzYtfVTGW0mZCoYhkF7e7tSCl2JRAJnZ2dERkYiIiIC4eHhEw62MQyD0tJSCAQCFBcXw8bGhk1IY0jLaU0RBRpT0N8PVFcDYjFgZQUEBQFPSnojl8uRl5eHU6dOoa+vT+VrczgcJCQkYNOmTVp5UJ9MSl0zMzPweDxs3LhxUqPvDMOgvLwcAoFAqSbHokWLwOPx4O/vb5QP2E/S1taGy5cvG/UNsrKyEp988olKaWsdHBzwwgsvYO7cuVromeYNDAwgOzsbTk5OWLZsmXHP3KlyEyR6Z7zR5kcLts2aNcsk789E+yQSCaqrq9nAo7m5GRwOB/7+/mwKZx8fn3HvpR0dHcjOzkZubi6GhoYQFRUFPp+PiIgIrb5npdJ+DA1Vg2HE4HCsYGMTBC6X7n9PQoHGE5SWAocOAWfOALW1wKP/WhwOEBAArF8PvPIKEBGhfG5JSQnS09PR3NysVh+ioqKwffv2aVmGUVlZiX/9618TFgm0tbXF+vXrwefzJ51dorOzEzk5Obh8+bJSTQ4ej4fFixebxBQowzAoKCiASCRCUlKSUT6QSqVSfPXVV7hw4QJUubXMmzcPO3fuNIhZL6lUiry8PIjFYiQmJhpvAgR1boLEILS1tbEbysvLyzE8PAwnJyelFLrGurST6F53dzebwrmsrAxDQ0Ows7NjC1ZGRkaOuc9teHiYTb3f1NTE1uRYtmyZxgqgDgyUorn5EDo7z0AkqgXw6O81DqytA+Dquh7e3q/Azo7uf2OhQGMcdXXA3r1AZibA5QITJclRvJ6cDBw+DFhZNSM9PR0lJSVq9cHb2xspKSmImOZf3ooH4pMnT6Knp2fc49zc3LB9+3YsWLBg0qMIEokEhYWFEAgEaGhoAGAaNTn6+vqQlZWFhQsXGtR+g6lobm7Gxx9/jHv37k35XCsrKzz99NOIi4vT+1FURUKFpqYmxMXFGe17Vq2boL//9PWTaJRUKmVHm4uLi0eNNkdGRsLX19coB0qI7snlctTV1aG4uBilpaVoaGgAwzCYM2cO+/4LCAhQGuR8vCYHl8tla3LMnj1bpX4MDdWhsnIvurszAXABTJQpceR1F5dkhIQcho0N3f8eRYHGGFJTgVdfHfm9OZUsnObmDMzMZFi27J8IC8tV+fqOjo7YtGkT4uLidHozV2RDOn/+PIaHh8c9LigoCCkpKfDz85tS+/X19RAIBCgsLIRUKmVrcvB4PISHh+v9A+dkFRcXo7GxEatWrYKlpaWuu6NxDMPg0qVLyMjIUCltbUBAAF588cUppUHUlfr6ehQVFWH+/PnwN+aHaVVvglzuyMd77wEvvaS9/pFpoxhtVhRsGxwchJ2dnVLBNicnJ113kxipvr4+pRS6fX19sLKyQlhYGJvC+dElyL29vWxNjp6eHgQHB4PH42HBggWTrsnR3JyK6upXIZdLMXGA8TguzMy4CAp6D97edP9ToEDjMQcPAgcOqNMCA4CDmJiTWLjw7JTOtLCwQHJyMtasWaNXyzB6enpw6tQp5OfnT7gcZunSpdiyZQtmzJgxpfb7+vqQm5uL7OxspZociilQGxsbtfqvK8PDw8jMzISfn5/Rbg7u6enBkSNHUFZWNuVzzczMsGHDBqxfv17vR0e7u7uRm5uLWbNmTWkGzyCpfxMc8eabwOuvq98O0RuK0WbFQ59itHn27Nls0BEYGDjlgm2ETAbDMGhqamLffzU1NZDL5fD09GTffyEhIbC0tIRMJsOtW7cgFApRWVkJZ2dnJCQkICEhYcLAuKHhIOrq1L//+fu/CV9fuv8BFGgoSU0FXn5Zc+0lJv4fwsLyJnWsqg/p06mpqQnp6ekT1kKwsLDAqlWrsHbt2ikHS4qaHEKhkL2GlZUVli5dCj6fb1CpQhsaGnDz5k0kJyfD3kg3y968eROfffaZSmlrPTw8sHv3br2fFRCJRMjJyYGlpSXi4+ON/wFK0zfB1FRgzx7NtUf0Sn9/P8rKythlLr29vexos+LBz1gTXhDdGxoaQnl5Obu/o6urC1wuFyEhIez7b+bMmUqp96VSKRYtWjRmTY7m5lRUVmru/hcamgovL7r/UaDxrbq6kX2MIpGmWmRgbi5BSsobcHTsHPeo4OBg7NixY8rLjnSFYRjcvXsX6enpbOrasTg4OGDz5s0qL/9qaWmBUChEfn4+W5MjJCSErckx2SnQ6SaXyyEUCmFra4ulS5ca5ci3SCTCP//5TxQUFKh0fkJCAlJSUvQ6laZcLkdBQQF6enqQmJhotMGiEs3fBAFr65HN5HoeUBL1MQyDe/fuKRVsk8vl8PDwYDMJKUabCdE0hmHQ2trKvv8qKyshkUjg4uLCpnD28fFhZzkUNTl4PB6WLFkCmew+rl+PgFyuufufmZk1Fi8uNfk9GxRofGv1akAgmNpy5CfhcGTw9i7Hhg3vjnrN3d0d27dvx/z58w3yYVQmkyEnJwenT59ms0iNRd0N7SKRiC3W8+DBAwAjVcuTkpIQHx+vVxWXFSn3EhMT4e7uruvuaEVVVRU+/fRTdHaOHzyPx8HBAd/73vcQHR2thZ5pTmlpKSorKxEbG4uZM2fqujvTRxs3QS4X4POBCxc01yYxCCKRCOXl5eyDX2dnJ7hcrlLBNi8vL4P8/feo3//+98jIyEB5eTlsbGywfPly/OEPf5hUkVuiPRKJBJWVlez778GDBzAzM0NAQAAiIiJgaWmJiooKtibHunWXYGlZAkCmwV5w4eLCx7x5pn3/o0ADIwNu2lxCn5LyW7i4jDwk29raYsOGDeDxeEaxDGNwcBBnz57FpUuXJtwIHBkZiR07dqi8/IlhGFRUVEAgEOD27dtgGAbm5ubsFKgua3IwDINr166hv78ffD5f7/cbqEIqleLrr7/GuXPnVEpbGx0djZ07d+pVYPi4lpYWXL16FWFhYQgLC9N1d6aXtm+CpaVAeLj22id6jWEYtLW1obi4eNRosyLoCAsL01hK0um0du1aPPvss1i8eDGkUilee+01dikZpQTWH52dnWwK57KyMohEIjg4OGDOnDlgmDrMn/9XrV178eJS2NmZ7v2PAg0A+/cDH3yg2YE8BQ5HhoiIbCQkpE2p2J2h6ejoQEZGBm7cuDHuMYqig0899ZRaD5xdXV1sTY7+/n4AgI+PD/h8/rTX5Ojv70dWVhbmz59vMMvfpqqlpQWffPIJGhsbp3yupaUlUlJSkJCQoLcjl319fcjJyYGrqyuWLFlilIHiE2nzJsjlAvv2Ae+Ontklpkkx2qzIZtXS0gIzMzP4+/srLXPR13vGRNrb2+Hh4cHObhP9I5PJUFtby6Zwdnf/AsHBpTAz08bjMBezZu1DcLDp3v8o0MBIcduaGu217+7eg7t3xfD09NTeRfRETU0N/vWvf6G+vn7cY6ytrbFu3TqsXLlSraBAIpHgxo0bEAgE7PXs7OwQFxc3LVW3S0pKUFdXh+TkZL3eb6AqhmGQnZ2N9PR0SCSSKZ/v5+eH3bt36+37XiKRIDc3FzKZDAkJCUb5fzhp2r4JBgUBVVXaa58YtM7OTqUUuiKRCPb29oiMjERERAQiIiL0ejb0UdXV1QgODsbdu3cRFRWl6+6QSbhyJQDDw3Vaa9/aOgixsaZ7/zP5QKOvD3ByUi52q2kcDtDbC5jCflJg5AG1sLAQGRkZ6OrqGvc4V1dXbN26FTExMWqPXI1Vk2Pu3Lng8XiIiIjQ6MiYRCJBZmYm5syZg7lz52qsXX3y8OFDHD16VKWikxwOh01bq4+b9hmGwY0bN9DS0oL4+Hi4uLjouku6RTdBokceHW0uKSlhZ1J9fHyUCrbp471FLpdj06ZN6OnpQW6u6rW0yPSRSvuQm+sE5YrfmsZBfHwvuFzTvP+ZfKBx6xawYIH2r1NUBMyfr/3r6BOJRIKLFy/i7NmzEE2Qycbf3x8pKSkIDAxU+5p9fX3Iy8tDdnY2G+R4eHiwNTnUXQPc2NiIwsJCJCcnw8HBQe3+6qOioiJ89tlnE27yH4+bmxv27NmDgIAALfRMfbW1tbhz5w4WLlwIHx8fXXdHP9BNkOix3t5epYJt/f39sLa2ZgsGRkREwNXVVdfdBADs27cPZ8+eRW5ursoVqcn06uu7hRs3tH//W7SoCA4O87V+HX1k8oHG1atAbKz2r/PMM+/Ay2vqa9yNgVgsRl1dHe7fvz/hRmJPT08EBQVppEAfwzBob2/HvXv32IDD3NwcXl5emD179pTTlSpSN3K5XMycOdMg1w4/iVQqRWVlJZqbm1U639vbGyEhIXqZ5GBoaAjNzc1wdHSEm5ubUf7//f/27jyorTPdE/9XQoDYEQJhsA0GsxnjeMU2GDCyjRPbiVfoSnfSiWN3Tzq32j2/mZqaP7r73pmq6dTUVNf0H7dT08kt7Did3m7Aa7zFxBarN7ybzRiDsY0wWhCbkITEOb8/iM5FIGEE2vV8qlzgcM7RC8GPznPe932euUrq7cV/+fd/d/rr9Jw4gajt2xEWFkY/fzInLMvi+fPn3Nr6rq4uMAyDhIQEbrYjPT3dpfv0zH75y1/izJkzqK2t9fj+QOQ/DA3dxN27zr8JXLPmBiIjNzj9dTyR3yca9DDPdeRyOSorK2dcjiMQCLBlyxbs2LHDYRVIent7UVNTg2vXrnE9OdLT0yGVSrFq1arXTsGr1WpUV1ejsLAQEonEIWPyNE+fPsWxY8egUqnsPjcsLAwffPABVnngL/jo6Chqa2sRGhqK/Px8j0yC3M5FQfB/7d+Pl7GxCAkJQVxcHCQSybSPkZGRlISQWRsdHbUooavRaBAYGMg1bMvJyYFEInHq7xTLsjhy5AhOnTqF6upqpKenO+21iOPRjIbz+X2iMTICREbS8mRXam5uRmVl5YxPzsPCwvDOO++gqKjIYWtx9Xo9bty4gerqavT29gKY6MlRWFiIoqKiaZsNzXtNBgcHIZVKPXJN8HyNj4/j3LlzuHjx4pzK1i5fvhwffvghoqKinDC6uRsfH8e1a9cwMjKCoqIin6z05jAuCIIsjwd5ayv6tFoolUooFAruo0aj4Y4LCgqaloCYPxeJRJSEEJtYlkVvby/XJfrJkycwmUwQi8UWJXSFQqFDX/ef/umf8Le//Q1nzpyx6J0RFRXlkNl54lwm0wjq6yNBezScx+8TDYAKrrgDwzBoaGjAmTNnMDw8bPO4+Ph4lJaWYsWKFQ67yTD35Kiursb9+/e5nhxr1qyBVCpFamoqRkdHUVVVhTfeeMNj9xvMV19fH44ePYru7m67zw0MDERpaSk2b97sUTd/LMuiqakJnZ2dyMvL89kZKIdzYxA0Go1QqVQWyYf5c7VazSXAAoHAIvEwf5RIJIiJifHPssTEJoPBgCdPnnA9Lfr6+sDn85GWlsYlHosWLZp3/LJ1/pdffomDBw/O69rENW7cSINe77z4R1WnKNGgEvJupNfrcenSJVRVVc3Y8C8rKwulpaVYvHixQ1/fWk8OoVCIhQsX4pNPPvHJDd8sy6K2thYVFRVzKlublJSEw4cPe1zX7JcvX6KxsRE5OTm0fMFeHhoETSYT1Go1lErltCREpVJhfHyiiy+fz0dsbKzVJEQsFtOSOQKVSsUtsWpra4PBYEBkZCSys7ORk5ODZcuW2b13j/iGJ09+hZ6ePwFwQvyjPhqUaADUFNcT9Pf34/Tp07h586bNY3g8HvLy8rBnzx5ER0c79PWNRiNu3ryJo0ePYnh4GGKxGKGhoSgoKHBJTw5XGRoawp///Gc8evTI7nN5PB7eeustvP322x514zY4OIi6ujrEx8c7pFSyX/LCIMgwDPr7+6clIOY/5iSax+MhJibG6p6Q2NhYBAUFOXRcxPOZTCY8ffqUSzxevnwJHo+H5ORkbrYjJSWFZsn8hFbbgsZG58U/6gxOiQYAYPt2QCZz7AM9gQCQSoHLlx13TV/37NkzfPPNN3g6wzKOoKAgvPnmmw5tlPfy5UvcunUL27ZtQ39/P6qrq9HY2Mj15MjJyYFUKnV4Tw5XevDgAb7++usZl6rZIhaLcejQIaSlpTlhZHMzNjaGuro6AEBhYSHdMM6XDwVBlmUxMDAwLQkxfzQXhQAm9mlNnQUxL9Fy9Hp+4pkGBgYsGgZqtVqEhoZyJXSXL1/u8IdbxLM8eLAdGo0Mjp3VEEAkkmLlSv++CaRE4wddXUB2NjBDuwe7CYUTD/Ko0p19WJbFvXv3cOLEiRmrIEVHR2Pv3r3YuHHjnG/+zd2vAwMDkZ+fb3GdkZERNDQ0oLq62qInx+bNm5Gfn++wqljOZjAYUFFRwd2U2ysvLw/vvvuux9x0sSyLW7duQalUWt3ET+bIT4Igy7IYHh62moQoFArodDru2MjISIt9IZMTEm/590/swzAMuru7udmOrq4usCyLxMRE5OTkYPny5UhLS/OoWV0yfzpdFxobs8Ewjot/fL4QubktCAnxnPjnDpRoTFJeDvz854693uHDjruevzGZTJDJZDh//rzFm/9USUlJKCsrQ0ZGhl3X7+/vh0wmQ0FBAeLj420exzAMHj16BJlMhtbWVgATsyobNmxAcXGxRzdm6uzsxJdffgmFQmH3uWFhYXj//fexZs0aJ4xsbtrb29HS0oLc3FwsXLjQ3cPxPX4eBFmWxejoqNVZEKVSaTEbGBYWZnUWRCKRIDw83GtnPoklrVZr0TBwcHAQQUFByMzM5GY7qOiEb5DLy9He7rj4l5lZjoQE74l/zkKJxhSffgr89reOuc6vfz3/65CJmYVz586hpqYGDMPYPG7lypU4cODAjEmD2e3bt6HRaLBlyxa7yta+evUK1dXVuH79OtftPD09HcXFxVi9erXHlMBlGAbnz5/HhQsXZvyZ2bJs2TIcPHjQY5YLKBQKXLt2jasYQzdxTkRB0CadTjetPK/54+DgIHecUCi0OgsSFxeHqKgo+v31UizLoqenh0s6Ojo6MD4+jri4OC7pyMzMdNiSXuJ63d2foqtr/vEvJeVTJCf7VvybK0o0rCgvB44cmViqbM9yZYFg4s9nn3nVQzyv0dfXhxMnTuDBgwc2j+Hz+SguLsbbb79ttXfC6OgoLl++jBUrVmDp0qVzHoter8fNmzchk8m4nhxRUVEoKipCYWGhW/tKKBQKHDt2DF1dXXafKxAIcODAAUilUo+4GdJqtaitrUVkZCTy8vJoc6arUBC0m8FgmFamd3KvEPNbbWBgoM0kRCQS0e+4FzEYDHj8+DHXqVylUiEgIADp6elc4pGYmOgRsZTMnlxejo6OI2AYE+zbsyEAny9AevpnNJMxCSUaNnR1AR9/DFRVTbxvzvRea/56SQnwxRcetRzZJz1+/BgVFRV48eKFzWNCQ0Oxa9cuFBcXc2tpHz9+jPb2dpSUlDhsvwHLsnjy5AlkMhnu378PhmHA5/Oxdu1aFBcXY+nSpS57k2FZFvX19fjmm28wNjZm9/mLFy/GoUOHkJiY6ITR2cdkMqGhoQF6vR5FRUXU+ModKAg6jLlXyNSlWAqFAmq1mpt1FAgEiI2Ntdq0UCwWe8yMKZmOZVkolUqLErpGoxHR0dFYvnw5srOzsWzZMmoe6iV0ui60t38MjaYKgAAzJxwTXxeJSpCR8YXf78mYihKN12hpAT7/HLh4caKf1eSfFo8HLF0K7NgxUSaeSti6DsMwuHHjBk6fPm2xZGGquLg47N69GyqVComJiVi1apXTxqTRaLieHOa13IsWLYJUKsX69eudWhVpeHgYX3/99YyzPbbweDxs374du3fvdvsGR5Zlcf/+fbx48QKbNm2CWCx263gIKAg62fj4ONcrZOrG9Km9QsRisc0yve7+t0ssGY1GdHR0cImHXC4Hj8dDSkoKli9fjpycHCQlJdEMlofTalsgl38OtfriD039Jt8y8yAULoVYvAOJiZ/4dQnbmVCiYYeREaCjAzAYgODgiWa31N/HvQwGAy5fvozLly9bfYqv1WqhUChQUFCADz74AEuWLHH6mEwmE+7cuYPq6mp0dnYCmJhhyc/PR3FxMeLi4hz6eo8ePcJXX301p7K1MTEx+Oijj+zeSO8M3d3duHv3LlauXOmz3di9HgVBl2IYBhqNxmoSYq1XiLXO6XFxcVT62QNoNBq0tLSgqakJra2t0Ol0CAsLQ3Z2NrfMiiroeTaTaQQ6XQdY1gAeLxghIWkQCCj+vQ4lGsQnDAwM4MyZM7h+/TpYlgXLsnj16hUAYMGCBdzypQ0bNmDfvn0QiUQuGVd3dzeqq6tx69YtrifH8uXLIZVK572p2WAwoLKyErW1tXM6f8OGDfjxj3/s9mVJGo0G9fX1WLhwIVavXk3rmQmZBZZlMTg4aHVPiEKhmNYrZOpSLPMeEU8pW+1PGIZBV1cXmpqa0NLSgu7ubrAsi8WLF3NJR2pqKs1SEZ9AiQbxKS9evMBXX32F2tpaxMfHW611HxgYiJKSErz55psue5M19+SoqamBWq0GMLGsq7i4eE49OZ49e4Zjx46hr6/P7rGEhobivffew7p16+w+15H0ej1qa2sRGBiIgoICBAYGunU8hPgKlmUxMjJidRZEoVBgdHSUOzYiImLaLIj5c9pP4BrDw8MWJXSHh4cRHByMrKws5OTkIDs7G7Gxse4eJiFzQokG8Sl37tyBUqlEXFwczpw5M+ONeGRkJHbv3o1Nmza5bJ0swzBoamqCTCZDS0sLgInEZ8OGDZBKpa/tycEwDC5duoRvv/12TmVrs7KycPDgQZfN6Fhj3l8zMDCAwsJCREREuG0shPgjrVZrsSF9chIyeQlmaGiozSQkIiKCZh8B1NbW4ve//z3u3LmD3t5enDp1Cnv37p3z9ViWxYsXL7ik4+nTp2AYBvHx8dxsR0ZGBi2HI16DEg3iE3Q6HS5fvozs7Gykp6cDmNhkWVtbi2+//RZardbmuQsXLkRpaSmys7NdNVwAE+V6a2pquOpKAJCWlgapVIpVq1ZNmzZXKpU4duwYt+/DHgKBAPv27cPWrVvdenPQ2tqKx48fY8OGDUhISHDbOAgh1un1+mkJiPnvAwMD3HHBwcFWE5C4uDhER0f7TRJy8eJFNDQ0YO3atdi/f/+8E42pdDod2trauP0d/f39EAgEyMjI4BKPycuDCfE0lGgQr9fe3o7W1lZs377d6n6D0dFRXLhwAVevXuUquFiTk5OD0tJSl98AGwwGrieHXC4HMDHbMrknx7Vr1/Dv//7vFuuuZ2vhwoU4fPiwWztp9/b24ubNm8jMzMQyqkxEiFcaGxvjeoVM3RvS398/rVeItX4hvtwrhMfjOTzRmIxlWfT19XGzHe3t7TAajRCJRMjJycHy5cuRlZXl9n13hExGiQbxWiaTCVeuXEFcXBzWrFnz2uOVSiVOnjyJu3fv2jyGz+ejoKAAu3fvdvmSHms9OcbHx6HX62EymRAZGWn3U6uSkhLs2bPHbfsfhoeHUVdXh5iYGKxfv95nbzAI8Xcmk2larxDzR5VKxS31DAgIQGxsrNUkxNt7hTg70ZjKaDSivb2dSzxevXoFPp+P1NRUbrYjKSmJZjuIW1GiQbySXC7H9evXsXXrVkRHR9t1bkdHByoqKvDs2TObxwiFQuzYsQNbt251y026RqPBX/7yF/z5z3/GyMgIACA8PBwJCQmQSCSvfTMWiUQ4ePAgsrKyXDHcaYxGI+rr62EymVBUVITg4GC3jIMQ4n7j4+Po7++fthTL/Lnph2aQfD4fMTEx05ZimXuFeHrBCFcnGlOp1Wo0NzejpaUFra2t0Ov1iIiI4EroZmdn05444nKUaBCvYu5+zbIsCgsL5/ykhmVZNDY24uTJk9BoNDaPE4vF2LdvH9atW+eyp0JjY2M4efIkZDIZGIaBSqWCXC7H0NAQgIn9FgsWLEBCQoLVKfLc3Fz85Cc/sbuSlSOwLMttiiwoKHDrpnNCiOdjGAYDAwM2y/RO7hUSHR09bRbEnIx4wsMMdycak42Pj6OzsxPNzc1oamrCixcvAADJyckWJXRplpk4GyUaxGsMDAzgypUryMvLQ2JiokOuaTQa8f333+PixYsz7n9ITU1FWVmZ0xvJPX/+HEePHuV6gEw2MjICuVwOhULBLUOIiYlBYmIiRCIRQkND8ZOf/ATr16936hht6ezsxIMHD7BmzRokJye7ZQyEEN/BsiyGhoZsJiHmIhoAEBUVZbVZoUQicdmeBU9KNKYaGhpCS0sLt8xKq9UiJCQEWVlZXOIRExPj7mESH0SJBvEK9+7dQ19fH7Zt2+aUJkZDQ0M4e/YsN1tiy7p167Bv3z6H1zRnGAbfffcdzp49+9qytUajEX19fZDL5dwb7cKFC/HJJ5/grbfecnnte5VKhYaGBiQnJ2PlypW0HpgQ4nTmXiHW9oQoFAqLSoPh4eFWZ0EkEgnCwsIcFrM8OdGYjGEYPH/+nEs6Ojs7wbIsEhISuKQjPT3d45eqEe9AiQbxaHq9HpcvX0ZmZiYyMzOd/npyuRyVlZVobm62eYxAIMCWLVuwY8cOhyxPUqvVOHbsGDo6Ouw6z9wZWCwWc13HAwMDsX79ekilUixevHjeY5uJTqdDbW0tQkJCkJ+fT11sCSEeY3R01OosiFKp5JahAkBISIjVWRCJRDKrXiEjIyNc7F69ejX+8Ic/QCqVIiYmBklJSU79Hh1ldHQUbW1taGpqQnNzMwYGBhAYGIjMzEwu8ZBIJPQQicwJJRrEY3V0dKC5uRklJSUu32/Q3NyMyspKrtysNeHh4XjnnXdQWFg4p0opLMvi5s2b+Pvf/26xBGC2EhMTcejQISxevJjryXHt2jXodDoAwNKlSyGVSrF69WqHJgEMw+DatWsYHh5GUVERdQ8mhHgVc68Qa00LJ+/ZCw4Otpj9mJyEmHuFVFdXQyqVTnuNDz/8EMePH3fhd+UYLMuit7eXm+148uQJTCYTYmNjkZ2djZycHGRmZkIoFLp7qMRLUKJBPI7JZMLVq1cRExODdevWuW0cDMOgvr4eZ8+eteiWO9WCBQtw4MABrFixYtZPfLRaLf7617/izp07cxrb1q1bsW/fvmlT2+aeHNXV1ejp6QFg2ZPD3gpdk7Esi6amJnR2diIvLw8SiWTO1yKEEE9kNBqnVcYyf1Sr1dzSWoFAYHNPSExMjM9ssjYYDBYldBUKBfh8PtLS0pCTk4Ps7GwsWrSIZjuITZRoEI/y6tUrNDQ0YMuWLR5TsUiv1+PSpUuoqqriyjBak5WVhbKyMixatGjG67W2tuL48eMWXXZnKzo6GgcPHnxt0zuWZdHR0QGZTIZ79+6BYRjw+XysXr0aUqkUaWlpdr0xvHz5Eo2NjcjJyeE6rxNCiD8xmUxQq9XTZkEUCoVFrxA+n4/Y2FirndPFYrFXLzNVKpVc0vH48WMYDAZERkZyS6yys7NplptYoESDeASWZdHQ0IDx8XEUFRV55NMRtVqN06dP49atWzaP4fF4yM/Px549exAVFWXxNaPRiFOnTuHKlStzev01a9bg/ffftzuIDwwMoK6uDrW1tdza5IULF0IqlWL9+vUzloUcHBxEXV0dJBIJcnNzPfL/CyGEuBvDMOjv77eahEzuFcLj8SAWi612To+Li/OqDdgmkwkdHR1cNauXL1+Cx+MhOTmZ61S+ZMkSn5ndIXNDiQZxu6GhIXz//fdYv379a2cDPEFXVxcqKirw9OlTm8cEBwfjzTffRElJCYKCgvDy5UscPXp0xj0ftgiFQvz4xz/Ghg0b5nWjbzKZcO/ePchkMm7s5o3cxcXFFkuhxsbGUFdXBwAoLCxEUFDQnF+XEEL8GcuyXK+QqQmIUqm0KK0uEomsJiBxcXEevy9iYGCASzpaWlowOjqK0NBQi4aB81m+S7wTJRrErR48eAC5XI5t27Z51ZMclmVx7949nDhxAiqVyuZxUVFRWLhwIdra2l5bttaatLQ0HDp0CGKxeD7DnebFixeQyWS4desW1xBr+fLl2Lx5M0ZHR6FWq1FYWDhtVoYQQojjsCyL4eFhq0mIQqHginsAE/vtpiYh5o/uaNA6E4Zh8OzZM26Z1bNnz8CyLBYuXMgts0pLS/PqZWRkdijRsMPICNDRARgMQHAwkJYGhIe7e1TeSa/Xo6qqCunp6cjKynL3cObMvHH9woULFm8IwMQmusePH2NgYADh4eFITU2d9dMcPp+PPXv2YPv27U6ddtZqtbh27Rqqq6vx9OlT9Pf3IzMzE++88w42bdpEa22JJQqChLgMy7IYHR21mYSMjIxwx4aFhdlMQsLDw92+7FWr1aK1tZXrVD40NITg4GCLErpxcXFuHePrmEwj0Ok6wLIG8HjBCAlJg0BA8e91KNF4jZYW4PPPgQsXgM5OYPJPi8cDUlOBnTuBX/wCyM523zi9SWdnJx4+fIiSkhKfuZEdGRnBuXPnUFNTA4ZhoFAo0NHRMW3zeGxsLFJSUmbsVLtgwQIcPnzYZTXYFQoFGhoawLIsXr58yfUQMffkKC4u9pp68MQJKAgS4pHMvUKmLsVSKBQYHBzkjhMKhVYTkLi4OERFRbk8CWFZFj09PVzS8fTpU4yPj0MikXBJR0ZGxoz7B11Fq22BXP451OoL0Os7AUy+ZeZBKEyFWLwTiYm/QFgYxT9rKNGwoasL+PhjoKoKEAiAGYoNcV8vKQG++AJISXHdOL3J+Pg4ZDIZoqKisG7dOrc/YXGGzs5O/PM//zPu3r1r8xgej4fExEQkJSVNWy4mlUqxf/9+l+yJ0Gq1qK2tRWRkJPLy8riZE4VCgZqaGjQ0NHCzNKmpqZBKpVizZg1NdfsLCoKEeC2DwWC1TK9CobDoFRIUFGSzTK9IJHLJ+7Rer8fjx4+5xEOtVkMgECAtLQ3Lly9HTk4OEhISXHrPoNN1ob39Y2g0VQAEAGaIfz98XSQqQUbGFwgJofg3GSUaVpSXA0eOTLxvzvTeOpVAMPHnj38EfvYz543PG/X19aG+vh7FxcUO32/gKdra2nD8+HFoNBoMDAygs7PTYmp7KoFAgKSkJCQmJnJla5cvX+70cZpMJjQ0NECv16OoqMjm7IrBYMCtW7dQXV2Nly9fAphYI1xQUICioiKPKT9MnICCICE+y2g0QqVSWU1CrPUKsda0UCwWO2VZL8uyUCgUFiV0jUYjoqOjudmOZcuWOXVPilxejo6OI2AYE2ZOMKYSgM8XIC3tj0hMpPhnRonGFJ9+Cvz2t/O/zu9+B/zmN/O/jrdjWRbXr1/H2NgYioqKfLLMnclkwunTp1FVVWXx31mWRV9fH549e4axsTGb56ekpOA3v/kN8vPznfrEhmVZPHjwAM+fP0d+fj5iY2NnfV5HRweqq6tx9+5drifHqlWrIJVKkZ6e7pOzU36LgiAhfstkMqG/v9/qnhCVSoXx8XEA/9ErxNpsSGxsrMNmvo1GIzo6OtDU1ITm5mb09vaCx+MhNTWVSzySk5Md9h7U3f0purrmH/9SUn6H5GSKfwAlGhbKy4Gf/9yx1zt82HHX8zbmsrW5ublYvHixu4fjFD09PTh69CjXhdua8fFxvHz5Ei9evLCoPBUQEIC0tDRIJBLweDykp6ejrKwMycnJDh9nd3c37t69i5UrVyI1NXXO17HWkyMxMRFSqRQbNmzwiDW1ZB4oCBJCbGAYBhqNZtosiHmJlrmCIY/HQ0xMzLQkRCKRIDY2dl5LgzUaDTfb0dLSAr1ej7CwMGRnZ3OdyiMjI+d0bbm8HO3tjot/mZnlSEig+EeJxg+6uib2Mer1jrumUDixj9Iflys/fPgQPT09Xle2drZYlsWVK1dw6tSpGbuFT2YwGPDs2TMoFApEREQgKyvLal30DRs2YN++fQ5ZmqTRaFBfX4/ExESsWbPGYU99zD05qqur0dHRAWBiw6G5J0d8fLxDXoe4EAVBQsgcsSyLwcFBq0mIQqGw6BUSHR1tNQmxt1fI+Pg4urq6uMSju7sbALB48WJutmPp0qUICAh47bV0ui40NmaDYRwX//h8IXJzW/x+zwYlGj/Yvh2Qyexbjvw6AgEglQKXLzvump7OYDCgqqoKqampyPbRCjQajQbHjx9HW1ub3efy+Xxs2LABKpUKT548sXlcYGAgSkpK8Oabb86pSZPBYEBtbS0EAgEKCgqcmuy9ePEC1dXVuHnzJvdEKzs7G1KpFDk5OT65XM4nURAkhDiBuVeItVkQhUKB0dFR7tiIiAirCUhcXNxrq1QODw9bNAwcHh6GUChEVlYWl3jY2iP64MF2aDQy2Lcn43UEEImkWLnSv+MfJRqYeODmzD24LS3AsmXOu76nePbsGe7fv+9TZWunun37Nv76179aBMbZio+Px+HDh5GcnAyWZfHw4UNUVlZCoVDYPCcyMhJ79uxBfn7+rG7YGYbBzZs3odFoUFhYiIiICLvHOVejo6O4du0aZDIZ18RQLBZj8+bNKCgo8NnfCZ9AQZAQ4iZardbqLIhSqcTw8DB3XGhoqNUkRCKRTOsVwrIsXrx4wc12PH36FAzDID4+Hjk5OVwJ3cDAQGi1LWhsdF78y81tQViY/8Y/SjQA/OpXwJ/+5NgHeWYCAfDJJ8C//qvjr+0pGIaBTCZDeHg41q9f75Mbg0dHR/GPf/wDN2/enNP5mzdvxoEDB6btYTCZTKitrcW5c+eg1Wptnr9w4UKUlZVh2Qw3a62trXj8+DE2bNiAhISEOY3TEViWRXNzM2QyGZqbm8GyLAIDA5Gbm4vi4mKn7EEh80RBkBDigfR6vc0kZGBggDtOKBRaVMeanIRERUVBr9ejra2NK6Gr0WgQGBiIjIwM5OTIwOd/C2DcCd+BAAsXfoL0dP+Nf5RoYKK57dOnzr3+DKtkvJpCoUBdXR02b9486ypG3qa9vR3Hjh2zqD0+WxEREfjwww+xYsWKGY8bHR3F+fPnIZPJuKoe1uTk5KC0tNQikejt7cXNmzeRmZk5YyLiDuaeHNeuXeNmgVJTU1FcXIy1a9dSTw5PQUGQEOJlDAYDVCrVtKVYSqUS/f39XJnewMDAaRvSeTweVCoVnj9/jrS0/4Hw8CGnjVMoTMPGjf4b//w+0RgeBqKiLJvdOhqPx6Krqx/hPtSpnmVZ3LlzBzqdDps2bfLJdfgmkwmXLl2CTCbDXP6ZLF++HD/60Y/sWr6kVCpx/vx5PHz40OYxfD4fGzduxKZNm/Do0SNER0dj3bp1Hv3/YGxsDHfv3kV9fT3kcjkAIDw8HBs3bkR+fj6io6PdO0B/NjyMmNRU8JwbBIGhIfhUECSEeCyTyWSRhEz+qFaruQqQQiGDvXvL4dyFGDwUFAxBIPDP+Of3icb9+8Dq1c5/nf37/xdiY186/4VcwGg04uXLl4iNjXXpHgBX0mq1ePz48YwN92wJCAjA0qVLER8fP+dlZIODg+js7LRYnzrZ6Ogo+Hw+MjMzsXjxYo9OMiYzbwqUy+VQKpVgWRY8Hg9isRiJiYmIioryyaV3nmyRSoV/PnnS+S907x6wapXzX4cQQmYwPj4+qVfIdQAOLOltw9q19xARscrpr+OJ/H7dwqSKa07FML7xo+7v78fIyAiSkpJmVTLO27AsC7lcjq6uLoueF7MVGRmJzMxMm922ZysqKgqrVq2CUqlEV1cXVxpQr9fDZDIhNDQUfD4f3d3d6Ovrw5IlSxAXF+fxN+k8Hg+RkZGIjIxEamoqent70dvbC5VKBZVKhdDQUCQmJkIikdCyKhcRzOH3fE5cFWwJIWQGAQEB3H6OoaER3L3r/NdkWf+Nf37/Tu6q/mJ8vhM2WbrQ+Pg4enp6EB4ejqSkJHcPxykMBgPa29vntBeDx+MhKSkJSUlJDrvZ5/F4kEgkEIvFePLkCbq6uhAUFDSt3K15k5tcLkdqauqcmxW5WlBQEJKTk7F48WKo1WrI5XIMDg6io6MDz549g0QiQWJiIkJDQ909VJ9mctFsWHt3NyKSkhAbG+uTvXUIId6Hx3PNTaCrXscT+f3SqZERIDKS9mjM5MWLF3j48CGKiop8dqnUgwcP8M0330Cn09l9bmxsLN577z2nVFPq7+/HzZs3sWjRIiQnJ+PSpUu4efPmjHtGVq1ahV27dtmsF+7J5HI56uvrcffuXYyNjQEAMjIyUFBQgOzsbK9ZIuZVRkYQk5Li1D0aLID//NFHMAQGgsfjITo6elplGPMTRuouTwhxFZNpBPX1kZiIUs5CezT8OtEAqOCKLQzDoLq6GqGhodiwYYPHL8uZC71ej7///e+4cePGnM4vLCxEWVmZw2+OdDodamtrERISgvz8fItlRD09PaioqEBra6vN8wUCAbZu3YodO3bMexmXO5h7ctTU1HB9Rsw9OTZt2oRwb83aPZWTgyCblobBxsZpmzLNH/WTupFHRUVZTUAkEolX/i4TQjzbjRtp0OudF/+o6hQlGlRC3gqVSoWamhoUFRUhLi7O3cNxiidPnuDLL7+EWq22+9yIiAj89Kc/xcqVKx06JoZhcP36dQwNDaGoqMhmkztzr4rKykr09vbavF54eDjeeecdFBUVeeVsAMuyaGlpgUwmQ1NTE1iWhUAgQG5uLqRSKfXkcBQ3BkGWZTEyMjIt+TB/Prm/THh4+LQkxDwzEhoa6pMPQwghzvXkya/Q0/MnOLYruBn10aBEA9QUdzKWZXHr1i2MjIxAKpV65c3p65hMJpw7dw6XLl2aU9naFStW4IMPPnDoXghz4tDR0YG8vDzEx8fP6jyGYVBfX4+zZ8/arFAFAAkJCThw4ABycnK89mbMnPzW19dzPTlSUlIglUqpJ8d8eXAQHB0dtZmEDA39R+370NBQi9mPyUlIRESE1/7eE0KcizqDOxclGj/Yvh2QyRz7QE8gAKRS4PJlx13TmbRaLaqqqrBq1SosWbLE3cNxit7eXhw7dgzPnz+3+9zAwED86Ec/QmFhoUNvWnp6etDY2Ijs7GxkZGTM6Rp6vR4XL17E999/D9MMv8TLli1DaWkpFi1aNNfhut3Y2BgaGxshk8nw4sULABMzTAUFBdi8eTNEIpGbR+ilvDAImrsGT01AlEqlRVGH4ODgaQmI+WN0dDQlIYT4uQcPtkOjkcGxsxoCiERSrFzpJTeBTkKJxg+6uoDsbGDSUuF5EwonHuSlpDjums7S0tKCzs5OlJSU+ORmTJZlUVNTg8rKShiNRrvPT05OxuHDh2c90zAbQ0NDqK2thUQiQW5urkNudtRqNU6dOoXGxkabx/B4POTn52PPnj2Iioqa92u6C8uy6OzshEwmw507d8AwDHg8HlatWoXi4mJkZmbSDaQ9fCwIGo1Gq0mIQqGw6BosEAiszoLExcUhJibGJ2d1CSGWdLouNDZmg2EcF//4fCFyc1sQEuIFN4FORInGJOXlwM8d2LelvBw4fNhx13MGo9GIqqoqLF68GCtWrHD3cJxicHAQX331FZqbm+0+l8fjYefOndi1a5fD+oaMjY2hrq4OwMRm8qCgIIdcd7LOzk5UVFSgs7PT5jHBwcF48803UVJS4pQxuNLg4CDq6upQV1eHgYEBABPLxYqLi7Fx48ZpJYGJDX4SBE0mE9RqtdUkRKVScT10AgICEBsba7Eky5yEiMViWq5HiA+Ry8vR3u64+JeZWY6EBM+Lf65GicYUn34K/Pa3jrnOr389/+s404sXL9DY2Iht27Z5Te8Fe927dw9ff/21xYbS2YqNjcWhQ4ewdOlSh4yFZVk0NjZCoVCgsLDQ6bMJLMvizp07OHXqFFQqlc3joqOjsW/fPp+oLDY+Po779+9DJpPhyQ+l3oRCIfLy8lBcXIwFCxa4eYRewJ+CoBUMw3Bdg6dWyFIqldzSRHNH+6kJiEQioV4hhHip7u5P0dU1//iXkvIpkpO9L/45AyUaVpSXA0eOTCxVtme5skAw8eezzzzyIR6HYRjU1NQgODgYeXl5Xn9zaY1er8c333yDhoaGOZ2/adMm/OhHP3LYk/AnT56gubkZ69atc/n+CJPJhKtXr+L8+fMWZUSnSk5ORmlp6Zz3iXianp4eVFdX48aNG1xPjqysLEilUrzxxhu0JGYmvh4E54hlWQwMDFhNQhQKBfd7BgAikchqEkK9QgjxbHJ5OTo6joBhTLBvz4YAfL4A6emf0UzGJJRo2NDVBXz8MVBVNfG+OdN7rfnrJSXAF1949p4MtVqN6upqFBQUOHS/gSd5+vQpjh07NuNTfFvCwsLw05/+FKtXr3bIWBQKBa5fv47U1FS3V3waHh7GuXPnUFtbyy0NsWbVqlU4cOAAJBKJC0fnPKOjo7h+/Tqqq6u5nhwxMTFcTw5fbUI5b74aBJ2EZVkMDQ1ZzH6YP+/r67NI8iMjIy0SkMlJSGhoqBu/C0IIMLFno739Y2g0VQAEmDnhmPi6SFSCjIwv/H5PxlSUaLxGSwvw+efAxYsT/awm/7R4PGDpUmDHjoky8Z5cwpZlWdy+fRuDg4OQSqUO22/gScbHx3H+/HlcuHBhTmVrly9fjg8//NAhS5pGR0dRU1ODiIgI5OXledTPu7e3FydPnsTDhw9tHsPn8yGVSrFr1y6bvTy8jbknR3V1NR49esT15Fi3bh2kUqnPVlqbN18Jgm7Esiy0Wq3VWRClUomRkRHu2LCwMKuzIBKJBGFhYT45A02Ip9JqWyCXfw61+uIPTf0m31vwIBQuhVi8A4mJn/h1CduZUKJhh5ERoKMDMBiA4OCJZrre0KDYXLb2jTfeQGpqqruH4xR9fX04duwYnj17Zve5gYGBKC0txebNm+f9Jm4ymXDt2jXodDoUFhZ69NPJtrY2VFRU4OXLlzaPCQ0Nxdtvv43Nmzf71MZXaz05lixZwvXkoPX1NnhrEPRw5l4h1vqFTO4VIhQKbSYhkZGRlIQQ4kQm0wh0ug6wrAE8XjBCQtIgEFD8ex1KNHxca2srOjo6sH37dp9cF8yyLOrq6lBRUWGxPnq2kpKScOjQISQkJMx7HA8fPkR3dzfy8/MRGxs7r+u5irkT+enTpy1uaKaSSCTYv38/Vq1a5VM3M9Z6coSHh6OwsBBFRUWIiYlx8wiJvzMYDNM2pJuTkMm9QoKCgqYlIObPRSKRT/27JYR4D0o0fJTRaMT333+PxMRErFy50t3DcYqhoSH8+c9/xqNHj+w+l8fj4a233sLbb7897yf1z58/x507d/DGG284rEKVqxkMBly+fBnffffdjH1G0tPTUVZWhuTkZBeOzvlYlkVXVxfXk2N8fBw8Hg8rV66EVCqlnhzEIxmNRqhUKqtd09Vq9bReIdb6hVCvEEKIM1Gi4YNevnyJW7du+XTZ2gcPHuDrr7/G8PCw3eeKxWJ89NFHSE9Pn9cYNBoN6uvrkZCQgLVr1/rEjahGo8Hp06dx48aNGY/buHEj9u7d65NduIeGhlBfX4+amhquJ8eCBQtQXFyMvLw86slBvILJZOLK9E5NQlQqFcbHxwFM7Mcy9wqZmoRQrxBCyHxRouFDzN2vAwMDkZ+f7xM3vlMZDAZUVFRwDe/slZeXh3fffXdeN4sGgwG1tbUQCAQoKCjwyfX83d3dqKysRHt7u81jAgMDUVJSgrfeessnl+WNj4/jwYMHkMlk3M/BXBK6uLh43svtCHEXc6+QqQmI+Y95VpPH4yEmJsbqnpDY2Fivb/TpCLW1tfj973+PO3fuoLe3F6dOncLevXvdPSxCPAYlGj6iv78fMpkMmzZt8tmmZF1dXTh27BhXotQeoaGh+OlPf4o1a9bM+fUZhsGtW7fQ39+PwsJCny+Lat53UllZOePPPDIyEnv37kVeXp7PLsGQy+WQyWS4efMmDAYDgImeHMXFxVi5cqXPft/E/5h7hVjrmq5UKrnff2Ci2efUWRDzEi1/mfm7ePEiGhoasHbtWuzfv58SDUKmoETDB9y+fRv9/f3YsmWLT05zMwyDCxcu4Pz58zP2f7Bl2bJlOHjwIKKjo+c8hra2NrS1tWH9+vVITEyc83W8kclkQk1NDc6dO8dVaLJm0aJFKC0txTIfLnGq0+lw/fp1yGQyLvkSiUTYvHkzCgoKfD75JP6NZVkMDw9bTUIUCgV0Oh13bGRkpMW+kMkJiSdX45sPHo9HiQYhU1Ci4cVGR0dRVVWFnJwcr92E/DoKhQLHjh1DV1eX3ecKBALs378fW7ZsmfMyslevXuHGjRvIyMhAdnb2nK7hK7RaLS5cuACZTMat77YmJycHpaWlPr20iGVZtLa2QiaTUU8OQjDxb2J0dNTqLIhSqbTYTxcWFmaza3p4eLjXLvulRIOQ6SjR8FKPHz9Ge3s7SkpKfHKKmmVZNDQ04JtvvrGYqp+tRYsW4fDhw3OefRgZGUFtbS2io6OxceNGWhoziUKhwMmTJ3Hv3j2bx/D5fBQVFeHtt9/2+af8KpUKtbW1qK+vh1arBQAkJydDKpVi3bp1PrmHhxB76XQ6q80KFQoFBgcHueOEQqHNJCQqKsqjkxBKNAiZjhINL2MymfD9998jPj4eq1evdvdwnGJ4eBhff/01Hjx4YPe5PB4P27dvx+7du+e0jMxkMqG+vh5jY2MoKiryySTOUZ48eYKKigp0d3fbPEYoFGLnzp3YsmWLz99wG41GrifH8+fPAUw8uS0oKMDmzZshFovdPEJCPJO5V4i1poUajYYr0xsYGDhtL4j5c5FI5PYHQpRoEDIdJRpepKenBzdu3MDWrVvntd/AkzU1NeGrr76asXmcLTExMfjoo4+QkZFh97ksy+LevXvo6elBQUGBT5ZtdQaWZXHr1i2cOnXKonnYVGKxGPv37/eZMsAzMffkqK6uxu3bt7meHG+88QakUimysrJ8/mdAiKOYe4VYmw1Rq9Xcvj2BQIDY2FirFbJiYmIQEBDg9LFSokHIdJRoeAFz92sej4eCggKfvEkZGxtDZWUlampq5nT+hg0b8O67785pk2FXVxfu37+P1atX09r6ORobG8P333+PS5cuzbjULTU1FWVlZUhNTXXh6NzHWk+O+Ph4SKVS6slByDyNj49DrVZPS0IUCsW0XiFisdhmmV5HFVGhRIOQ6SjR8HAajQZXr15Ffn6+z26u7e7uxtGjR9HX12f3uaGhofjJT36C3Nxcu89Vq9VoaGjA4sWLsWrVKp9M4FxtaGgIZ86cQUNDA2YKLevWrcP+/fv9ZjkRwzC4f/8+qqur8fjxYwATPTk2btyI4uJiv6tkRoizMQwDjUZjsSF98kb1qb1CJicgkz9/Xa+QkZERdHR0AABWr16NP/zhD5BKpYiJiUFSUpLTv09CPB0lGh7s7t27UCqV2Lp1q8+Wrb106RK+/fbbOZWtzcrKwsGDB+1e5qTX61FTUwOhUIhNmzb55M/W3V6+fInKykq0trbaPEYgEGDr1q3YsWMHQkJCXDg695LL5aiursaNGze42Z/MzExIpVLqyUGIC7Asi8HBQatd0xUKxbReIda6ppt7hVRXV0MqlU57jQ8//BDHjx934XdFiGeiRMMD6XQ6XL58GdnZ2UhPT3f3cJxCpVLh2LFjePr0qd3nCgQC7Nu3D1u3brVrFoJhGFy/fh1DQ0MoKipCWFiY3a9NZo9lWTQ3N6OyshK9vb02jwsPD8c777yDoqIiv7rJ1ul0uHHjBmQyGTebJxKJUFRU5BcNIQnxRCzLYmRkxGYSMrmXUEREhM0khN5fCJlAiYaHefLkCVpbW1FSUuKTT3lZlsX169fxj3/8Y05laxcuXIhDhw5h0aJFdp3X3NyMjo4ObNy4EfHx8Xa/Lpk7hmFQV1eHb7/91qKW/lQJCQkoLS3F8uXL/WoZG8uyaGtrg0wmw8OHD7meHGvXrkVxcTFSUlL86udBiCfTarXTEhDz3yfHt9DQUKt7QuLi4hAREUH/ponfoETDQ5hMJly5cgVxcXFYs2aNu4fjFCMjI/jLX/4yY/+FmWzbtg179+61q0xqT08PGhsbkZ2dPadqVMRxdDodLl68iCtXrsBkMtk8btmyZSgtLbU7mfQFarUaNTU103pyFBcXIzc31+dLBBPizfR6vdVZEKVSyRWDACb2Z1mbBZFIJB7fK4QQe1Gi4QF6e3tx7do1ny5b29zcjOPHj8+pbG10dDQ++ugjZGVlzfqcoaEh1NbWIi4uDuvXr6fA7UFUKhVOnTqF27dv2zyGx+Nh06ZN2LNnDyIjI104Os9gNBpx+/ZtyGQyrk8J9eQgxHuNjY1BpVJZTUL6+/steoVM3pA+OQnxhF4hhNiLEg03YlkW9fX1YFkWhYWFPnkzbDQaceLECchksjmdv27dOrz33nuzLltrNBpRW1vL/UyDg4Pn9LrE+To7O1FRUYHOzk6bxwQHB+Ott97Ctm3bXlv9xVc9e/YMMpkMt2/fhslk4npyFBcXY9myZT4ZNwjxJyaTiUtCJicgSqUSKpWKK5YSEBDA9QqZWiFLLBa7pFcIIfaiRMMOIyNARwdgMADBwUBaGhAePrdrDQwM4OrVq9i4caPPlrZ8/vw5jh07NuNGYFuEQiF+8pOfzHo2gmVZ3L59G319fSgoKPDZmSFfw7Is7ty5g5MnT0KtVts8TiQSYe/evdiwYYPf3lgPDw9zPTnMzRHj4+NRXFyMvLw81+zpcmQQJIS81vj4OPr7+6clIeZeIeZlqHw+HzExMdNmQeLi4hAbG0vLLh3AZBqBTtcBljWAxwtGSEgaBAKKf69DicZrtLQAn38OXLgAdHYCk39aPB6Qmgrs3An84hdAdvbsrnnv3j0oFAqfLlt7+fJlnD17lmuYZI+MjAwcPHhw1stDnjx5gqamJqxbtw6LFy+2+/WI+xmNRly9ehUXLlyAXq+3eVxycjLKysp8thrbbDAMgwcPHqC6uhptbW0AJmZ+NmzYAKlU6vgHF84IgoSQeTP3Cpm8IX3yHpHJvUJEIpHVPiFxcXE08z8DrbYFcvnnUKsvQK/vBDD5lpkHoTAVYvFOJCb+AmFhFP+soUTDhq4u4OOPgaoqQCAAZti7yn29pAT44gsgJcX6cXq9HlVVVcjIyEBmZqZzBu5marUaX375JZ48eWL3uQEBAdizZw9KSkpmtQ5VqVTi2rVrSElJwYoVK/z2SbcvGR4exrlz51BbWztjb5XVq1dj//79kEgkLhyd5+nt7UV1dTWuX7/OVXHLyMjgenLMaymFM4IgIcQlzL1Cpi7FMichkx/oREVF2ayQ5YvVL2dDp+tCe/vH0GiqAAgAzBD/fvi6SFSCjIwvEBJC8W8ySjSsKC8HjhyZeN+c6b11KoFg4s8f/wj87GeWX+vo6EBzczNKSkpmvd/Am7Asi5s3b+Lvf//7jE+kbUlISMDhw4dnNSMxOjqKmpoahIeHIz8/n9al+qDe3l6cOHECjx49snlMQEAAiouLsWvXLr+vWa/X63H9+nWLnhzR0dHYvHkzCgoK7N9Q74wgSAjxCOZeIdZmQZRKJVfxDpjoc2QtCZFIJAgNDfXJB3xyeTk6Oo6AYUyYOcGYSgA+X4C0tD8iMZHinxklGlN8+inw29/O/zq/+x3wm99MbPK6evUqYmJisG7duvlf2ANptVr89a9/xZ07d+Z0/tatW7Fv377XriEdHx9HQ0MDdDodCgsLfTJhI5ZaW1tRWVmJly9f2jwmNDQUb7/9NjZv3uyTSxHtwbIsHj9+DJlMhgcPHoBlWQQEBGDt2rWQSqWz68nh6CBICPEqo6OjNpOQyZUjQ0NDpy3DMich3torpLv7U3R1zT/+paT8DsnJFP8ASjQslJcDP/+54673f//vIJKTv4dUKkVMTIzjLuxBWltbcfz4cYsa4bMVHR2NgwcPYtmyZTMex7IsHj58iGfPnmHTpk2IjY2d42iJNzJ3dD99+vSM5ZElEgkOHDiAlStXeuUbnKP19/ejtrYWdXV1GBkZAQAkJSWhuLgY69evt57YOzoIlpcDhw877nqEELcy9wqx1rTQXKQCmNg3ZqtrenR0tEfGaLm8HO3tjot/mZnlSEig+EeJxg+6uib2Mc5h1Y8NLIKCGLS28pGa6nn/oObLaDTi1KlTuHLlypzOX7NmDd5///3XLnl5/vw57ty5gzfeeANLly6d02sR32AwGPDdd9/h8uXL3CZHazIyMlBaWork5GQXjs5zGY1G3LlzBzKZDM+ePQMw0ZNj06ZN2Lx5838k7o4PgoBQOLGZnPZsEOLzjEaj1SREoVBM6xViLtM7NQmJiYlxS68Qna4LjY3ZYBjHxT8+X4jc3Ba/37NBicYPtm8HZDL7liO/jkAASKXA5cuOu6YnePnyJY4ePQq5XG73uUKhED/+8Y9fW6Z0YGAAdXV1SEhIwNq1az3y6QdxD41Gg9OnT+PGjRszHrdx40bs3bsXIpHIRSPzfNZ6cqxYsQLFxcXI/i//BTwKgoQQJzCZTFCr1VaTEGu9QqxtTBeLxU5bHvvgwXZoNDLYtyfjdQQQiaRYudK/4x8lGph44LZ8uXOv/5rVQV6BYRh8//33OH369JzK1qalpeHQoUMzlq01GAyoq6tDQEAACgoKqPY3sam7uxsVFRUzVjgLDAzE9u3b8eabb1IJx0mGh4fR0NCA6upqaDQaJGg0+J8VFc57QV8JgoQQh2MYhusVYq1poblXCI/Hg1gstto1fT69QrTaFjQ2Ou8mMDe3BWFh/hv/KNEA8KtfAX/6k2Mf5JkJBMAnnwD/+q+Ov7Yr9ff348svv0R7e7vd5/L5fOzZswfbt2+3OSXKMAxu3boFtVqNoqIiREREzHfIxA+wLIsHDx7gxIkTUCgUNo+LjIzE3r17kZeX55ZpeU/FMAwePnwI9sgRvNHQgABnvB34ShAkhLgcy7IYGBiwmoQoFAqMjY0BmEhCoqOjrSYhr+sV8uTJr9DT8yc4djbDTICFCz9Berr/xj9KNDDR3PbpU+defw5tJTzGrVu38Le//Q06nc7ucxcsWIDDhw8jKSnJ5jFtbW1oa2vD+vXrfbZLOnEuk8mEmpoanDt3DqOjozaPW7RoEUpLS19bgMDvUBAkhHgZlmUxNDQ0rU+IUqlEX1+fRan9yMhIiwRkchLy8OEb0OudF/+EwjRs3Oi/8c/vE43hYSAqyrLZraPxeMDQEBDuZZ3qR0dH8be//Q2NjY1zOl8qlWL//v0ICgqy+vW+vj5cv34d6enpWO7MtWvEb2i1Wpw/fx4ymWzGhn8rVqzAgQMHkJCQ4MLReSgKgoQQH8OyLLRardVZEKVSyVXiEwjGUFp6HM7dBspDQcEQBAL/jH9+n2jcvw+sXu3817l3D1i1yvmv4yhtbW04fvy4Rbm62YqMjMTBgwdtJg8jIyOora1FdHQ0Nm7cSEtZiMMpFAqcPHkS9+7ds3kMn89HUVER3n77bf9eqkdBkBDiZ8y9Ql69qodO977TX2/t2nuIiFjl9NfxRP7d3QqAweBbrzNfJpMJp0+fRlVV1ZzOX716Nd5//32EW3lyaTKZUF9fj7GxMWzZsgVCoXC+wyXEKolEgl/84hdob29HRUUFnj9/Pu0YhmFQXV2NGzduYNeuXZBKpf5ZfICCICHEz4SGhiI5ORki0Svcvev812NZ/41/fp9ouKoQjTcUvOnp6cHRo0fR09Nj97nBwcF49913kZeXN60ULcuyuHfvHnp6erBp0yafbV5IPE9GRgZ+/etf4+bNmzh16pTVxpJ6vR4nTpxAdXU19u/f73/llF0UnO63tiIsJgZxcXGIioryr58xIcQj8XiuiX+ueh1P5PdLp0ZGgMhI/16ezLIsrly5glOnTnFl5OyxdOlSHDp0yGrH7mfPnuHevXtYvXo1lixZ4oDREjI3Y2Nj+P7773Hp0iUYZni6npqairKyMqSmprpwdG7kgiDIAvjPH30Eww8zRkFBQVbr5EskEohEIkpCCCEuYTKNoL4+EhNRylloj4ZfJxqAfxdc0Wg0OH78ONra2uw+l8/n45133sFbb701bZ+FWq1GQ0MDFi9ejFWrVtGNA/EYg4ODOHPmDK5du4aZwl9ubi727ds3Y98Xn+GCIGhsaYFKpZpWIUahUECtVnP/LwQCAVcVZmoSIhaLaU8XIcShbtxIo6pTTuT3S6cAYOdO5/bR2LHD8dd1hNu3b+Ovf/3rjOVAbYmPj8ehQ4emzVLo9XrU1NQgODgYO3fudFoXT0LmKioqCh988AG2bNmCyspKtLa2Wj2usbER9+7dw9atW7Fjxw6EhIS4eKQu5IIgGBgYiISEBKuVvkwmE9ewa3IC0tTUBJVKxTUI5fP5VrsGm5MQijeEEHuJxTud2kdDLPbQm0AXoRkN+F9ncJ1Oh7///e+4efPmnM4vKipCaWmpRQMchmFw/fp1DA0NoaioCGFhYY4aLiFOw7IsmpubUVFRgVevXtk8LiIiArt370ZBQYFvPlH34CDIMAw0Gs20JMQ8K2I0GgFMNOyK+WEPyNQkJDY21maZbUKIf6PO4M5FicYPtm8HZDLHPtATCACpFLh82XHXnK/29nZ8+eWX6O/vt/vciIgIfPjhh1ixYoXFf29ubkZHRwc2btyI+Ph4Rw2VEJcZHx9HXV0dvv32W66+ujUJCQkoLS3F8uXLfW85oBcGQXPXYGt18hUKhcVenOjo6GnNusx/pwp4hPi3Bw+2Q6ORwbGzGgKIRFKsXOlBN4FuQInGD7q6gOxsYFIjyXkTCice5KWkOO6ac2UymXD27Flcvnx5xnXptqxcuRI//elPLfoNyOVy3Lp1C8uWLUNmZqYjh0uIW+h0Oly8eBFXrlyZsTDCsmXLUFZWhoULF7pwdE7mY0GQZVkMDw9PmwUxf5y8ZDQiImLaLIg5IaHZWUJ8n07XhcbGbDCM4+Ifny9Ebm4LQkI84CbQjSjRmKS8HPj5zx17vcOHHXe9uZLL5Th27BhevHhh97lBQUH40Y9+hIKCAu4J7tDQEGpraxEXF4fc3FzfXEpC/JpKpcKpU6dw+/Ztm8fweDwUFBRg9+7diIyMdOHonMhXg6AVWq3WZhIyPDzMHRcaGmo1CZFIJAgPD/e9mS1C/JRcXo72dsfFv8zMciQkeGb8cyVKNKb49FPgt791zHV+/ev5X2c+WJaFTCbDiRMn5lS2NiUlBYcOHYJEIgEAGI1G1NXVgWEYFBYWWuzRIMQXdXZ2oqKiAp2dnTaPCQ4OxltvvYWSkhLfaPjnS0FwjnQ6nUXiMfnzyb1YhEKhzTK91CuEEO/T3f0purrmH/9SUj5FcrJ3xj9Ho0TDivJy4MiRiaXK9tyfCwQTfz77zP0P8QYGBnD8+HGbFXVmwufzsWvXLuzcuRN8Ph8sy+L27dvo6+tDQUEBoqOjHT9gQjwUy7K4c+cOTp48CbVabfM4kUiEffv2Yf369d5/g+kLQdBJDAaDRZneyR81Gg23NDUwMNDqLEhcXBxEIhHNBBPioeTycnR0HAHDmGDfng0B+HwB0tM/o5mMSSjRsKGrC/j4Y6CqauJ9c6b3WvPXS0qAL75w/56Mu3fv4i9/+Qu0Wq3d50okEhw6dAgpP3wTHR0dePToEdatW4fFixc7eqiEeA2j0YirV6/iwoUL0M+wjyE5ORllZWVIT0934eicwJuDoJsYjUao1WqrSYharQbDMAAmeoWIxWKrSYhYLEZAQICbvxNC/JtO14X29o+h0VRhohPETAnHxNdFohJkZHzh93sypqJE4zVaWoDPPwcuXpzoZzX5p8XjAUuXTvTJ+OQT95ew1ev1+Mc//oHr16/P6fzCwkKUlZUhODgYSqUS165dQ0pKClasWOH9T2gJcZDh4WF8++233DJCW1avXo39+/dzSw+9ljcFQQ82Pj4OtVptdUmWSqXilrfy+XwuCZnatDA2NtY3lucR4iW02hbI5Z9Drb74Q1O/ybfMPAiFSyEW70Bi4id+XcJ2JpRo2GFkBOjoAAwGIDh4opluuId0lO/o6MCxY8dmXNphS3h4OD744AOsXLkSo6OjqK2tRVhYGPLz8+nJGiE29Pb2orKyEk1NTTaPCQgIgFQqxa5duxAaGurC0TmJJwdBL2buFTJ1FsT8+eReISKRyOqekNjYWNo3R4gTmUwj0Ok6wLIG8HjBCAlJg0BA8e91KNHwciaTCefOncOlS5fmVLY2JycHH374IcLCwnDt2jWMjo6isLDQN26KCHGB1tZWVFRUoKenx+YxYWFh2LVrFzZv3kzdq4ldWJbF4OCgzSRk8jK+qKgoq0lIXFycb3e2J4R4LEo0vNirV69w9OhRPH/+3O5zAwMDubK1TU1N6OrqQn5+PuLi4pwwUkJ8G8MwuHbtGs6cOYOhoSGbx0kkEpSWluKNN96g5Yhk3liWxcjIyLSlWOa/T96nFxERYZF4TN6oHhoaSr+PhBCnoETDC7Esi5qaGlRWVnJT6vZITk7G4cOHMTY2htu3b2PFihVIS0tzwkgJ8S96vR7fffcdqqqqZvy3mZGRgbKyMiQlJblwdMTfmHuFWOsXMrVXyNRZEPPnERERlIQQQuaMEg0vMzQ0hK+++mrGdeG28Hg87NixAwUFBbh+/ToWLFiAtWvX0psIIQ6m0Whw+vRp3Lhxw+YxPB4PGzduxN69e6lkNHE5vV5vMwmZ3CskODjYZhISHR3t9+8f//t//2+cPHkSbW1tCAkJQX5+Pv7P//k/yMzMdPfQCPEIlGh4kXv37uHrr7+eU9na2NhYvPfee5DL5eDz+SgsLKTqJYQ4WXd3NyoqKvDkyRObxwQGBuLNN9/E9u3baTMv8QhjY2Ncr5Cpy7L6+/un9QqxtickJibGL3qFvPXWW3j33XeRm5sLk8mEX//612hqakJLSwvCwsLcPTxC3I4SDS+g1+vxzTffoKGhYU7n5+XlISUlBSMjIygsLERkZKSDR0gIsYVlWdy/fx8nTpyAUqm0eVxUVBT27NmDvLw8v7hBI97JZDJxvUKm9gtRqVRcyeeAgADExsZabVoYExPjs0URlEolJBIJampqUFRU5O7hEOJ2lGh4uM7OThw9ehQqlcruc8PCwlBYWAgej4f169cjMTHRCSMkhMyGyWRCTU0Nzp07h9HRUZvHLVq0CGVlZcjKynLh6AiZP4Zh0N/fbzUJUSqVXK8QHo8HsVhsNQnx9l4hHR0dSE9Px6NHj5CTk+Pu4RDidpRoeKjx8XGcP38eFy5cmFPZ2qSkJCxZsgSrVq3C8uXLnTBCQshcaLVanD9/HjKZbMaGf2+88QYOHDiABQsWuHB0hDgHwzAYGBiYthTL/HFsbAzARBISHR1tkYBMXpLlycsLGYbB7t27MTAwgPr6encPhxCPQImGB+rr68OxY8fw7NmzOZ2/ZMkSFBUV0RIMQjxYX18fTp48ifv379s8hs/no6ioCO+88w7CqTEe8VEsy2JoaGjaLIh5ZmRyr5DIyMhpsyDmZMTd/Z8++eQTXLx4EfX19Vi0aJFbx0KIp6BEw4OwLIu6ujpUVFRwT3dmi2EYMAyDbdu2Yd++fRAKhU4aJSHEkdrb21FRUTFjP5yQkBDs3LkTW7Zs8dm17YRYw7IstFqtzSRkcnGUsLAwq0mIRCJBWFiYUytk/fKXv8SZM2dQW1uLlJQUp70OId6GEg0PMTQ0hK+//hoPHz606zyWZdHf34/MzEz86le/Qnx8vJNGSAhxFpZlcfPmTZw6dcqitOhUsbGx2L9/P9asWeP3ZUUJAYDR0dFpe0HMScjk5pkhISFWl2JJJBJERkbO+d8Ty7I4cuQITp06herqaqSnpzvqWyPEJ1Ci4QEePnyIP//5zxYNlGZjeHgYBoMBv/zlLyGVSp00OkKIq4yNjaGqqgqXLl2acVZz6dKlKCsroyenhMzAYDBYnQVRKpXQaDTccUFBQVZnQSQSyWt7hfzTP/0T/va3v+HMmTMWvTOioqIQEhLi1O+PEG9AiYYbGQwGVFRUoK6uzu7zXr16hY0bN+K///f/7vZ1qYQQxxoYGMDZs2dx7dq1GYtB5ObmYt++fRCLxS4cHSHez2g0cr1CpiYharWa+3cnEAiszoKYy/QGBARYvf6XX36JgwcPuvA7IsQzUaLhJs+ePcPRo0ehUChmfc74+Dh6e3sRGhqK//bf/hs2bNjgxBESQtzt5cuXqKioQFtbm81jBAIBtm3bhh07dtDeLEIcwNwrZOpsiHlplrlaHJ/PR2xs7LQlWRKJBGKxmPZTEQJKNFyOYRhcuHAB58+fn7G05WQsy0KhUMBgMKC4uBgff/wxoqOjnTtQQohHYFkWTU1NqKysxKtXr2weFxERgd27d6OgoICqzRHiJOZeIVNnQcwfJ/cKiYmJmTYLYk5IvLlXCCH2oETDhRQKBY4dO4aurq5Zn6PRaDA4OIjExES8//772LJlC20CJcQPjY+Po66uDmfPnrWotDNVQkICysrKqH8OIS7GsiwGBgZsJiEGg4E71twrxFoSQjOTxJdQouECLMuioaEB33zzjUWgmYlWq4VSqUR0dDRycnJw+PBh6uxNCMHo6CguXryIq1evck9PrcnOzkZpaSkWLlzowtERQqxhWRbDw8M2y/TqdDru2MjIyGl7QswfaU8m8TaUaDjZ8PAwvv76azx48GBWx4+NjeHVq1cIDg5GfHw8tm/fjj179tBaT0KIBZVKhVOnTuH27ds2j+HxeCgoKMDu3bsRGRnpwtERQmaLZVmMjo5anQVRKBQYGRnhjg0LC5s2C2L+GB4eTiseiMehRMMOIyNARwdgMADBwUBaGjBTs96mpiZ89dVXFrW8bWEYBr29vQCABQsWIDY2FocOHUJGRoajhk8I8UFPnz5FRUXFjEsyg4ODsWPHDmzbtm1+a8PtDYKEkHnT6XRWN6YrFAoMDg5yxwmFQptJSFRUFCUh82QyjUCn6wDLGsDjBSMkJA0CAcW/16FE4zVaWoDPPwcuXAA6O4HJPy0eD0hNBXbuBH7xCyA7e+K/j42NobKyEjU1Na+9PsuyUKlUGB0dxYIFCxAcHIz169fjxz/+MU2REkJmhWVZ3L59GydPnkR/f7/N40QiEfbt24f169fP/qZjLkGQEOIS5l4h1poWajQarkxvUFCQReIx+XORSEQFJGzQalsgl38OtfoC9PpOAJNvmXkQClMhFu9EYuIvEBZG8c8aSjRs6OoCPv4YqKoCBAJghqXQ3NdLSoB/+ZceXL78Bfr6+l77GkNDQ1Cr1dyUZ0hICN577z3k5uY68DshhPgLo9GIK1eu4OLFi9Dr9TaPW7JkCUpLS2fuYjzXIPjFFwA1EiTE7cy9QqztCenv7+cqXwoEAosyvZM/isViv0xCdLoutLd/DI2mCoAAwAzx74evi0QlyMj4AiEhFP8mo0TDivJy4MiRiffNmd5bp+LzGfB4Jmza9A9kZTXYPE6v1+PVq1eIiIhATEwMeDweMjMz8dFHH0EkEjngOyCE+LPh4WGcPXsWdXV1Mzb8W7NmDfbv34+4uDjLL8w1CAoEE3/++EfgZz+b4+gJIc42Pj5utVeIQqGASqXC+Pg4gIleIWKx2GoSEhsb65P7R+XycnR0HAHDmDBzgjGVAHy+AGlpf0RiIsU/M0o0pvj0U+C3v53PFVgAPKxbdxpr1ly0+IrJZEJvby8EAgEWLFgAHo8HgUCAvXv3Ytu2bbR+khDiUHK5HCdOnEBTU5PNYwICAiCVSrFr166J5ZrzD4ITfvc74De/mf91CCEuxTAMNBrNtKVY5r8bjUYA/9ErxNaSrKCgIDd/J/br7v4UXV3zj38pKb9DcjLFP4ASDQvl5cDPf+646xUV/RlZWQ1gWRavXr2CyWRCQkIC9wQgMTERhw8fxqJFixz3ooQQMkVLSwsqKiogl8ttHhMWFoaf83hY9oc/OO6Fy8uBw4cddz1CiFuxLIvBwcFpsyDmz6f2Cpk6C2L+3BN7hcjl5Whvd9xNYGZmORISKP5RovGDrq6JfYwzLGu2E4uAACNKSv4/MMxTxMfHIyQkhPvqtm3bsHfvXuoOSghxCYZh0NDQgLNnz1qthCceGsL/rKhA4Pg4HDa3KhRObCanPRuE+DyWZTEyMmIzCRkdHeWOjYiIsJmEhIWFuXzsOl0XGhuzwTAOuwkEny9Ebm6L3+/ZoETjB9u3AzKZfcuRX4fHM0EiacaePf+P+2/R0dH46KOPkJWV5bgXIoSQWdLr9fjuu+9QVVXFLYEAgF+dP48suRwBjnxLEAgAqRS4fNlx1ySEeCVzI2JrZXqHh4e540JDQ63uCYmLi0NERIRTlpk/eLAdGo0M9u3JeB0BRCIpVq707/hHiQYmHrgtX+6865eV/Q+IRK+wbt06vPfee1S2lhDidv39/Th9+jRu3ryJBI0G/7Oiwnkv1tICLFvmvOsT4ia1tbX4/e9/jzt37qC3txenTp3C3r173T0sr6PX663OgiiVSgwMDHDHBQcHW50FkUgkc+4VotW2oLHReTeBubktCAvz3/jne+UC5uDzz19fvXGueLxxtLdvwRdfCO2rXU8IIU4UExODQ4cOYcuWLVC//z7GeTzHzmaYCQTAn/4E/Ou/Ov7ahLiZVqvFypUrcejQIezfv9/dw/FaQqEQixcvxuLFi6d9bWxsDCqValoS0tjYiP7+fq6yXmBgoMWG9MlJyEy9QuTyz/H6ErZzJYBc/iekp/tv/KMZDUw0t3361HnXT0kZR2dngPNegBBC5oFNSwPPmUEwLQ148sR51yfEA/B4PJrRcDGTycQlIVMbF6pUKq5XSEBAANcrZGqFrM7OvB+a8TmHUJiGjRv9N/75/YzG8PBEs1tnevYsACMjQDh1qieEeJrhYfCcHQSfPgUFQUKIo5nbBSxYsGDa18bHx9Hf3z9tKVZzczNUKhVMJhMEgjGUlnbCmYtN9PqnMJlGIBD4Z/zz+0Tj6VPA2XM6LAt0dACrVjn3dQghxG4uCoK9dXUwOnMzHCEeQKlU4vnz5+4eBpkkIiICERERSE1N5f4bwzAYGhqCSnUDPN5xJ4+AhU7XgYiIVU5+Hc/k94nGpJLPPvE6hBBiFxcFp+P/9m94JpG45LUIcZfKykrcvn3b3cMgsyQWK7B9u/Nfh2X99ybQ7xON4GDfeh1CCLGLi4LTwf/0n2hGg/i0f/u3f0NpaSnefPNNdw+FzJLB0IyentNOfx0ez39vAv0+0UhLA3g8564c4PEmXocQQjyOi4JgQmEh7dEgPi8uLg5JSUnuHgaZJZMpBj09PADOXD7KQ0iI/94EWq/15UfCw4FJy/acYulSen8lhHgoCoKEzNnIyAju37+P+/fvAwC6urpw//592qfhJQSCcAiFzo1/QuFSv90IDlCiAQDYuXOi1LszCATAjh3OuTYhhDgEBUFC5uT27dtYvXo1Vq9eDQD4r//1v2L16tX4l3/5FzePjMyWWLwTzlvgI4BY7N/xj/powPmdwakpLiHEo1EQJIT4KeoM7lw0owEgOxsoKXH8Az2BYOK69P5KCPFoFAQJIX4qLCwbIlEJHD+rIYBIVOLXSQZAMxqcrq6J91q93nHXFAonHuSlpDjumoQQ4hQUBAkhfkqn60JjYzYYxnHxj88XIje3BSEh/h3/aEbjBykpwB//6NhrfvYZvb8SQrwEBUFCiJ8KCUlBWppj4196+md+n2QAlGhY+NnPgN/9zjHX+vRT4PBhx1yLEEJcgoIgIcRPJSb+DCkpjol/KSmfIiGB4h9AS6esKi8HjhwBTKaJP7MlEEz8+ewzen8lhHgxCoKEED8ll5ejo+MIGMYEwI74BwH4fAHS0z+jJGMSSjRs6OoCPv4YqKqaeN+c6b3W/PWSEuCLL2ilACHEB1AQJIT4KZ2uC+3tH0OjqcLEJvGZEo6Jr4tEJcjI+IKWS01BicZrtLQAn38OXLwIPH1q2TyXx5voQ7VjB/DJJ1RYhRDigygIEkL8lFbbArn8c6jVF6HXP4VlB3EehMKlEIt3IDHxE7+vLmULJRp2GBkBOjoAgwEIDgbS0qjZLSHEj1AQJIT4KZNpBDpdB1jWAB4vGCEhaX7d8Xu2KNEghBBCCCGEOBxVnSKEEEIIIYQ4HCUahBBCCCGEEIejRIMQQgghhBDicJRoEEIIIYQQQhyOEg1CCCGEEEKIw1GiQQghhBBCCHE4SjQIIYQQQgghDkeJBiGEEEIIIcThKNEghBBCCCGEOBwlGoQQQgghhBCHo0SDEEIIIYQQ4nCUaBBCCCGEEEIcjhINQgghhBBCiMNRokEIIYQQQghxOEo0CCGEEEIIIQ5HiQYhhBBCCCHE4SjRIIQQQgghhDgcJRqEEEIIIYQQh6NEgxBCCCGEEOJwlGgQQgghhBBCHI4SDUIIIYQQQojDUaJBCCGEEEIIcThKNAghhBBCCCEOR4kGIYQQQgghxOEo0SCEEEIIIYQ4HCUahBBCCCGEEIejRIMQQgghhBDicJRoEEIIIYQQQhyOEg1CCCGEEEKIw1GiQQghhBBCCHE4SjQIIYQQQgghDkeJBiGEEEIIIcTh/n8xIBfNp6uZCwAAAABJRU5ErkJggg==", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Create a bipartite graph from the adjacency matrix\n", + "G = nx.Graph()\n", + "proc_times = td[\"proc_times\"].squeeze(0)\n", + "job_ops_adj = td[\"job_ops_adj\"].squeeze(0)\n", + "order = td[\"ops_sequence_order\"].squeeze(0) + 1\n", + "\n", + "num_machines, num_operations = proc_times.shape\n", + "num_jobs = job_ops_adj.size(0)\n", + "\n", + "jobs = [f\"j{i+1}\" for i in range(num_jobs)]\n", + "machines = [f\"m{i+1}\" for i in range(num_machines)]\n", + "operations = [f\"o{i+1}\" for i in range(num_operations)]\n", + "\n", + "# Add nodes from each set\n", + "G.add_nodes_from(machines, bipartite=0)\n", + "G.add_nodes_from(operations, bipartite=1)\n", + "G.add_nodes_from(jobs, bipartite=2)\n", + "\n", + "# Add edges based on the adjacency matrix\n", + "for i in range(num_machines):\n", + " for j in range(num_operations):\n", + " edge_weigth = proc_times[i][j]\n", + " if edge_weigth != 0:\n", + " G.add_edge(f\"m{i+1}\", f\"o{j+1}\", weight=edge_weigth)\n", + "\n", + "\n", + "# Add edges based on the adjacency matrix\n", + "for i in range(num_jobs):\n", + " for j in range(num_operations):\n", + " edge_weigth = job_ops_adj[i][j]\n", + " if edge_weigth != 0:\n", + " G.add_edge(f\"j{i+1}\", f\"o{j+1}\", weight=3, label=order[j])\n", + "\n", + "\n", + "widths = [x / 3 for x in nx.get_edge_attributes(G, 'weight').values()]\n", + "\n", + "plt.figure(figsize=(10,6))\n", + "# Plot the graph\n", + "\n", + "machines = [n for n, d in G.nodes(data=True) if d['bipartite'] == 0]\n", + "operations = [n for n, d in G.nodes(data=True) if d['bipartite'] == 1]\n", + "jobs = [n for n, d in G.nodes(data=True) if d['bipartite'] == 2]\n", + "\n", + "pos = {}\n", + "pos.update((node, (1, index)) for index, node in enumerate(machines))\n", + "pos.update((node, (2, index)) for index, node in enumerate(operations))\n", + "pos.update((node, (3, index)) for index, node in enumerate(jobs))\n", + "\n", + "edge_labels = {(u, v): d['label'].item() for u, v, d in G.edges(data=True) if d.get(\"label\") is not None}\n", + "nx.draw_networkx_edge_labels(G, {k: (v[0]+.12, v[1]) for k,v in pos.items()}, edge_labels=edge_labels, rotate=False)\n", + "\n", + "nx.draw_networkx_nodes(G, pos, nodelist=machines, node_color='b', label=\"Machine\")\n", + "nx.draw_networkx_nodes(G, pos, nodelist=operations, node_color='r', label=\"Operation\")\n", + "nx.draw_networkx_nodes(G, pos, nodelist=jobs, node_color='y', label=\"jobs\")\n", + "nx.draw_networkx_edges(G, pos, width=widths, alpha=0.6)\n", + "\n", + "plt.title('Visualization of the FJSP')\n", + "plt.legend(bbox_to_anchor=(.95, 1.05))\n", + "plt.axis('off')\n", + "plt.show()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Build a Model to Solve the FJSP\n", + "\n", + "In the FJSP we typically encode Operations and Machines separately, since they pose different node types in a k-partite Graph. Therefore, the encoder for the FJSP returns two hidden representations, the first containing machine embeddings and the second containing operation embeddings:" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "# Lets generate a more complex instance\n", + "\n", + "generator_params = {\n", + " \"num_jobs\": 10, # the total number of jobs\n", + " \"num_machines\": 5, # the total number of machines that can process operations\n", + " \"min_ops_per_job\": 4, # minimum number of operatios per job\n", + " \"max_ops_per_job\": 6, # maximum number of operations per job\n", + " \"min_processing_time\": 1, # the minimum time required for a machine to process an operation\n", + " \"max_processing_time\": 20, # the maximum time required for a machine to process an operation\n", + " \"min_eligible_ma_per_op\": 1, # the minimum number of machines capable to process an operation\n", + " \"max_eligible_ma_per_op\": 5, # the maximum number of machines capable to process an operation\n", + "}\n", + "\n", + "env = FJSPEnv(generator_params=generator_params)\n", + "td = env.reset(batch_size=[1])" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "torch.Size([1, 60, 32])\n", + "torch.Size([1, 5, 32])\n" + ] + } + ], + "source": [ + "encoder = HetGNNEncoder(embed_dim=32, num_layers=2)\n", + "(ma_emb, op_emb), init = encoder(td)\n", + "print(ma_emb.shape)\n", + "print(op_emb.shape)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The decoder return logits over a composite action-space of size (1 + num_jobs * num_machines), where each entry corresponds to a machine-job combination plus one **waiting**-operation. The selected action specifies, which job is processed next by which machine. To be more precise, the next operation of the selected job is processed. This operation can be retrieved from __td[\"next_op\"]__" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "tensor([[ 0, 4, 10, 15, 21, 27, 33, 39, 45, 49]])" + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# next operation per job\n", + "td[\"next_op\"]" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "torch.Size([1, 51])\n" + ] + } + ], + "source": [ + "decoder = L2DDecoder(env_name=env.name, embed_dim=32)\n", + "logits, mask = decoder(td, (ma_emb, op_emb), num_starts=0)\n", + "# (1 + num_jobs * num_machines)\n", + "print(logits.shape)" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [], + "source": [ + "def make_step(td):\n", + " logits, mask = decoder(td, (ma_emb, op_emb), num_starts=0)\n", + " action = logits.masked_fill(~mask, -torch.inf).argmax(1)\n", + " td[\"action\"] = action\n", + " td = env.step(td)[\"next\"]\n", + " return td" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Visualize solution construction\n", + "\n", + "Starting at $t=0$, the decoder uses the machine-operation embeddings of the encoder to decide which machine-**job**-combination to schedule next. Note, that due to the precedence relationship, the operations to be scheduled next are fixed per job. Therefore, it is sufficient to determine the next job to be scheduled, which significantly reduces the action space. \n", + "\n", + "After some operations have been scheduled, either all the machines are busy or all the jobs have been scheduled with their currently active operation. In this case, the environment transitions to a new time step $t$. The new $t$ will be equal to the first time step where a machine finishes an operation in the partial schedule. When an operation is finished, the machine that has processed it is immediately ready to process the next operation. Also, the next operation of the respective job can then be scheduled.\n", + "\n", + "The start time of an operation is always equal to the time step in which it is scheduled. The finish time of an operation is equal to its start time plus the processing time required by the machine on which it is being processed.\n", + "\n", + "The figure below visualises this process. " + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "env.render(td, 0)\n", + "# Update plot within a for loop\n", + "while not td[\"done\"].all():\n", + " # Clear the previous output for the next iteration\n", + " clear_output(wait=True)\n", + "\n", + " td = make_step(td)\n", + " env.render(td, 0)\n", + " # Display updated plot\n", + " display(plt.gcf())\n", + " \n", + " # Pause for a moment to see the changes\n", + " time.sleep(.4)" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [], + "source": [ + "if torch.cuda.is_available():\n", + " accelerator = \"gpu\"\n", + " batch_size = 256\n", + " train_data_size = 2_000\n", + " embed_dim = 128\n", + " num_encoder_layers = 4\n", + "else:\n", + " accelerator = \"cpu\"\n", + " batch_size = 32\n", + " train_data_size = 1_000\n", + " embed_dim = 64\n", + " num_encoder_layers = 2" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n", + "/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n", + "/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/trainer/connectors/accelerator_connector.py:551: You passed `Trainer(accelerator='cpu', precision='16-mixed')` but AMP with fp16 is not supported on CPU. Using `precision='bf16-mixed'` instead.\n", + "Using bfloat16 Automatic Mixed Precision (AMP)\n", + "GPU available: False, used: False\n", + "TPU available: False, using: 0 TPU cores\n", + "IPU available: False, using: 0 IPUs\n", + "HPU available: False, using: 0 HPUs\n", + "/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:67: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\n", + "val_file not set. Generating dataset instead\n", + "test_file not set. Generating dataset instead\n", + "\n", + " | Name | Type | Params\n", + "--------------------------------------------\n", + "0 | env | FJSPEnv | 0 \n", + "1 | policy | L2DPolicy | 81.2 K\n", + "2 | baseline | WarmupBaseline | 81.2 K\n", + "--------------------------------------------\n", + "162 K Trainable params\n", + "0 Non-trainable params\n", + "162 K Total params\n", + "0.649 Total estimated model params size (MB)\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "812cd22f33dd469cb501b27936cc1105", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Sanity Checking: | | 0/? [00:00 + + + + + + + + + + + + + + + + + + + + + + + + + Solving the Flexible Job-Shop Scheduling Problem (FJSP) - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/other/3-data-generator-distributions/3-data-generator-distributions.ipynb b/examples/other/3-data-generator-distributions/3-data-generator-distributions.ipynb new file mode 100644 index 00000000..82e1e221 --- /dev/null +++ b/examples/other/3-data-generator-distributions/3-data-generator-distributions.ipynb @@ -0,0 +1,372 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Generating data in RL4CO\n", + "\n", + "RL4CO allows for easily generating data from different distributions for CO problems\n", + "\n", + "\"Open\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Generating different distributions for TSP" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/home/botu/anaconda3/envs/rl4co/lib/python3.11/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n", + " from .autonotebook import tqdm as notebook_tqdm\n" + ] + }, + { + "data": { + "text/plain": [ + "Text(0.5, 0.98, 'TSP with 100 locations, uniform distribution')" + ] + }, + "execution_count": 1, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "from rl4co.envs.routing import TSPEnv, TSPGenerator\n", + "from rl4co.envs.common.distribution_utils import Cluster, Mix_Distribution, Mix_Multi_Distributions, Gaussian_Mixture, Mixed\n", + "\n", + "# Instantiate the environment and generator\n", + "generator = TSPGenerator(num_loc=100)\n", + "env = TSPEnv(generator=generator)\n", + "\n", + "# Simple plot\n", + "fig, axs = plt.subplots(1, 3, figsize=(10, 3))\n", + "td = env.generator(3) # generate 3 instances\n", + "for i in range(3):\n", + " axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1])\n", + " axs[i].set_xticks([]); axs[i].set_yticks([])\n", + "fig.suptitle(\"TSP with 100 locations, uniform distribution\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Generating data with different sizes" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Text(0.5, 0.98, 'TSP with 1000 locations, uniform distribution')" + ] + }, + "execution_count": 2, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAxoAAAEZCAYAAAAQS1PVAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8pXeV/AAAACXBIWXMAAA9hAAAPYQGoP6dpAAEAAElEQVR4nOydeXgUVdbG3+6kl6SzdgJ0A5IECEIIWxAEIzjGoCwK4jaAOoqOK8woow6K8onDuI8jzgRRUXFcAFeEAcxIBAUiiAIBQlCSkASBBMwesidd3x+d21RX13Jr6U4g9XueeUY63dXVVXXvPefcc95jYBiGgY6Ojo6Ojo6Ojo6OjoYYO/sEdHR0dHR0dHR0dHQuPHRHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0fnAufOO+9EfHw89XvDwsL8e0JdlPfeew8GgwHFxcWdfSqCxMfH48477+zs0+hUvv32WxgMBnz77bder3/wwQcYPHgwTCYToqKiOuXc1MI3Vg0GA5YsWeL37+a7rr/73e+QnJzs9+8GgOLiYhgMBrz33nsB+T4dHZ3AoDsaOjo8GAwGqv+RRfm3337DQw89hMGDByMkJAQ9e/bE2LFjsXDhQpw9e9Zz3DvvvNPr8xERERgxYgReeeUVNDc3B+S3NTQ0YMmSJT6Gmhbs2bMHDz74IEaPHg2TyQSDwSD6/nfeeQdDhgyB1WpFYmIi/v3vf/O+7+TJk7jlllsQFRWFiIgIzJgxA8eOHVN1zK7K999/jyVLlqC6urqzT+W84eeff8add96JAQMGYOXKlXjrrbc6+5Q6ldWrV2PZsmWdfRq8dOVz09HR0Z7gzj4BHZ2uyAcffOD17/fffx9btmzxeX3IkCGorKzEJZdcgtraWtx1110YPHgwKioqcPDgQaxYsQIPPPCA1y6BxWLB22+/DQCorq7G559/jkcffRQ//vgj1q5dq/lvWblyJVwul+ffDQ0NeOaZZwC4I5ZasnnzZrz99tsYPnw4+vfvj6NHjwq+980338T999+PG2+8EX/5y1+wY8cO/PnPf0ZDQwMWLlzoed/Zs2dx5ZVXoqamBosWLYLJZMKrr76KK664Ajk5OYiJiZF9zK7M999/j2eeeQZ33nmnT2T+l19+gdHYveNDEydORGNjI8xms+e1b7/9Fi6XC6+99hoGDhzYiWenPY2NjQgOlrdUr169Grm5uXj44YepP8N3Xf2B0LnFxcWhsbERJpPJr9+vo6MTWHRHQ0eHh9tuu83r37t378aWLVt8XgeAl19+GcePH0d2djYuu+wyr7/V1tb6LNzBwcFex3nwwQdx6aWX4uOPP8Y///lP9O7dW8NfgoAu3A888AAWLlyIkJAQzJ8/X9DRaGxsxJNPPolp06bhs88+AwDcc889cLlcWLp0Ke69915ER0cDAF5//XXk5+djz549GDNmDABgypQpSE5OxiuvvILnnntO9jHPVywWS2efQqdjNBphtVq9Xjtz5gwAaJoy1dDQgNDQUM2OpxTub9WapqYmmM1m3usaSAwGQ6d+v46Ojn/o3qExHR0NKCwsRFBQEMaNG+fzt4iICMnF02g0enYWhOoDqqurERQUhH/961+e18rLy2E0GhETEwOGYTyvP/DAA3A4HJ5/s/O+i4uL0aNHDwDAM88840nh4uaAnzx5Etdffz3CwsLQo0cPPProo2hvbxf9HQDQq1cvhISESL5v27ZtqKiowIMPPuj1+rx581BfX49NmzZ5Xvvss88wZswYj5MBAIMHD8ZVV12FTz75RNEx5fD6669j6NChsFgs6N27N+bNm8eb1vTDDz9g6tSpiI6Ohs1mw/Dhw/Haa695/n7w4EHceeed6N+/P6xWKxwOB+666y5UVFR43rNkyRI89thjAICEhATP/SHPBV+NxrFjx3DzzTfDbrcjNDQU48aN8/mtJP/+k08+wbPPPou+ffvCarXiqquuQkFBgdd78/PzceONN8LhcMBqtaJv376YNWsWampqZF+7JUuW8KbP8dXDxMfH49prr8XOnTsxduxYWK1W9O/fH++//z7vbyGpf/Hx8Xj66acBAD169PB5nmnuH6lF2Lt3LyZOnIjQ0FAsWrTIUzfwj3/8A8uXL0f//v0RGhqKq6++Gr/++isYhsHSpUvRt29fhISEYMaMGaisrKS6Nl9++SWSk5NhtVqRnJyMdevW8b6P+3vq6urw8MMPIz4+HhaLBT179sSkSZOwb98+z2/ZtGkTSkpKPM8PGf/k2q1duxZPPfUU+vTpg9DQUNTW1grWvgDA3r17cdlllyEkJAQJCQl44403vP4uVN/EPabYuQnVaGzduhUTJkyAzWZDVFQUZsyYgSNHjni9hzxnBQUFnp3AyMhIzJ07Fw0NDcI3QUdHx+/oOxo6OiqJi4tDe3s7PvjgA9xxxx2KjlFYWAgAXmlAbKKiopCcnIzt27fjz3/+MwBg586dMBgMqKysRF5eHoYOHQoA2LFjByZMmMB7nB49enjSuWbOnIkbbrgBADB8+HDPe9rb23HNNdfg0ksvxT/+8Q9kZWXhlVdewYABA/DAAw8o+n1c9u/fDwC45JJLvF4fPXo0jEYj9u/fj9tuuw0ulwsHDx7EXXfd5XOMsWPH4uuvv0ZdXR3Cw8OpjymHJUuW4JlnnkF6ejoeeOAB/PLLL1ixYgV+/PFHZGdne3aLtmzZgmuvvRZOpxMPPfQQHA4Hjhw5go0bN+Khhx7yvOfYsWOYO3cuHA4HDh8+jLfeeguHDx/G7t27YTAYcMMNN+Do0aNYs2YNXn31VcTGxgKAxznkcvr0aVx22WVoaGjAn//8Z8TExOA///kPpk+fjs8++wwzZ870ev8LL7wAo9GIRx99FDU1NXjppZdw66234ocffgAAtLS04JprrkFzczP+9Kc/weFw4OTJk9i4cSOqq6sRGRkp6/rJpaCgADfddBPuvvtu3HHHHXj33Xdx5513YvTo0Z7nm8uyZcvw/vvvY926dVixYgXCwsI8zzPt/QOAiooKTJkyBbNmzcJtt92GXr16ef720UcfoaWlBX/6059QWVmJl156CbfccgvS0tLw7bffYuHChSgoKMC///1vPProo3j33XdFf+fXX3+NG2+8EUlJSXj++edRUVGBuXPnom/fvpLX6P7778dnn32G+fPnIykpCRUVFdi5cyeOHDmClJQUPPnkk6ipqcGJEyfw6quvAoCPwMPSpUthNpvx6KOPorm5WTRdqqqqClOnTsUtt9yC2bNn45NPPsEDDzwAs9nMOy7FoDk3NllZWZgyZQr69++PJUuWoLGxEf/+97+RmpqKffv2+RTO33LLLUhISMDzzz+Pffv24e2330bPnj3x4osvyjpPHR0dDWF0dHQkmTdvHiM0XMrKypgePXowAJjBgwcz999/P7N69Wqmurra57133HEHY7PZmN9++4357bffmIKCAua5555jDAYDM3z4cMlz6NWrl+fff/nLX5iJEycyPXv2ZFasWMEwDMNUVFQwBoOBee2117y+My4uzvPv3377jQHAPP3007znB4D529/+5vX6qFGjmNGjR4ueH9/5Cl2zefPmMUFBQbx/69GjBzNr1iyvc+WeD8MwzPLlyxkAzM8//yzrmEKsWrWKAcAUFRUxDMMwZ86cYcxmM3P11Vcz7e3tnvdlZGQwAJh3332XYRiGaWtrYxISEpi4uDimqqrK65gul8vz3w0NDT7fuWbNGgYAs337ds9rL7/8std5sImLi2PuuOMOz78ffvhhBgCzY8cOz2t1dXVMQkICEx8f7znvbdu2MQCYIUOGMM3NzZ73vvbaawwA5tChQwzDMMz+/fsZAMynn34qeq1oefrpp3mfAe61Jr+Ney3OnDnDWCwW5pFHHvG8Rn7Ltm3bfL7nt99+8/oszf1jGIa54oorGADMG2+84XWeRUVFDACmR48eXuP5iSeeYAAwI0aMYFpbWz2vz549mzGbzUxTU5PodRk5ciTjdDq9jvn1118zALzGKsMwPmM1MjKSmTdvnujxp02b5nMchjl37fr37+/zPPJdV3JdXnnlFc9rzc3NzMiRI5mePXsyLS0tDMPw30+hYwqdG7nWq1at8rxGvqeiosLz2oEDBxij0cj84Q9/8LxG7v9dd93ldcyZM2cyMTExPt+lo6MTOPTUKR0dlfTq1QsHDhzA/fffj6qqKrzxxhuYM2cOevbsiaVLl3qlNQFAfX09evTogR49emDgwIFYtGgRxo8fL5g6QZgwYQJOnz6NX375BYB752LixImYMGECduzYAcC9y8EwjOCOBi3333+/z3cLqTwpQazo1Gq1orGx0fM+gL82gaSksd9Lc0xasrKy0NLSgocfftirAPuee+5BRESEJz1p//79KCoqwsMPP+xTI8BOG2KnlDU1NaG8vNyTbkfSXuSyefNmjB07FpdffrnntbCwMNx7770oLi5GXl6e1/vnzp3rdY3Ic0LuLdmx+N///tcpKSdJSUlez26PHj1w8cUXK3r2aO8fwWKxYO7cubzHuvnmm712cy699FIA7loudqH2pZdeipaWFpw8eVLwvEpLS5GTk4M77rjD65iTJk1CUlKS5O+KiorCDz/8gFOnTkm+V4g77riDKsURcNeU3XfffZ5/m81m3HfffThz5gz27t2r+BykINfpzjvvhN1u97w+fPhwTJo0CZs3b/b5DN+8VVFRgdraWr+dp46Ojji6o6GjowFOpxMrVqxAaWkpfvnlF/zrX/9Cjx498H//93945513vN5rtVqxZcsWbNmyBdu3b8evv/6K7Oxs9O/fX/Q7iAG2Y8cO1NfXY//+/ZgwYQImTpzocTR27NjhkcxVitVq9UnViY6ORlVVleJjcgkJCUFLSwvv35qamjxGEPl/PunfpqYmr/fQHpOWkpISAMDFF1/s9brZbEb//v09fydpb1L9BiorK/HQQw956lh69OiBhIQEAFBU/0DOkXt+gFsNjf0bCP369fP6NymOJ/c2ISEBf/nLX/D2228jNjYW11xzDZYvX674/OTCPT9yjkqePdr7R+jTp4+go8o9L+IgXHTRRbyvi50v+d7ExESfv/HdSy4vvfQScnNzcdFFF2Hs2LFYsmSJbEeMPHc09O7dGzabzeu1QYMGARCuKdMCofsHuJ/v8vJy1NfXe70u9Xzr6OgEHt3R0NHREIPBgEGDBuFPf/oTtm/fDqPRiI8++sjrPUFBQUhPT0d6ejomTJhAlZcNuBf8hIQEbN++Hbt27QLDMBg/fjwmTJiAX3/9FSUlJdixYwcuu+wyVRKoQUFBij9Li9PpRHt7u0ctiNDS0oKKigqP8pbdbofFYkFpaanPMchr5L20x+wsbrnlFqxcuRL3338/vvjiC3z99dfIzMwEAC/5YX8idG/Zu26vvPIKDh48iEWLFqGxsRF//vOfMXToUJw4cUL29wn1URESFqA5P38h5ogKnVdnnO8tt9yCY8eO4d///jd69+6Nl19+GUOHDsVXX31FfQy5TrcUcu+zv+jM50dHR4cf3dHQ0fET/fv3R3R0NK+RrBSSJrVjxw6MHDkS4eHhGDFiBCIjI5GZmYl9+/Zh4sSJoseQaqIXCEaOHAkA+Omnn7xe/+mnn+ByuTx/NxqNGDZsmM/7ALfKU//+/REeHi7rmLTExcUBgCdVjdDS0oKioiLP3wcMGAAAyM3NFTxWVVUVvvnmGzz++ON45plnMHPmTEyaNIl3F0vO/YmLi/M5P8DdwI79G+QybNgwPPXUU9i+fTt27NiBkydP+igN0UAiylyVJ+5ugj+gvX+Bhnxvfn6+z9/47iUfTqcTDz74IL788ksUFRUhJiYGzz77rOfvWo7xU6dO+ewcENlqUowt5z7TnpvQ/QPcz3dsbKzPTouOjk7XQ3c0dHRU8sMPP/gsxIC7S3ZFRQVVOgQtEyZMQHFxMT7++GNPKpXRaMRll12Gf/7zn2htbZWszyC9ATqz83RaWhrsdjtWrFjh9fqKFSsQGhqKadOmeV676aab8OOPP3o5EL/88gu2bt2Km2++WdExaUhPT4fZbMa//vUvr4joO++8g5qaGs/xUlJSkJCQgGXLlvlcU/I5EmnlRlb5OiQT44nm/kydOhV79uzBrl27PK/V19fjrbfeQnx8PFXOP5va2lq0tbV5vTZs2DAYjUZFneuJE7Z9+3av8/vPf/4j+1hyob1/gcbpdGLkyJH4z3/+45WStmXLFp+aGi7t7e0+aWw9e/ZE7969ve6PzWbTLN2tra0Nb775puffLS0tePPNN9GjRw+MHj0aAP99bm9v5+3QTntu7OvEHgu5ubn4+uuvMXXqVKU/SUdHJ4Do8rY6Oir54IMP8NFHH2HmzJkYPXo0zGYzjhw5gnfffRdWqxWLFi3S7LuIE/HLL794GtUB7q6+X331FSwWi1e/CT5CQkKQlJSEjz/+GIMGDYLdbkdycrJkjQENJSUlnu7pxDH4+9//DsAdobz99ts957B06VLMmzcPN998M6655hrs2LEDH374IZ599lmv4s8HH3wQK1euxLRp0/Doo4/CZDLhn//8J3r16oVHHnnE63fRHpOGHj164IknnsAzzzyDyZMnY/r06fjll1/w+uuvY8yYMR6pXKPRiBUrVuC6667DyJEjMXfuXDidTvz88884fPgw/ve//yEiIgITJ07ESy+9hNbWVvTp0wdff/01ioqKfL6XGG9PPvkkZs2aBZPJhOuuu443evv4449jzZo1mDJlCv785z/DbrfjP//5D4qKivD555/LTqHbunUr5s+fj5tvvhmDBg1CW1sbPvjgAwQFBeHGG2/0vI/Ixm7btk20u/zVV1+Nfv364e6778Zjjz2GoKAgvPvuu+jRoweOHz8u69zkQnv/OoPnn38e06ZNw+WXX4677roLlZWV+Pe//42hQ4fi7Nmzgp+rq6tD3759cdNNN2HEiBEICwtDVlYWfvzxR7zyyiue940ePRoff/wx/vKXv2DMmDEICwvDddddp+hce/fujRdffBHFxcUYNGgQPv74Y+Tk5OCtt97yyAMPHToU48aNwxNPPIHKykrY7XasXbvWx2mVe24vv/wypkyZgvHjx+Puu+/2yNtGRkb69P7R0dHponSS2pWOznmFmFTrwYMHmccee4xJSUlh7HY7ExwczDidTubmm29m9u3b5/VeIm+rhp49ezIAmNOnT3te27lzJwOAmTBhgs/7ufK2DMMw33//PTN69GjGbDZ7yWcKnZ+QTCkXImfJ978rrrjC5/1vvfUWc/HFFzNms5kZMGAA8+qrr3pJwhJ+/fVX5qabbmIiIiKYsLAw5tprr2Xy8/N5z4H2mFyEJDozMjKYwYMHMyaTienVqxfzwAMP+MjYMoz7HkyaNIkJDw9nbDYbM3z4cObf//635+8nTpxgZs6cyURFRTGRkZHMzTffzJw6dYpXanjp0qVMnz59GKPR6HVOXHlbhmGYwsJC5qabbmKioqIYq9XKjB07ltm4caPXe8h94crWciVFjx07xtx1113MgAEDGKvVytjtdubKK69ksrKyvD73yCOPMAaDgTly5Ij4RWUYZu/evcyll17KmM1mpl+/fsw///lPQXnbadOm+Xz+iiuu8Hp2aOVtCTT374orrmCGDh3q81lyfV5++WWv14WuJ/ldP/74o8gVcfP5558zQ4YMYSwWC5OUlMR88cUXvGOV/Xw0Nzczjz32GDNixAjPczZixAjm9ddf9/rM2bNnmTlz5jBRUVFekrlC583+G1fedujQocxPP/3EjB8/nrFarUxcXByTkZHh8/nCwkImPT2dsVgsTK9evZhFixYxW7Zs8Tmm0LnxydsyDMNkZWUxqampTEhICBMREcFcd911TF5entd7hO6/0JjW0dEJHAaG0aukdHR0dHToGTt2LOLi4vDpp5929qno6Ojo6HRhdEdDR0dHR4ea2tpa9OjRAzk5OR4ZXR0dHR0dHT50R0NHR0dHR0dHR0dHR3N01SkdHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc3RHQ0dHR0dHR0dHR0dHc0JpnmTy+XCqVOnEB4eDoPB4O9z0tHREYFhGNTV1aF3794wGs+fWIE+j+jodA30OURHR0cttPMIlaNx6tQpXHTRRZqdnI6Ojnp+/fVX9O3bt7NPgxp9HtHR6Vroc4iOjo5apOYRKkcjPDzcc7CIiAhtzkxHR0cRtbW1uOiiizzj8nxBn0d0dLoG+hyio6OjFtp5hMrRIFuUERER+uDW0ekinG+pA/o8oqPTtdDnEB0dHbVIzSPnT3Kmjo6Ojo6Ojo6Ojs55g+5o6Ojo6Ojo6Ojo6OhoDlXqlI6Ojo7O+U+7i8GeokqcqWtCz3ArxibYEWQ8v9JndHR0dHTOH3RHw490hUW93cVg97EK7CqsAMBgfP9YjBsQoxsXfqAr3G8d/3I+3+PM3FI88988lNY0eV5zRlrx9HVJmJzs7MQz69rIueeBfD7O52fxfES/3urprGuo9ntb2lz4YFcxSiobEGcPxe3j42EOvjASggJxT3RHw090hUU9M7cUj39xCNUNrZ7XMrYVIirUhBduGKYbFxpCc7/1her8pjPGtJpnhv3Z4vJ6vJqV7/OespomPPDhPqy4LSXg88H5MB7k3PNAPh9832W3mTBzZB+kJzm65LU8n+kK6/n5TmddQ/6xYsb1I3tjEsVYeX5zHlbuKIKLOffas5uP4J4JCXhiapKic+oqc1+g7omBYRhG6k21tbWIjIxETU2NKqWHrnJxxdDiHDNzS/HAh/vAvbDkKIFY1DNzS3H/h/tE3/NGJxgXbM6H54EGoftNWJCeiMSeYVi66YgmA1qr8Rhozqfz5j6bVfXNmLd6v+A99sdYUrMI8H1WCAMAR6QVOxemBWz8Sf22rjA3yJnHAznnS803gPRzcj6NRTadcd7+vrf+ftbPt7GkFL7fuSWvTNVYeX5zHt7cXiT42fsmync2uorTqsU9oR2PfnM0+BZqrQwtf7H5YCmeWp+LyvoWz2tyz7HdxeDyF7cKLvCBWNTbXQxSX9iKslpxI6NXuBn//P0olJ9tDvgEpLWh0ZlbsmL3Wwylk6xuJPgXvmfTaIBXRItLVKgJe5+apNkzp2YRoDFE+VhzzziMHxAj91R5ERuPUr/t3okJ2HCgtFPXCpp53G4z46lpQ9AzwopHPslBWW2z4HvJnA9A8LrQzGG0843Uc3K+jEUugT5vf6/nao1O7jMzOi4ae0uqupTdFQibiO86OiIsaGpzeWV0CGGA71hpaXNh8OKvROd9owH4eekU6jSqrhCEBrS7J7Tj0S+pU7TRtM7ctuci5LmWyjzHPUWVor+b6TjmnqJKzRZ1vnOQcjIA4HRdC259+wfPvwM1AQkNNvI8yDU0MnNLsWTDYa+F3hFhwZLpQ/3+W6TutxgM3AP6mf/mYVKS47zczTmfoDHkhJ5NscUGAKobWpGxtQAPpSdqcp7P/DeP11GQembEPivFmbomzXZ0hYynSUkO0d8GgHceVrJWqPktNPN4RX0LFnxyQPJYZM5f+NlBZB05jerGc4YPuS4AqAxO2vlGn1u0wZ/rudQ6KPWsKwmIyDm+Vsi9hnLHreB1FHD8heCOlQ92FUteSxfjft/dE/pLHl/JvO6vAGqg7VTNHQ050TRycZdsOIxwq0kysu6vi7754CnR7TEG9BM2jYEPuBd1f6H02IGYgKQGGyDP0BBKESurbcb9H+6jTmkRerb4XgfORSXzT5+l+t1CBMLx1KGvoVFqpAPAyh2FeOB3A2QVCfI9X2oWATWOb3F5vU+US27wQcp4ejg9UdH50ThYWu6g+2N+/mzfCZ/XymqaBFNc+eY8Oeelzy3qob3eQu9rdzHYXViBXcfKARgwfkAMxvV33wulwQRAeUCE9vhaIuca8s3TUSEmzE2Nx/y0RE0DK2z4xkpJZQPVZ2nfRzuvv5ddhNhwC4rL67Fmz3Evh0mrYLDa51oumjkaRN3o8c8PybrpDNxGoVRkffPBUx1pTb7RILX5kU+tz5V8H82EnZlbiqUbD1N9b89wK9W5KXGsaI7Nhz8mIK5aw6Ce4ZoZGu0uBo9/cUj0c49/cUjytwhNbpcnxuKn4iov5zEq1AQAVNuxctiSV6YbAyJIOXxi40NoUS7tMPJen5OCqcOdqox0ADjb3I5xz2fhuZl0QgtCzs+UZAfV9/EFNZQsDAYANkuw6mJxmojdquxi2efHPgbfPOyPHXSlc6hcxNZKvjlPyXn5M6h1oUN7vfnexy/GUoCoUBPmXhavOJighXFN64RqEdylvYbF5fVYlpXv87uqG1vxalY+Vn1f7CNio3bO5sJeh+PsoVSfoX0f7ThcuumI4N/ImqW2JlDNc60ETRwNOYWHNHAXBK3SmvjYU1Tp5byIwX5Q5BaLEkjuGzGUhFCTuzk2wQ5HhJV6d4WNllEwPrUGNa4L99x2F1ZIGvzVDa3YXViB1MRY3r8LGaHVja3YeLCU93j+4N3sYoxNsHd6CmFXhG8shFmCwDBAfUu75zW+8UGzKM9fsw8ZGIVWmnCgBJX1rdRpD0KR/3cpjfGlGw8jxGT0+h4lCwMD4Gxzm+DfaIMPNBE7dtqQUtjzsJIddJrfomYO1RLunDc2wQ5npBVlNU3UhmagnKbzFTFjemyCHVGhJsF5X2g9FxNjqW5o5XXq+eAzTrU0rsWMX62KlqWeWXIN1+w5LvpMVzf4zq1aO9Hsdfj28fF4dvMRyRqN28fHUx1by3FIE0AVg2YeMRqAqnp56WdCqBYCJhO9ll4l+eHP/DcPG3Po0praFRoJch5U8qBk5pYi9YWtmL1yNx5am4PZK3dj/ho6JwMAnr4uiSrnkHtNiQOWmetrALMJMhqwZLoy2TWC2gFMnEPubVFvyp07N/d2tDRC79Nq21Ur1DzHFyLtLgavZR3F/Txj4Wxzu5eTAfCPD5pF2cUAD67ej+Lyes3OXexe0kT+adYP4tSwf+/YBDvsNrOicxaCbeyKQTtnRIWYVAUcyDzc7mKwZIO88Sv1W9pdDHYVVuC5TXmoa/ZPUEEJ5NoGGQ2emg4anBRBre5MZm4pLn/Rey2//MWtnjG1Ja9MNLjEwHc9dz+XdJkNUrCf9V2FFVifcxLZBXTrnpzjc1Frg7BhP7PccU/+PWtMP6qaCq69F2uzUJ8HDSQQ0e5iYA424p4JCaLvv2dCAnWqLDHutUhUIzWBSqGZR1wMMG/1fln3WghVjoY/DTWyIDzxpXhqDEC3CApB62XG2MwYm2D3RCq4kS4a+9BuM0tGOmlqGJ5cl4t1+05gV2GFoDEzOdmJN25L8aT6yEWN993S5sLKHcLOoVpibRbsKqzAUer6CP6hrfW2q1pKa5qw+1hFZ59Gl4A487SRP8A7QEHGhRyHec2e43BEqF8IpIxZmsi/HH+T/XuDjAb8fUayjLOlR+pa0s4Zl3fsLsq9zgZ4G84ZW/MV7zjw/Ra20flOdjHqm9t5Ptk5sK/t5GQnHk4fRPW5WWP6dctCcLZhLrRObj54ijeIQYzpzQdP4Zn/5ol+j80chHCLyev4bjEWdZFg9rPOdYYytik3MPmOz71WLW0uSRtEblBscrITK25LgSPSe45wRFqx4rYUxMfSpR8BnLlV40ebO3c/MTUJ901M8An8GA3ypW3FHC4lrPq+iOoeCI2FyclOLJ+TIhnU0iIAqip1KhCGWl0T/5Y+l686vC65OYTEy5T6HUs7Fm+pmgAxnpo2RHLLUa7aCVvNhbv9OznZiUlJDvz7m3y8vfMYzlIunFGhJrhcDNpdjKJFikatQQkGAJGhJjzy6QFZBoZQClhXzF2e99E+vHBj926mqFSeFfBNNZHjMJfVNmNB+iAsyzoKA7x337j/pkHo+crKK5N5JGH4Uh2nDnfivhMJojvBSpC6lu50I4ukkbW3pArL54zyKdaWgoHbcAbcz4gcJ5RLz3Arp6FhA5ZlHVUVNCMpIP+4aQTK65tRXtcsmm8t55jcXYl+MXSGGe37LiRoUn425pzCn9bu5/082VXk1oTyUd/Sjlvf+cHr+HLXFb65BnDvlND0gZAL9/h8zezYEv9clKZXE3uEjLlYmwUwAOVn3WNFDuQal5/VJrVH6PiA29l45OrBijqDc9PyJiU5sOK2FE1KDaobWqnqhsXGQrTNLGqraZVKr8rR6EqG2vu7SvD+rhLZOYRBRgMWTxuCB1fzTzqA23OdOtyJ7IJyVTn6lfUtksa73GtKVEu4eaRs2cTXvvEtsBKjuqHVZ/KUA60KgxzIZOz+jfT3IDrU5FH54NIVc5erG+ly/C9UtNolJeOoSmTB5CM+NpR3IXCwxtOidbmiCzGB7/lqdzFYl3NS1jnRwJ03npiahBF9o7Dwi0PUwRoxokJMkik4QUYDZo/tJ+kAlNY0Idpmwc6Fadh9rALzPtpHXbvxatZRrNlzHE1tynYbiOFeVd+suP+N0HEBt/FG6sHaXQze3llEXU8hZnBy14xKSgOL9n0XCjSSsfuPV0k64QxAXbsJnCvSzZg1UpbRfFNKH2QXVvDONZOSHLj8xa2aZ4yw5zK+a0UztwHK7L8go1t5KzO3FI9+dkC2NC+BzK3+WsPZKWvEUUjqHYk7UxOog69iRv7OhWme46oJSEjV2EiNheY2F9X3ZKkUq1HlaPjTUCMNkSpkGgpyJVozc0sFb7LdZsLfZyRj6vDeAIBdherSWpZuOoK3dxaJGu9yryl5iLgOELkOkaEmxRMV+1ry7ZgIDbiLorWPovWS0XyHzfM3DBM8T9rdrM6gu+rfa7VLSiLWSzeJpz7wfW78gBjR5z1tcC+Mez5L0BARE3yQIz4h97y5TB3eG81tLqpeD1LMTY2nehbjY21UxztT14QgowGpA2Pxwo3D8EBH4SzNXKWmQJsBMH2Ek0q4Q4xQcxAaWDVCDp6gDEmVeODDfYI7YlGhJrxwwzAAvn00+I7p+VwIXUqs1vU6XRma2qfHPz+I6kb1jrcQ89fmyHq/1RyEf9w0whPZZ881uzgOiBbclNIHL940AgBUOzFK7T810rzcuVWJOALt8dUUw0srHY7y2JXtLgbLvy2kdvDYCN0D2p4d/7h5BNX3rMs5iUXTxGuLxVDlaNDcZCUpB+SnLJ2RjKWb5G0x0SqLtLsYZGzNF42+uVwMjF6fV/8oSzlCo+OiJbcuaRByQJQc4y+fHIDVRNcxPTO3FG/vKFT8nXwsSB+ES+KjvSSQpRCbENhRilljLlKVguEPtFT+Ot/QYpfUGWmFy8Xg1S2/UM8d3AWMRN74MAcb8dxMfuNYSvBB611gKRU7R2SI6u8IswRjfhpdI8LYMLrizKOn65CdXw4XwyD3ZC2mJPfCrmMVqGo4ZwQaDADjhxTMj386oXomb2hpx4L0QYiPDRUNvJDcdK7BEmoOwtRkB567YbgnBYMmmONetwqwknKO1eL+ny/QqZ7JczLsNjOq6lv8Jhjy4e7j+HD3cc96xZ5zaB3qyUN7oWeEFe/vKpF872f7TiJtcE9E2yyKnRha5Uw+1OxYC82tWq3hNClrNIFsOqXD/ciAAVOHOxFkNOD6kb2p1QbJuYrdA9qeHWDc87uQ6iChsl46TUsMVY4GO2IjBM0Dxd0yc0RasXhaEqJtZkxNduAdmdrrUoaau5N0nuRArm5s89IsHt8/Fhnb1BnRYo4Q8aDVOhla09DS7hW9A/gHnJrceiEMANb+eJw61/gP4+MwJdkp2lPBp2dGqAktbS6f39jZdKXUxEChxS5pY6s7b1ouUmpwbIQMSLvNjKUzkn0WIeLcqm3wyIfYeWsh03rLJX3pI1mUg3/5tkIs55lLwyzBGJsQjR+LqzRJ+eJDC4lqMi/tXJgmeW1IbnrG1nysyi5GdWMrGlra8dm+k8gurPAERPicW+86knq8m12EGkpjubspTmk9Xzo77JB5q4V3pLSCbz2lTXvLPHwaC9LpAgGA28i9g1KSlQuNcqZY89v3sosUOzjcHT61bRW46eY0KWs0gWx6pcN9eMOY4pkfaB0NmntAOxa2/nxa0smQe0w+VPfRIJXr89fsk10ATC5RxuxRiLZZOF1d8xTn7xGElEXkGsPkoRo3IEZUU5sWPkfIH0a6P+EOOEC406na7ymtaaKedImTwTfRCV3jmo77ee1wJ3bml3vlizsiLJg9th9a212qnUy5aCm3er6gJp3NZglCfXO77PFpt5mom+yxmZzshKuj4SdJh6qob8HSTXkwGuG1IC7ZcFi1Eg0Xo8E9d4qd97m6iaOKv4eMbxrKVequn21uw9aff1N1jEAgFMziNiglRaNb8sp4m5GJRUjVGlKLpw3pVqmXWqdyE6N2hVGb4l0x+AxYOWlva/YcR1SIiarWycUAq74vpjqu3WbySvUUS+cDhOsSpo9wYsOBUsXX0G4z4bvHrvTs/m0+WIoHVwsHuMUQE9ChSVkjY/+97CLemg05Bjm533LWPal7ANCPBTn1gmrGlyYN+6Qq1wnEECDwXbDM3FLe/Fly/LmXxaFvdChV8Qz3wijdtmMvKC/cMEywEY9cyAPZ1fo50MKVgvPnRHyiSrrA3ClQ5Gm3mfHM9KF4bvMR0SjF3pIq7HkyHXtLqnwmn/UKC3h7hZtxpk7Z1vuaPccxPy2xWxkLNOIMXKJCTLjzsnis/fG4bEnSCGswnpqahMgQs2yVNaG5im08AtBsvuDiYoBoCh15OdKRXORGxbuiwII/YRsVfA1K/77pCKYNc+CnkipZEVItAk9LNx2B0WjoNqISWuXrGwAsn3POgScRZ7nCBXLhOq9y0t60DmKQ1JzvHruSdz3kQ6wuQa0CXmV9K/aWVGH8gBhsPngK89fQrw9sYmxmL4eFL+NFTgdvvppbOXMgcVhiwy2eFDCh3bO7U+OR3uGUSK1TNE0S5dRAR4VKi4GIobphH0B/Y4gREBViwoL0Qdi5ME12F9//7CpBr3CraOMTrt46QU2hKfs3Ku1NwYVErAMhE+xPU/VMXZPf03zWHzgl+Z5rh7uLPLnXsrK+BX9a4/s6GzLJf7CrmHdSVWpATUjsobwYv7ZZcX+Y8xka45nN32cMRbg1WNFiW9vUhr98esCnUZcUNP1ulmw4jMc/Vy6HTQPNuFNj/E8f4RRNkeDqs2vZlEoMA9yKco4IbRt2yYVcW7EGpRsPlYk+m9yAjVaBp1IFzdXOZ2gaw9Gs3XddHu8p1GUfmwgX+BsypslY6iyevi4J5mAjxg+IwYyRfTB+QIzoXODvYOmZuiZk5pbiwdX7FcvnV9S3YG9Jleh7ZEmi84wxufdt6aYjeGhtDl7NykdUqAmRnGfUGWnFG7elYPF1Q0XvARuasTBjZG/QUt3Qii0qZNk1cTTkLmQ1ja1YlnXU58Rpc9vmr92P6SPcDorQReTLX1NjDJfXNWPzQbfHrkWOL+COWLe7GL8b6Xelxvs0ymGj1nHqGW71WyTTAHcUgkap5/N9J1VPdGTQcw3PsQl2aqUXwoL0QQi1qNs07I51GnJ/858+zlHdrwCQ1/WWptiurLZZcfTTQtltlmbcqTH+39xexHs9hDoqb8krw+JpQwKyO/v8DcOQ/fhV+OiPl8oem1pgNLjFO7RqUEqeey0DTwy0abh1viDWGO6N21Lw3PXSjsLmQ2WijXBfnzNKssmZGsiYltsFXiuMBuBfs0chMsQs2vCQTSCCpbFhFskGijRIrS9y5ktyVbhjbNaYixSdW01DK2oaWrEgfRBemzUSa+4Z5xOQp0WqSaKclFh2x3QlaJI6JXfLkn1z2NvFcgyMDQdKeZs+RXdI0vLdGDXG8NJNR2A0aFsQRiLW/k43mJTkwJPTks41ygmzAIw7n5pE7l/KPOKz7S8FV/lAaquuV4QFgEF2YeoMSkUGrYvoiRQdEQOYm5pAnevuiLBgftpAvJetzgCJlRndvxCQW5siV5lIaGtaaF7iQ010hwYpfXM5yi80MqtiPP7FIaq0HnZPH3/zcPogzxzPlsgNpDntYtzplnmnajRpUErWAa2DC91NwY7bGI6bfy+F1PWaOrw3MmBQXCMgBN+Ydjs2KZi3OnDPtosBnt7g3axQStbV3wGxqFATwGiTni1lb8mdL9k1G85Iq+xGpNxjyRGakEJsLLS7GGq7Xa0SpiY7Gkpbq5fWNCFj6zlZMrm5bdE2CxZPS/Iqmqqsb8XSTUeQmVvqs7U/Oi4ajgjlRr0/gkJn6pr8mm5gt5lQVut+QMYm2DFjZB+kDoxFamKsZzt0S14Z3uLZ9heDu3NEcuuFDsEAWDJ9KJZMp4/QRIWYZHve/uDxLw6h3cVgftpAaiNqyfShCDIacPv4eHXRr+5TngFAfcdnGqQec/a8xJcelJlbKkuKUA4GgPp5Ye/a8p0nG6HoFg3VDa3I2Frg+R6plDGtdnzF4NadkN8X6FSTM3VNqhuUklTf0XHR2FVY4Rdlsu62M0oUvLgpP7TXgV0/yTeupg53OwBa7WyIZWJMHe7EnZfFafNFlHAzCKR2e/0dLJ17WYJqoQmhlHo+lMyXSzcdwYM8qdty4aZSAtLzuxhCY0HJjpnSeUSTHQ1AWO5Rilez8nGxIxyTO9SC5EgxZuWV4d3sYtHIGrdb9iXx0dh40H85q38YH4cYm4U68t0z3Ko64ihGZX0rFnycA4A/KqE0t5JPau5vG4W3NYmBPjnZiQXpiVTGpMHgPit3bxGTXxqd0UAMrYfSEyXFAEgDLnJdzMFGXDWkJ7bknVH03eXdqLMveRa7Aq9m5ePAiWrk/FrjtVPmiLBSywFGh5pQJcPoJmOfZofmoasSPakNxeUNWLPnuNe8yTfWz8msFshWoVr1fRHmpw0MSIoEDXyGDTt69/XhUqz58Vc0tdJ1vlU67/YMtyLOrrzYnpiU00c4ccXL2/x2bbtbkb4QtNehZ7hVsmEbrQgOgdzreycm+CgwSSkJXT3UiVXfS/fJ8BdSsq5aN85jE2oOwvy0gditomEyjSQsFzKfLPzsID7bd0Lxdyslu6C8Q9aabn5XArHbF607RGVfKZ1HNHM0AO+JPrvgN2o5UPLwbskrw9lm+oV5XQ5/Tr5QZK2spsmvTgbgllcdPyAGiT1tmL9GuGiJu00q5KiRSNeO/HLUqFS74JNSlGM42G0mzBzZx0f5IDO3VFJZp6ah1fPd89MSsWbPr5IOZVVDG6/D2BkQQ2tyshNv8NynqFAT5l6WgAd+NwB7S6qwPudkh1RzC7IUOhlA9zIQuooRS+CTWZWT9nfH+Dis+r6Yuu+BI9KKa4b2wnsUBsV73xdj2TfCzrqYbOqq7+Wn81U3tHq23zsT9rwppNdf09iC974vkTR4yLEWTxuiKN2BREdHx0Xj2c1HFO14OzqkP9/aXuS31Jju1k9DDBqDOCrEhB+OVeC1b8TliKXSG7mwnYm/Th7i8+wCwK7CCl4xEjWy31yUtAoApNNnZo1RJ6MtBKlXc1HmyE4b5sC+49WyHDkhtuSV4fNOcDIAIGNbgeDfxOZ3Mi+W1brbAthtZjgiQwQbgEaGmPHklCFYsjFPsHeRmiaNgMaOBnBum2Zsgh2f7ztJNTDcqQoFWJZ1lHqyDbMEy45w+zvH0WgAqjq298TyOIW8a24+XXF5PdbsOS7pHJFo3LXDndhx9DfUCDwsfFEJWsNh/pUDsWDSIN4H9fEvpJV1uN+9ZHoSb2dlPjrbySDnQCZYobzHLXllPlFJpXU9agf2+UhnG7Fas+ybAslUuwXpg9DPHoLK+hacqGqkjpxJFZkLRSB3H6tQPJ7Is97ZkM69fEGZxdOSsHST9A4tew6enOzENclOvLrlqOjizmXxtHNpo/dMSJCU8CRj+h83jfDUx42Oi8YVL2/z29pkgLwobndAqpN0dWOroBPPHlf/uGkE1ffNv3IgUgfGehl63OaMYrsnZK1R0rwYcLcEuHqo06tPGZ8sNy3ceVptvxcpqhpa8afVe/HdUbr+OulJDvxrdgpvEEIOXbntgJgsttC9IPNjtM3sZV9KqTUq2Q3iormjQSDpQLQa8quy5UV0Lh9oR+Zh5ZFif+BigHmr92NFh3b51OFOvMHT7CeyI/rNV3tAJqDM3FLeBk98RIaa8PtL+lJFxbhRCVrDIXVgLO9DtruQ3nBhf/e5LbvcLtcJXQj2BMu3UPAVoyqJHGkxsM9HuoIRqzWkGSS3mRYxIgD4bZHmi0DSFMMKQRZsf6VISGHvEPoAIFiMTluga7ME4x83D/dEA4l8qRxHI5pVG/jEVPe9fGtHEW/qG3tMpybGel6Xag6mBq3SKy4UtDKIybiCQVoAxRFp9QrQ8e3CbckrkxRXYK+xBoM8AYyrhzp9diDuPVHtI/5Cu9PBnqcD1Wh4c+5p6vfuK6mE0eA+z2uH91a8hna1HXYu3Pld6l6Uypgf2SjdDWLjN0cDIPn4g6i20+TKQO4prlZ4Vufg5uWSxzEy1ISahlbFg4ftZZ7Li87HquxiVDe2orqhFa9mHcXaH4973UAyCZ2qbsSS/+ZSf7812Ij1OaWyzper1S01WQpF1ncdK5fxrd7fPTnZicaWdiz45IDsY4jx0FWJeHvnMdnN26SIDfNWgGJvUS7deFjx88J9DrUY2OcjYxPssNvM543jSQOJPIWYg7B8ToqX0puQgaE1Z+qaPM/q0dO1sj/PngP8WU/GZUxcFH4+fdaznV9Z34q/bcxDU5tLNGWWBlJnwzb8Ym0WWTWC3MjuE1OT8MjVg7Hoi0PYfKgUDa3izWn5jiGHSGsQaprOfYfNHIShvSNwSbwdqQNjMa4/neb+hYYcY14N5WebBccCX7CIz9FxRFgkn2efQF7HH0LNQWhoEV7jhNbuzNxS3qCklPPCPV5Xjfh/sPs4Pth9HIC3sy2UaslHu4tBdoF826YzIPO7lvfCbjNh8bVD4YhQthvExW+OBrmp/WJCRYsiDQAiOdE+Gqo0MEa4kQEHK8qodCHliyJuySvj3Z0geXbL54xC/pmzHkdELkoalXG1umknS1/kP4DsiIic7qdSkInw/isG4P1dxaiHto7GI5/kYMn0oZic7ERmbimWbMiTLdXLB7nmcjp/XogEGQ34+4xkzWUjOxsyJxiNBswY2QeAskXaZglS5DwXlzfg8he3qorOzRrTDxsPnkLPcCsmJTkUCX/I5ceSap/XtOyA/MinBxBmzsXpunNrSWQI/ZLItwNnDjbiH7eMwIs3DRc0atgGzw7KdBA+nr9hBKJtZmTllWFdzklU1rdiT3EV9hRXYd3+k90yWMFvzFvR1NauuUHcM9yK8QNieMcCn1gK766FgueZBC8iQ0y4Z0ICXvvGdxdOaO2mUY3jg+94XT3iD5yzsfgK8IV2/DYfPIWn1ud2mviMXHqGWzW/F5X1rXBEWDWTxPaLo0G7RUke3rmp8bIlLbWYNMg24d2p8Ugb0surt8TyOSkdD5syh4Ytjyc1sOet2S+7F4BShLS6aSZLPsYPiJGVbhAVaoLLxaDdxSDIaNA8FWP6CCdSX9wqS+2HltO1zZ5JSyofWy4GAJtzy7BoWvdKl+IydbgT953Q/vp2BdjRayULw52XxWM5pcAG0GGMhJpk1b5xiQoJBgwGr11pskDvXJjmMZiPltVh+bf059YVqG9u93HcSOG+WHoKTf0UN7WSoGU++5NfHsKz1ycLKi8KFYteqAgb89oaw3xCLkK9CgD/RP5J8GJsQgzeuC2Cau1udzF4d+cxqmePq/LId7zzoaaOXHO+9YT0yXp9TgqmDnf/ruc35503aw/7Odx48JTmx9fy/mruaMjJ2XOwip3+s6tYsQfJHRRhlmBqCUoDgC/2n8SmQ6Ve0QVnpBUzRiiXlCPRLhqDIlBOBoFvh0JqshRiXP8YWapQ1Q2tuPWdH7yiCWRHRQ1GA3D35Qmq1VvE8lTJy29p0AWY79jdrbGWEE9MTUKIKQjLeCJ1chnqCMfhsjoNzko97Ai4EuPnsv6x+GLfSVmNUdvaGcXj4drhTl4hCj4jdldhxXnnaIgRYjKioYVfVYiBsvoprfPZqxpa8eSX/Cm2UnKkFxqBTuPh3n8hxxLwb+R/3kf78MKNw7ycfr61OzO3FI9/fog6Y2L22H4wdOQ4jO8fi3EDfNPwLpSaunmr9+HO4jhEhpjPGycD8J6H/HEvtDymJg37CHIGu91mxuJpbkMzyGjAzI6UAiXMGNEHa+4Z52nZvnTGUOrPMnBP2NwtzLKaJlW61SS1K1BeP80y4uxoPS8U4RJq7CJGkNGAF24YJvNsvRsAkR2VaBUdhV0M8Pk+frljuceRwp+O4fkQJQoECT3CNDlOV3EyokNNnghoZm4plm48TP1Z0mhq3IAY2Y1RaQMubJyRVrw+JwV7S6p4/04e/2f+m+dpHEV2JpUwc2RvRZ/zJw0tLlw7rBfvdbaZg2Qfz1+GsNjOLTt4caETyDQedld6NkJN1fw5p1c3umXjt+SVCa7dRH5eTlr28m2FyNhWgIxthXj0swPYklfm8x5/NhoOJAyAVd+XiMqFd2XaXQxcLgZRIcrtJzZyGhvSoqmjIWewV9W34MHV+/C3/x7GrsIKpA3upfh71x846el6PX5AjCZ5/2RBMBqUNWdeusm9CAfK66dZwP5x0wi/bKOT3hJyuq5zjZXJyU7MGdtP1XlcCEXEF0qUSC1aXIdABHFjbGZcObiH5PvI806i2nJ3b0nkSqhjrSPCguuG+6rY0XD7uH5YPG0IXv29O1Czc2Eaom1m0bmca8SSWi8ll7yrFZMSNh46zXtu9S3tuF+kSzIfnZnP3h2CF4H8jf3svvZFZm4pLn9xK2av3I2H1uZg9srduPzFrcjMLQ3InM52+tm0tLnwiEqxFZJi9FrWUa/vIGO+q47fCx0DgCe+OITUF77Bre/8oKi+VwitFS81dTTkpAOQh/Pd7GLMXrkbD67ehzBLsKKFqrK+1Stqo6Wn7WKULYRkEe5KXn95vX+6TJOmLwunDMbt4+idBa6xYugKF6mT8EcU4XxGi3GjRFqYlqgQEz7646XY9cRVOPBrjeT7qxtasftYheyoNt8u5ORkJ3YuTPPaxd3+1zT8xFM8TcPUYb1x94T+mDnqXDSU1nBjv484QXJ3Nr7MkZdfbIC71ktOYMMfPP75IWQXlPMaeFw609jvDsELpb/R0PG/+yYmwGamM4fKz3qvoyR4wHUkya59VX0zHBHeioVaIrRzlZlbikufy0K9iDKVHF7NykfqC27niezeNLe5cFOK8mwUtSjZXbxQEMrGUYPR4O5cr3VAWrMaDbnpAFzUdr3m9jjQIu+fjZJummfqmmT3E/EnWiw4XIm4qvoWLN2krriR3Lvx/WOpu8mfzyhT9+peqB3DU5J74SsZ2uu0kLvzwo3DkDowFrsKK6h30r4vLKcaJxHWYNw0ui8miSiQcXPClfRjECtqpp0ruO8jtV7vZRdh6aYjss6HBs/1v2GYV01ZeV2zX75PjOrGVtz69g9U/Sr8YexLyZsC3Sd4QSPTHhVqgiXY6GWYsZUm36NMlWZHjqXEXgwAFn2ZS/071MC2gfzV36Kslr+3R2dgAHDvxAF+6UZ+IRAZEozrhvfGhz8cp/4MwwBvbS/CqH7RmjobmjgagWraIgbfgqelBCPJy78rNR61ja34bN9JWefUmQNTqy7T/uoA+r+O7eUxCfYuMYEJQRwEmgVeiAXpiVj746+y1b26K5EKn4eKs/5Jo4vuaBpH7pWcSHXO8Wqq9z0zfShmpvSVdV5yI+bkWZ6S7PDsvLIdGrX9dfyh+gZ4C4iwAx6dGdcspVB4Gh0XrXmPGHOwUXIeWjxtSLcIXtDItD/PcU7ZPTbkBAINrH1WqZQ4Bjx9MFioWUu4EHsjEIXxgVyjb0rpi6wjp3kbnk5KcmDtj8c7pYFoV6emsQ1Tkp3YeKhUVlNlf4hIqHY0Ortpi9iCx1ZS2pJXhi9zTime6MkN+Cq3DN89diV2FpQLblmxz6mznTCtouX+/B2bc09jc+5pOCOt+P0lff0iHavFeUeGmjyF70p2qJyRVsxPS8T8tESvxW50XDT2llRhfc5JarWvCx21z9ueYv5CZrVU1rdi6aYjMHbUS8iJVGdTduVWEv2W+xki3/pudjHezS72icor7a/jr2AEu8fMlrwyn74gnT1cGAgvzuSaaOlk3JTShyrYFW3zX8pOV0NMpn3xtCREhpg9vWCmJDuxt6QKGw6ckp2Jwd5JVJsSp0W6MNcGOh/6W9BAfteLNw0HAEFVLa2zV/yFvxuc8nGmrgmtbfzqeUL4QwFTtaPRmQ81jRFNUgzGD4jBk9OSkLE1X3bPDgK5AXtLqjBjZG9Rg5hsx3Z250yaaLlUx8xAOZNlNU14a3sR7pmQgDV7SnC2Wd4AEYIsNEs35amKfBgNBjS2tMMRGYLX56TgbxsPezmboWZhSUwDvJ9TMoAzc0txxcvbqBoJdRc6O3ghBVvedVKSQ5acNg15pbVeHcS5cxvfeKXpR2O3mTBjRG+s+r7EJw2U+5v2FFWiuc2Fh9MTsWbPcd50E+7z6a9gBLvHjFCHZ3/W49DCtzj745o4I61IHRhL5Wh0h0JwNnwy7VX1zT7pvUpSoQF3TcC4/ufur9qUOJoGnAYAf5wQj7d3FAOQdvovlHvOwN0Xi7tmciEOphz53s6AgXsOHtYnEt8dpes6HhVqQk3HboSSOaT8bIviGp0u1UejMx9qu82MZ2cmUxlk7S4GuwsrsCq7WPX3ZuWV4V2R45BiGiV502KEmoNgNBiojZrF04bgztQE0eg4XwSSa+gGypkkA2mlRn0q/jA+DlOSnR5jzWiEqshHZX0LFnQoeDgjrfi/a5MQbbN4GXz/yy3zafQo5DgINpjqhs222HT1iBx7e9nlYjR1MgDg2c3nag24z47YeF08bQgeXL3f53hk9P99xjAs3ZTH+53kNz3+xSGfjveOCCsWpA9CfGyoqPPjL+eQBHi+zy/v0g4o4L0ean1N2EZlZIiZ6jPdoRCcC7t+KTO3FPNW79fMMR0dF+1pNgtIpxhqwfKOhnKj4+yCjfkmJTmwq7DCU690oUBbLzA52Ylwqwm3vv1DgM5MGVX1rdROBgA8d/0w5J85i1XZRbKcKLIbVN2gfBdVy7lDtaNBezJa56cCwKIpg306X/JF5rXezl+XI9yvwQBgw4FS/HXyEM2dsMYOz5S20DU23CLpZNAYuudrhGRKstMrCkIiH0s2HFat1FBW04R5q/djxW0pmMHqATN1uBPXdOS9l9U0orK+BfYwCyJDzF4LFE0RYXdptsXlfHjeiPH71Hr/FnqyxyIAwfFKCjT5IMZIZIi0ZK07l9d7QTtd24RlWUex4raUTmlKRrj/o72aKej4C/Z6qPaaRIWYvIwL9k5Su4tRVUPTHfCH87s9vxyDF3+FeyYk4ImpSaIphmrhBhmEmuoKpRJ2hV0+LWCvg2LZF+P6x/jd6VML7XmRBsRKhHbYAYnck9KKiELfX6WhSqlqR4O2aPC7x67E3pIqZOWV4R0NdhUA4NmvfobNGozJyU7BSN/0EU7V3aIJBrgdpgoRh4md36Z1NIkYoHuK6PLPY0Xyc+UYuudjVExIbYVM1hlbC1SpVYg5A0FGA2oaW/DS/34R3CmiKSLsrp3Cz6fnTW4/DLmQ52zJhsMADILjFRAu0CSNUdfnSKfaiJ2DmOMbCOewqzsZBoM74k1Qe02Wz0mBsUNqmGtUKa2h6U74y/l1MfCkTT8xNUm4NiTCgqY2F2oaWmXZH/OvHIDUgT14dw65anNCwcILxclgr4M1jS2i2Rf+dPoCzd2Xx+PtHcrsVnZAItxiUqTk6WLgDqR21CKqRXUfDXJzAd/GduwJzxxsxPgBMR5lIS2orG/BAx/uw/Ob83h1rEtrmvCmQidDaHqeQdnF9kxdk196aDAAKupbYLeZJI/7yKcHBJtKyTF0u1IvEFpmjeknWrfzUHoi3lCg+c9GTL9cTFc9M7dUUZ+C7oKaLtNyYGvoc7/PEqxpiyFVMADKaptl9SkiGKBN81CpLtPnk3OohDCLdEyOYeDppt7uYlSlsMTYzBjXUVvI1+0ZOLdD69O8kaf3SnfE33PnW9uLsOOX39DS5kJkiBl/nTzY3fjylhFYc884ZD9+lUc8RM7amdgrnPd+A97dx7MLyrFkw2FR++ZC8TNJbZbYmgoIj4nziYevSsTGg2WK7Nb5Vw7EzoVpnrE/bkCMKntbqBGkXDSRtxVTe+DmF2tdGMfAndOv1Y4FKRxe9OUhnwhhZKhJVm6sPz3smSP74N3sYtHjnq4VzvWXY+jK/R3RoSYwDIPqRm1z1+XQ2t7ularEB3cruri8Acs6djnk3CvavGx2ZPgfN4+gOvaFbsDxEajeM+z56a+Th3ieg1ibBY98ekDSsLeHmlDZRaWYCXwBAzWpBVvyynh32AKRq95Z3JUaDwCidXmEstomvJaVLzunmsuMkb2pdiOE0mm6804Gwd9zJwPg9lV7fNKUSJQ9qCMaLFdmP/90HXYVVvjcRyUp4C4GeHLqYCzfVtilC6Wl+DLnlOhu7pPrcpE2uBfMwUafMREbZsEjn+Ro2tjOn7S5GMU7cakDY32yK164YZiitVTLrArNwnZ83WrZnpU/iwW12CZk774YjfxpCDUNrViWdRRRocK7CdwOz2Si6UXZxTbERHdLSmsa8XB6InqGCzs+5LKwvVISEck/fZbqe8hkLRQpcEZa8fqcUZ77viA9EVUNrZ3qZABAxrZCXP7iVsEdHQLZir52eG+MTbDjztR4hFnl+d9y8rLJ4AUD0V2i7t4pfHKyE2/clqLZ7idh1EVRvPMTeQ5mjOwDo9FAtXvwh/Hx581OHztgAMiLsLJ5N7uYd0xpceyuyqQkByYlOajeu/jLQ3g166hqo47m+8hcvvGgu7P6tcN7C0bCuyOB2okXUnDbfPCUp3v2P24agQ/uGouoEOn5LGNbIWav3O21fgntktNQ09jaZZ2MJ6cOEb0m7nR1k2R9b0V9Cy59LguvZR3F+pyTnsDKjJF9kDowFkumDz2P5iX5Bq2YvUDWUm53+sgQOjtHi51BzTqDA775g2y6upIMW73h8he38r6HRKQNrP+mzY1tbKUzvF+5eQT+tvGIpKFDek9ESxhiUjmOUlSxBrhU9KzdxQheu86AT72JW0w2Oi4aK74twKrsYt7JWGoHx2Dwvka0g7K8vlnPsZaAXU/zbnYRajRYLPf/Wo37OtI4haC9hwk9bOdNTnBsmAXZBeXIPVmLycm9sPtYpVdTPZJPLtXYSaxWQyxXffbYfoiPtWHH0d+oZFml8Ie4CB/sxdsZaZWcO89SyJXK+U4haNQCuzuB2hnlQuaB+Wv2ezkhdpsZKXFR2Przb1TzBWkEuXzOKCzddETF/NI11xBnpBV3XZ6Ai+whHjVIvnVw5sg+VHW9VQ2tXq0L2OOBzE1Prz+M011UlYtk1IzvHyu7roKBuL3AZ7u5XAxufUdapUuLnUFNHQ0xumqueaQ1GK/fNhrj+rsjQVKStAzcD/RNKX18mvbx6cvTposZcE7GLv9MPXWhMm0H3i15ZViVXSx7svrbxsOIDDWh/Ow5Xf/zxZnkFrFuySvzWZxJ4zKxY4h+BwM8uHof3jCmyGrg1jPcivEDYqhSDrszpJ7mkrhoqkmRBik1L7n38N6JCe70zS7oaRjg1mJ/8KO9qOHsMlpNRswecxGuHuqWgH4p84hks0yp7XSxYES7i8Hzm39W/ZucLHER714JR3iLcdV0MWYv3uzGYFyDSEsJW6kAgy6LTc+kJAd1c0Ot4e50VNa3YOvPv7n/QfnQMAD++vlBxQ6sM9I9R2VsK1D0eTaRIcE+c4gaFk9zP+eTkhx4OD3RJ9jHVstTIiDENx5a2rXpzaU17ODiuAExVEENNlOSe6G5zcWbckcgGwGeYOvZ5o7dIuH50RFh0SSrImCOBu3iraT5lRopN4PRgLqmVtnNbj7bd1JSX15OuhgDINrmToOKjw2V+zMkEcpxlKKsttlLm1osatYVnUliGGVszceyrHyfa6CVcUiMV1oVtrEJdrS7GHcR4TUXe2RwHRF6jjUf5RpK7Unlncq5h5m5pZqp2vkDEhjho6nVhVXfl8AcbMTYBDs2HBBPM2Tzxnduw4VGGYek+GQX/KaooJ3L4mlDPOIibK7pUHPzROwYRrGuvtEA/Ov3oxAZYsb6nJPoGW7FpCQHb2BASolQzndmzB4l2VxVl8WmIzO31KcnTFdBzrqjZpds+ggnxvWPgSPCqvo6GBW0MR/RNxK/VjXy7j4u3ZSHAyeqsOFAqdd4igoxYW5qAuanDUSQ0YBnBXr/SMHtd8TXT6WrwA0uyt2J+yr3tKflgZiNJrfOp6nNhS15ZaoDFwFzNOTI4K74tgDvZhdTp0pYTUFoUCh9WNPQ6uX1Fpc3UH9WSl9eboSfGOpaFrEZAIRbgzVLMxCLmsWGCcvpSuHv1BMluzlyYBuvNClRfLsr7CJCHW+0LuwUc4pppUMBdOkGcrRj6s3tRQgxBcuaq747Wo7vjpZLputo3cMIAKIFZLu5Do5SOV8AmJLswLNfHeExgOJ9dlPKaho9jTzV4GKEfxtBl8WmIzO3NOApU10R0tPrkvhobDxIH0jggzZ7gs1frxmMmsYW3kaiRBWUS02juxb2YkcY0gb3wjs7xXdZxWD3O+qK8/T8KwcidWCsT8BmcrITC9ITvVLBaBGy0ZSIMXHtY6UETMNRjgzu/LREzL9yAPWxiZOhwOH2KpjefLDUozok97N8EmByI/zEmNKyiI0BUNuk3XanWIH5B7uKVR33iSmDYTMHqT5HPgJRDEfut5TsJAAqqT6dc2hd2CnluNBIh+4+Jp5myYVGIlVL5Cwob26Xr7UOiD+zagpYxaCdV9U4p5sOlfmcd3WjOwd87HNZqGls8cjOOiJDFH8Pl69yS7GrsEJQUpL2t2fllWl2Tucb7S4Gj39xqLNPo0vg3s0vUO1kKCEq1IQxCXYs3XRE1ufYNsZ/vi/WROzH3/2OlJLYK0xQwGF+WiIclCJCbIRsNCVBMSkbl5aArnw0MrhqImAhJiMaWuTn4KnxesUiSHIWOnYBoNIitkAVSKotMBeirqlV86ZcBrhlidXkadPCvt9CueoAcPmLW/XUB5loJRVtANArwgIXw3hSYoRS1cTqDTJzS/H453TGzBBHOE5UN6BOQ4dfaxpbleUuCz2zLW0uLFp3yC9RRPY4E+sU7C/J3WpOlE/L73l/Vwne31UiuFNEu6asyzmJRdO65+7o7mMVAZnvzxdWZdPvCIRZgjQRNACAF24Yhr0lVYpsA2Jj/FjM37enK0DWIZs5SLHdIjaeg4wGLJmuTMyAa5eqqZ/VYpc04F2pxGRw1UbAGlpcuHa406f5Fm2UXI2RzhdpkhOFnZrsNmiI1zgpyUEt7Umkzf52XRLsNm3lQMX4WqCJjlJOVDVqchwu6YN7+uW4bPiUYtiSqSRqISf1QccbKYnlBemJksdg4M47vfXtH/DQ2hwfGUkufPeQzFO0u2RHyupQ19S1u1qrgfvMZuaWYtzz3/glisgeZ5m5pbj8xa2YvXI37730p+Qug3NRPn98j9BO0dgEO+w26V5OlfWt3XYO2VVYIfszUaEmvD5HXQNXQlfz7eTs5mvhZESFBOONDidcbd1mqAYZDmEW/2RJOCKtuG9igmInQ0xdjmSJNLe5MDW5l+JzJNdfi/pZNccI7F5+B3wyuFr12dhZUI49i9I9ObSxYRbMX71P80g5Fz7PlCYKS15/J7sY72QXeyJZkSFmWVGZ6SOc+NPaHMXXT0kk473vta17+DLnlIZHc2M1GQOiODJrTD+q922hTGnoioX1XQEpieWLHeGCO2xRHTtb3HElR63Hn/2AzneyC35DRV0z5q/1zcfWClLDRKu8pKRhGi3sKJ/Q95C6jsSeYXhi3SFq1R6hnaIgowHXj+xN1Tyw+84h8kfn8tkpSE2MhdEIXmUxMZyRVvzjphEor2/uUEBrwbzV8o7hDwwAIjRWiqLBagry9IFRW1s3xBmODQfU9Uq7ZqgD2QXlOF3brMn9mH/lAKQO7IHRcdGYoELOf9aYfrw7jlrWtZHrr0WNo5pjdIqjwYdW0qjVDa3YW1LlcWR2FVZQFTGFW4MURx3FPFOphU5ooZzb0Y1WiqgQE56bOQxLN6kzfs42t8NuM+P6kb1x1eBeeOTTAzhdK54K0BXlPLkoTQmRy6tZR/GfXUWYObIP0jvUp7iTSGZuKZWBAHTPjuBsxFJixPr1TE52Im1wL3ywqxjFFfUAgJEXRcMRYcUjnx4A4DsXyElZ6woSztcNd+DH4uoup6YjV/tdLqTGRa7yEtc5zT9dp9m5ftWx4zA2wS7pBF+T7ETG1gK8tb2QKvAllLIQSdH0Dei+c4icPgREhGZcx/WV45iya0tTE2O9/rbC6B/nlhYSwGzTosBBJmW1zZ5nVm1a4fNf/YJQs3KxHwD4fN9JRIWaNHP6EnuFY/yAGOwqrFDVk4NPXVRJwTYfbGVEwN3rS6k6K/dYSugyjoaW0Rf2sWiPe1NKX2QePq1oQDS2tnskwPgMpHONx/IlVQTIQrmeMrrf5nLhl9N1mkxoVfUtWJVdjLEJdiyZrn0jsmuHOxXnbHYFDACiQ01uWdPDp33+Xlnf6rMz5dHvbnNh0bpcqu/pzh3BAXXNyPg+m3XkDGaNuUjUMKfNQ+3sKHF0qAlTkp34sbgqIN9nswShXqOcbS6OCAv+79ok/G1jnlc/IiHqm9vwwIf78HD6INnKS2zndFdhhWaOBl9NhdDzE2Q0YH7aQKzZUyJrh539zGXmlkquIVoYBucz4wbEeHYvxRBqjMrnMFbVt2DpJvp+R+xjZOWV4ZO9v1IFMrWqkSB1if4au1KQZ1aL2rpGltgPO7hpNABXDemJrLwzgMSxazSs2SHKpGrXgvzTZ736XrS7GCzZoH63nPtcZ+aWYt5qOufFX82Du4yjoWX0hX2s4vJ6qs9cPdSJS/vHKBoQRALs3okJPprQZAGalOTA2h9/pToeA6CivgV2mwlV9a2i53K2uR2vfSNfAk3oe0k0cOfCNKy4LQWL1uVqUmDuiLDgtVmjAADvZRfJVqLobMgQ+/v17t0jKdgpHACwaN0h6pz17ixxq6YZmdBnS2uaqGUCpRaPzowSGwDccknfgOrBv3X7JTAaDMjKK1PUNEuMpjYXjEYDsh+/ChlbCySblJLf/BalQpbQvRwdF62q9xIfZTVNuP/DfViQnoj4WJugyMCeokoqp4oNeebITo4UDM41Q+uOBBkNeOGGYZJFtGKOAt+uaXqSe6e0pLIBcfZQ3D4+HuZg4TJXcozxA2KwcMqQjrol4bXUEWHB9r+m4V/fHFXkCJOeXrE2i+DubaAor2v21C+pTV8kdknPMDP+OGEAfq06d/2DjAZkbC3Aquwi0VoULefLtT8ex/y0garXgoxtBcjYVgBHhBWzx/bDz2U1muxSs59r2lTfeybEY3Sc3W/Ngzvd0SA7AGU1jYqa9bHhRnLaXQzW7Dku+TkSQQ4yGngHhNSiRP7EpwlNDKSH0xNlD7KZI/tQp9poBTsaODnZicaWdtUa8QYAS6YP9Sx8seHK+20ECm5EjN2llOY+kmfi0U8PyIpQ3Z0a3227+kqlxADAkg2HedObtKqdEFo8yDx1qqoBVpMRTQFKySM4I61YPC1JdYokLZ6Ukv4xHoNpdFw05q/Zr5mBztZofyg9ERc7wqgcctrdAKF7ubekiuo3yNnNIYdjO7R8u3ByoqDc9UxO2t7STXkwGtFt55LJyU68cVsKlmw47OXYRYcG44ZRfQXTW4Xg2yl9e2cRtRFmDjbiuZnJgp3lAfcaaQ42InVgD1mORlSoCS/cMMxzHrsKK6gM1ghrsKbS92yWbjridX3IDs+rW44q6lLOADhd14LkPpG4Z2J/AP7p0UMDsY/GJtg1uYZltU2SQRYa/jA+DlM6VPDIc007Z6zcUYzRcXbsXJgmmPqphk5zNNpdDDK25vu0nVcK3xYPbfSIXZTD3TYtLq/H6h9KcLpOWVSfeOOrFDgM6UkOjEmwy4qGS0G7W5NdUI6xCXbVGvGOCAuWTB+KSUkO7CqswJm6JpSryGv0N+wdKL4BJ7cJmNxt8PSOIrruCM2kWFbbjIytBXiIozCltnZCLN1k88FTeGp9bsC12G8f1w8Gg8ETvQtk2iED3521aJtF010Abj3F5GQnGprb8ZdP1Te/s9vcKY58qay0xv7frx+G4xUNktFSIUp5duHkNIQFvO+BHCdFjsDBhQp7LS+rbULl2WbYbWY4IkN8DCixmjA1u6zc85GS9wfOqVVKjfXJQ3vh9nHxGMfqw9DuYpBdUE5zeXD9yN748Ifjmo5pNtzrE2Q0IHVgrCJHg0DGgFa1DGrP4+qkXgERm6FhCk/appw545n/5iFtsHKFKzE6xdHIzC3F418c0lTrmm+Lh/Yic4tySAQvM7cUy7LyVT/MDORJzLGNniCjAY2tLiz4OEflWZw7FxoythXg830n8OSUIarSDF65ZSTqmlpx+YtbZe0SBYqoEBPmXTkAsWEWnwWIL9fa36kzW38u67YdfWnH66tZR5HYMwzRNrNXd2aliOWhPr85j3en0t8YDcAHu8/txr69swhDnOEB+/6rBvfwMZ78UZ/CraeoatCmD9DMkX2wJa+Mt9aHViHOEWHFzFF9MD9tIPYUVeKr3FK8v6tE1nkwAJ744hAmJTmwJa+MuiGszRyEV24Z4XUP5Mw9ek8eN0FGA2oaW/BS5s9ez4HdZvIId/DVX5CAU9rgXli0jr+/lpJrLCUYQM6Z1DUILZH3TUzAE1OTvF6TG+F/f7d0toca+K6P2uLwnuHWLqH8V1xe72PTCBFhDcZtl8bh9e/8I5YhFiSLtdFnj5TWNPmk99HWRkoRcEfDX54owyOBRDsxs/MJCf54mCOtwaiR2GbjM3qUdIcUIyrEhJpG8doPwP3gqZWq/HB3Mb7K9S2cFnIytCw+p6G6sRXJfaKojXt/NQEjrNxRDMCAJ6clSb31gkOOITV/zT6vZ4imt4AQ0TYTLk2IQe7JGoRbTJ4I4eaDpZ3iZAC+46O0pimgKQLf/PwbMnNLFRu6ciFOjJr7yCYixCQYhV6WdRRRoSbUNPDPgdyFm52vL9fRAICqhlY8tGYv9h6voZ4z6lva4eI8BHLnHi0abZ3vCNkbbOEOPkjNjVSaJPsaj02wexyI2DALwMAjeUurmkeYnOzEvRMTsHJHkddcYADwxwnxvE5GZ0b4heA+g2qKw+02E8pqm/BedlGnCspEh5qoa/4MAF66aTia2/yTaitZrC0zvsCtIdJqZzSgDfv86Ymerm32aXBE2zBv6aYjPk27/CFj2dwu/bA5Iq0+N7WqvkXThlNzUxMCNiHxORlsuGPDEWnVrHESLXIitezmXP5i5Y4ibPRDT5GuDhmvNHANcSWCBVcM6oEwSzAq61vxVW4ZMrYV4tZ3fsDov2/xpEspZfG0IXj1lhHu///9SMy/cqDiY3UWpCEdQU4DUrkQBRa1zgxpXrpmz3HRWh9i5HB/i9DC3e5i4HIxiKKUluWy8dBp2evJU+tzva6/0saAna2U1lmosTfIZ2hrsbLyyryaR9769g+49R26pqB8ZOaW4q3tRT7zHAN3MIp9rK4Q4ZeC/QwKNV6N7mhQLPRsV9a3YsHHOZ0uJCOnvwqx5fwVpOGzF9mUn1WXpk5+K3ctkEtAdzT8qUHPt00nx3vmem7+mJyFJi2bJQizLrmIt0BNjjSZFCRS98DvBuDXyvoukVvoYtxGWWy4xSvyYzRCUjWEMP/KAUjsFY7YMAu+LyjH8m/lbVHSTALcHN7lc0Zh6aYjfnue56/dj+BgQ7fKrybjlfa+q+W7o7/xvl7d0IoHVyvfyYsKNeHO1ASvceyWVFWem9wZ8EnEqpWqFIIosNhtZpiDjWgRiQCS3QiAv6h21ph+osWVDNy7DAvSE7H2x18lVVY6q+iUdPcm17/dxSAyxIy7UuOxLuckdc1Qd+2nEcieN1KKbFo3BX28Ix0vyGjoEr19pOA+g0IpZHzpjl2Jm1L6UNlN4dZgLJ7mW3ejZSaE3WbC4mlDRJ+n2DD1wjta7IwG1NHwd2SF74LQSqtxHZVATs4RVhMW8cgR+iNSMX2EExNf2talmn3FhlswY2QfH2P+4asSsYxCujd1YA/P/TYaDNSOBq3evFBfh8XTkhBtM2NLXhk+3XsCdRoreHTH/OrJyU5cN9yB/x6k66CuFH+m6FU3tOKlzCNe6Q1jE+yw28yaSEUHEu6c7c9O2wDdztQLNwwDAMGiWto0hdZ2F7577ErsLakSzJfv7JQUdvEr9/dGh5rQ3OYSbGbW3ftpBGInxwB3fwepYK+ceg4ax6G6odUjiqHF7xSaD+9OjUdFfQu+VLHD7oiw8D6DfClkXgX8NY1YuulIl5kzHREWpA6MpXI06praMG/1PqwwniuE1zpIU1Xfinmr92OFkT8gmZlbiqdV7MpzUfOcBTR1KlDGO9/iuHNhGm5K6Sv6OW6+ZaDSd8h3ctEyUuGMtOLeiQl4c3uRYidDaGoMNQcpPzG4n4vM3FKvrefZK3dj7Y+/IjJE2BcmaRKj46Kxq7AC63NOwuViZNW0SPWsIIYG9z6U1TRh3up9qGlswf9dNxR7n5qkWX45Qei5uJDJzC31u5MB+L8O6M3tRdh88NziHGQ04PqRvf38rdrDN2eT+XRB+qCAn090qMmjULVzYRrW3DMOr80aiTX3jMPOhWmYnOyk7p2Usa0QV7y8DTWNLZgxso8nh5xAE+iJCjHhxpQ+Kn+VMGRu5JuDqhtaPU4GbQpYdyIQ9gYDelETtn0hBq1Bt+r7IrS7GMW/k6yfr8/xTWNyRlrxxm0pWHzdUPSN9u1gLYfZY8+pera7GM9avauwgjcdhzggjsiQLuNkAG75YbkqnOyUI6GUMaWIpTVl5pbi/g/3KVZL5UPNeArojoa/C2kJQhck64h4vQDhTF1TwNM4yOTCjurnnz6r6pghJiN+d3FP3DYuDmPi7Rj7XJai47A1/L0iiBEWzB7bD9UNrVjz43HZvQVIxK2qvoU3Pex07bnnRKhj5fQRTlzx8jav86JZVsXUFNi9XZZuOkKlOGIONuLm0X00Lx7uTvnVtA3JzheeWp+LazqiWQAwKckR8L44hCenDsG+45WSNVMEmmj42h/9q1rDR1VDq1dhKTciStM5m41YSgtVZLmxFTeM6ov/HT6tqgcUHwYDUFHXjGe/Ep+DIkNNsAYHeQWQtGq0dT4TCHsj1BwkuKMkhFZNQas7xsLouGjZu6VsR3RyshPXJAsrYY0fEKMq7TM+1gZAODNA6DntKmuf0QD8KW0gmttccDEMHBEWnK5tlnymhDJsJiU5kLE1H+9mF6NGZWsHvu9odzF4/ItDqo7LRoudUU0dDTEtavK3KcnuxVZo+ygyJBh3pSYgPtYGe6gZf3h3D/UkIXZB9hRVUkvMkoE+OdmJ1+ek+Cjc+AMSudIyJaGx1YWvcsuQ82s1fn9JX8VywlOSHYi2mb3SDIrLG7Bmz3FZizobMtEtnjZEsAkZWUijQk2wBBu9eqJEhpgwITGG17AXulVhlmDccklfTBJp1iTnHnB3wDYcoC/2o6U75VefD7nGcuDm2NPq4/uD0ppGaieDIBYN78x7JWSAKHFUxVJaaA2d8vpmvHTjcDy4WtugFMNAUvWPgdvg/OjuFBiNBs0bbZ3PsNNV/IVcJwOQntPHJtgRFWKisley8srwl09yBJ0MYmcJNaAlBr6YEta4/jE+n5cDe1dOTi+SrrL2RVhNeO2bc45WVKhJluPKnUfcMtfq2yYIfcfuwgrNWkdotTOqmaORmVuKJRvyvKMqEVYsme7OU+YabwaDeyIlRIWaMPeyBMxPG+j5QbsKK2Q5GYDwBaFdNKJCTV6OytThTmRglGRxaFSHYoLcG3wuqt+Meav3+yXyUlbThGXfKI9IvJtdjHezi2G3mfC364aiuLxBdSdL2k7bpHDzoz9eip+KqzzNs6obW2Wn2IRZgvAkTy0MQWk+9pm6Js0Nr+6YX91VIlha8lWHOgwx/NiGTyDz/j/56QT1e2m00zvzXhEtfW5QS+kYJAGD3ccqkDow1ut7aM9n/IAY3HciodPkkMvrmzFjpP9SuM5XJiU58OerBuJf3xR0uioT7ZweZDRgbmo8VRBPqgidrLNSvTukzueFG4bJzu4gv3d0XDSueHmb7F4kgcqAESLMEoyzzW0+Dh8RorBZglBP0ZCXPY/4SyGM/R27jtE1bKRBq51RTRwNkg/Gpay2SfDhJDsEd6fGIz3JgdFx0dhbUoWNB0/J7uAKeA8o0oGaPaBoF425lyX4DMCpw3vjDaPBx1liN/0hk0fG1nxZUX4GwLXDnYIpOlqg1XEr61sxf22O6uMsnjbEo8pD22n7myOnsSq7WNVvKattFlROUDMB9Ay3amp4ddf86q4SwdKS93eV4P1dJV7GO18xtb8bWNKk9UxJ7oU/jE+gMkLU3CtHhAVNbS7BPhZi2G0mVNU3+zTLsttMmD5CXQ3MvI/24YUbh1ErxXANxyemJmFE3yg89vlBKgNES2LDLLzrXnems9TC+JA7p89PS8Sq74sFA5c0Reh2mwnfPXYlzMHuUlyhdY/PAeG+PinJgTduS/EJJkeHmlDV0CqY2vz0dUnYW1IlGUzkUzXyp8odDUECt4k4R+YgI2CB4Fjncyz9sRPs9HFelY17owG4+/J4pA12aD6PqHY01OSDGQBszi3D6Di7T569nA6uxHDdkleG1Be+8UqxcURY8H/XJiEy1Cy5HRkVasL8NH69e5qOngDwUPogXOwI95ngbOYg1Atss67c0TlRsM7AGWn1kv6kNVi+zDmlyUQj5BAonQCiQkxwMYysDpxS2G1mPDszudvlV3dmapG/4aYIsOeS8rrmTteGB9xzHK18YVV9syLniMzVL2UeURT9H3VRFO/Ob2V9K977Xn4zPTbVja1e90jM0OEajsQw21tSFVAng6SWPvJJjte6p1VH3/OVzlYL4yI3Mkx2Efh+A3kWeXoUe1FZ34q9JVWCY1qoZmL6CCc2HCjlraXIfjyNSpKW/Xtpg4lltU0+zrJQYEbMntIKsebKJNNCiHOp4Ule18sfap+zxvTzskOV1tS4GODtHcUYHWfXfHdUtaOx+5jyfDDiyfLltsrp4EqcDP5dlWZqTfwXbhgm6r0FGQ1e3T9Jbj73M1xDIjbMgkc+yVE9MOZdOQD5p8/i6zx5udZdicXThnhdr9Fx0ZIGiwHKGrLxQRwbbsSmrKZR0fGqG1tx69s/wBFhFX1W5fCUhDb2hQrbsOsqBoJW8KUIEAOAdiEGfHOttYTW6Xf39pGf5ulkzdVvKUwx2n2s0u/PBvseCRk6bEMqUJFzPmdHyODRqqPv+UhXamA3/8oBSB3YQ1FkWOzZI7WuUggF1oQcsdKaJt4AgNjzNDnZibTBvfDBrmKUVDYgzh6K28fHe3ZSaOeVpRsPe/WGYTvLHsnbWndgZtmWX6iOqQQD3DWgtDW9fDg6HDaugI7dpqzhpxjxsd6qYGpravwhq6/a0dhVWKHFefhAFmZ2B1ehiBIAVVX2tNEfMdUEvt0OYkjsKqzwijYpZc2e49RNmroq0ZzI/96SKioNcrWwtzH57qNaaVq2QpZa5EroXUiQxfXxLw75zaCmxRlpxTVDe6mOlBOEUgTkpCE9d30yDpyo1rwWwGhw71JIocaImz7CPb+qMQL9HcX01GsUVngVVwv12whU5Pzuy+OwmdNd3BFpRWNrO+84kdO34UJDq/QUsmbwKS7SktgrXHBHQUw8hyCUSbGnqJLK0eDWBxBjfenGw7KeWbHniW89fXtnkccucrkYquJ2rm3DdW5qGlvwUubPfnXoya+irZHhEmoOwso/XIKahhbBnVca3IqecVS1sNz1Q2lNDaBNcz4+NKjR8N8US9vBNTu/XJFREhVqwvLZKRjH0U/nQ0w14f4P9/l4kGznRav8fS2cjMlDeyHzcOftiHCvRaCaKgFup3RLXhnvfayi2DGJCgkGAwOvJB05ns0cBHOwUXRbVQzffMvux+RkJ8ItJtz6zg8B+052A0bugq6Vo0HgPvPuZn4mqvEdbbPgialJaGlzYZWG5+ViINr8iaDGiHtzexFCzaaApMbRFmoK8eDqfV7jnMzn7JQCtZFzOXnn7+wswetzUryeT5eLER0j/jIaujpaNbADfOVfd+T/htcpG8ICwkEEoWDX9SN7+6gi8ilCya0f0mLXje95kmsXyf0+4ty0tblk14deMagHLh8Yi4yt+aJpUGx6RViwZPpQTEpy+NicNDS0tMPVzqiquX3oqkT8+apEAG4JcbFieK54EWFyspO3poYWre0y1Y7G+P6xyNhGP/CUEB9rw86FvrmBHnUqhVX21Q2tMBoNkk6G2IJCXuMOJjLQ7kqNR5+orhOhHtgzHOhER4M78dJGc+02M6rqW6gGLzcViy0UcPmLW0XvoxitLgb1EkW19S3tqG9ph91mwoi+UfippMqrY7hQ8RyhsbUdW/LKul26A5dyiui6UtxOxRBE2yySRW9jE+yapyvxRaBmjuwjqSADnFsArh7q1NTRIAhFwEk0lKhoKeXN7crV7+QQZFAXwecGE/hSR9RGzqNtJswY0Zv6Pi7dlIedC9M894Y25e5CVHMTQ84OoVBNAp/8a01jC76g6AoNiCtMCRnnlfUtHoVHqSwLOfVDWu+6sXt+ybWL5EKcmz99nCP7s/dfMQDjB8TgInsIdXT/lVtGepTnFk8bQp12z+bz/SdUzQvs9PxZYy4S3VmpbmgVtBf4Us4On6zGlxQy/FoLs6h2NMYNUJcPRkPPcKuozrPSKnvAV36SDyULChloZHvT36oytFyaYMfqPXTRU7lwJYu9/gb+iZc2MrN4WhLmraZTn3ht1ijEhvkakbsKK6juo1A0VE6EtKq+Fd/+8huWzxnlY9BuySsTTA2qaWjttrnVbPylQLUgPRHz0xKpUknaXQwythZoOre5U5R8d8/SkxxUjga5LmMT7HBEWDRJySQIRcC1rEFoaJHX1FMptZQRTFr4UkfUGvCV9a1Yf+CU9Bs74N4bOfK73QkaWdRQcxAWpA/CHZe5awn+OnmIaBqTEmOdT2GKdheslKLGhqZ+yB/1KuR5CmQvHanCdy7szIDJyU7clRpPlWpWfvbcfMpN86ZFSW8VNg9+uNdrB0bKrhJLjyR2c2ZuKd7NLpK8X/6S1TeqPQDJB1OK3WYWdRPEcodJO3tGxTB6f1cJZq/cjctf3IpMgWidFhGhruBkRIUE47HPDvrFyViQnojls0d56mrYiEn7kcgMJD43dbh7Uu0VIT74DQCe23wEYxPcygnjWWlxWXl0fTeCjaqHhVsVBMDSTb7nMinJAWsw/3eQx+SZ/+ahvSs8NJ0EMRa0yiw3GoDX54zCQ+mDvJ5BMoeszzmJXYUVaHcxaHcxeC3rKFKWfq26XwwXF+NOy9l80Huukfq9BngvnlvyytDUJs9ojwqhK0Rkz3fEwLoQlcDkwnbEAG0MeLlzMfveyH1mugtiawqhoaUdz24+gite3obM3FKPQXbtcLdE8saDp7zmAznGujPSKuggyDXOpdaByclO7FyYhjX3jMNrs0ZizT3jsHNhmma7bmy4z1NX3ilbzOmXNSnJQfU59phW+vvGxKsbb9w0LzEnizsn8UE7h/tTVl+9RYVz+WAOCSOQj+tHimufuxfm/T5OQGZuKS5/cStmr9yN5RqkbpGtcT5nQ8uIEPf+kUZ/gaC6sc0v8moAcLEjHFOH98aK21LgiPS+Xg6RiRc4F5mR+tzkZCdeuWWk6HkIDbzM3FKqiDHgmzahhtKaJmRs9d76dG9lCkeiaSaPCx0aY0EOGbNTcE2y08up2HzwlGcOeWhtDmav3I3Rf9+C4Uv+h1ez8lHTqG1UnM38Nfuw+aB3NHvWmIsEd/UA31QIuTst6UN6Ur2PrczWVdR7uhLEANHaGaaBvRbRBmm6UyE4QWhN4cJe99k2BZkPLn9xKzK25ssy1u9KjUdzm8vjqLCRY7zSrgPESeIG1tpdDLILtGnexvc8deWdsmiOuIsSp1zJ77OZg3DHZfEBnxeEgqhy5vDIEBMeTk+kdsrkoFlncKXa8JOSHLgkzo55a/aJem5/+eQAwq0mjOsfI1jQqwb21nja4F5eCiOj46I161DpYty5f7HhFqqCvvMB9vYdbb8RLrSfY29tisGe0Mlgo/kdkX5IAyQ5lvGxNllSul05YhQIhFID5HLfxAQYjfBp8sZHoJSuSADlDaMBLhfw1PpcQQlnrVIhUhN7ILuwgrqANJCpEUK4G/Spl4zWEmKASOXJM3A3QbQEB+HLHOkUKSWppzTpM90VsqZ8X1CO+z/ay5v6Stb9J744xCvgUVrTJFt96NnNP3v+m1trocR4lbsOuFM+87Equ1iVRCsbvuepszt3i8G9ZnJqWgju9FR5vS/unTgA5mBjwBsNvpNdjDEdfUfYyJnDqxtb8WpWPtb++Kvmc4dmjgbgrY7Q2NKOv0tU3hsNwKmqBlQ2tEjm4DW0tHf0K3B3laW9eWTHgMaAIBGES5/L8pp0okNNGNUvSrNFt6iiHkm9Iz2LRlcdrLRwc7vF62mEofkc7USdf/osdhVWeAqraO4dA3dneK3TZQB4LVa0UrpdOWIUKIix8OqWo4qaEAHAxz+dwFvbi7rk+PrLJwdEc3pvSumD1IGxiAwxewqylc5DlWebsXjaEMxbvZ+qAZ1W0VClkGar8xQUZPoDPmOfxtBfn3OSytG4c3wcb2G41O6E0uBOd2BLXhkWrTskWl8n1XxNDVwRASVNSeWsA5m5pZpLgz98VSL+dJVvXVtnd+4WQ6hf1vI5o7B00xEqpzzIaMCS6UnUheTshs9C84Iz0h243nhQnagGH3y1GkqClTT1QXLR1NEgZOaWYtG6XMkHz8UAj3x2UNaxaYsf5185EKkDY72ic1/lluL9XdIKH9xJp6qhFVt//k3WeYrx4e7j+HD3cU+0Q8rT9keU3R8EIgJPG0XJ2FaAjG0FcHY0N6LhrtR4zE8biLU/HvdrJJdKSldAtq670O5isPtYRUefHgaRlPUFfHTlsSNVOPjZvpP4rEPpxt6hUqSUpZuOwBlpxR8nJODzfSe86gOI4EK41YQHPtyL7Ud/83vPCimWTB/qXrCNBixad6hTewiJGftShj6toXj1UCcu7R/D67QsnjYEkSFmrM85yetIKA3uXMh0he7gfCICT18nw3gN8V0HhPpv+Ov3LvsmH4Od4T5GZ7uLQWSIGXNT4/FlzimvHVkpdUV/IdUvS0jGXMgpJ2UBj3xyQHI+5DZ8npTkQLjF1KGK6h6f4/rHYEPOSb84Gmp7NLFh4N7l06oHj+aORlcY3ACQ2CvM64KT/6ZxNAIF23Pk836jbSb8fUYyjEZDl7imUtA+1NyJcnRcNG8zLKEJVc5EXVbTRKU2AUDRQqAEmvvYnWORQlG5rhY1CzSV9a2qJW1La5qwcod3s78wSxBG94vCE+sO+rUuRQ4L0hO9arPSBvfCuOe/EUwv8zdSqUhChn67i0Fbu0vy2TUagNFx0TAHG72cllibBT8WV2LRulyvNBjaJrPdla5UX8Td8Z+c7MSC9ESqlKy5qfFeht7mg6U+aZbEeF66yX+/9/HPD3lS14lT49sHxISZI/sgvaMPyJa8MizZcNgrOOyIsGDGyN4+csJCmIMMaGmX96tmjemHZzfl8a77ZTVNmLfabXOxe+JIIeZkRIea8PwNw7zGIt/1+XzfCUwf4cSne+kkkpXA16NJqSpsVUMrMrbm46H0QarPS1NHoysNbj6jtyvmFDJwRzt2LkzzydWurG/F0k1HsHhaEh5OH4RV2UWa5VxyCbME46xEjwgxokJMcDFuhQ4xD5hvAHKlf4W0zcniKgcSUTKIyAtzUyImJztxd2o8dfG4P6hqaO12jbYA9/Mh5OR1lTF7oXG2uR0bD9EpsgWKxJ5hXv82Bxvx3MxkPNDxbPj7WYgKCcbc1ARPXZVQ1FMoGEKkkWnnbBcD7C2p8ko9zcwtxbw1/EX/fH09dM7RFeqLuLCNwPlpiViz51fR/P/oUBPmpyV6/v385jy8ub3I532lNU14cLX/AmOAO3//1rd/8KzNfKmoVfWteLejVuDcWPGVKRjVL9ojJ5yVVya6zspxMmzmIJiCjaKpz2Idzvmgqe+0dAQHCELB9tKaJt77pyVcu3dLXpmqHf1V2cXUcvBiaOpodIXBTYxGl4vx2WZm5xR2JYgy0bKsfN6HkzuJRFqDkZ7UE1lHftNMIcklV6iaA3siEoq0CQ1ArgMgNCDZ3UblwOBckSVtIRhtXwN/0t2KwdtdDJZsoCva70yn46GrBuLjH0/gdK1wUXU0ZadvHX6WbjqCa5KdXmNSjjiAM9KK5D4R+ObIGUXS4tWNbbjYEe4pwBdKVeFLzZg+womPfzohe4HnygqL7arKNZi6G3LmTn+JgHDhKoYtmZ4k6DgbADzPSsXZfPCU341UGsSMZfYz6XIB81b7rvWna70d5NFx0Vj706+yelQJUd/SDlCkewr1C+KDxqYtq232HKuzgu189WO0IjhiVDdqE/DU1NHobMOIGCCNre1eSk5s43dyshMPpw/yS8GvGlZlF1M/nDVNbfh83ylcN9yB/x4s08TwUttkhiAUadNiAKrtNnp3ajw255aJNjdipyw4IqyCxmQg6G7F4KSDqRQM3MptP5VU4qtc6S73ISYjGlvVN4qLCjXhhY4t8iHOCFG1oSYNvu98hajqFZc3YFnHPCt3DAkZAiSN6oNdxSipbMBF0aEY3Csc5fXNqKxvgT3MPW6r6psxb/V+VWOXGExLN/E7E3xRXTVRS66ssBRyDKbuBu3cGWMz49mZyQDg13TZGJsZo+OivV4TKxhmB+vaXQyeWp/rt3PTEvJMPrWev0aX64w8tT5XtZMhlbEgBI29SmvTkvd1RrBdKFiq1bloYddr6mgEyjAiEQhrcJCXYRLVUYDENUS5xm98bKhfz89mDpJdSKkkJeq/B8tgswSBYbwdBaHUIy0Ryp0kE8mT63LR2NIOR2SILOUnf5Ke5MCiaUnU0cmoUJPn93RWQVt3Qs6EZreZsf94jeT7okKCMXNUH1W1DVGhJsy9LAHz0wZ6JnIhI4HMQVo57ucbjggL7kxN8Fynix1hiuWJ+Z4HoV2Ep69Lwt0p/QG4DbPLX9yqeswKpaT4IwWCreEvd67s7ABfV4QmTdpuM2HXE1fB3NE89fU5ozB/zX6/NNetqG/BFS9v89ntp1EM21NUed7tjorVUhFnRIt0L7I2K0nIoLFXi8sbZB2rM8ZirwgLZo/t5+ndQp4frc5FC7teU0dDiXSbXMjwe+GGYd5Fc2EWPPJJDu9nuNvM/nKI5l05AJcNiMUjn+TIcjQswUY0y+zyS2BHA6JCTJibes4gInmQb35XgG+PaitVKZY7ycA9sS745AAA9yI6lVL5yR+wDXe+ok2hlK6aDoeVu63OrSmx+yFNpjs22pIzLivrW6h2P+amJmBsQoxiR2PmyN646ZKLPEWQbLhGgtgcxMWAc07JhcTssf180p0mJTmw8LMDHvUsWrjPg9A45QaSukJQQy6/v+Qiz3/LNRC6284nDTR9E56bOczjZADA1OG9kQGDIgOYuybwISQbKqUYJvd5UBIYU1ow3Nk4OlQlaQVfAN9Anlhq5DKJzBfusbQYi/ZQEyop7sWDvxsAS3AQ1uw57iUsQAIvWpwLt4mhUjTvo7F4WpJmhUnRHRFl9gDgqn+QAbqrsIK627K/isIH9QqH0WCgluAlKHUyuNQ0tmJZ1lFc7AjD5I785prGFs2dDLmU1TR1Wr2DlAa9WEoXcVCtwUZ89MdLUX622UclKzbMgu8LyrH8W/Xd6QnThju7ZYFnVX0z1YLtiLDgRDVd08P4WJuqAMi6nFNYl3NKsPaIbSRIzUFsGAAzR/VBZIgZa/Yc93KabGYj6lvOz9SrWp6d2S15ZbKdDO4CRzNOSSBJToOtrsKyb/Lx8U+/yjYQtDIELkSUNDOcOtyJBWfoU6uJUU+7C8LAV8GJDZ/RGxtmoTq23WbG32cM9ekTYbMESaYnVTe0elKx1RKoDIDF04bgztQE7CmqpHY0uPaAsATuECyV6AMHuH8n27ZQY1tGhZqwfHYKztQ1eYK0YvxcVottP//Gm755/4f78NBViaLp3wYAoRLPxvQRTk0CnprL23Jbvytl/pUDsWCSW1aLphGRnFw6fzWakdP12R9wF1x0/LcUBgChCtK95JwXQBf1kYKkzZHdBqnDSclSSkU/GZzr3cKWwyOqMI9+eoDagB3eNwIHT9RKvm9nQbmketeFRmZuKR6kbMz2+zEX4Z2ddKkr5XXN2HjwFGaNuQivZuUrHu80TYxo5yByDmRxdERYsCA90Uvh6KXMI12i+FMu63JOYtG0cwtvu4vB418ckn0cufnGJJCUsTUf/9lVLPv7ugJkZ2b5nBQqY8WA7rnzKQep1CQ+w15OarWjY7deTiBNSDhFyOi9eXRfquPedmk/TB3eG9d07OqR31RW24QFH+dIfn5HfgX1bxCDgdvpqapv8YvDQXYRSIqmHOOebQ+I7ZDSrkVsGW5AWRNDdpZOamJsR+8oaaR6u732TT6iQoJ507/Jd5qCjACE7b4NB0rx18lDupbqFKBdjlrqwFjPj6MpdKONApH3iRViLZ42BPln6mVFNRyRVlTVt2DppiNUn/EX7J0bdPw3zWdMwUYqxQbyWxmGwenaZlkTiRZOBuAekABUN+MB6J/Xez/4CS/fOAJTh59bFOT2Nvm1ki7fs7qbSdvSGqOh5iCYg4147Rv6DuHs8UjUypSmCEg1MaKdg3yVWJqxLCsfK25L8dzzJ6YmYUTfaB/NfC7+VswJMRnR7mKoZSYr672f3Yyt+bLOjU+THqAfpzS9CUjamothePuGdJaqGfnORV8ewh3j4/HaN8K/Reg66fgilJokZNjPGtOP6rjsiLqSHXt2yh8AQaP3X1vp5juyvnJ/L63hqqV0/vUje2NVdrFfxhJ3FwGAJ5AkxN2p8Z7+HkR+WmyHlJb4WJvPa2K2JV/tLDcYqmUJQnXH/MZdIxwdz7mUjauV2ITmjoYWeWGOCIvgdrBQPh2NV8vdZpaKdtAUMpJHffoIJ6+cW2chx+GbktyLSr2HQHpZKNkRUtKAh8AdkFJFdDTQPq/1ze14cPU+3HciAX+dPESRglZVA32fku5U4Lm7sILKGG1oaVdVZE12wRakD0J8bKgiVaSqhlbMX70Xfxif4PO8jU2wwxFhlZ26IyRVOnW4E9ckO5CxNZ93ESXfPPeyBNmpHnw4I634/SUXoc3FAGAwvn8sxiTYMfa5LLTIcBbIs9vuYrBKhgH28FWJ+NNV/JrtWtUhkCM/31Hjl7E1H6uyi72MLEekFZOH9lLdHFEp1Q2teO2bfBgMvkWuoeYg3DPBXXdUfrbZq/hThx6xaPayrKOI6tg1F0o5YUfUR8dFK9qtZ4/7hpY21Uav0LulbCN/BCsiQ8zUUtRyYcvb8zmLfO8fk2D3Mpa1quMSmpfEbEtSOytkt2jdNJgv/Xtsgh0bD56i+nyXU50C3A+12uLYpjYXtuSV+URrxBRHJic7JbesGlvbfY4rVojFfViKy+s78qlZnS5l5PPJ4eqkXpibmoCq+mb8bWOe7LoPOQvzgB7hAKQdDba8JwBFE4kSJ2NCYix+N6gHbh8f71W8J1VER4PcnMo3txfBagr2e7Fpdyrw3HUsMDVEZGFf++Nx7FyYhiCjQZEq0le5p/FV7mmf1IcgowGzx0pHiYTOjR09YgdUxibE4PU54T4yq8TxnpTkwNofj4v+Bnb3YLFuvlyDdRelE8iGPLt7iiqpo6QL0gfhofREwb9rVVdn75AzJfdsfloiLomzdzyD7vlkXP8YZGyV3hlxH49/rdMiksunpNPQ0o7/7Crx2tXTu4QLwxeYBCBZ72Ng/Tdfygk7or63pErxbj0Z91owvn8s7+ti/cOUBCtoIHPspCQHXt1yFBnb6HehpahpaMUDH+7DvRMTeCWmhd7PTntVazzTKEMK2Sc0douWTYNJ+rfRYPBK/6a1MYrL61Wfg+aORpDRgL/PSJbMcYsW2brmezBoFUdW3JaCx784xLs4Vje04v4P9+ENGd1UuQ/F/LREn4nLHyong3qFeY69cMoQZOf/RlVQyR0AUpEMR6QVwZTRsOWzUzBuQAx2FVZ4fv93j12JH4sr8X1BOd77vliwzkNN1GRHfjl25Jfj7Z1FqhZUoUWHZguRzds7jyn6fhq6p7Rt4KKxXIOe3Zfhh6JKfJ1Hv7PH1zNGrXT2mbom0QLFaJuFNxI2fYRTtKZj+ginZ4eErZIFBiivFw5iyN2dMRrg6RdAu5hHhgRjftpA0fdoFeV7atoQ0Zz4z/edwOJpQ7Bmz3HJYzkjrXhyymDMX5vj8zfufKs2bY+NlHy7jhu++2u3mXFpQrRkvU9VQysWpCdi7Y+/ShaSd4Xd56hQE8ZJGK98629URwoeCVZoJZDDnmNTB8Zq6miQ81u5Q9rJIO/n7hirCeRJCcxohdZNg7nPKW3w5tWsfE/zUqVo7mgAbpm4+05UCy58BgDPXj8Mf9uYx+tosB+McIsJZ+qaBHcMuA9R2uBeMEA83/txkTxrKfi8UX9MNEXlDbj8xa0+Gv2A8GLFNwCkJP4WTxuCReuk8+OdkVbUNLbwnhMj4DByv0tt1ETNgirUJwOQv/hr0cWUj0BNYF2N8QNiNF2IaCBjlmbrXQitFzDAHT1alpXPG1CZt3o/VtyW4hWVAtwO9IYDpaLHZRf1CQkZ8BWnLt14WNb5uxh3hHf8gBjqa3FXav+APe+OyBAA4oEralGCSy7Cs1/9TPVekrb30FWJ+M/3xZrmwwul3nVnhO5vZX0LdZpwfKwNOxemSabndoXd5xdYXcS5iNUTEnltfwjkkDmWVk1QLnKOxw0wqdkhlRKYUQJfEFRpKq4Q3OdUbKeLjRZzi1H6Lcp4YmoSXp+TAjtHhcoZacWK21IQbTOLXkDyYNz6zg9Y8MkBqgYwGVsLMO75byS16asbWpFBWWBFgz8mmk2HfJvt1XQ0I1yQnoi7UuN9rq2j49pyGwKtuC0Fjkgr73sjQ8yegiExUvpFYd7q/T7nVN3QKupksL9rftpAOCOVXysyITzz3zy0d8wy7S4GuworsD7nJHYVVnheZ0MmWr5zVxphjAoxqYrDL0gf5HMt+O5fd2Bc/xivvNtA0DPcKvhcyIErvlBV36L4uTAagNU/lIjmarOffQLNjir7HIV+N3HkM3NLPe9RkgJLDAyymItdj6hQk+RuBkDfLVuMqFATxibYNSsEbXMx1M8OOe4nP/2K52YO86TnaAX3OezOiN1fOfQMt3oc82uH9wYAbDx4ymedqRKxTbQiKtSE1+eMgiPCW+rWHmrCXanxiAwx+6yJ6/afxMrtx7Dws4OC14IYke0uRtBWUAqZY+et9k8TRCWQuYkY2YC8cbggfRB2LkzTdI3OzC3F5S9uxeyVu/HQ2hzMXrkbl7+4FS9lHkFTm/qgpgHCMtiTk514OH2Q6Oe1mFv8sqNB4G7VsyMC63Pk6arTICdavur7Iq9Ov2rwV18OLudyzH/FzoVpeFKgyzUXscKkf/yPLiL37S++es1ShJqDsPIPl3jphRMPWul1Yj/0NY0tvrsUISbMTY3H/LRESXUJNcxNjccyBXKpJDXqgd8NwCVx0T654d0xGhlkNOCFG4aJpsWIFWfKgVz/kRdFIfXFbzR7LrILyrElr0xW4yguLgY4XScdUOGqgNDuqJbVNCK7oByPf35IdHd4yYbDAAyKrw0JvNBEScUisWy0SE+de5m7eHdXYYVGqa7yS3VLa5oQbfNfoWxXSOPpbNQ+K9z0VbHa0ElJDizdpMwBlrN2zL0swUu6NiuvDOtyTqKyvhXvZhfj3exiQVUjMfhSSb2akNoseOTTA4K9GIR+lyPS3W/qipe3dRmBHMA7KCykDiWEAcCaPSW4JD7aq6hazZottNtUWtNELW9uAGAxGdHUKtx7SSxLgjbdV83c4ldHAxAufOns7UYtJUT91ZeDD+7EwHf+Qspc/L+VbpAo6bHR0NIOMPDpFLzithQsWndIlWDAG98V4DueRoTVja14NSsfq74vxgs3DENkiFnzxdwZacX8tERc7AgXlLB7q2OS4EtXmz7CiSte3uaTG96dCzonJzvxxm0pWLIhz2unkyzoACS3eAnRHR23hdIFp49wIvXFrZp2cw9k6hd3wqedS5duOiK6Mwx4942RC199kZjUo5znXa0Bzd450cIYNxqg2MA4U9eEGSP7YFKSA7uPVWDeR/s0S6Xq7HW1K6Dm/nLTV6VqQx9OT1S8vkSGmvCHcXH4YHeJaBZGqDkIl8RHe3or1TS24N3sYlXGKZevct2pl3y2wpLp9LYN+/rtLanyq2iKoeOEaOwtodrHyclOuFxMh4y4+Bgkc+Otb//geU2NEINWQVAGEHUy/jjBveO1Puckr3MktzWEEvzuaAgRqF0AMeROSEIGPCDfO1aL0LlLKXNxuTTBjoxtfjtN7DpWjtREbzWMyclONLa6qJoICcHnZLCp7hAUmJsar/g7+GA3yZKSR165o8hLOcZgAK4a0pNXKUMv6JSWm/73rFH409r9ovOF3WbC7ifSsfXn07wdgYkT2JWibHLhTvi0c6mUk6EGsfoiqfvKhW+eVWtAs3dOtDDGXQzw2jcFinbaztQ2eYzG1IGxeOHGYR4nWulz2T1FJPhRc3/Z+fc03ejlyDdzqW5opeqR0dDSjlvf/gFRISbceVk81v54XPP56/1dJXh/V4mPrdDuYhAZYsZdqfGeHRRCdKgJDODTn4F83h9ZK2zI2irlAInNTSS1S+n1VLNu+0NEiI93dhZj5Y5iz7+595hG/ljt3BJwR4O9iKjt1qsWqQmJfa7F5Q0d0rbCBjyNHK4/z51WmYuN0eDvVB3+4zsi/B95YwCsz6HTiqaBK+8L8O/YZeaW8hqzLgbYkndG8Fz1gk54euKQMbSnqBJjE+zYkleG//vvYcl5orK+FXtLqniN2664lU8gk7lYI0yhCT/IaMDiaUOoi5j9gVSBJK0UtVCg5MkpgxUVlBoNQMbsUV7nRbuwLpo6BA+tFc4vN3D+m/bUnt38M5Z9k4+XbxyOqcN7e4JUSzYc9loraI/ZXUUkhFASxLRZgnDvhP6elFuArhu9lkX9UlQ3tmKZSBNHLeA2EeRT7bp+ZG9M6pDDBiAYQAjE7lqYJRhhlmAvu4w7TwjNTVrsKKhZtwOV5sidv8pqmnD/h/uwID0R8bE29Ay3iq4fDNTPLQF1NLRU/lEDjYdGo0ZTyrphZIIiCypxUvrZQ1F+thkZ2wpRQzEp0XjnfOdOU+D4zH/zkDa4F/aWVHkmBtqH3WYOUpQ+RYwLbpRydFy0Zt0vxaiob4HdZkJVvfr8/uqGVriEdygBqJu8hHLwuxNCc4Sc+YFd8MftkBuICJJSZo3ph9rGFl5JQ6moHLsDOhslPY2iQ00wBxlxpk7Y4ekVYcErt4zULFcZEA+U8EnI0pAxOwVTh3sbGFKprgzgkRIWc2xINHdB+iDJPiZc3A1A9+O+E9V4YmpSx6ve1492DvGHCs75jBIp5IbmdizrkPEkAQqSTiRFVIgJNY3q15euADGcH//iEO9OXWW9O20rMsQskZIdmKyVs81tMAXBy2geHRftZeMIzU1a7SgoXbeLyxtUf7cSyL1gN4H1txhLwBwNoUWE2603NsyCRz7JEYzqqYUm+iMmB8fHq1n5WLPnVyyZ7p7sxRwqKUfCQZHjz3futMoz457P8jI8uMpVQihxMqJDTRgTb8drWflYlV3kFf0htQxKc0rlMHNkH7ybXazJztn8NfuQgVGYOrw3b4qHFpNXdy3oFBp3coMQ5XXNntQUNl35uoaYg7zELLhRuajQYNwxPh7NbS7sKqzwLKZZeWWiWuszRvaRnd5R1dDqlq2GcMOyJdOHInUgf4MwJbS7GCzZwL9jpWTMOjkpMNxxKpXqunTTEUxJdlB9V3xsqJcManF5A1b/UILTddI72W9uL0KbC3hnp/x5cO5l8bh6KH+jRR15AQq2gc2tE5NibmoClmnY7K6z4aZD8fFq1lGs2VOCJdOHCo6xQNWuVjW0YVlWPlbcluIx9GkMfq3XAznHa3cxVL16AoXY/dYi0yIgjgZNriO7W++S6UOpCz/lIhX9URqRLqttEu1WSRwqbtMcZ6QVs8b0Q3xsqNcAHdUvmjfHXOjcaSdGbnTTn9J8zW0ujPzb1+6icA6lNU14a3sRrhrcA9/8/JvfzgFwN74Zk2DXpH7GxcATieSqezgjrdTGiRjdsaBTS3WwpZuOYPm3BT4dr7vydeWOEW4kvaqhDctY3aBp04iUpg4KzVc00XOxWjYh/vVNviYppvOvHIjUgbGe75SqWXO5gAdX+641ZTVN1ApibBlUAsMw1GkuSpwMANhw4BSeulZPl+IiN1BIOGdg0zknJLtgftpAXOwIUy1wcr5RVtvssXn41kIyxvgcen/01aA1hsn8lH/6rKbfHxtmkX5TB3uKKjXpj+GIsKCuuc1vvb0AbTItAuJo0OQ6ciXWVtyWgsc/P6R5DuRLNwzHhIt7KD5XKYS6VRKHyhpsxJNTh+DXqgbE2UNx+/h4mIN925nILaCsPKtskfbndi+fg8H97h/8rPtO9KODjAa3ykthBeatVq/ywrcTI8c44aM7F3RqXRhXWd+Kd7KL8U6H7CORolS7lf+H8XGIs4cKpirxER1qAsNom89Nu0hX1rfAZglCQ3O7rN9M5qsQUxCW352C8nr+FCmuU1FV34ylm47IUph6fnOe6p1NMnYWTBrkOT+pmrXlc0YJ3kfy+w0iBpHQeM3MLfV7Lj3gTgvtzmmWfPhLzpwLN7tAC4GT8xEGwmshuy6U2DJEAlxrJ4PWGFbToJXqJCih3f2IDAn26lPWK9yMOZfGIT7W5qkb9qeTwaZLy9sC9CfIft/kZCfCLSbc+s4PIp+Qz5/W7scLNw4TXPTUXEwG8FIZ4vt7WW0znt18bnFb/m2hV3EVexGnLaAE6FOgxI8hP59bLWeb2xFmCUZ9c5vmiwNbIQpwX8/URG1UXvigMU7Y50abFtcd8GdaE3vRU5uuNyXZibEJdvx7W4FkesHcy+Jw9VD3+3cXVmg+l9FCFiK56Qtk8TYaDT7dyAH3os0tYOZDTIxi88FS2feDZuzQ7KJLSVqy53Pa8apFY0E5dOV0wM4gUEo+fDt7gRA4ocEfuwVy4SuSHh0XjXk8u4daIjYelO500fLNz6d9FDaFoN1d54r1GAxGXOwIBwAsyzoq+lu0fg7UZAT4rTM4G6U6veMGxKjqJM1HdWOrp/stzTn4G1JcRbpBCp2XFI7IENXnsvjaoVhzzzi8Nmsk5l8p3a1XK1wdq7mW5rXNEiQoOad1B1Q2DM4Nbu7vMXT8776JCYKd2rtrQac/xx2Zax//4pCn9kkJpLP0lrwySSfjvokJeHp6MsYPcDdhLK/XXnlODtGhJvTidBWOCqErAORbvDNzS3H/h/uo0p3YYhTsjsrtHfr1tDgjrXh9ju+45Rs7NLvotEGVu1PjqcdroAxdQldOB+wM/O14TUiMxeJpQ/DdY1f63HtS/KxmHVO7BhoA3H15vMqjuOc6tefC3mXIzC3tqA/1bxd1ofEQiJ2ud7OLqe032meF21/ldEeK/uNf8DddJcTYzPjX70d5bA41GCDcWZyWgOxoKNXpVaIeQYtQPl9n9vcoVaHJPDouWvWOhCPC6tlB2VVYEbAmZA0t7YqUW/gwALh2uAPLZqWI7gzIadSjhLtT47E5t0ywxuavk4fIzmO/kPH3uKMpcJRi7mUJACAZsY4KNeGvk4d4vdbZBmFVQys++uOlMBoMnmfOxTBezaeE4J57u4vB418ckvX9fKkNe4oqZRkeZOxckyydUqqlwZme5MCiaUlU4zWQOwzcxV9JbcyFhr/H2Y78cuzIL8fbO4t8djS0KH4mawTgDozImbOckW6ZUjlpnWJoNQ9ndaRL+dueEjOGaQMA14/sDYMBWLdfWW0bbZ2IUtuWXEOp56KivgUx4RbNerudF/K2YgNQKmVkcrITr88ZhflrhPXM5SKWz8c+185C7GHlW0y25JXhmf/mKTaY+Ry9sQl2OCIsfukBwgdbuSW74DdkbCuUfYzbx/XD4muH8ta8+OaSt6hq1COFlHEiJy2uOxAohRKlkM7SNAtWdUMrXt1y1KsouSs0KC0/2+yVAtXuYhQFgHYXVih22tiGuByjfEF6oseooxk7Whmc7Bovvu9sdzHYXViBXcfKARhQWtOoyfdKwU0Llduo9UJlbIJdUm3KZglCuCVY1domlA6opvg5OtSExdOGeI43KcmBhZ8dwGf76Brf/f6Si5BXWqfJjlqNhu0G1uWcDMicx02dZK+9ZZTj8kuVfbfkFE1PSnLIlm6Xw5m6JswY2QeTkhxYsiEXH+yWr3Ll7kOkPtMiYPK2QgOQRsVk6vDeyICBVx1EDUILHTnXp9fn4nSdf7f6uIg5QUp7DBApWTmSuVvyytDUJtE0QkPYyi1jE+z4fN9JaqOMGERLpifzOmd8181o8J8xazS41by4PVU2Hjzl43DoUchzeEQgZEbyAsFz17ufLVrjOGNbATK2FXgZe53tSBHjm69pKhexAJDbqFZ3DgC9SovdZsL8tERZ30Ozi05TS7V4mrgMemc8q1wHQkmj1u6MKciI7X9N8/RaKK9rlr0LwFeDQOAKudAev6qhFfNW78eKjuLyIKMBkZTpjQA0FSDQYn4ywF07WuHndCluI12+9V6LGlZaxNYI9txbXtfs17mDzLVBRgMMChszuxggWoNrF9CGfXKVlNhMHe7EG0bhbaCoEBNaXS5ZFfhiUa/JyU6EW01UqQX+gPuwKu0xEGMz47vHroQ52Egtmevvoik2fFFTOduK5MmZNaYfryEv9Fv8WSznYoB5q/dhhTGFNz3Lydoe16OQ3kxKcuDp9Yc7+zR8iLa5jWK5kXJi7D3c0Sfo4fRErNlz3CuaGh1qQku7vLlLLnabCWW1TXgt66jP9xsMviIWUaEmPH+DkGiG/EWLd3eEcgzePi5etvMttYsuJdxBEFpkSY2KGsxBBrS0S59EVIgJc1MTfCTQAbqid7Ua+OcTe4oqJdfE6oZW7C2p8mom+/bOItm7jVKZEeS19Tl0OxIEcr8A927A+QoD4LoRTrz3fYlfjm+zBOGPl/fHn69KlFzv/Snjz6W8rhnrc07y2iJye7QogW+ujbOHKj6eFumgAXU0AHjSCIizsaeoktrZYDsqZbVNyM7/DVuOnEFNY6ts6Ui7zSRZ3FKuUDJWC9gGjZpCpor6Fs+kSuPoBUoekA1f1JR2W5E0FmM3O2PLmWr9W3qFm/HMjGS4XIxkOt8jnx7gNR5JR3k+unsUMmNrAVWjMyVEhZp4u93SkJVX5tltk5MCRd7Dfj4dEVZPg1IyBtfvP4m/fHpAwZm5iQ41+RQOsqmsbxWU3uQzuMWONX5AjKz6LaHdEdoC+f49bNTfxUZsF31KsoNKippvkSXNBdVC42QAwPI5KYJqNnKl4y90lChcqk3blPpOOR2g2fcLoBcs6KpsOKBM3EYIdlCkvrkdn/z0K4Y4wz1NA8Wc7kBgNMBr94odVNSq1tgA91pW1dBKXYpw+/h4PLv5iKIAqxZpqAF3NNTmkpJIQWZuKT7fpzz3b+bIPpLOTWcUcPJ5o2qVTLiTqtiCE0jVFLvNhOdm8kdNaSJTAL9BxI4ia/1b/vn7UUgdGItdhRWig5YBFEWou2MUkpCZW+plkGsFe7JXaky8k12MMR0dpdWmQJ2ubcKyrKNYcVsKxibYkbE1H29tP6bgSG7sNhP+dl0y5q/dr/gYfAg9g+P6x8jKLRZKj1WqRigHoeBKxlY6R4nvu92BLm2c4VBzkGC/IbIWjBOZr5UY1hcytM9KeV0z2l2M59mW6hRP+518tYBKuoZfKPdL650EblCEHZiLDDFT3bvo0GBUNbRJvk8JXJuAnF+IOUiT45OZ+PkbhgHwzYgQmmvNwUbcMyFBlpS4ln29/OZokAFXVtuEyrPNsNvMOF7ZwJsPLDeKq0XUPT3Jt4Mzd5IYHRcNR4RV1VZXkAGgDFwJeqNqJx05C3UgJ7jF1w71Wz8TA4BV36trAsYH2eXy53XqblFIwH/9Bx6+aiD+dNW5Jm4rbkvBonW5imQWieGtxigBzj2fT3xxCAs/P+jVkEkJlfWteOJLeSpQNIilhbxwwzDRCB13x4bPYabZHYoKMcHFMF5GIRepOiducCUzt1TS+BNbZLUc+8TJUNpXJxDO2vkE7Y7j0k1HvJSj2l0MIkPM+OvkwR57JTbMgjtW7RENKBkNbsVHQNtawOLyemgr+N45+HsngR2Y++s1F1N9xsUYcFNKX3y274Rm5yFU7E9ekmpeLAQ3EMF1JOSUIjwx1R1sW7mjiGpng4F2fb384mjI7b4oN4qrJuoutIAIFVq3qCyIpnUyAPWRPy5KPNJALkhiDY7UnocWcqZ89Ay3ot3FoNxP6T1sLpSoFg3+2km7tH+sT6FmY0s7FnwiP02JbXizI+VKVNIYiKcnyaWuyT8Rui0dKWNcJic78cZtKT45x+y0RbH0WOIckBQmod2h6sZW3Pr2D4K73nJ3yGmDVGKLrJZzJEmDsAQbvXZJekVYMHtsPzS3ubCrsEKxs6ZlVPJ8QE4aFAlw3jsxARsOlPo8Q7PG9JM0yFwMsLekCjWNLZrWAvIFZDuLrqgCyIYE5miDRzWNrfhs3wlVqbSEP4yPQ5w9VDNJYS4R1mCs/MMlKD/bTBVEkWJUv2j0CDsZcJEjzR0NpYXE5GHZXVgh2V1RqQEmFCVSUmgdHWpC6sBYbDyoPgdxSnIv/GF8gqrInxByPVKtZDiNHbmUShe/riAHysUZaUVVfTMuf3FrQNLLuksUEvCfU5VdUO4zrtQ0t+RLQxybYMeHPxzvckpZWrA+5xSeFFBeEkpL2pJX5jNG2MY/byBKwprh2/VWorZE69ASOV2+3RItpb+Jw8nucVJc3oA1e457GZuOCCuWTPd1ntRIx1+o0O44kmvFl05SVtNEncZZVtOIl/73S5dZp7QgzBKMeyb0R2LPMCzd5OvIL56WhGibGWfqmpB/+mzAem6JYQ+zUNsMBs5/K713U5Kdfg0IltU2w2gweMmSA8K7uFy57fEDYjCuv7tprFzbXMsUbk0djZY2FxatE+9YKMW81fvwwo38efvk4uafrqM6FreBHd+OgdI0LEuwEVcN6aWJozE52SnqlSotVvvjhHjB1CShB5VGrUUsP5s8jvdMSMBb24sUL35dsa/C6Lhov/beYKO2E+f5hr+cqoxtBfh83wmvcU+cWCXOIt950nQKV0OkNRi1TW2dMgYq6ltEU/j40pLEjP97J7rnBe7fSe61JdiIZp5dZO6uNzr+W67aEq1RUNPYKrpb8n/XDpWUW7dZgnBJv2h8ly8tB0x6nAjVKZXVugUk3uBxntRIx1+oECf4vewiRdFmOWOtsr4loN3gA8HZ5ja8mnUUUSEm3HlZHMbEx6C8nj+qHsjmvmI4IqzUPdBIxsPDVyXi459+9Rnji6YOwdMbDgvukrCDpaRw31/wKZDyzUvTRzjx8U8nvNaijG0FiAo14bnrh2HpJnl2rpYp3Jo5Gpm5pR25z+oW3OrGVt5olJx0LPIQbH3kd1j9QwlKKhsQZw/F7ePjfZq5KU3ZKKttRqVGqlRCcmhslOSFv7OzGKMusmPqcHnpBlILF4libskrw5c5p7wGI3tx45PTtdvMWDojmWrxU5sLrzU788sDZux1tyikP3ewuBFuJV1ZhXbh/FVbwiZ1YAw2557263eIQWuc00itrtzh62Sw4XMy2MdgK/IoUVuidWjfzS7mVaViC01IUd/cjomDelA5GiQlU6rj+hNfHOKNMKqRjr9QCTIaEBtO16tFCWROiAoNXI+GQFPd2Ipl3xQgKrQEL9wwjNfg1HLuNgAIERFIEPoMmZuDjAZ3L6bPD1Epkb73fTGem5mMaJvFZ9yYggwep0UsWEqTvggeCXFa2HOWUCCntKZJsNC7uqFVVQ+6LiNv64++C+xolJzjk4dg+ggn0l751msxWrnjGGaP7Yf4WJvngcrKK1N8jnabWXVnRyE5NGKIc3cevnvsSuwtqUJ2QblkFMHFAA+u3oc3jPLTDaQWrvEDYjB+QAyeFOl+PTnZ6dNHoqK+BUs35cFohKSzwS7QK69rRsbWfNT4KRedBrkSykpwd+Ic1e2ikOwdLK1Rq+QltgsXCJU24mTQdBf2B7TGOY3UqtLFlo2chY/7XjW7WYB8oQm7zUxdQ7H7mHTH9aqGVuw+VoHUgb7pxXLztbsDWu2UCu3MTx/hxLOb/ZOf35WobuAPAAPaZR+Quhg5yoN8c7OcHmjVjR1NEm9L8UlPot0pDDIasHhaEq8xT87vXpmKT+Sz7OBWZ7QeALqIvK0/fjw7GjU2wS7r+FGhJtxySV/e7fmy2mafvNe6JuXGoxY3QEgObcVtKQCEG7ol9gqj/o4n1+UibXAvBBkNstINaBYusfdk5pbyphrRqIzJFRTwJwYAkSEmTRyNMEswzja3CU7IGbNTfHaguguTk524d6L8CZkGvjmFFrEUlLKaRg3PUpzOcDJoVJ8IgRIvkDPvct+rZDeLixyhCUdkiGQNBWk2uu3nM1TH3FXI72jo+KJFtH1BeiLW/virj7E5fYST1864UGHgtg/CLSafNCq12QeLpw3BnakJ2HjwlKzPCc3N4/rHyLrvQkEobsA1NswCMO4eQNn55YAB2HrktGBjRW6Gx5INh71qu6JCglHd6GsP8DlQgWw9QHBEWLqGvK0/f/yb3xUg71QPWcevbmjF2h9/pXq41MjWRoWaAIP2ykbkvJ/44pBEj4hE6mNW1Ldg3PNZuGN8QsCaO6npWBvIzuS0zE2NV6UEcndqPNKTHJ5iWb0juC/tLkbzBk9cvsotRd6pGqo5Zf6VA5A6sIdoCooSmdzzCSnVJzb+Fi/gRvikdgrsNjPKahp9VJsmJztxd2o83qFo2CdGVIgJNY38qjV86Rx8qoYMoKB3TFeaGbs2QUYDpo9wKgpekHv4wO8G4pI4u1eB7Zh4O654eVu3uxOlNU249Z1zOwXclOu0wb0w7vksWSn0RoO7oVyQ0SB7Dlk8bQjvnCRnh1zK7mH3bnv00wOy7FH2+YmJZ9DUV3WGCmVTmwtb8spU2yWqHQ1//vhvj5bj26PS+a1sGEC1Lj0N1Q2t2HrEf3nTQtKXxEhfs+e4rB4flfWt1AtadsFvqvN7lXasVbtDZreZUVXfotkCEBViwgs3DsOkJAfW/vir7MgYn4Gm51PzE4iIzfu7Sqjfm9grXNLhtof5Lwe8K0G62S9IH4T5aQM9zyo7tTM2zAJHhAWna5uFc5WhzEzmi/CJpWswcAdYiIwxdxymJzlUOxpzU+OxLCufKhrJHfPF5fWKAxfj++u7GbRk5pbiLYVOBuBOjbri5W1e89KHu0uQPqRnl9ht72y42Ql7S6pk1+kSiWCi4CdnJ+Kp9blIT3L41N4C51KfaOs1hKS8AWXBTwPcafHXdNQFAvwZIJOSHAi3mHiVoth0hgpljUjKnBx8745MlPz4C8WcEtou8zcM3Glgs8f288vxM7YV4vIXtyIzV3l0WWnHWqXGpgFuY+LvM5I9/+b+XQnLb/UuIJZ7rEVTz0U02l0MdhVWYH3OSU8Kz4yRfTB+gO+k0h3pan1DaOa24xUNATgTZTgjrVggY+eThlezjiL1hW+QmVuKzNxSXP7iVsxeuRsPrc3BrW//gKY2lycYwob8+48T4iW/IyrU5NNjJ9pmwl2p8YgMMaO9I4eMGBKOSOn7RAyizQdPYVdhBcpqGmG3mRXPC1GhJlwSZ8fyOaN8vt8RaRXMZR+bYEdsmAWrFDo5UaEm0U7hOudQE7RyRFo9Cmnc9ai6sRWf7euctb+rQa7tkg2HkV1Qjq8U2gxk7mevszRU1rdi3PPfCNoqk5OdWD4nhepY72YX47Wso1ifcxK7Cis884zS54grXsEHmUNvfecHZGwrRMa2Ajz66QFs4akdJk5YIC0F8puf+W+e53ooQfWOhpLiugtlu1GtwpZafi6r8dux5XZr56K0Y60SY5MdQZyc7MQKo2+ags0ShLPN8rpzOiOtGNf/3KKuJA/1obX7EWQAjB31MXq6lDBdqW+I3WZCWW2TaLO0dheDNXuOd8LZCRNhDcbT1yahd3SoJ8VIyU6cGGW1zYI1DjUdO7GRHJEMdiqA0WAQTGUxAHjhhmG8ynbvZBfjnexin3QN8t6y2iYs3XiYd14mv33+mv2a1LpUN7Ti1nd+8OkpILY7mZlb6tPgUC4v3DBMD0pQojRotXjaENw+Pj4gqVFdRbpdDSTwSVN8LQR77pe7E1FZ3yIo/QwA4wbEUNuo7F1GMs9EhphV7V4J2TQ0wjzczIfF04Zg3ur9is9FCVqk1Kt2NNwV90PwYIB/vA7wlR8lL9Uq9VTVt4iq5AjJhSoxNntFWLBk+lCfXMiMrflYlV2M6sZW2U4GwK8yJLcjtFv5i39sqHXmLjTGJthVq7hpRWV9KxZ8nANA2CEkxq2WEF13uY4BeUpfumm4z3n6S82LDzJvhJiCsPzuFF7t/b9OHoIQUzBW7jyGeta45F7nmsYWrMoulhSTIOkIuworJIM/WhfUl9U0Yd7qfbyqNWwyc0tVFaA7OHOcjjRKd0hjwy3YW1Ll19QoZ6QV1w534O2dxQHxNNy9FJKRV1oruWYFGrvNhNFx0V6vyVGOIrCln7lqnUpsVDLPzE2Nl/U5Lnw2DU0N6+NfHOpoGXGuDjAq1CRb/lcr1GQcaCJvG23rHnnK3Q0lnmy7i0HG1gKqehC2IU8mhrKaRoRbg1EnS8bW1wnakleGZVn5iufwjFnCErPEsFGb6kPO7fHPDyHcauLNy9TxJjIkGK/fOhr/O1wmq95CDUIOoT9SvRJ62BQ5BmLKWIHuR0PmDaPRt6Mtn5pcVIgJc1MTfGo/xBZiwDcI0hmpdzQBGZr+GHzcPq4fLom36zVcClG6QxprsyC7QF5tqFyuHe7E2xI9ZYRwRFjQ1OZCTQO/EAEfIaYgXJPsRLTN0uUcjcr6Vlzx8jafncEx8fLqNYj0c11TK2/2wFWDe+Cbn3+jPi8yttfnyFPCYhMVYvKSpyXOT3lds2QNK1/ArTODcGoyDjRxNORO8Gr04BdPG4L/HjiFnBP+SxuiJcRkRGOrcIOpCwXa++tODfCWb+OD2ytCrZQt6ZpLlJ1Gx0WrllyOoWj0pFWqjxxlnwuZPUWVkhNpTWMbjAYDpiQ7NXM0Fk8b4m4kuekIr4oUeY4e/fQADp6oQerAWIzrH4Pi8npNvp9NeV0zYsMtuDGlLz7bd0Ly/fOvHIjUgbGShih7J46v0SZBy14dXFEJoVSBmsZWLMs6iosdYZ5nnybthRsEKS7vnHoZqYAMTX8MPlLi7KK7JDriKJG2NRiAv3ySg9N12jTjFeLzfSdl71jeeVkcrh7q9CgVyelbwZb29ldjVDWU1jT59KEg3a7lFPN/uLsEmbllvLugSuwLIipht5lQVU/v2BHmpsZ7esF1Fbl+JdhtJlUyt6qLwQH5BpfVFKToe+w2E24fH4+SSu0XFCWxohdnDoNUkMloADJmjYSTomCxq0Jzf4kRIeVkAG5DhuyCkc9pMQDfyS7G7JW7Me75LNXHo3GuyKStFSRyrqYI/3xGjoCAVGGcAe7InyNC/D3OSCvuTE2AIzJEUqr2bHM7Xv+2ELe+/QNSln6Nd7O17fdBmnc+tDaHyskAgMReYdRiAmQn7v+uG4ofn0zHmnvG4dXfj8TiaUPw6i0jsOaecciYTVc4SQNbVIJ2h4IUHNI+C6RosivUywid867CCkXH4xbE68hDiYAHw8DvTgYgXxabAfDe9yWoaWzx6ltBI4RAKKttUixq0hmU1jThre1FuHdiAmxmOptxR/5voulISjcFZ3Y4/HI+Hmo2Yn5aoqY2Tmcxc2QfVTuqmjgatNXwUSHuDRSl+WUzR/bB3pIqQelXpZDzvodCEYVw38QETE/pi3smJIi+754JCbh2ZB/sXJjmXthvGaFK7STQGA1AVb34xKtEleFMXZPfOl1qUaRP41zJVciQQiuFh/MVOQICYgsm+feS6UOxZHqSqNQqSd+Tuytb09imuYy2kluudFeNOB0zR/XB3RP6Y2ZKX4wfEIOpw51YkD5I0TH5IM5zxtZ8arlrgP53rc85dS7tUuN6GbkIn7P8G+vkqV/TkY8Sg7wrw14bJic7sXNhGhZPG0L12b/99zBey8pHc5sLD6cnoleE9649sc+6EgyADQdK8TplAESsFpOB8t3a9CSH7OfIFGTslG7eRoPbltUyCJqe5FD1eU0cDRov+eGrEhXvZBDSkxx+ycMlcoRPThuK+yaKOw5hlmC8PicFT0x1/94npibhvokJPp6y0eB2Rsj7PAt7Sl88N5NfglVLDADCLOquN+AemPNW7xeNsitR9+gZbu2UTpdSkCg33yLPlqcl8neTk514fU6K4kgJFxpJvAsVml0K9r0RMiK48qJRoSafY0WGmrze05mKV4olVkOC/WKMzk8biEiNjA6ywNLKuWYXlGPdvhPIPVlDFcWsqG/x5D13JlGhwqkFcvpeGDr+xydEoaMMuQa5P3E3kvSdj2jgWxuCjAbcmZpAFeitanD30npobU6HupIBC9IH4bVZI7EgfRCsJnlj/sHf9RfdMdaK0pomBJuMvPM4m1DKXQ/a9xHImkOeozX3jMP8KwdKfq6msQ2LvjgYcBvHxQBpgx2yzlUMtWlTgEY1GoBwwSFbImzZN8oaFLEVitQaYORY/7hpBK8iyhNTkzCibzSeWs+p9g8xIX1IT6QOjEW0za3lzv7MI1cPxge7ilFS2YA4eyhuHx/P20QG8H9xpjPSillj+inoOCuMWLGjnEgi+15uPKi8yMof8DXaIvDlWJJne+pwJzIwilfVQql8YWcbTp0Bu5srTRM0QLz5oViTpRrOrmhn5i4r/b7qxjZNurayaXcx2F1YgdZ27a4CA1DJVAJAxrYC2ccn970zETO2xg2IoVZTEyvq15EPuwB3sCMCjggrTtdqM8aNBmDZzSOxZBO/pLIQf5+RjKWbjiiea0ivCjLPic2bYpyubcKyrKOefiFyz2VCYk8M7xulSk2NljO1TXjhhmGi33XfxP5UTTDlZtSw1xwSMC6raaT6bGf1WzlT1+Q517EJdny+74RiW/PvM5JVBz003SsTW/TXK2xuxzUw5PTtEDNWxg2I8ZwnKZIiF9NoBMxB3he2pqNJD3lwuIW75mAj7p7Qn/p3nZNgpVNoomVBeiLmpyVig4bNBKWKHSvPystpJfeys40DLkKLPI3e9dThvfEGT68MR4fO/qIvD8kqCO1q1yZQCDnhQveGK2NIxjHNljXbeVa6WHc2SuWn+fB3wWJUiAk1jfILKqUor2tGWzsDg8GdY98ZVDW0Cs6PQUaDpJFEhCzkqEsJPfs6bngVzkJNnnx9tY9KxuwURNvM1E6GAcBDVw3ENclOGI0GxXPN+7tK8P6uEp9+MituS/GRQxWDXIeVMtWv2MHCIKMBcy+Lw6rv/asAmF1QgX/cMgJv3JbiIzhDpJ8nJTk07RlkALB8Dr/6pNwaGykWTxuC2HALYsMs+MvH+3G6Tt3x2fYDWduUOIT3TUzA1OG9VZ0LoLGjAfC3WAfoFUHsNrPXTXR0ROeb21ye5llSF+2qwT0wvG801uw57hVtJ8YKAFz+4lZvQybCgtlj+6G2sRXv8GzzCxmZy+eMQrTNoniy16qAkT3pZOaWYummI9SfpY22cSMpBLvNTPc9ISa8cOMwz8CV6rURCP6cNhADeoYJ3jsavWti7Ak52jRqSgSh/iLdCaHrCLgLa8lrVfUtWLpJeAeVtiaAzFeBloHVArWNlAhiuz9aMTc1AcuyjmrqyJEC+q6A2C7k5GSnqJEkdwdDbIdV3w0RUTgTaCgpB3cOfAKmDnfKCqAyAJZ9U4CPfzqBp69LUj3XcGW3Jyc78cOxCllGPwN5zjnfznLf6FD6Ayjks30nkJ7UUzSYTc5Lq2DRHePjBI1se5h2LR2MBsAZGYKpw922W7PEbrLYbxOyH0iK9/w1+6jsrRibGUtnJGPqcG3mEk0dDbHoIo1BbQDwt+uGIibcbbgXl9djzZ7jXhF/Inkmxjc//4Zvfv4NjggLFqQnIj7Whp7hVoyOi8aKbwt4t9fKapuptt0IQp1myWQvNhgIGVvzNStgXDxtiMfJoDUYokJMWH5rCsAAt74j3RiHL5IC0Effl89JQWqiO185M7cU81b717Ch4cMfjuO5mcmChppUHQnXYOVztOWmQen52b4BC9pou9wmS9x7MznZibTBvfCf74vxzy2/nBfy1WrT7NQULJKFjWEYnK5tFiy8d0RaMT9tIC52hGnqyHUlzQSpeVDKSKJFaI4vrfGW+e6uOxw0wSFrsBEf/fFSRf14XAzw1vYijOoXrWjnme0g7FyYJtnVXghuoAsA1h/wbzoy386ylka3GEs2HPbs3gqt10LBIiWNYDccPIVxA2J4HXctFeHcdbD7cO8J8RS2MEsQXrpxOACDjxQwIJ76DUA0xZvgr7lDM0dDLMISGWKmMqgZAPPX7sfrc0bBEmzkbbhWVtOENyl1lYnz8PqcUahpbMHEl7ZprkzCXejKOiZ77oPNNc4zc0tlOTZiGOCO6qUnOagNBgOAF24chtSBsWh3MbLy09kTJQAs2ZAn+ZkYmxljWI1rpM7TaHDvNiz7Rn7Othwq61tEu3PTGnHZBb8JGg+0i1GMzYxnZybrEUkOcpxnuU2WuPemM/XOlUbh2L9BSTqNUlEG9sIGQLS2ZvG0JOwpqkRzmwv/uGkEYADO1DXjqXWHUN8JXW61RM4upJiRRAPN3PlOdjHeyS7utjscNMGhstpm/FxaiwirssJswG3gf/fYldSp3OzvZzsItF3thY7FLhDXQnGRj+tH9kbf6FCMHxCDcf29n9+eMh0NpSmOZbXNyNhagIfSE0Xfx+fQu1wMVTCVTWV9q6BtICeFHwDGJURjd1GV4N8ZSKewhVtNuCbZiSCjAW8Y6dOLgXPrQquLwYL0QT7ZPv6eKzRxNKRy2OW2cJ+/Zj8irMGimutymLd6f8Ai5+R7uN4z2zif1OEQaPmdpTVN+GBXMdWDH24Nwi2jL0JkyLmidjlbjmSifPyLQ9TdSSvqW3DFy9uo0loAtwM3Jj4GUaElopEImyUIwUaDaqlRvlz3dheDckpNdXa3Ve6gpSk0tttM2PXEVYICAt0VJdF2miZLBgC9IixwMQzW55zsSMVqDuhcQYgKNeG564f5pIFFdwQraLfJlabTKN0R4S5sQrU100c4eVPcZo256IJwMoDA7ULKcQqFOtpf6NA+z2pS7siau7ekyrN2yp2j2Dvhancl/SkeYjQAX3YEbjK2FfikadMEGtkwDHBTSl9kHTlNLRJBeJXT2FMIrkPf7mLgiLBQ9fniwmcbBBkNmD7CSRX0Nhgg6mQQpHZn2c+LnN1RvnWBne0Ta7MABqD8bLOnPEHruUy1o0GzTSm3hbuLcSuqaEVX2F1nRzHCrSa/RExpGxnWNbV7ol5RISbMTU3A/LSBWHFbCh7/gq5omYGvMyUFWfjuok1roSgyZxigVuWzQib997KLcGdqgupOnqWcBZ5GTem5mcN0J4MHNRLIM0f2wbvZxbzXnAHQ1ObCrW+fi3IZDeJzhSXYgOY27WeT6oZWGI3wpFGwF47/5ZbxbpMD7nMlBi6NYIHQ4iw3/eN3g2Jx3xUDfRYkvsVPyHkrq2nSbEdXCnK/F6Qnol+MTXaKCnHoFk8bgqWbjlBHEf2BHIOSGznvLmlUgRTSOFPXhBkj+8haO7mfB9Sfsz9/M1/WxgMf7lOsVgUAEwbF4sWbhnvmih1Hy6mblLKfZ9od3CCjAbPH9pM95wgJ4bS7GGw4QNdYV0uBCvb4p9kdFVoXTtc2Y1lWPu6dmIANB0r9Xuul2tGg2aasqG9BuDUYdU3aNrg63yAPrZxOsdcOd2LbL2dQL9KIhhBnl1+UVd3o1tZ+c3sh7pnQH9bgIAD+2X4lC986ygK6yrPNkhO30uaPfCzddARv7yzC9BFOxRMogYH3hChXTUnHzf8OK++Snp7kwJgEu881J4Wg3GdLKqLkDycD8E2jYDN1uBNvGPmNGKIrL0ewgG8RlpsGkNwnSvBv7MWv3cXg8he3arYzrZRomwkzR/bB2IQYuBhGtpMBwDNGr0l2Uhk2/lKEkmtQSikGXoj8f3vvHh5Vda+PvzPJzCQZkkkmUWYAIYEEJQx3RTBIS0wqgkK1tlXU03qhtpJ+NacXxUKljfVy2vMTW1CrCJ5TBbT1AgpymgBViSDKPQQLhAREMmAuJGFyJTO/PyZr2LNnX9bae+1JIPM+z3lO1cmePXuv9Vmf6/tGk6qavA8SZD+8dg827K+l/l7y91rvWVzV1Jq1l4IcUYtWtiohiOgqWZM3jx2EbUe/obp3sp6b2jqZKriZGXaNdxsZ4PeWBhjL/lc7FwBIVmSMqITqDjRoMyz9PcgQ4vDpFqrP3TzWTWW0iLG5Z2omVmyr1mRgWzu78bxGnRMWBBDsfXTarWj0dSoOj9KyWfEEywyQGqRYjXgMg/YXbNxfi/9hHNQkMJuAScPSYI03hz3zDLsNv/j7PmgNpo2gaFVzBv3+gGTA3dQa7CF+pGAkM8OWEKz0h8u2Ho1ooZBCXxHkbPB1hVVwWUASAYW5rjDGs5vHDpLdt0YyQrEGhQT9SZcnGlTVUnM5pZVepiBDKD6q5Z7FbXubKmrRfp4PeUXeiHSUKyREWdmqCOTmmeLMJiyZM5raBv3zoBevfVrDVMHVU/UR/60R+8ncM7si91jlhITloNX+GlEJ1d2r0V/5/vXgn5WnVT/jSIhH+dE6aqP1xC25sMabVRXa+wq+Oz5IGye+T6HxdDkSo3pPAP9DSWyQSBZn7vjBIZaqGCKxqaIWD63erbns7A8Au44H+2KFz9xsNukihLg3LwuAMftL6vDauL8WC2RYQgI9/7fqU7rA+MOK2pCivRiEflVNfVcIQnzxfNlhrNv7dcS1+6JzS9sTXjRjBNbMn4Jtj+YDAPKe2Yw7X9mBh9fuxZ2v7EDeM5uxqSKy2kZaFcQHPHGApP6GBcQhZUV/O6dJBdnlMO53L549CjurG7Bu79coP1qHJesPMp0fc8a5I1oPpe7Z7UjAg9OD6t9CuBwJIYearDutlL1iKAUZWqE2zzTT48btE4dQXesfu08qZup/935lhJ0jQTqL7TbhgoPf7Q+g/Egd/vR/X2LroTMMV6HD/OuVz5a2rm6UVnqpr6fH/opJBvRCd0WjNxR1TYBkbxnv7wgAuPe6YVi3r1Y2+24UmhgqQD+ZnhWK3md63PjJ9KxgWdPgG05NslAPg4tR2EOhptRKxMqG1RchdcCL2yomDUvDruONsSpHD0jJVy+kDK1W46tG0epKsaH9vF/zfgCkGbDk5jOEoHUu5OipCYQioqvKq1WdcvI7hX3PwmtfjM4tec/FhVeGssRSWVZvcwd++vpuvCTInOptYaNF0CEbTK06nG639ktdHnEFua6lg4vmitNuwfcnDYmY12HF+n21+PXMUapzTuQ8+PXMUZrFSXtbrwqgaxPOy06nmtVQ6pCRq+BqqRoFEGTMK630aprBoYHZBCy7c0JIs+PlT6olb45UsGlbmnjY37JKL5eWS92Bhh7VQa24b1omFs7KDdt4x77x4S9bjnDbTMJNce3wdOrFabfFwdfRHVV1YaHB2lRRq3u+gAYPTs/ChKFpzOVpsaqoUiuR2hB1APqCHaNBDnhhYEG0YYS9qOJDoL/SUhLwarmRMrRajK84EyflDEwalob/fGsvPtivLWNNWr0Iuv0BLFl/kPrvHYnxaG47z0xPLV5jcWYTHi7IQVF+NnZWN6D86DdhjGos1y7MdTElCpx2CxbNysWTGyuZaTonZ6ZhZ406s4sSxO+52x/AY+8cUPybx945EAocWDV39CAvO4M60Jg7Xr7N61KHeGZIa2sxQbrdit/dMho/X6ufnU5uLcgN+cr9exp76Q8EKzBOuxUlGw5xSZzSnvv35WWGEotq65BnF4NUUkluVjKtRzFeKpB4/D1jAgyCZXdODIn1Kflu5N8L9USUwKMI8Gp5Da7Jcur2RbjQ3Mz0uKmZhHjg1W01eHpjZVhLRHHhSNw/LUvT9UwIZiTfeOBaPH/H+FDJXFgloC3D+jq68eD0LENLtmIQg6VHeIsFJgSDm8Jcl+RzSetpv1Bqi6JljJB79i5HAl66eyKeuW2M5HcZBVJKdaWoc4eXzPWgtNKLac9uCbVdPFd2JGLgTY7VQ2+bxcUKHi03TrtFMotLUz4X229hiwKB0PY0tXVi8lNlmoMMILzVC0CPiBf9UGfhqIEA6PaBUnsBAfl9OQOTqe9BfG0ATG0+Db4uNLZ2atICqDjVzPw3A2xxYf8sfs87qupVHYyzrV3Y0dNmQrtueaxvFoeMiLn1d8SZTVg8O1fT+Wjq+b+SuR784cND3M5YHmuB9hoZyTbcOnEInrrVA0D/mUkTvJoAfFjhxaRhaaE2M7n2TSCYbHHalds31f47AUkqdfsD2F5VH/ruwlwXtj2ajzXzp4T8vc8eL8CPpg6TvI7eIEPuKaUlWfDS3cEgg8V3I3oiBOLfR54tSdTqXatL1h+UfV+04CbYV5jrwsryGua/u8njwocV9H1nBH/9uBrjhqSGyk2bKmqx4hPtQ7xL5ozGlOHpIcd3Z3VDmONbmOtCcoIFn1bV4bXyGln+d+KEf/SrGdh1vBEfVtQyK49qwUsfHcXGA0lRGb4U08FKVSVKK72KbVFSA5POHnYYsTKl2hC1VIbCyN8+y+NCSqJFkSrvwelZMJvBzK9OvqM/0lIS8Cj53jp+sCzNoVr5PCUhHvfmZSEzw67ayibXWqMFQoeB1QHJy85AQe5A6n1Am13X8i6E9iEj2YZHCnKwcls1VTsoLUW3GFrY584JmPzSkiz4wdVXoOO8P8Qlv/1YHdV1th+rQ15OBvWz4rG+J2c5qRiGWAdIL2VsqqhFyQZtLZnk7KLRgGIBj7XAuu5metxYPm8iHn1nvy6SnvMUziexBVOeLgtLIEhV7YlPoJRoMAF4cq4HJRsOyWbqhV0TasQM3f4Alm05gp++vgtNjJoeajCbgD//cAL+8GF4i11QUiATRfk5oXOFtYpP9EQAKP6+wlyXJlV0IbzNHbqrsNwCDS1lGqfdgrunDNMUaADAr97ej+QeZc/H3j6gKXJzpdiwZM5oAMC0Z7dIOr4pidYIJUU5kI2163hj6MVEI9D46DDdocgTJRsO4S9bjoZ0OGh7TeW4nYXsMGJDpMQZLf4uwiykVwV+gC0e5zoiDfGrPQF1apIFnef9EU7OAFscOs/78fi7FZqzCf2RlpJAK7OOEAUKWVxSJZPruW1qO4+lZUfw4t0TFZ89r1kSAqHDUFPnY/rbBl8nfjz+QtBPm+BQC2j0lN+F/fC0DHJaKLoJ9DCCNbZ2hbHuuR0JGH9FKuVfB+2e2rOSY9wRg6bSS8vSIx447q+QO3PU8B9Th+Emjzv0DtZRUrOrgXYt0IB13ZGAK5pMoOLgQdy+SZOwEfoEZrNJUZfqiVuCcxVK2kI/mZ6FN784aVhblD8ApCfbJPWRxHtSS2Vr4TsH0Chx78Jn60i0cvl9eitv3BTCtLBhPDnXg6bWTs3f6evoxj0rd+KelTuZFSYBoLhgJMofuwEAJJlCiOP7XNlhZqeVvBgtTAcXE4gOx6QnSyNafaQYlmhLhKztQ8LvysvJwG9vZmdmEUMqyBDibGuXZCb1XEc3Vn16HA0+7WuboC8y9xgNorqqBUKWECUU5rqQICOQSNNaBPClbzWbgPFXpGJ7VT3e3X0Sr31aw/T3JRsOIe+ZLSjtGd67ibKnVi0bKrTremxYo8peIO/tnqmZmu3lvT3tuzxsrbepnToBRoJRpWdFHKKbPK5Qm6sUNlXUhrVa3vnKDkx7doukHSRMYUnWOIkrBfHyx9X9tgWTQE9L8U0edxg7YMYA9ZZZNaixL7GABKU3eVyhSrjSd8mxokUbQhvbed6vOguVbrfio1/NUG1ndzkSsHzeBCQnWGSTz4St768fVxs6ewEA3uZ2Kjp7LZUtqSADCH+2epOtBHorb9wqGgApyU3AonUVqn22D07Pwo0eN6Y9u4XnLVAh3W7F3PGDQoO6Rsw1kBcTDU7vvoCzrV0RLCxSoHXO9LYPpfWCBocRuBiZe/SCRXVVCJYZILUZCJqKEs8g0B8A8p7drGk+gcDb3B7ag2qD2CwZVXKoL1mv/eBSsnvC90YoulntZWqSBUX5ObjSlYwl6w/qFi0j32syKesFpCVZMGX4hfUhN2xKfszK8hqslKjYAvJZ99qmdlnbWpjrQkrCQcXWsf7agkmgJSEgtT82VdQyETTIgYZ9iaaqJdUWJF6vYhbHaMxw0oLY2Mff2a/q8Nf7OsO6RADprolGXydKNkSnjZoGv3//YFhAIEf0wpu9lTzbhnP6xRtdKTbdlTeugUawJHco7LAUL/x0uxUlcz2YNdaN8iN1UV0QN3lc+Ky6HvW+zpDBd9qtXDLPBFIGSu7w6U3KOaO+W+1QY3HO9LQPXQqVgP7aX621UqA2AyQ08jwGd3kHgXqCDCF+8dY+7F/iUmRsA+gzqt3+AByJVtw2cRBe+NcxLvcohNjxuhDY0AcMJoV/Sk6Ix+0Th8Bui2Ni0ALURcmevm2MJIEFcYBWfFKFzV9+E3GdWhE7145j9XhUpf2XMFwBCKNs1RswX+rQchaQWTwyqynXhkOLtKR4/PYWD1wp6vTlNIKPckEpOdPvz8uMmHXsKwKaYmykrBxKvUdhS/WmilosWK39HRkBcdVBjvHPqIS0027V3Ya8ZM5o3UkKboGG3MInBvbe64ZhSFoSnHYr0uxWbNx/Co+/W8Hr6xVhQjDjJVUK5x1kANIHuBwlplA/YcuXp7Fim7H6F2QRGxXgqB1qWpwzLVlUrU5gX6o69df+ai2OQXFBTmi4Ts4WCY08j8FdHrMkRsDX2Y2/bD6CRwpHSiY4aDKqBFJOD08UF4yMmO8CgvbSbo3HPSt3Ul2nsbULy7YcxdKywxHvvaX9PFZ9WoObx2prx7svLxMbD3jD7JASBTXJRv+z0ovNX34je90AgsEDbaXobGsXHl67B7uON8aUwRnAehaQJByZF3SlJKD9fLeuc+HH12Xh1gmDVT9HY7sKc12KlQkTgs7747PD/RAWsbew66lU9eQgN+MoBi2Rg9J71DsTGS0odWrIVkN1wOVIxOLZuVR6TGKkJlnwzG1juNDscwk0aEpy/7P9eK9l7wMAOs77Df8etQNcaqCZ/PPG/bV4RQdrFss9zvK4QgPNRuDDnp5gqcxNo6+TuZqy6L0DSLSYw56rWmmZZkAuNckCW7w5LCPociTgjmuuUGSUihZe/rgaE4am9Ts9DVbHwARg7edfoSg/h1o07aNfzdDdWiTMQvW1A27Ftmr8/IYcVcY2JWgdoKVF8L2dQFF+tuR/X73zBNP1VpUr6wdppR8uzHXhN7NzqZ4ha2AWbBmhr2Rp/Q39sQWTgOYscNqtuGWcG699Gumn8Ohzz8ywq36G1nYl2yzMei3d/gDe23tK072rBRliViPCqvSzb2fjW3/cqvjcHYkWqvna1ERpunIguOcef/cAt4qwGM4kCxo4znIoVRmF9rqs0qvLTzObgLpzHfA2tVF9fuFNV/UQBAQwdXgGpghmk/SCS6BBKxjTm9BCf6gGYqAWzR4FlyOR6gCXcpD/r6IWRWv2cL8/ILhJ/jJvIurOdYS+b2d1A9MCDmpGmKgNrliBmGyc0kqvJgpkX0d3WI8yTWlZTewPCLY9SDlhQNBxjYYiuVrQ1R/7qycNS2MKRoWGGz3/W+2zu443cmktUstC8W7NpMW5jvOhg0yOsU0pWNfSz21CMPvJ+t6eK/038rIvC/v+TRW1zGyEWghBlMDKDGR0YKYFPNmNLlbQnAUlcz2aqW9pQBPo0Qo+0tIuC6tYO6sbDLNDT313DNLsVkk7oiTmHECQwIEmqXd9jrTTa/SeKy4YiZ99e4RiwKQVZ1raZW3w1BHpmDoiHSmJVjxXdljT9f0B4OcMfmVzexd+deNVmr5LDVwCjf5YliVL/g+3eqgzzlIOsl6OYzWMH5qKvOyMsH83OcuJJGscdfBF6H9ZNzQZYmT5LsX7WH8Qfj8k+zCleh/lnEBx5UnKCSMHk9FQcsr6a3/1ruONmhITLHboTEs75o4frLu1CAjPQnmb2tDg64RzgA2ulGB75OSnyrjt8bSkeDS20tFSKj0PtWCdtZ+b2MP512fh5Y+DlVnaV7hsaxWWba0K0YnnXzVQlYVGjFTKzCgtxDSZaomNvjZoC/BlN7rYoXYW8NbHIGAJ9GjtF20bkzC4McpHMwEo2VCJbY/mhyUptlfV40xLO2rqlHVxci5PphqCfn+/F7PH1kZ0NRi151KTLKEA6sOK2lCXA8/W6po6X4SkgtiuZGZop/tmxWuf1mDMYIchHRRcAo3+WJZNTbLgaYb+NbnI22h6tS1ffoNNFbURg0ezPC78Y7c6J/jtE4eE/lZJe0AJvKpJ3uYOLFon3Ycp1/tIhBa3V9WDpSRIDqbH363olYy0EP0tkNf6e1nskFC8SmtrkRByVYON+0+p7pfUJAuaWuX1H0wm4MfXZeI7uS5MGpaGCSX/hK9DfU/JPQ+aPnDWVlNhcDZhaJqmPmOhjg4LTKDPjNKC/B5AOsEiTmz0xUFb1oD5UofSXueljyGEWqAnzmbTUueu3nlC0WZIBTdG+WjiZBhL6yAJUhbPHoUFq9Uz7795twL5Vw2EtYeW3Ig9ZwIwe6wbszyuCPaq1KSgZpvQnmtJopK2bSl7JbYr0fStfR3dkoPqPMAl0OBNzdUbYB14kuMwlkJvZrvkBo+eum0s3t79teI9mU3AU7eNCf0zMdTLthzBqvIa7q0KNFBy+mmM3tu7v6Y6fAnTzsKZV+Lx9yrQ1d17K7u/BfJaZjSEByvr7IWSGKQebNyv3hJJMmcLFIb1AgHgtfIaXJvlhDXejD9+byweUjmY5RjLaPvA/3T7OMXrExTNyEZedkZYcEbsxI5j9Vjwxm5D7URaT8KnMNeF/9muX7umaMaIUBsXEBRxpUls9JVkwOLZo5CRbNMcMF9qkGpNkdrrRthYpUBP6mxypdhUkw5AuO9B2/ZptI9WWulFU1snU9cDOa/T7DY8UjBStUWo3teJKU+X4albxzAxB7IggOAclNQsVFPPcy8uGInMjCTU1LViqca2JrlnJLYrk7OccKUkcNPDoIER7dpcBPt4iTr1JrSwKjz+7gF0UmT+ejPbJe5fJ7DGm/HA9VmKfzv/+qxQ9oAgzmzCwwUjsWtxIdbMn4L/mDqM9y3rxpmWdllhIrEQICnzrtv7NbZX1aPbHwgTzfrV2wcMDTLMJvk9Q0TM+lt/NYvIpfhgVRNNE35WK6TWjBibKmrx0Ordqi1gZ1u7kGa3Yvm8CVC7pd+8W4F3d59Emt2G+Sp7t62rW5JlhrYPHCYovgOyNosLR4YJmhHEmU3Iy87AM98bE5zdUP5pmjA5Mw1fLCrETE+Qne3JuR7N17rwe64M/R7aZ7WzukGToxrH+aG4HQn4cV5WmEBqfwaL+CFPYd3URAveeOBabHs0XzbIkDqbTjd34GxPkKF2HyYEg+yBKeFVEJcjQTIjrUVQmQUry2vw2DvK9MxyONPSTt0i1ODrCp3f0U7Akd+29vMTuMnjxtrPTzD/XrMJePiGHMUqt9CulFZ60X6e/3wxzXfzBDd6276oFWE0GnxdmPL0ZjylMqfBO/J22i1YfPNouFIS8M+DtVj16XHVvxHfw6YK6agdCL6z+ddnYeEsecMkzAL/73b1748mzjS3Y/nWKtVMpN8fQMmGQ5pnZtKSLEyVLSHIQXL/tCxJtrH+3F/NwimeZrfgybnh+492NkcLaIgISNWAFiTbqjavU+/rRPFb+0LfOf/6LKzZ+ZUkhWRTa5dkGZzWFtWd64jKsLwePHzDyLDvnzXWjQdPZuGvHyuz99H+HhatlZvHDqLOGJMzkXf+4o5rhvY7WyGHjftrJSk9aXQMtII8+We+NyZiLpKApqLoSLLAbDKpVu8bW7vwxgPXwmwyUbV9XmgHNoahSWsbuJaAgYY50AgQR/xv22s02TN/ADjvp2tL/dv2amysOM38HTxQfvQbrhVRLhUNgpkeN7Y9mo8186fg+TvG440HrsX/y8/h+RXcwMscN/g6wzLkUuAVeZPM4FO3jsGtE4JZq++MpnOahP2fchkVgj//cIJikCEEz0wQD5gA/GHjl4rtGsRYPLR6T8QzoDWWKQnx+M2sUZrv0+VIwE+mZ8kGe3KZqf4Ccii6HOF7JzXJggG2C/mRBl8XSjYcith/Ylu0Zv4U2QwjLWirZKwVzMuTE5iTEd6mdqz4pBpxMhacHLy/e78yrOLCoh8i9w5Y16bwXRTNkKayZUVqkgVTJFpgFs7KxQvzJsBpt4T9+3S7FfflZaK4YCQGptD9HpZnRVPVv+GqywAYl3iL5uBoX8bG/adQtEae6QiI3BfABZuTmmiJ/EMJiD+XZrfgvrxMOBKtklVOgK6ieLa1C3dccwXVPdSd68DUEenUVayZHjcW3zya6trRAKnYs/gRYuZAIPqdNMcblIfclUF3t70VZABBgg656p8WcFUGBy5kujdV1OKXf98nu6lcKTa0n/crOnZGVkN4X1apr41Xf6RURpb22r94ay+WzBmtKvYDAL99vwKHvM2AKWhMnUlWnG3rCjHpCCNdoxQttSJa39/cfh6L1tEJTjrtFjw5N5wCsNHXgQWr98je7+LZo/ptkEH6qjvO+4OzAj184KQnloZxDOA7e0E728Dar08OWtZSNbmPpjZ5Biop1jIaTQHhDAvvYfnJWU68vfukblv4jIQiN8GssYNwY8+AdlmlF+/u/Rr1vs4QtbYrxYbighxkZtgVfw8NzbLZFPwcIF+9cTsSsHj2KJRsOKT9B1Ogv81ySSHYsqg8v6SmY5Bss+CuVz9T/a7ld02E2WRCaaUX7+09hQZfZ4jMQE7QkZ5Zim53ZNjpBsiFcKX0nXUiFKVlrSgpMQcajWFO7UH91BHpXGyg0ZA7V7WAe6ABqHMbExXf0kpvaGFJlbKX3TkRR8609AnxNCWo0ZCq8XgHEMle4Eqx4Y5rrkBwBESeLYnW0T/d3IGfvb4bjxTkqG7IBl8Xlv+rSva/ExrKgp5hJSPbI/oy2rvUS6Dpdiu2L7whbNal2x+QHTIFCBvHIdzo6X/K4HKtSYtnj5LtiZVjHOMJ2n7918qr0dhKP5BMMnJ+f4A7RSuB0Lmh0RQQthDJ8byrCWbKgUeLyvzrs1QPvjizCU1tweBCvGZON3dgadkRvHj3RMVAlIZm2R8Ifo5cRy4wM3pOrz/OcomhpWVRClNGpKsm79yOBEwZno7SSi9WSawxOSeNNhj82w66dmS/huHSyVlOw2wNK9bvq8WvZ45CnNmEwlwXHinIwcufHGNi1eMpckcDtyMB90zNxIpt1UzBAkniTBmebih9PiHoaPQFWTq1tsnxPFe5BxpqDEsmXFDxpeulduNKV7Khyo+8oJStkPuthO2KBBkDbHH49sjL8cXxRizdfDT0OSW2JHLtJesrZdkJyKJZxWETCmkohZmb/KsGYsrTZX3+PUUDZEv+4VZPxEA9y5Bpf9LPUKJd1ZOl5AHaTCRL1jo1yYI9JxoND9CPnD6H7VX1oWCAdoZFLuibM86N9ftqJYPBNLtNNfiY6XFj+bwJmg/BV7dVY8IVqZg1dpDsZ1gqUHIHKMuMhhBSlTSjWalu8gQdrf7MNKWlZVEKNMHwnHFudPsDePxd6QFouTVG24FwjsLRBoKCbM98j55mn+DyFBv3QMNui6MKEIQgNruprZOJFleOOTAocidNHcsLi2ePgjXerKmTgyRxiA0sWrOHa9cOIegg662jO4DiN/dqvh6vc5V7oMHqRNGU5i84sZujpmmgpQ1ILVshFXmLF9m5jm58cCCyL06tjEVT8g2Av3qu8L4cidY+H2REq71LSWdFqwNzKUPNMaSF1memlqE3oi3lbGuX6uAyDyzbehTLth4NSwqo6cvIBX21Te2S91wrEQzKtY9sqqhFyYZDYbaChV7cHwAeWr0HL/Uc2FLgEcyzzGgIIbWWaup8VNfSipXlNVip0LLTH6ClZVEOMz1u/GS6PLHAXz+uxhufSRMxEEitMd6txmfbpEkf5LCpohZPrDuI0y0dOr85EvFmE+zWOPgYdSXkqkJSoCGiKMrPwZqdXxlGCZvW067G0skhtS/T7DbuowHi58KrTU6vL8I90NDiRNH0UlvjzXjqVo+hcvNCsH6HmuESHj4ZA2zYIBFMqN2PWhauzkdnPFITLWhqU+bq1nJfv77xSg5XDLI5AWxaJbRwORKweHYuSjZUGtojaYs3ozDXFfbvyBo4cvoc1TX6U881r9aSDLstpEpL29JDwyQ1OcsJp93a6+KNYqQmxuNs23kqp4UkBX4yPSuiIiGsmPLS/altasdPX9+NF+ZNxKyxF6okUjacBBnfHpmBfx2uo7q+ki3kEcyT7LPSuhTbfam1xMJkpxc8+6ovNrDYSzWGrm5/AOv3KZ/RSkGGEOI1JuegOu0WzYk6mvYWtZZ2vVCaF1PCe3tPUd8TDXNgnNmEJXNymX7r8IwkHFNRMScQvk9xojxjgA0IBD/T4OuUnGslKJOgH9eKNJnEJq/5YL2+CPdAQ2sWiBYOCaNtt8bBEm+OmjEXw4Sg4fpg/ylJ54ZFLVMJalk42md6b14WlpYd5pbdJ/fFywl7+rYxaO3oxn/+fR+X6wHBNfLyf1yNKcODWVuzGYozM3qdA29zR9h7YlVMFZeGL3XozZgQWshf/H1fWCbLlZKAOycPRWZGkuzepFF+jjOb8N3xg0IDxX0GJhMelAgcpEB+o1SWVlyZ5NnKVbRmN5ZhAm70uFUDmF0nGqmvy8MWKn0uzmzCnHFuxaqTcJhVbi1F81yKxrxSX8XkLCe1UrMaQxfPmRqpNSbVyeFtbtfU5kJTnetN0WAl2K1xVH6DUEiTZk2zUvmyVHguT07QPKMGBN/Fsi1HNM+SpCTE4d68rB5ms2CSnvg1YtDM5DkYVea1gHugwcpqQgulaNzX2Y0fXz0E59q78Y/dJ7XctmbY4s2wxJnCVC2F2VAjsghyThntsy/Kz8aVrgHce8OdA2y6o+figuDszqufHON2XwBgiTeHbUa1PvXCXBd2VNXjZ2/sQnO7tkwNeU8sa6C/6mewJB7kgsOgQxd+qHib22X3Jk271uPvHkD+VQNh7alQ9bVAo6m1Cy9/XI3l8yYizW5F+dFvsGyrPJGDHMIqkzOv4nqPpNWpuMCnam9a2tnaLvTawknD0mQrYDRZbTLMCsBwR+4mjwsfVqhnQfvrjBcAmE10NlPN3vDINqv5OuJOjmAbo3YoJWt6UzRYCdNHXka1pnMGJjOvZdJyP+nJUrSonOG0syXpdisafR2Y9uwWxQq4HDZV1CrO0tLAbrPg/4k0hJSg5uv4/ZDUnOHpixhCb0vLakIbFdJE469RiNYZgY7zfogrqCQ7uHzeBJRsOMT98KEZYlN79iSjsqOqHq99Wo3SQ2d035crJUFX/6nbkYCiHt0Vp92q+36EONvaFXHwqs0H5eVk4L9uH4ufamSHIJkPFgeEh6jcxQhax5C0vQkN5kAKqmwC1sy9UJSzMNel2koTbZAAoWRDJbY9mq+rMkQc1DoD+rcBYGU53+QBANS1dKDbH5Bl45PbuwEEqxHf+uNWWYeBxjkTqugavS4+q2ZzRPvTjBcQdKZp2pmcdotionNTRS0X5qIA2Jy0yVlOuFJs8DZr2391LR1Yt/drSV+qL66FtCQL7p4yjCrQ0NoBY4034/uThlAliGiYuG6bOFiSlp6mZZFX0pkmiSD2rQtzXZK+TmmlFyUbpJnaePoihtDb0rCa0PRFE/TVaFwO5PDXQy0mBZpqEIsqcmmll0tVQ3hfcWYTM9WtVOTsciTquicpSBlbtfmgmR43Xrp7Ih575wB1C4TwedCuXdbS8KUG2iB5pseNGz3hBtMfCOCuFeq894C2maIGXyd++vpuvHT3xDA2mr7ShiDMYPOY6zn49Vnd15CC1h5uJZRsOIQV26o1HYhqLWQd5+kUfKPhxKUkxDOfJf1pxgugfw/XZqXLtjmzUuQqgVTnaVFa6UU75ZoTw2wKZ7wT+1J9bS2YEGyRnjJcmUqYR+uOI5EuaXlvXiaWlh2RteszrrwMb+8+qYnJjnfrmtJap/Wt1QIfnlpeXJXBhVBS5qVV2CXoi9G4GgIA9yADoMuQ0Kgiq6mDs0J4X+T7iwtGUv2tlDLv5CwnUpPoFFppodXYzvS4sWtRId544Frc5HGp/wEuPA/atUtKw/0xyCCgUaKWqoLWnWPLAGqdKXrsnQMozHVJ3mNfwIcVtfD7A3Cl0CnsyuE9lXahvgapc0Orw0gO3d+9X0kthnZ5coLhjtz3Jg2h/qwJ/VNXg/YdfFjhxcNr9+LOV3ZEqB/zTGqeZdDTIeex1nkeMXuReE8Q7Yy+ArstDv6eSqScujeP1p1ufwBrdp5Q/ZwrxYai/By8ePdEuEW2nXTjbf33N4o+nTDhIwbvZLncWqf1rWlkKEo2HJJVuGeFIRUNAqlssRZ+82hF49GiPtUC1jKWUqa+2x/AkvV8out0uxV/uNUjeV9rP1fe4KmJFiy/a6LkIFNppZfbEKVaVoSmhS/ObMKU4en4JcWA+gMCQTGjyREuNZC+2r9tr8HxhlYMcybhnqmZsMabZTM1d1wzVNN3kZki2gPgbGsX/rL5CB4pHBlRhm70dUa0dKlBSZNizjg3Xu7JuNPu0//dfhz/u/04UpMsIVvaV+0ZTwiDA3Ju6DnYicMAE6izrf9XUauqIq4VD07PwrevHMikgdTfZrwA0nqUwNT/Lm554ZnUXPXpcVw7PD3ibBSfN5OGpXGf75Hypa7PScf7+/kxHenBuY5uPLR6Dx48eRYLZ+VSd2GwYmd1A9V6uHPy0LCW8p3VDSit9AYFPxlfjNQa4rmu5JIILL51tLW8DA00pKDlB/Ki6FKDq8dpEQ6P6oUWSkwW8SstWLblCBeOaafdEqF6TUBz0J9t64LZZJItM9LChCBLVGNrF5XasRBGtPC98kk1Jg1Lw0yP2zByhEsVUu9jxbbqkOMt1Ru7tOwwUhWYM+RQdeYcrh6WynT4Pr/5CEYOHIBZYwdFGGDS0lVW6cW7e78Oy34p7elfzxwlGehOGJqmqbWxqSdAFzP0aQ1geCE1MR4JlnjD+O2F50Yph2HeunMdVO18pZVeyb5tFqQmWWA2mcLOCqfdgifnejBr7CB0+wNUZ6ArxYYlc0b3uxkvIJgMunMy2/ktdsB4J3zESVMp+6aH1lYJxJd6rvTfmDo8A58di8y09zb++nE1xg1Jw6yx6npqAF1SUPi5DyvoqrOZGfbQ/44zmzA5y4n/fGuvpt8kRbHOc13J+TIsvnW0tbyiHmho1dlYPHuUqjqwFjjtFiy+eXSI6/iD/ae4XTvdbsWSOaPx8zV09x2NPv1NFbXcVDOfunVMKMgQGwBaZ0JqPbBkI8lTevq2MQDAlBWhpTZVulc5CA8Y2gH9/g5WkTjggqNgEvxvWodv2dajzPcYgLxYnFCd9vHZucFsWlNbiE89zW6TrZZJZY1metzw+wPMs17kOSTEm/HGA9ei7lxHRACjl/lEC0wmE3578ygs6LHjRgQ6pZVeTM5y4r29+u345ckJmDoiXZWdbtqzW3T/lmduG6PoaNFQ7RYXjERRfna/tiVqtLVSEDpgvJOawuBXzr4ZLXK7bGuVJiY6Fswe40L50XpNgsCL11XgRo9LdV6SZfaANUEjDgS0VkTttrgIinWn3Yq549xw2q1o9HWqJgrmjh+EN784GdHRIaeVQcDiW0e70yLqgYaWH0iUZHmCmOKnbg1/cTwjz3pfJ57aeAjzr8/Eq9siVcCF9+JyJKC48MoQG1f5kTpsP1YHwpN8TaYTu4436qpw8Bx0S02yhATp5LI0NJB63iwOvTiQoMmKAMrtYzxa+IQHDMuAfn+FnmG5AILijsUFOVj7+VdRIY5Q0ymIM5vQ1NaJ//q/f4v2hRXfHT8Ihbku1T28qaJWc6Y8gKCWi9lkwtzxg8P+20yPG8k2C+56lW6AnhcaW7uQZrcxk0XYbXG4PvsybDqoXqVYt/cUbrhqoC5NH3GVUYmdbntVva71NsAWhz99f1zIBsg5WpsqakOVKCk8OD0LDxfkaL6PSwV6zu8zLe3clbvJdXkPA5tNwP/Lz8HSzXyShnqx4YD2CmK9r1O2RYckMMsqvZJMYOKkICuzk1xHgdZMvq+jO4Iqt8HXiVUUrKi3TxyCvJwMuFIS8IvvXIXPqxtCPuC1WU6YzSbUnevA9qp6ybODxbeOdqdFVAONbn8A/kBAkUZM/AP1UoIlJ8Th9klDsG5vbdjhI+fk8VYA9ja1Y8UnNXjg+iy88ol8VpZktTdV1EYwHC3bejTC6DkS4nHftOFMGSy+g25Butimtk7NWRqzCWiUeM4sh0VA1EApNxckdhLU2seUWvhon2FppTf0t2pUuv0dPNZmZoYd2x7Nx89X78LGitOc7kwatU3teK28GhnJNiYhwAZfJ1aW12BleY2imCAvx6RMsAaFqPMZQ2GrhjMt7Zg7fnBoL5CKz8nGNry16ytJPntfRzdVkAEEnZbg4awNclVGuWyr3taCku/KZygJaNYC0fPo7/ZET0WCnDtyiSGtuDw5gfsw8LI7J6Ag14X/3VFjeEUkGpDaRzSVCWFSMP+qgUw2k+yUxT3VZ6NandRASG/+sftkSAeOVGp+eeNV2FRRi1+/vV+1ksMSPAgDajnw7LSIWqBBs2ikdDbUFo5a1qGlvRurysOjSafdIkvdFWc24cm5HkkBEy0gG+Efu9SFBDdV1CryvgvR1H4ez5UdxqpPq/GMQjlNCN7sXRsP1GLDgVOanSF/AFiwejdeNEcyTtEeFqebOyLanISBRU2dD2t2ngjjJmdR/fY2tYX1W7K08K0sr8HkLGfovtRKw/0ZPNZmTZ0PpZVew4MMAjk6SdogQSwm6LRbcOv4wSjIdcEfCHBxTF4tr8E1gjVI0FvkA+R75So+fKD9cGStMup9jq4U9b9n0fPo7/ZFS0VCKnsrTAzJZdNZrsurJTslIR63TxqCI2d8+P0HWy+JIAOI3EcsCWaSFPzb9homW+LqmVkTk3iQeToj54JTEuKx5JbR+KqxDUvLDsu2b/9kepbsbKLY72Ft057pceMn04MJcGG3jdkEzBcQ2vBAVAIN2kUjNvI0BlbLImjwdWHB6j14UaLPGgBmjXXjwZNZiv2wLCCtHXIgEbnfz86hfba1K8Txr7YwaA/FyZlp2FnTqPq5v+2gE0k0maDI3CBuQ2E5LMRtTjTaICxsViUbDoVVt9yOBMy/PguvbqtWZZhR4tWOIRw8HN/nyo5wp0SmRS2jEKAUGnxdeLW8Bq+W13ClopRag6zVOb3gXalWwtQR6Xh790kmJyHBYsLPvpWNovwcpr2qNYPO0poQ7cHNix0sFQm5CpYwWVWQ68KkYU5mVjnhdXnYNxOA5vbzVOJzFxPELEpaq7nHG1qpPvcfU4fhJo8bjb4OWfG9Bav3hJx8I9Dcfh4lGw4iAJNi+/Yrn0QGGcL/LrbtLG3apB1TfP1AAHj542pMGJrGLdgwPNBgWTTiKoORhjMAZSdw4axcjBuSyl10T+5e9B74NA4t7aFIE2SwQCnIIL9d3IbCcliQayzbclQyO6AH4ha6YCtctWIrnPi+dhyrR152Bse7uvTAawiTFyWyFhCbQisEqAQtQ5VykMp2C4N5o9mntFSqtX6Py5GAKcPTVdsCxGjvCuC5siPIuTzIKAbQ016zfhcrCUSMIpsdUq2qjb4OlGw4ROWASQ0dL549CrVN7VTzomLa90nD0hTZpUyIZIkT42KhqmaZbTEhch9obTMb5qQjAriphw1SjsSBOPHr9p7Cwzfk4JVPjsHXGdnSqReNrcoCpgHQ+U5i207Tpq1FZkIPDA80WBZNyYZDuNHjjpp+hlq5edbYQbjR4w69sE8O14V66PoaaErnRgy68YJcG0phrgvPlR6mYghaue2Y4b+JbMIP9tfi3uuGUQ15LXhjN575nnx7Gy1l36UMmrLv7LFufLC/b4vJaREC1ALiVF/lGoCt/1afSZBK2pBg/vF3K7jd8+TMNBw5cy6sgqulUq0VxGnR+tuK1uzBMphgNkcy2BG7JD7EC3NdWD5vAorW7KHS0UhVYY8RI0aRrQ1SrarC85xltopkuZfPm6iaEBHTvm/cX6uYsCTf/sxtY7DnRGNEK0tfgCPRgiaF5AdZg4tnj4oI5lKTLMgbkYHtx+ojugOEdoGVklb43QNTbGhqi6S3l7rHyVlOKipYb3MH07B9b/lUUrZdrU37ktPRYKlK9IZ+htr9kRfW7Q/giXUHDboLPqB51rwH3YyAsA1lpseNvOwMqkCjqV05Q8ALZBMOSaPLoJxt65KkywXYdDwudcitTUeiBffmZWJouj0qgYbbkYCbx7qwYhu7WBNwQQjQKLtFHBM1ulMh5JI2RCBxytNlXCq3pBoqnDcRO3NGVKpNJuDh/JwQEx6g7bf5A5Cdz/M2teOnr++OmPEiopG0zqFSG60UYhTZ/CBHFrLjWD0+rarDa+U1ilnekg2VWDw7SNEs9y6EtO9Pb6xU3aMkEAcg2crSF/DCvIn44niDJDW+cA3O9LglgzkA+PRIHd7ecxKtnd24JtOJH12XGXpOWihpyXcHALS0n8eftyj7CAEAP7z6CgDG2KDeem9aEvKXnI4G60MQ62cYnYGXuj+pDPPO6gau7QxGgPZZC9WXP6uuxz8rzxh8Z+wIAFiy/iCSEyw409JhmKiRHjjtViaHUkq8iUXHoz+AVLGWbTmKVeXVONvWhbNtXXiu7Ag1ZbIW3OQZiJked9h+f+WTGk3XcqUkGGq3HEkWPPXdMSjZQEdVLackS2CNN+OpW8eE2n943G+DrwsrewbRtdIwsiAQAJZuPoI3v/gqbCh/1/FG3Dp+sKZh3ojv6Pn/4vaW2qZ2ZpFXYtvEGidyiFFkGwMplkc5kASTHEVzWk9w7Ui0otsfwP9V1KoGGSkJ8fjld65Ess2CX/x9X58LMkLtiCPSkZeTgStdyaprUBzMST3jf1aexvJ/HcUzPfpXWls4SbsZbWvT0s1H8Nr2Gtx7XZaGb4suTAgmUJQSGOl2KyYNS2O+Nq0NzhhgY762FEwBMT+oBJqbm+FwONDU1ISUlBSmL+j2BzDt2S3Ukeqa+VMiMg5ao101JCfEYe9vb4wonUplmG/yuPr0EJbbkYBtj+aH0WPKlYiNep79DWvmT5Gl91X6G1IhU9oXxMAL3ymBnv3Ym6C9byMHheVQNCMbedkZoX2ybu/XeHjtXubrpNut2PmbghBVNc+2JAITgEcKRlI7tzREEYAxdiEtyYIvFhVG9AdPe3aLIRUf8i0/mZ6F9ftqw36LGilFb0Kuiim245OGpenWUwIufRtCoHYOyrE8KuH5O8Zj7vjBoWuXVnrx3t5T4fT5KQlo6eiSpGu+mGACIhJeLK2+NM+YhQWSJG7uy8vEDVcNjBDHY0FqkgVNrV19LrgjMAFhA+ly95naU/FnIbKgtcGuFBuWzBkte37Q7kfDKxq0Q4dKfabC4ZbSSi/e3fM1c/lZCrdPHELVn1nb1N6ngwzxQJVSOw6gPXsQwwWQLHGc2YQX756Ix94+QFXxIhW7aPdIXiwwalBYDcu2HsWyrUd7hj5zUdeiTWeiZK4njAGkrbMbxW/t43mrCABY9Sldy9T9eZnU2W6hnfU2taFkwyFVJVs1NLZ24S+bD+Pa4RlhjolaK9AjBSND+iI7jtXh+c10Ku7kWpKZ5D5s9EgVc/m8iUizW3uouVt7qLkj7bhYhDGGSEidg64UG+6cPBRD0+1Y9N4BTdeta+lAtz8QomheJdFupdX57Wt4pGBkhP1Q6v8XBiEZA2x4Yl2F6newEHg47VaUzPVg1lg3tlfV63rOXee7+7JJQKI1DhOGpuHFu9MUE0Ck4v/KJ9X4r++Nxayx6vaetltISj5AC6JCb0vKvkolygCACVc4sKOqHlNGpEuye8htaq34zujwKF2vg2NCsBTa3H4+agtYHHGqteM4kiyGZBH78oY1AndcMzTMobRb4nHPqp2qf5dhD5YiY5SV0jByUJhmndY2tWvW0HlwehZu9LjCdFeMIrSgPZzzrxrIdF3hTNqJhlbJnmxWPL/5KAKCQIE4y7StQJOznHjz85O6nbe+bKPIvRWt2a3YKtGf2ypZIHsONnfoXtMlGw5hxbZqLJ6di5IN0U+K0MLBwRfJzKCbQwSi0ylR7+tEyYZKmM1Ax3l2OQAhfJ36/t5otHZ2h6QLPvrVDNVZs3Md5/HQ6t148GQWFs7KVb0+8cuXrK+Uta28GKiiJth3off6CFaV10hmfzdWnMbGitMYYIvHD64egkLBICHvTKczyRLW28bDwQkAMJlNoZdjtAEqLhgZpgyuRlkGGEP/SYRv1Ep8vQWW0iwtxAbYHEe5AXs+Rtv7yKtH8mKBUYFVcUEO1n7+lSGHoNNuwZNzPTCbTRHtcK6UBMNK9I5EC5rblK/7i7/vw5I5bD38ag5DWmI8MpJtOHLGR3U9pRmkbY/mU1HILpmTy3WGpK9CbaDcCOrJSw3RqIp6dSQkooX7pg3H0rLDklVD2mdDmyiJZrsrsR+PFORE4dt6H797vxLJNvoZ1b9+XI1xQ1JDNN1KmOlxI9lmwV2vfib7GR7dFWZNf6URcWYTHi4YiV2LC1FcMFL2c+c6gqI0d76yA9Oe3YJNFbXcM50NrV341h+3YlMPlRovB6epx6F1iITD7LY4LtcHghnBl+6eiIcLwnvyjMwGi2G3xeH+vEysmT8F2x7Nx8JZwQylyyFtmKJ9HqYlxeP+vEy8cf+1SIjn9+wJxAa47hxdq03oc7QW+VL2qiTAuwJgQnC/FOXnYNuj+VgzfwqKZozQdU23IwHFBSPx/B3jsWb+FHz+m0KYzSb87PXdEfvvdHM7zvYEGby3QOEo9WrF6ebgobyJkjKSOAxydiTBYkZj23nqIEMKZEn/7v3gMPvUEemYO34wpkpUsglI9k3OvhiBvurCCw/+GCIRjXOwt82ySWFxXrB52ZJ7xuVIwAvzJsDtSFBc43ZrHPz+ALpVot9ot7uS71mz8wRcKcq/4VJAbVM7th9TpzAXYtG6CtX3RlDno/Nd9PjIUatoiLFm5wmqzxGq0x/nZVJfmzZiF2bWeDk4xKFItMRh+f0TUefrQMYAG37x1l7dg2HigVUxotlm09rRHcEqM9Pjht8vTQ8ZbV7ws63BYDUl0cK9X1aKxYdVVIt2c9N+7lIBT0prKerPqSPSde2TxbNH4cd5WcziR6lJFtjizfA283ufednpSB9gUWS2YcmA0zgM7V182g20ZMlIVXzHsXoseGO3YSyAxQUjcaVrQJ8nzOhvbZW0uNSeC5kbI7M7RHxwweo9AJTpjpXE28xmk+Kgtq+zG3e9+pkq3Xo0E5wEROeiuGCkZNWmryI10aLRbrGFUw2+LmrbGg1B0KhWNAh2VjcwO39v76ITyrt94mDqrJcwszZpWBpSE/nQZ5JD1Gw2Ye74wTCbTLocDJKhKC4cqZj1q6nTnmVkhfDZkci52x9QpdwU37o4M5OWFI/UJP3vgdzfKgOG+KU464mDLGcOyDskAUpM7VcaZEgN0J9RTrTG4ZGCkWHaCoC+Z5qRbIt49zSD/Y2tXfjvHwQrIPflZSI5QX+O5/KUBKzfp16poM2A94bDwHoOxJlNyMvOwDPfGxOkfzTgnoamJ8GRaMWvb7wyqJmgswJmFPqbbaBFX38uLGvWabdi8exczBrrDqv8zRo7SLZaIZ7fIXNX4qphYa6L6qwlyV65qmhvBnaZGUmSz8Fu5d/FIIUEixn5V11G/fnl8yZqqqhPHZEON2M1l/a9BFXrrbL/Xey7aEGvVDRYF2YAQDOlGFtedgaevX1cKIKva+kIU52WunZtUzt2HW/EtJwMroJg5Hfq2Yi0gkybKmq5DG6yQJyVpHFU/IFgVvjU2Ta8u/frsL5Dp93a0+sOTbSDUvfHO+v5wjzpIUxWUa2Y2q88eIlKtnZ247myw1j7+YmwjJyeqomUE1Na6aX627pzHbDFm7kQWphNwGfH6pmej5od6g2HoeSDg0i0mJkHm+XWiJvDvNjv3z8Yxmo4MNmGAbZ4nOvgJwiqNwObmmTpl7aBBmR/6w2aE+JNaD/PN0++ePYoDEy2oYiSOrvR14kFq3fjRXPkuaNUraDBzuoGptlFuapobwZ2lycnYOqIdMnnUFrppdZI0YqOLj+2fvkN5l+fhVe3ySu6C/VIzGYTlm2tov4Op92KKcPT8cQtuUx+Ec17IfN4chTsvARBo1bR6PYHsL2qHuv2fq2ZOpIGLkdiWASfkUw3TFta6eWuOkxetJ6NKJWhICDP9N09X2PhO/s1f4deEAeFNjt5srENK8trIoabiFEFgtz/PCobQLBcySPz+cgN2YrUcXJ95HJZJrnMfUztN/gsyUzF83eMx+LZozRfyyvKyGmpmgizOkJbVn6kDu/tPUV1DWeilVsvsz8AVSVcMYR2SPgbtlfVo9sfCDGi8QLN0m3wdTHNkAghXiNq82K071pMnX66pYNrkFFcMDLi3li3+dnWLuoAt79BuL/1QC3IIDbhhXkTqLshMpJtSGfwB6Q6B4SQq1bQgCWxoFQVVavma4HbkQBXik3xmk77BUIfqecw0+PGrkWFeOOBa1E0IxsPfXs4nHYr1/skb+SD/bX48w/HK37ujmuCquSsz+s/pgwDELR3xZQD8GZT0J9Sgto8HqDsf7IgKhUNKRYTLRkdNXVoqfJOTV0r1bXf+oKuNYsG4mz05CynJuajohkjUFx4paTx6Euie8SBaaAciP7H7pOK/ey/e78S2x7NDylE//Wjo2jV0Rt+b14Wlz7OrMsGqH6GJcs00+PG8nkTsGhdRdi6jqn9BiHka+/2B7D8X1WaxO+k5hRYqibCwK+00qt53/1s9S6c6yUBL6FtlNPZ+eHVV3D7vuKCkci5fEAocaC277SyKMlx+ou1l1ZypEWXQmqSBT+amok3P/8Kp5vlK2VOuwU/+/YIFOVnh9kIuZ57OZD1nGyzoM5Hpy7enzDT48ZNnoH4sOK0Yd8RAEJ22pFkxV0r5Jl7CC5PTtDU0WGEppKWBKjUvdNqMrCgrasbP7x6CF7+uFr2mg2+IKGP0lkZZzZhyvB0mE0mnGlpx4+mDmPu/FAT+iTvJz05SNIjdz48V3YEaz//Ck/ckht6XjRYuvkI3vwi+HeZGXaqv/EHEFEJE2ucLFl/UPFdOe0WfPSrGbDG669HGF7RkIuaWBYjyRw8Odej2AMvzgAH24no1HO1ZqxostGllV5N5bu87Mtkgwy1SDSaIJGzUp+fEC0KbXBCoxpnNuFK1wDNQYYa+wYr1DLC5N+zqKaWbDgU0T62eHYsyBAjzmzCk3M9mv9eKiMnlREnbCxCkKwOAF37jjbIcHCaFSMgthEAni87gp9K/AZvUzuWbtbfeulKsYUY8WaNDQZzaSp2wSgWpTizCZOznPiwwrjM/4+uG4Y186dg16JCFBeOxJI5ypUy4hyVVnoxOcsZcjzT7DYsn0dvo8gzu+vVz/Dw2r1hDI0xBHH3tZmGXj/JGhea/5oyPF21Ap/W0+6mtcOBd2sjyayzQO7e5ar5aUkWTZ0JZ1u78PLH1fjJ9CzFPSGuVouxqaIW057dgjtf2YGH1+7Fc2VHkJpkoWYBXTx7FP50+ziqz55paQ+dKXKsqrVN7aH2pxfvnkj9/MnvpE2cA0EbQSph4udw14rPVOeGG3xd2HW8kfr7lGBoRYOXCB5wIXPwotkkq3otdM66/QEsWX9Qxzero7hgJNZ+fkJRcIo8A1akJQXZkrZX1Yc5q72lnKyEkg2VuNHjgsuRyO2a3uZ2zc8OUGffqKnz9ajuqldhxBUquYzwnHFurN9Xq7o2yTWkeMeVenL7O2aNdePBk1mKLEtqEB/WUhnxGz3uiGARAKY9uyUq++6FuybCbDLhw4pa/O/247qulZZkwdO3jQEA5D2zWXa98/hdxQUj8bNvj8Cu441Yt/drXJ6cgMJcF7U6uvDdsATsSjB6wP1/Pj2OqcMvtKzQVMq8Pc6GuModZBcahTS7TdO7J0O7MTG/4PqBKRgMtHYaU0Vs7ezGjqp65OVkUH2e7DGtM2K8ZyFIJYKl71+pHUeumg8AO6rqMf9vXzC/i/X7arHlF99G3rNbJKvZSqx6cmcsi6ZRRrJNE3HL2s+VWVUfe+cAdi0qDD0vb3M76lra8VzZEclnRH7nmp3HkZZkiWjvlENtUzseWbsbH+z3arLxvIJbQwMNWiOfkhCPu6cMQ03dOWw/Vo/G1gsZb7HjLl7MGXYbYAoOWgqd8uDLM2YWhDieRfnZESVw8YGo9aBrbO1C8Zt7AYQ7q9FkhqEtg5JsJK8hPCA4JHqi3qf5WlLtR2Knsig/RxB4tGJp2eGI3ysOWOSMV21Tu6QDLKXkS0OHGhPkksbCWbkYNyQ1ot2MFjSHhlTwsb2KbfBaC0IDgwLHVWugkWSJw4PfGo6i/ByUVnoNFdNKTbLgmZ5g5lt/3BoRaN9xzVCq65B3IxfIa2knjMaAu3ivzvS4kX/VQEx5erOscwREiqd6m9qxYPUevHj3RNzkcWt69ySL2Z9tRzTbit/4rAZ5ORlUg9VnWy9QjrK2Gull/ZHDTI8b9+dl4lVKdkaSVJRbW6SKSM5V4heYzSbmIINU7VZ/dlyxZVaqtYxGvJgGdS0duMnjZiJuofHRzrZ2YdmWo3i4ICd0z8+XHVZ8RoTSlxXv79de0eUV3BoaaNAa+eb288jLzsCvZ15FlckijsCmilr88h/7wl5qaqIF9+ZlYWh6kvhruECOm18OPA46obPacZ4Pjz0NBqbYMNSZhJ016uWzMy3tiDObsHj2KDzU02ssB3NPz6PShm/wdWli0SLvX6iYLgehQ7mpohYOiTma1J6M8EyPW1M1SSpwoKFDNaIn91LBrLGDQlWH0kov3tt7imp2IzXRAn8gKEDF6oQZ7bCK7Uq3PwC/P6CZd/2VH12NvOwMwyqgdlscpudk4O5rMzFlRLpsMONtasfSssOK6ujCg1oukJcK2GlAe1AOsMXBH4Cm7HdtUzteK68OZT8nZzmx63gj8zyR0FZ89KsZmpnR+rPtiKZCNQBsrDiNTRW11OcysSOk8rVkfSUVicri2cYRgxTkuqgDDbW1JZckuMnjkvw8DY430LULCW00r4RsyYZDWLGtOsRkR8MoSXtWrPq0GkX52QCAHcfq8dePjum+X17gzXppaKDBEg0teGM3nvle0KGjMZByBuVsWxeeKzuMARyVuIVgHdTlEREKDyDafkE9uD8vE6dbOrDxQC11BE1+ZxoFcw0hzzBCZKeprQtLyw7jStcA2XckDmbJIKbUvQhLlFqNlzhwoDVEl5rwlBbIJR5IkDh1RDp+MzsXy7YcUQ1Mz7Z14a4V6gJUUt9/5PQ5Xj9JEkK7oicjK6yKANrWbHFBDtZ+/pXi37V2dGNTxWnMHT8YAFSzh+e7AyE7JndQq11HS6WPpk3FbKKfn5GDkELd7UjALI2OlZBuXc+AbX+0Hb3VVvy79yvxp+/TnctCf2Cmx41kmwV3vao+RF5Z24w0u9WQgX/WTgS5taWUJFipQ8/qijS6pHHGgAu+B8v6V9tf3qb20LyIuDVayh+k9fmCVY0jqrY22jCC9dLQQEONXkuIs21dYRkrpcoGjUHhze6SmmjB8rsmhrU10ICX0jE5gGACl+sNsMUjPs4U0SP8xC252HOikZrqVxz50m7w+/IyqTPRLJBySIRrqabOh9WfncBpAcWy2SRvaITX0nt4l1V6MXVEekysjxIsLTRrP/+K+rokO/5IwUhkZiTJVk43VdRiyfqDhrVg/mbWKFyeYgv7fj0ZWT3ZNfL3wZbQHBTl52BHVT0WrJZW4Bbus+QEi+pBea7jPOy2OFjizGE2R3hQq7Wn0Vb6xGeHWpVVjvteK7xN7dQZYjmUVXqx+JbRmvVk+qPtoA2qnXZr2LkjN19Hi9qmdiCgfC7LZYjrfHS2ZdnWo1i29WhIa0qJZh2I3AOThqVh1/FGSX+KdVZDvLa6/QHsqKrHo28f0N2qJAR5Zle5kun+QPBFtOtfas5W6rImBOdFPvrVDNnnSDA5y0ldiY629hkNjGC9NCzQ6PYH8PsP2Ad5f/d+Jfz+YC+gnIPRGwq2Z9u6YDaZNNEv8qR+23LoNJfrlcwdjTnjB0cEc93+AB56g87gSDk2tBu8MNeFMYMdVEOi5Ltof6vQIWlq61Q9qJUcDeG19B7er5bX4JosJwpzXTGxPhWwtNCw2gNyTSEjnTiA2VRRy0U0Ugm57pSwQVKaBApJeDS1dkXYSD3ZNQLhXjabTYqHJdkbr++gmyXwdXQD6EZxQQ4yM+wRBzWtDo9S8CQVnKYmWWC3xsEnaosyoqIKwTVpWkTl8O7er/F4D/scmUksP1qHZVvVtVOc9v4p5kcbVN9xzRU9uiXBqihJHv565ii8Vl6tKPArh81fnsaccW5ZogpChSv2H1i1axp8nXho9W48eDILC2dJa4VI7QGzKfycc9otPQHLIADB6soL8yaiaM1uxfPQaQ8nqdFD960EoW/R0EqXjBQGbbSCuGTOVu293JI12gAAJmxJREFUCyuN4iSHVFKct/izUSDP4U+3jzOUJtuwQINM0rOAvMyHVkce8HrmFHipumrNaPNSOgYuOKt6rycUNhTitXJ5dcvIa0Q6NrRl2EZfBzVLFU3WQQqvfFKFrV9+w8WZONPSjps8blVObTWQ6giLinh/A+uwPO85qMJcFx5754Dua6rhTA+BBTmg/IGA+hBhT8Jj1lg3bvRIM7wIrzlpWBpVBVSqUkQrCPfx4W+oPkewZucJlD92QwRDzKL36J65XPAk204rM6RrdIuNnkpJg+/C4DCx05OznHh790nVNfLkXE+/tB20QfUL/7qgyvz27pOhdR9nNuHHeVlYsa2auWPgrS9OavMxNL6mv35cjXFDUiMY8uTagMVrscHXhYdW70H+rq8wf3o2Jmc5MWusG8swQbH61+C7QFKjRRuMFq4eBjZHohXlR+nsi/D9qyV4A0BINyjObKIWdiZdCQRSQZ0jIT6qs7RaIfQ1aJnTtMKwQIN3j2jYnAJlPyRBydzRqKlvxYpPjkVktVigJ6MtzEx5m9tR8sFBTaw5QLignZB96/OaBqwsr0azgk6FWracdvDqO7mX48W7r5Yc1F88O1cyWBSiZMMh1YFHOXavupYOqqzTli/ZHCAlXJ6cgF3HG3UFGcCF6ohc8BkT61OvUIhbaHjPQdkt8YYdoEKIbQCtujCxreJEgRLtspLwVXFBsFVKuJe7/QFqxXNWm+pt7sCyLUdDe7qs0kvVaqRku/oi7TcAfGvkZfiIMRAjkKJiVmsDe3B6VihL3d+gpU1ZXCEVOqgsoAkypOaL6ihFbqXwq7f34/cfHApL6Cq1AUthy7/rsOXfdWHUyvfnZeLdvV+r+ie8beTi2aNChAqNvs6Iiq0c5OyCWoJ36eYjeG17DZ65bQz1GUIqjUptrk0K/ldfQjR9DcMCjZo6H/drhuYUevohaTPcJxra8OfNR3QdQjzo5YhjsL2qXnOQAYQ7WULWpOdVfiNNtnyYk27w6tos+VkVNYEuIPgb/rz5CO645go8V3aEKrMvpK5bsa06Ku1zxIhNGpaGP3MQNAPCmUdoVcT7E2iTFKfOtmF7VT28ze1w2i269hRwwb68veekruvQQny/tOxSUoeiUquZ3CBjkKEtMyLIAILBHs38lN0W19MSxYbnyg5j1afVzM6KnO3qjXZaGgx1atcWEr9nIvAphXS7FSUUvfuXMrS0KUtVSImD+vi7B3TbFCGk5ov0JEl8Hd0Re09rFS3YSRIewCYnxOO2CYPx/v5a7rOUUshItmHu+MHYVFGLBavp5tTUfJqZHjf8/oBscH62tQs/fX03lt0xHskJ8YpiwsCFSuPkLGefTGzIwYQgi+h//2A86s4Z1yIlB0MCjW5/AGt2KguW6EGdryNkUGhe9KpPq3UviDnj3IovhUVgike1RyxuRbPoB6bYsGTO6IgIVnjvIy9PjujnFMNsAkYOTA6Jcol/K+3vI/3GRDlUbkhUDC1CQ1pAftGcce4IfQA9EJd4+yMNpRJoD99f/mOf7gqTFIwS+NILucwdTasZGWR88V9VWFVejbNtXT0MfUHWE/Feo93DIy9Pxp6vzmr6PaxBxiMFI2Wzb32RZclsAv62g/0clHrPaiQB/T3IIGCljQWkSQZmetxo6/KH2oR4QbxOeZHFGIGW9vP4H52CoSy4PDmBuTKplpUPzgqrdz/8fO1e6u8k+iB6/QGn3YJGH714oFYQP2bJnNHIyza2RUoOhgQaRorlAcEFOXVEOl68eyIee+cAlVCOXqzfV4tfzxwlGTywCkzxaPUQXmPHMToxsf/+wfiIhSZ172pqqgmWONyzcmfon8W/VUgzR4OmnvdTrMICJASr0JAWuARtJzyMQWzImw60h68RQQYAXD0sDf+sPG3MxXVAbqCUttXsxX9VSYpSSg3Y09oorUGGFmRmyFdb+yLLkp4ZDeF7VnO+TAiSpyTb4vFZTT3EQ879DSy0sUKIg4AT9fy7MsTrlDdZzMUKV4otJPRH48sUzchGXnaGqp9AOyvM8twvT07QndgYYIvD3HGDsOpTPoEc8S1+cPUQ/M+nx8Oq40rBGEuCXA8MCTSMzC4JW5i0GhQtkKNV1CIwNTnLqbnVg5TA/IEA1u39GjV1PqzcJs10IYa4H1Tu3tt6ggzx4DP5Z3EQIvytALBk/UGm30Syrms/P4Ftj+ZTL3QWoSEaJFnNeOU/rgmVFicNS8O3/riVm/GXcxRjCIfWPmleGOVK0dwSJIYJgF0DGYVUsE8qf2LQ2tuXP66iHrCnoSZXq3zyBsl4Sh2MfSkzrOe5mE3A/Ouzws4M2kDynlUXkj/Lth4NKbb3x3kvWtpYIZyJ1hCRQsYAG1Z/xjebL9d+zZMs5mLFkjmjEWc2wdvURvX5pja6Vi6evqgwUbizukHXtc51dIeCDClGMBbfkASoTW1deH7zBVY6NfFi1gS5HhgSaBiZXZrVw7RCDhgtBkUrxJExKzsOQZzZhFvHD2Z2ksmCaj/vx10r2IMr4XuhuffLB1jxwPUj8FVjK65IS8KKT46F6U+IP7/wnQNhAncs0MKRn2G3wZWSgNPNfJwLa3xcWBZQjddfCKfdCr/fj7Nt8g6l3RaHti5/iBowFnDIw6g+aRo0tHXijquv0B3EkrcbH8f+nqUqik2tXZLJC1p7qzS0Ldx/k7OcKNmgTk0ezSDDlWJDo68T057dInsw9mZmOCUhHrdPGoLBqYma6FEJAgHg5Y+rMWFoWugda3WWSP/5S4xq6pcCtPggD7+119BZBKUkk3her6bOh5c+qkJbV99nL9IDEgwX5rqwvaqemsHubztO4G87Tqg6xrx8UfEsCKvIoRJIMve+vEwU5rpCCU7qpEmPwROfGUrixVoS5Hpg5nYlASZnOeFKYWufocWr5TW485UdmPbsFmyqqI1qybxBVBFgYccRoyCXXTnWITHLQAMTIrMpNPd+uqUTnsEOPHHLaJhNkAwyhJ/XGmQIocaRP+3ZLbjzlR14eO1e3PXqZ2g/3x0KdIQw9fzfg9Oz4HbQK3UK3xXtAV80YwT+cscExSADCA7vFb+5N2z9xiCPmR43Ft88Ourfe3lygqb9KYbLkYBHCkZyY2chh8Lv3q9Et8DLJ4eeXDhD9gINePUf88bc8YOwYPXuiPsiB+OmitpQcOoS7ffUJEtENchpp2P4okFakgVfLCrEb28ZTU2TKQepd6z3jBOvl/4AtT0hBaOCDLstTjXYCxeVbcXSsiOyQUZqYjxSkyxamXG5gXy/XKVVDWlJ8dj5eAEAhM71dymZ7gjI/t+4vxbbq+qxbu/X2F5VH1rvQV9Uv4/ociSEOd+k6s4DxH/5sMKLyVlOWOPNoWtL+TVAkCnw/rzM4N/LbG2580ItySz1N3phSEUjzmzCnZOHGqp6SBbY8nkTVUvm1jgTOrv1P7QGX2fYADStIyr1ORpBGSFLQIbdhl/8fR8AbU6LOJtCe++llV7851t7o+Z4iKsuwgyP1Hoi8x0OEad3kIc7F2l2K65ypeCjw99Q0XWWH/0m1JZBO2tiiYtjrqwZlTm41MDjkGBBatIFsTPWVhwTgpWtRbNHweVIxOQsJz7Yz3ZwqkGq8qfU582a3efRf2wE3vziJFXlWI7JDUCEUvLEklIu+ko/uHoIrPHBnB0vqmXhO9bbFkZTKb7U0Nvtl0KotWBKtbAoIdEaj8WzR2HB6j1Rrd6J2zlJ739hrgs7qurx0Bu7mKhdG1vPy86N0YL8nVhoUFjpWDJHH3HM4tmj8OO8rIhq1EyPGy9RzgmrQbzn1ejvC3NdmPRkKfN1AfoE+Y5j9dyGxw2jt83MsBt1aQAXDpiSDZWq3OJyQYbbkYA7rhmKrm4/leLqcoHQD/lbGtTURWpTqDkHQDhLAKHxZIVcny7tgbjSwGFrKTT2OOy0xpesg4R4M9544NrQfEWjr4Oah1uIZVsvvGNXig2pSRY0tSozQywtO4xHCkYyfY9Sa10MFxDt3vt7r7twoLC04pC394dbPbqUuWkhDgaUDqabPC6qfUyCLL39x0ZA6SAXH6ZyTG5izRHaIEONHENIFNLo6+Dm/An1UvS2hfXF4NFoXGCgOmgoOY0alOy8GpuYFGqb2pFmt/W0llZEhXoWCLbmOO0W3Dp+MApyXWHtv2azSZN+xKpyPkQr4uS7OJH3wryJWLBmNzOBSLrdKhlkEJDExl82H1GVF6CBcJ8q0d8/X3aYKbgRCg3S2oIFb+zGM9/jM+NlSOsUQH/ADrDF4eEbsgGwi2SSA8aRZNVUvls8exQeLshBceFI6vYaAm9TO5aWHaYqYS4tOxxqk+n2B0IlPkeiFcvnTYgo9YvLdN3+AMqP1jHdH8HyO6Uz5jSl5d5wfUs2HMLG/afws9cj2yTkEEBQBMxsMmHu+MFoauvEgtV7dFdhvM0dOKsSZJDvX/v5CbhSbEzPTKm1LoYghCVqo9djapIFRfnZoX+Wa8VJk2jFEe9ZAi0tHDSQsq8zPW5sezQfa+ZPwfN3jMea+VNCwp40IEFWo68DSnGvCdrbJYRwJPLNc9EeoKR1gBZqdMdkD2+qqMVDEqrMWiF8x3JrUcu1+hNmetwof+wGFDMmgnhCzs7rEZk809IebC2dPYrLPdKi0deFleU1aGrr1NQhIQatdhArxC1As8a6sfzOCczXKZnrUU0CxplNeKRwJJbPY7++GFKsZFNHpGPu+MGhJEq3P4BVjAngd/d+zdyKebatK9SWqheGVTRomZXOdXRjyvAMjHKnRGTjUhMtVAtxe1W9prmFkg2HcKNIDZR205OMNG2G6XfvV8LvR0SW3S1o8ZGiGGMtqwp/n8uRgCky5XKaLFlvdPXWNrVj0boKzcbXCIVgmndc29SO4oIcLJUQH1RDf8w2siBarCzP3DZGsjxO04ojN9zPs61JiEaZVj2pbD6ZmVPK6pIgKyiWpe4s33tdFp4rO8x622F44a5JMJtM+LCiFv/Lga+f9gBlmUGhPYO8ze149kPtQ+BSEL9j8VrMGGDDf765B6dblDPaPMRmL2bEmU14uCAHV7oG9Cqzk9jO65mFImvd5dAuCKkFcpV41kDWBMBBube0QlzpnDV2EF4ym6jXwIPTs5i0aW70uFFccA6ryms0/S7afbqzuoH5+kRoUEsrJo+uC8MqGoRZiQYkOhdn45bfNZHy29iPa3GWgTgzLJUNMgB9+0Tl30m+6yGZYcYFq3ejqa0zImp9vuwIfsqQ2SdQU8skIL/ZwSE7yRNaWYaOnD6H18r5K4bTrq6mti5NWcf+mm1kgdA+FM3IVv8DCcgNL7odCYrDmlJZJal/p3TvUutCz75btK4C7+4JH3wUg1RPn9pQiRaVNqFnbhsDAKpButkELJ83EUX52borNWdaOjB1RDpu4lCaT020wB8IUA0wsgT29/YMXKqh4VwH9/ac339wYSCTvEsy83Pz2EHIy87A7+Z6VK8To9QOgocN0QOxndeSYBITuxCnMZqQqtCwVG7JZ2j3ll6I25GEfmZxwciIOUCn3YIX5k3Awln0w94b95/CNX8oxXNlR0JBQJI1jvrvTaDfp6WVXurrCvHPg8HKBMsgO6+uC8OUwXdWNyCR8kGTDSjOxnX7A0gVDfkKQbL2U4dnhPXWs0CpJ+7I6XNUsxtJNu2PUSpDsKmiVldfKY1appAiNiE+DlqHzPsSaN4VQdGMbOQMHED9jmmwbu8p/GZ2bmgNeZvaULLhEBp9nbID/zEBP3oQ+0B7QIuz0cJBumiIFAkRkY3WSe7Q4OsKqRZLUTwGbYi6OrJwhouGztkfANLsVi5zA4TFj4YYw9EzKwWZ7zrb1oW7VnxGxQNPG9gXF+SgKD8Haz//SvHeXI4EOO1WqmsSpNutqFfprfc2d2DZlqOSmXjh75QbSE1LsuDpfqqjIQdWG8IDcnZeSxUACHdItXRj8ILwGbLYg4EpNvz25lw4Eq3UFUM9kGtHIijKz9Z1Hjy9sRJ//ThSy0yt5ZKAZZ9uqqjVPDf72vbjuCbTiVljB4WSX4+9fYDq+evdL9wDDZZWHzVHq7TSqzoE+MQtuZgyIl2zAF5dSwe6/YFQFUG44JxJVizbqn6NgE6JYmHU2NTWyWw0yGA6jaq21lYsVhTNGIGcgcnIsNvw87V7ojawRgtLnBlzxw/G9qp6boFGva8zVJ4khizRGqc48B/LNoaDRqmU9oBePm8izGaT5LV6g4FHeMBpJXeQgnDwsTDXhWVbjlK3NSVa4kIzHKwsenpb2ohzTkOMIay4KH0XDZsbTeuA25GAovwcqnt74pag00SLxbNH4WRjK5UqsNx7FP9Owvyz/Vgd+rsyOA2iVUVWsvOsLSxyCcSQ08iB/YgF4mcoZw/EgnTt5/14/L0Kw++VNpFHdDHIuSPUaVPDxv21kkEGLaYOT8PrD0yl+i7W2TIxAgHgodV78JLZhJkeN5Pgtd79wjXQYGFQUHO0aB5qapIlVAV4cq5HkXlKDiUbDmHFtmrMGefG+n21ERtEDWZTUDyGB7zN7fivTV8yBRlFM0aguPBKqoWqheFCK/KyLws5Vd8dPyjq7FVqIEI2hbkubsI7ABsbkBEKnBczaJVK1cSShPNJcvuCJqAxEjwzqkLBzCfWVaj27Ash7GGmPUzEQ8p+f0CT7RX2l9PuE+JQL1i9WzITR8PmRhs8kL+lubduf0B1DgYIrme3I0GXqJ/c78zLyUBeDh86yksd0WKzU7LzNPNbxQU5yMywq9ooEmwu23IkYkbAlWJD+3k/d8e+USJ5KKzcllZ6sbK8JoIRKlrBEElEq9l1pXNHaT7P29SG364/qOsetx9rRNHq3RhxmR1Th2conlm89I2ENmPKiHTVajKPrgtugQbrEK6ao0XzUInAGhn0efDkWU3RZW1Tu+Tf0eiV8NRBajjXwbyQ8rIvCy3MzvN+/G17DY43tGKYMwn3TM0M8bvzHJIWZyiEkFqYhbl09JpS1zLyECAb7olb9PFsC3F5ckKEE1uY65Jt1+lth7evgEWpNM5sgmdwiuJeER4w4mfc6OuUJGUwIvDr9gckM828M6pkXkwLSNBD08Ik3tvd/oAmp9lujYs4vJToHAnizCaYzSbFcr8Ud7wYrAkAtXuLM5vw25tzVQOuxbNzqVTXaUDzO2O4ALEdIFoURkFOf0EInomo4ND7SBTl54T9Tn8ggLtWqGetWVGyoRI3eiKDeVIhIK2dLLDb4lR1R2hxX16m6vNTOnd++vruiNb9VI2iyUr4sCI4c7Fsa5WsHAHALzklpgJnSbpoBbdAgzbaKpqRjbzsDFWHSosY3sJZuUi0xGPpZuOEAo2Alj5f8aH/9MZKvPJJdVgA8IeNhzD/+iwsnJXLVe33/mlZWPFJMDCjWZiThqUxtbal261YMmc0ntp4yLAWL+EhHeTZnoCiNXs0B47kfTT6OjDt2S1UTixtBv9Sh5pSqThz+/TGSpRWnpG93qRhqeg478f2qnrJoEIKRggobqqojWhnWLb1KFKTLHjqu2Oiqg+ihAy7Ddur6nGmpR13XHMFnpNgTpPb25rtiozpl9PAEEKPUKoQNIEN7b1tqqhVDLjs1jj8ZPoIOBIt3G1ajLVOHXK29ifTsyI6GfSCnAVqQQYQtH2ORCt+feOVaPB1wjnABleKvoSTeJ2u2/u1puuoQSnIXbbliKbWUJogg2a+CYAqrTeNQrY4oDC6GnO2tQs/fX23JDkJz+SUeDZZSm9mYIoNS+aM5nIecgs0aI1dzsABVNkXLWV8AMi6zFihQL3g1edL/oY4XnIVGfLvuzgooxN8sL8Wy+dNQMmGQ6pZGGLgWeZn6n2dWPxeBX583TBck5mOOl8Haup8WLPzBHdmF29zO7ZX1aPLH0DRjGz8eYu2eY0AAM/gFElqUHEP/c7qBpRVevGqRJWnPyqG0yqV/uz1XZg4NFW1avnF8bP44vhepnsQBjT5Vw3EruONuqpMmypqZatkZ1u78NDq3XhwehZe/rg6quq+YqQmWfCLv+8LcwqksnZyGVatTq6vozvUC81a0dNyNshVDmkCGykIr1dT58NzZcrJLV9nN54rO4zURP4Mf8I5wxgioZS1fvnjaiyfNxFpditKK714b+8p1XlCpf3KkgVWSjTJVWO12CIj51Gk9v+milrV/aAHT8zOxZINB2V9Ctp2H57JV95Ysv5gROsnz3Y/8Zrw+6WErfnZE26BhtbAQAjhpqr+xqfYogNcULLVch+9geKCkVj7+YkI53zx7GCQ4W1up8r8C7Penef9eOUTZcfr5U+qmRUxlUCUSbc9mq9oBPXMhJxt68LSzUeRmnQcz9w2JqIkTFh7Tjfr23QlH8gbLFbIZdmJE/vYOwdUmYBoeswvNdA6q/+sPI1/Vp427D5IQDPl6bKwNcFaZer2B7CEonf377u+xo+uG4b1+2p7jSwhGEyEr3/C7lRcMFKVYEKPvS2t9OI/39rLXNFjbfGScuhSEy24Ny8zNPDNAj2EGkYw7JA5w/5WCaUBTda6ZEMltj2aj6kj0vGb2bmiNsuOiISayQTZ85S25YmmVRSIJD/QUvE2ch5FvP/1DizTYMkG+cQlS6DXlyuB3uaOiGoRD6Y/qSBMLlHtbeaX9OQWaNAyechFmVqM99nWLpRWeiUHRftCSwIBeblF+dkoys/GjmP12F5VDyCYhfr9B/RUtnZbHBbPHhX6zX/bHjlsJQbPIIPgTEu7YjaQZibEabfC7+/G2Tb5cunZ1q6wxS78viVzlAfpUnsoMZXugVeQoYYApJ06uc/2p97rvpYcEK+J2p5+XSWtDSF2VjdQ7ecGXyde62EectotmDtuMNbt+zpqa1IOJNhd+/kJbHs0X/HA1mNvpea2aCp65MCVqxgJh0DlHLqzbV14ruwIVn1aI9sTLYVoEmqwoD9WQmlAk7UW96yLbe6NHndYFVrpvKVhoKRpFV34zgHJmSst75mHgyqG0GEVJojrWtjnTFmhlJRhmW2Jxrkz//osvL/vlKZODKlASC/DmHhAfuP+U4odAgH0McE+oQiI3O20dXVLio0Q461FmI5IzLPcR2+AvNzSSi9++fd9WLb1KJZtrcLzm48yLcLWjm4sWL0nJAt/vKHVqFtWhNompTHwDb5OxSCDgCx2sRiXnBCa027FC/MmhigxxeugL60LJfTljAtPsIg99SYee+cAd0E4gkZfF177tAbfnzSE+Tm4HQkRIoR6wSLUdMc1Q5mdF7nfSK4jtd9ZQZPsIIkMYk/1Xq+3wPO5XUqgnRNQ+hwZbt5YoS6Udrq5Q3U90bSKyhE7aH3PcmelnoL5E7fkorTSi2nPbsGdr+zAw2v36mZT04N0uxUf/WoGdQBm5LmT3uOD/GZ2LpbMGQ0T2P0OOR+rMNeFhHhtrntxQU7o+XT7A1i0rkL1b3gI9nFVBldTmm6SMOp6jLfcYUjuY2BK38iUkuehNaASQmxohjmTONwhG5z2yJY1MXg7yXKLfabHjcWzR8Fpv7Dm6nsGgAHIBiIXA/papt8o9NXkgBhnW7uwjGKGR8t7I/t6/b5aPHB9JvVzWDx7FLY9mo8fXj2E+TtpoLSPN1XUYtqzW6g1O4RQsvdqQY5aewZJQO2gECAk30fjuPXlnm6An4rvpQQiCqn3c7TvniYQ0Hs2an3PYlXsNfOn4MuSm3qU0kdQXyc10RJq7dLrz4ihx/7X+zqx63gj9ed5nztOuwXP/TD4XHf+pgCzxgYderkgTwmuFJusj0VbMZdCZsaFGead1Q3U1XO9a5ZroAEoR1tSm5CH8ZYrMf3398fpuq4S3I4EPDg9C26KxUMCrMfeOcAlGyY0NPdMzdSVldCCJ+d6uA1sskBu8GzB6j0RG4aUmAFEGNdFs0dxvzeeMEG5zfBShBZj3BtY9Wm1qkM6OcsJV4qN+dpkX7/ySQ21nchItqG00ouXdYhGKUFuH6slTYoLcvDCvAlU9lEOcocbLXlAkFKYDjSO28VSYbxY7jMaoE0qqX2O5ZmqBQK8zkYt75m0hs0dPxhTR6TDGm/G1BHpKC68MixZp4TldwVJTYyo7um9Husz4XnuPHXrGNw6YXCoBU/8PcQPuS8vU/VaS+aMlvWx9Oxv4dpjuU6fEuwD1KMtcf85D6Mo9xDqfHRRnyPRguY2+V7+1CQL/nLHBJhNJtT5OsKGI389c1TPb26XHSyWo0rTizMt7bDGmzH/+izFPrskaxzaOru5GIUHp2dh1thBqp+jHdgMBALU0XlNnS/sn1loUYV9t8H5mL4JntzVFxuEdKNvfX4C7+49FbXvpqVMFGr3yCHObMKSOaO5abMoIWOADb/8+z6mvU0zw6TE3KJWhQ7Od3yFbY/mh/rbvU1tKNlwiGnoXc6u058ZbPtH7boXS4XxYrnPaEAoCqnnc1qeqdx6UhMcpQXP90wreux2JGDK8HTu1T0Tgp0fen0kLc9ETHOdMcCGX7y1l6lqIGxJkgMJ8qaOSMfkLKfknIWSjgaBlt8oZc9pr5Nut+pOenKvaLBynOvZLGqZX9pr35eXFbqe+PomAM/cNgbXj7wMeTkZoUyAUKhp6oh0uFISoj7ESX7fwlm5eHB6VkRlw2wKBgb/3w+ClR2WY1d8LdJzuHBWLtXfK5Ulhc70kjmjqe9pzc4TYdlk2symOLOk1ptpAqizOzRwpdiQmmShev4uR0K/Hugk++nZ28cZVqlLTbTghXkTwqpc2xfeQE09SmPjZnrceOnuidxnJwiI7UMAzAe+y5GAl+5Wn2GSC3ZZ9l3IPjoSqYMMXnZ9ao/qLS3UrmtETzfPNs7+WAlVA3lnSqB5Zlrevdx6Ep6NWmDUe541dhAenJ6l+L3EJvCsmpFneu918t9NAz0OsbDSk5edEZqroIHbkYCi/Bym75vpcWPXokK88cC1KJqRjaIZI/DG/ddi16JC1bOfdS3K2XOavQEAJRQdLGrgXtFgpbnVylpCk/mlzaoX5WfjStcAXeqc0SxXS0WnC2fl4hffuUpWGVxKfdTdQ62bZrfC29QWJhg0aViabi0BWtXTl+6eiF/+fR/OqYj1iCnftAp30ahhPjnXg5INhzSzl6UlWfDbW0aHxJdKK72KDFn35WWiMNfVb5XBxaCp1GnF8rsmIi87I+Lf35uXScX/TmvjSKZs5bZj+MPGL5nvUw1P3JJLXbUtmpGNnIEDIvayFlViLfuO1T7ysOtThqcrslOJP6/mpNDYjUd6KIEzBtjw0Bu70NR2XvE7/+u2sbhn1U7F7xWCVKEg8/39sRKqBOE7k1srNM9MeB010KynmR437s/LlNRSUrs2YNx7XjgrF+OGpGHRuoqwxICYVpdnNcVpt+IPt3pQmOvC2s9PaD5z544fxO2ZyPkuQuh9F3FmE/KyMyTPIrW/Y2ERk7PnansDIB0sfUiwj4CV41wr9RpNEMAir86qEisGz40nvFe1+xbCGm/G/dcPl7ymlt/Hg1qV5ntnetxo6/Kj+M29qtcTOix6tFtogiCz2aSZEvBpUfmTNuiK4QJI9UyseC+EWGtHSXtH6IBKoSg/B6s+rZEt39M6pELEmU24b9pwrCyv4Ua5nd5zMM/0uKnbAPOyMyT3sxa7oGXf0f6N027BU7cqtw6w2vWXFOggWZ0Fln387PfGSgY5wu9saGPTTyFVqJgdoYfcO2PVpODtfBbkupgDjWi851lj3bjRo2wTeMoILBLQ9dMGc1JQUwJnhdA2Sok59uaeU1rTi2ePQprdRmXP5a7jtFvw5FwPVZs8DUwBCuLn5uZmOBwONDU1ISUlRfWiZFAQkD4EpFpDpHQ0XCk23Dl5KDIz7Miw2wATUHeugzkIUFLg5LVIuv0BTHt2i2KAlZpkQWNrl6rjSu4N4CPYczFge1U97nxlh+rn1syfEnKYaJ65y5GgqAWgprwqt3bmjHPjzS9OMvdY8lB6Zd2PfQVa77vzvD9UqbsiLQlXDUxGQ1snLk+OrLw1+jqxYDWb7RFCTieB9u/Vriu+L4LUJAue+u4YlGyoVDy8nXYLdiwsCFUqeewBVmj5TrW/AYIB1PaFN4R+mxpY7Hq3P4BlW45iVXl1mGieVntKu4/V7pHW7g2wxeNP3x8bRk2px470NxsC8LG9wutIOZ8s64l2H/3p9nERs6F9AWo2jRbCM51cd8l6em0xIPjcedo4KfBaP33xnrReh3Y/GhJoANqceyNfZDQWCU2ABUgHD3dcM1RShbcvLm4joNVh0hLUark3qXfQ7Q+EiS9OHZ6BKRKME7zRH50EFuhNLBiVmJBUqE6y4N7rslCUnx0mMAewJWmM3gNSv6Uv3CerfewNe6r0nTQB2ABbHHYv/g51AEaDmA3hA73rqTf2Lk9I2bS0JItAoFYeSkkQkhhQo86+WJ7TpYpeDzSA/uMkC0HjpPTH50IDrUY3GhWrvoS+dtjSIpr3rXePGbVHaa6rZT33xh64WO6zr0MtM0yrSM+CmA3pO7jY94SUTQMQqvqsLK+RbXGkqTArtapdTM/pUkSfCDT6K2KBhHZoNbr96ZlfrPvxYr3v3oCW9dzXsvV96T77OqLtbF6se/FivW81XMp7Qu/aFj6bjAE2IIA+2UrWHxELNGK4aHEpG10euFj348V63zHEEA1E0+5drHvxYr3v/o7YmX5pgnY/cmediiEGvSCc1jHEEEMM/QUxuxfDpYrY2u7f4C7YF0MMMcQQQwwxxBBDDDHEEAs0YoghhhhiiCGGGGKIIQbuoGqdImMczc3Nht5MDDHEoA6yDynGq/oUYnYkhhj6BmI2JIYYYtALWjtCFWi0tLQAAK644gqdtxVDDDHwQktLCxwOR2/fBjVidiSGGPoWYjYkhhhi0As1O0LFOuX3+3Hq1CkkJyfDZIoxBcQQQ28iEAigpaUFgwYNgtl88XQ/xuxIDDH0DcRsSAwxxKAXtHaEKtCIIYYYYoghhhhiiCGGGGJgwcWTyoghhhhiiCGGGGKIIYYYLhrEAo0YYoghhhhiiCGGGGKIgTtigUYMMcQQQwwxxBBDDDHEwB2xQCOGGGKIIYYYYoghhhhi4I5YoBFDDDHEEEMMMcQQQwwxcEcs0IghhhhiiCGGGGKIIYYYuCMWaMQQQwwxxBBDDDHEEEMM3PH/A+bS5Y1QB4VAAAAAAElFTkSuQmCC", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "generator = TSPGenerator(num_loc=1000)\n", + "env.generator = generator\n", + "\n", + "fig, axs = plt.subplots(1, 3, figsize=(10, 3))\n", + "td = env.generator(3) # generate 3 instances\n", + "for i in range(3):\n", + " axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1])\n", + " axs[i].set_xticks([]); axs[i].set_yticks([])\n", + "fig.suptitle(\"TSP with 1000 locations, uniform distribution\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Changing distribution of the data to normal distribution. We can pass the arguments to it by using `loc_` + distribution name as well as its keyword arguments, including here the `mean` and `std` of the normal distribution" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Text(0.5, 0.98, 'TSP with 100 locations, normal distribution')" + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "generator = TSPGenerator(num_loc=100, loc_distribution=\"normal\", loc_mean=0, loc_std=1)\n", + "env.generator = generator\n", + "\n", + "fig, axs = plt.subplots(1, 3, figsize=(10, 3))\n", + "td = env.generator(3) # generate 3 instances\n", + "for i in range(3):\n", + " axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1])\n", + " axs[i].set_xticks([]); axs[i].set_yticks([])\n", + "fig.suptitle(\"TSP with 100 locations, normal distribution\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can pass a custom `loc_sampler` to the generator (we can make it ourselves!) to generate data from a custom distribution. In this case we use the mixture of three exemplar distributions in batch-level, i.e. Uniform, Cluster, Mixed following the setting in Bi et al. 2022 (https://arxiv.org/abs/2210.07686)" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Text(0.5, 0.98, 'TSP with 200 locations, mixed distribution')" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAxoAAAEZCAYAAAAQS1PVAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8pXeV/AAAACXBIWXMAAA9hAAAPYQGoP6dpAAB/GElEQVR4nO2deXxU1d3/PzMhOyQhbAmoJCIKMQiKIsjiA4VHNBaK2wPqY10erQJPXarVqvzEh1blsRZtUSqKWrWA1qVasTwlhZalQaxspkGBmOBCgpKEgAkkIXN/f4Q7znKXc+49995zZ77v16uvymTmzpl7z/me734CiqIoIAiCIAiCIAiCEEjQ6wEQBEEQBEEQBJF4kKFBEARBEARBEIRwyNAgCIIgCIIgCEI4ZGgQBEEQBEEQBCEcMjQIgiAIgiAIghAOGRoEQRAEQRAEQQiHDA2CIAiCIAiCIIRDhgZBEARBEARBEMIhQ4MgCIIgCIIgCOGQoUEQRBTXX389ioqKmN/bvXt3ZwfkMkVFRbj++uu9HoYuL730EgKBAGpra70eimvMnz8fgUDA9e+1e6+11lIgEMD8+fNtj82Mv/3tbwgEAvjb3/4Wfu3f/u3fUFpa6vh3A0BtbS0CgQBeeuklV76PIAg5IUODIAQQCASY/qdu+t988w1uv/12DBkyBJmZmejbty9GjRqFe++9F99++234utdff33U53NycjB8+HA88cQTaGtrc+W3tba2Yv78+VEKiwhCoRBeeuklTJs2DSeffDKys7NRWlqKn//85zh27JjmZ5YtW4ahQ4ciIyMDgwcPxm9+8xvN93311Ve46qqrkJeXh5ycHEyfPh2fffaZ0PE7zSOPPII//vGPXg+DkIDly5fjySef9HoYmsg8NoIgvKeb1wMgiETglVdeifr3yy+/jDVr1sS9PnToUDQ2NuLcc8/F4cOHceONN2LIkCFoaGjAzp07sWTJEtx2221RUYL09HQ8//zzAIBDhw7hzTffxN13340PP/wQK1euFP5bnnvuOYRCofC/W1tb8fDDDwPo8oiKorW1FTfccANGjx6NW2+9FX379kVFRQUeeugh/PWvf8XatWujvNjPPvssbr31Vlx++eW46667sGHDBvz4xz9Ga2sr7r333vD7vv32W0ycOBHNzc24//77kZqaikWLFuHCCy/E9u3b0atXL2G/wUkeeeQRXHHFFfjBD34Q9fp//ud/YubMmUhPT/dmYB7w4IMP4r777vN6GEI4evQounXj23qXL1+OyspK3HHHHcyfmTBhAo4ePYq0tDTOEfKhN7aBAwfi6NGjSE1NdfT7CYKQGzI0CEIA1157bdS/N2/ejDVr1sS9DgCPP/44Pv/8c2zatAkXXHBB1N8OHz4cpxh069Yt6jqzZ8/G+eefj9deew2/+tWv0L9/f4G/BK4pBmlpaXH34Oabb0ZRUVHY2Jg8eTKALuXsgQceQFlZGd54443we0OhEBYsWIBbbrkFPXv2BAA888wz2LNnD7Zs2YLzzjsPAHDxxRejtLQUTzzxBB555BFXfp9TpKSkICUlxethuEq3bt24lXNZycjIcPT6x44dQ1paGoLBoOPfZUQgEPD0+wmCkANKnSIIl6murkZKSgpGjx4d97ecnBzTzTkYDIYjC3q544cOHUJKSgp+/etfh187ePAggsEgevXqBUVRwq/fdtttKCgoCP87Mq+8trYWffr0AQA8/PDD4RSu2Bzzr776Cj/4wQ/QvXt39OnTB3fffTc6OzsNf0daWlqcoQUAM2bMAADs2rUr/Nq6devQ0NCA2bNnR713zpw5aGlpwapVq8KvvfHGGzjvvPPCRgYADBkyBN/73vfw+uuvG45Jj88++wxXXnkl8vPzkZWVhdGjR0d9p8qxY8cwf/58nH766cjIyEBhYSEuu+wyVFdXh9/zy1/+EhdccAF69eqFzMxMjBw5Mmw8qQQCAbS0tOB3v/td+J6rdSN6dQPPPPMMzjzzTKSnp6N///6YM2cODh06FPUeNUe/qqoKEydORFZWFgYMGID//d//jfstv/nNb3DmmWciKysLPXv2xLnnnovly5dbun9FRUW49NJL8be//Q3nnnsuMjMzMWzYsHA63ltvvYVhw4YhIyMDI0eOxLZt26I+H1uj8eKLLyIQCOCFF16Iet8jjzyCQCCA999/P/zaJ598giuuuAL5+fnIyMjAueeei3fffTdujP/6178wadIkZGZm4qSTTsLPf/7zqMieGX/84x9RWlqKjIwMlJaW4u2339Z8X+z6OXLkCO644w4UFRUhPT0dffv2xZQpU7B161YAXc9s1apV2LdvX3guqOtTrcNYuXIlHnzwQQwYMABZWVk4fPiwZo2GykcffYQLLrgAmZmZKC4uxm9/+9uov+vNsdhrGo1Nr0Zj7dq1GD9+PLKzs5GXl4fp06dHrXXgu+e9d+9eXH/99cjLy0Nubi5uuOEGtLa26j8EgiCkIzFcRAThIwYOHIjOzk688sor+OEPf2jpGqriqpcGlJeXh9LSUqxfvx4//vGPAQAbN25EIBBAY2MjqqqqcOaZZwIANmzYgPHjx2tep0+fPuF0rhkzZuCyyy4DAJx11lnh93R2duKiiy7C+eefj1/+8pcoLy/HE088gUGDBuG2227j/m319fUAgN69e4dfUxXPc889N+q9I0eORDAYxLZt23DttdciFAph586duPHGG+OuO2rUKPzlL3/BkSNH0KNHD+bxHDhwABdccAFaW1vx4x//GL169cLvfvc7TJs2DW+88UbYMOrs7MSll16Kv/71r5g5cyZuv/12HDlyBGvWrEFlZSUGDRoEAHjqqacwbdo0XHPNNWhvb8fKlStx5ZVX4r333kNZWRmArlS8//qv/8KoUaNwyy23AED481rMnz8fDz/8MCZPnozbbrsNn376KZYsWYIPP/wQmzZtiopSNTU1YerUqbjssstw1VVX4Y033sC9996LYcOG4eKLLwbQlT734x//GFdccQVuv/12HDt2DDt37sQHH3yAq6++mvneRbJ3715cffXV+NGPfoRrr70Wv/zlL/H9738fv/3tb3H//feHjchHH30UV111FT799FMEg9q+sBtuuAFvvfUW7rrrLkyZMgUnn3wyPv74Yzz88MO46aabcMkllwDoMh7Gjh2LAQMG4L777kN2djZef/11/OAHP8Cbb74Zfnb19fWYOHEijh8/Hn7f0qVLkZmZyfTb/vKXv+Dyyy9HSUkJHn30UTQ0NOCGG27ASSedZPrZW2+9FW+88Qbmzp2LkpISNDQ0YOPGjdi1axfOOeccPPDAA2hubsaXX36JRYsWAUBcA4YFCxYgLS0Nd999N9ra2gzTpZqamnDJJZfgqquuwqxZs/D666/jtttuQ1pamua6MYJlbJGUl5fj4osvxqmnnor58+fj6NGj+M1vfoOxY8di69atcYXzV111FYqLi/Hoo49i69ateP7559G3b18sXLiQa5wEQXiIQhCEcObMmaPoLa/6+nqlT58+CgBlyJAhyq233qosX75cOXToUNx7f/jDHyrZ2dnKN998o3zzzTfK3r17lUceeUQJBALKWWedZTqGfv36hf991113KRMmTFD69u2rLFmyRFEURWloaFACgYDy1FNPRX3nwIEDw//+5ptvFADKQw89pDk+AMr//M//RL1+9tlnKyNHjjQcnx6TJ09WcnJylKampqjfkpKSovn+Pn36KDNnzowaa+x4FEVRnn76aQWA8sknnxh+/8CBA5Uf/vCH4X/fcccdCgBlw4YN4deOHDmiFBcXK0VFRUpnZ6eiKIrywgsvKACUX/3qV3HXDIVC4f9ubW2N+lt7e7tSWlqqTJo0Ker17OzsqHGovPjiiwoApaamRlEURfn666+VtLQ05d///d/DY1EURVm8eLECQHnhhRfCr1144YUKAOXll18Ov9bW1qYUFBQol19+efi16dOnK2eeeabW7bHEwIEDFQDKP/7xj/Br//d//6cAUDIzM5V9+/aFX3/22WcVAMq6devCrz300ENx66murk7Jz89XpkyZorS1tSlnn322csoppyjNzc3h93zve99Thg0bphw7diz8WigUUi644AJl8ODB4dfUZ/zBBx+EX/v666+V3NzcqHutx4gRI5TCwsKoNfyXv/xFARC1lhRFiVtLubm5ypw5cwyvX1ZWFncdRVGUdevWKQCUU089NW5eqX+LvI/q83/iiSfCr7W1tSkjRoxQ+vbtq7S3tyuKEj/HjK6pN7aamhoFgPLiiy+GX1O/p6GhIfzajh07lGAwqFx33XXh19TnfeONN0Zdc8aMGUqvXr3ivosgCHmh1CmCcJl+/fphx44duPXWW9HU1ITf/va3uPrqq9G3b18sWLAgKq0JAFpaWtCnTx/06dMHp512Gu6//36MGTNGNzVDZfz48Thw4AA+/fRTAF2RiwkTJmD8+PHYsGEDgK4oh6IouhENVm699da477bS5emRRx5BeXk5HnvsMeTl5YVfNypqzcjIwNGjR8PvA6BZKK2mpKnvYeX999/HqFGjMG7cuPBr3bt3xy233ILa2lpUVVUBAN5880307t0b//3f/x13jci0n0gveVNTE5qbmzF+/Phwqgwv5eXlaG9vxx133BEVAbj55puRk5MTl+LVvXv3qJqftLQ0jBo1Kup55eXl4csvv8SHH35oaUxalJSUYMyYMeF/n3/++QCASZMm4ZRTTol73Wz+FBQU4Omnn8aaNWswfvx4bN++HS+88AJycnIAAI2NjVi7di2uuuoqHDlyBAcPHsTBgwfR0NCAiy66CHv27MFXX30FoOsZjx49GqNGjQpfv0+fPrjmmmtMf1ddXR22b9+OH/7wh8jNzQ2/PmXKFJSUlJh+Pi8vDx988AH2799v+l49fvjDHzJHX7p164Yf/ehH4X+npaXhRz/6Eb7++mt89NFHlsdghnqfrr/+euTn54dfP+usszBlypSodDcVLbnS0NCAw4cPOzZOgiDEQoYGQXhAYWEhlixZgrq6Onz66af49a9/jT59+uD//b//h2XLlkW9NyMjA2vWrMGaNWuwfv16fPHFF9i0aRNOPfVUw+9QjYcNGzagpaUF27Ztw/jx4zFhwoSwobFhw4Zwy1yrZGRkhOs4VHr27Immpiau67z22mt48MEHcdNNN8WlXGVmZqK9vV3zc8eOHQsrWer/a7X+VVvmsipkKvv27cMZZ5wR9/rQoUPDfwe60tnOOOMM06Ll9957D6NHj0ZGRgby8/PD6WnNzc1c44ocH4C4MaalpeHUU08N/13lpJNOijuTIvZ53XvvvejevTtGjRqFwYMHY86cOdi0aZOl8alEGhMAwkr5ySefrPk6y/yZOXMmysrKsGXLFtx888343ve+F/7b3r17oSgK5s2bFzbU1f899NBDAICvv/4aQNc9HDx4cNz1tZ57LOr9tfr5//3f/0VlZSVOPvlkjBo1CvPnz+c20ouLi5nf279/f2RnZ0e9dvrppwPQr/kSgd48BbrW0sGDB9HS0hL1euycURs+8MoWgiC8gwwNgvCQQCCA008/Hf/93/+N9evXIxgM4ve//33Ue1JSUjB58mRMnjwZ48ePZ8r7BroUiuLiYqxfvx4VFRVQFAVjxozB+PHj8cUXX2Dfvn3YsGEDLrjgAt1ceBZEdEBas2YNrrvuOpSVlcUVpgJdhllnZ2dYMVRpb29HQ0NDuPNWfn4+0tPTUVdXF3cN9TXRXbp42LBhA6ZNm4aMjAw888wzeP/997FmzRpcffXVcZEsp9B7XpHfP3ToUHz66adYuXIlxo0bhzfffBPjxo0LK+giv5dlPHo0NDTgn//8JwCgqqoqqnhb/e+77747bKjH/u+0007j/RnCueqqq/DZZ5/hN7/5Dfr374/HH38cZ555Jv785z8zX4PXeDZD73BEswYPorEzNwiCkAMyNAhCEk499VT07NlTU0m2ipomtWHDBowYMQI9evTA8OHDkZubi9WrV2Pr1q2YMGGC4TWcPpH5gw8+wIwZM3Duuefi9ddf14wIjBgxAgDCSqXKP//5T4RCofDfg8Eghg0bFvc+9XtOPfVUrkJwoKt4X00/i+STTz4J/x3oKtb+9NNP0dHRoXutN998ExkZGfi///s/3Hjjjbj44ovDLXxjYb3v6vfHjrG9vR01NTXhv/OSnZ2N//iP/8CLL76Izz//HGVlZfjFL36he5iiF8yZMwdHjhzBo48+io0bN0YdHKdG/FJTU8OGeuz/1LkwcOBA7NmzJ+76Ws89FvX+Wv080GVIz549G3/84x9RU1ODXr164Re/+EX47yLX4P79++MiB7t37waAcDG2GjmI7VoWGx3jGZvePAW61lLv3r3jIi0EQfgfMjQIwmU++OCDuI0eALZs2YKGhgamdAtWxo8fj9raWrz22mvhVKpgMIgLLrgAv/rVr9DR0WFan5GVlQUgXukQwa5du1BWVoaioiK89957up7ZSZMmIT8/H0uWLIl6fcmSJcjKygp3awKAK664Ah9++GGUsfHpp59i7dq1uPLKK7nHeMkll2DLli2oqKgIv9bS0oKlS5eiqKgonId/+eWX4+DBg1i8eHHcNVQPbEpKCgKBQJRnuLa2VvME8OzsbKZ7PnnyZKSlpeHXv/51lKd32bJlaG5ujro3rDQ0NET9Oy0tDSUlJVAUxdCQcpM33ngDr732Gh577DHcd999mDlzJh588MGw0ty3b1/827/9G5599llN4/2bb74J//cll1yCzZs3Y8uWLVF/j40ualFYWIgRI0bgd7/7XVT625o1a8L1O3p0dnbGpcz17dsX/fv3j0r/y87OtpxaF8vx48fx7LPPhv/d3t6OZ599Fn369MHIkSMBfNfhbP369VFjXbp0adz1WMcWeZ8i53VlZSX+8pe/hDuFEQSRWFB7W4JwmVdeeQW///3vMWPGDIwcORJpaWnYtWsXXnjhBWRkZOD+++8X9l2qEfHpp59GHVQ3YcIE/PnPf0Z6enrUeRNaZGZmoqSkBK+99hpOP/105Ofno7S0FKWlpbbGduTIEVx00UVoamrCPffcE1e0PGjQoHDxcGZmJhYsWIA5c+bgyiuvxEUXXYQNGzbg1VdfxS9+8Yuo4tLZs2fjueeeQ1lZGe6++26kpqbiV7/6Ffr164ef/OQn3OO87777sGLFClx88cX48Y9/jPz8fPzud79DTU0N3nzzzXDa2XXXXYeXX34Zd911F7Zs2YLx48ejpaUF5eXlmD17NqZPn46ysjL86le/wtSpU3H11Vfj66+/xtNPP43TTjsNO3fujPrekSNHory8PHwoY3FxcbhQOpI+ffrgZz/7GR5++GFMnToV06ZNw6effopnnnkG5513nuahkWb8+7//OwoKCjB27Fj069cPu3btwuLFi1FWVhYVEQoEArjwwgs1z2pwkq+//hq33XYbJk6ciLlz5wIAFi9ejHXr1uH666/Hxo0bEQwG8fTTT2PcuHEYNmwYbr75Zpx66qk4cOAAKioq8OWXX2LHjh0AgJ/+9Kd45ZVXMHXqVNx+++3h9rYDBw6Mey5aPProoygrK8O4ceNw4403orGxMXwOybfffqv7uSNHjuCkk07CFVdcgeHDh6N79+4oLy/Hhx9+iCeeeCL8vpEjR+K1117DXXfdhfPOOw/du3fH97//fUv3rn///li4cCFqa2tx+umn47XXXsP27duxdOnScBvkM888E6NHj8bPfvYzNDY2Ij8/HytXrsTx48fjrscztscffxwXX3wxxowZg5tuuinc3jY3NzfubB6CIBIEj7pdEURCY9TedufOnco999yjnHPOOUp+fr7SrVs3pbCwULnyyiuVrVu3Rr1XbW9rh759+yoAlAMHDoRf27hxowJAGT9+fNz7Y9vbKoqi/OMf/1BGjhyppKWlRbXn1BufVjvSWNT2l3r/02rtunTpUuWMM85Q0tLSlEGDBimLFi2Kah2r8sUXXyhXXHGFkpOTo3Tv3l259NJLlT179hiORyW2va2iKEp1dbVyxRVXKHl5eUpGRoYyatQo5b333ov7bGtrq/LAAw8oxcXFSmpqqlJQUKBcccUVSnV1dfg9y5YtUwYPHqykp6crQ4YMUV588UXN+/XJJ58oEyZMUDIzM6Puh17r0cWLFytDhgxRUlNTlX79+im33XZbVItgRelqb6rVtjb2mT/77LPKhAkTlF69einp6enKoEGDlHvuuSeqdeyRI0cUAOHWwkYMHDhQKSsri3sdQFxrV3VePP744+HXYu/PZZddpvTo0UOpra2N+uw777yjAFAWLlwYfq26ulq57rrrlIKCAiU1NVUZMGCAcumllypvvPFG1Gd37typXHjhhUpGRoYyYMAAZcGCBcqyZcuY2tsqiqK8+eabytChQ5X09HSlpKREeeuttzTXUuT6aWtrU+655x5l+PDhSo8ePZTs7Gxl+PDhyjPPPBP1mW+//Va5+uqrlby8vKiWuWq72T/84Q9x49Frb3vmmWcq//znP5UxY8YoGRkZysCBA5XFixfHfb66ulqZPHmykp6ervTr10+5//77lTVr1sRdU29sWu1tFUVRysvLlbFjxyqZmZlKTk6O8v3vf1+pqqqKeo/6vL/55puo1/XmPkEQ8hJQFKqqIgiCIPh4//33cemll2LHjh0YNmyY18MhCIIgJIRqNAiCIAhu1q1bh5kzZ5KRQRAEQehCEQ2CIAiCIAiCIIRDEQ2CIAiCIAiCIIRDhgZBEARBEARBEMIhQ4MgCIIgCIIgCOGQoUEQBEEQBEEQhHDI0CAIgiAIgiAIQjhkaBAEQRAEQRAEIRwyNAiCIAiCIAiCEA4ZGgRBEARBEARBCIcMDYIgCIIgCIIghEOGBkEQBEEQBEEQwiFDgyAIgiAIgiAI4ZChQRAEQRAEQRCEcLqxvCkUCmH//v3o0aMHAoGA02MiCMIARVFw5MgR9O/fH8Ggf3wFJEcIQg5IhhAEYRdWOcJkaOzfvx8nn3yysMERBGGfL774AieddJLXw2CG5AhByAXJEIIg7GImR5gMjR49eoQvlpOTI2ZkBEFY4vDhwzj55JPD69IvkBwhCDkgGUIQhF1Y5QiToaGGKHNycmhxE4Qk+C11gOQIQcgFyRCCIOxiJkf8k5xJEARBEARBEIRvIEODIAiCIAiCIAjhMKVOJQudIQVbahrx9ZFj6NsjA6OK85ES9FdomSAIgiAI/0K6CJFIkKFxgtWVdXj4T1Woaz4Wfq0wNwMPfb8EU0sLPRwZQRDJACkXBEEkqi5C8i15IUMDXQv7tle3Qol5vb75GG57dSuWXHuOrxc4QRB8uL0pJqpyQRAEO4mqi9iVbyzyWFZDRtZxuUnSGxqdIQUP/6kqbmEDgAIgAODhP1VhSklB0k0OgkhG3Fb6E1W5IAiCHb/oIryKsxX5FvkdtQdbsWLL56g/rC+PZXXUyDout0l6Q2NLTWPUJIhFAVDXfAxbahoxqjg/6S1TgkhE1I2tvKoeyzbVxv3dKaXfL8pFskNeScJpeHSRMYN62f4+K3OaV3E2k28A8MDblZg0pB/SugV1vyOWSHkMwJYh49R6JgfSdyS9ofH1Ef3JHMmaqnrc9fr2pLdMCSLRYNnYnFL63VYuCH7IK0m4Aasuwvo+QF+htjKnrSjOZvINABpa2jH60XI8MmMYAG2jIZZIeawoCpejxo317KYDyQ9OkKQ3NPr2yGB63wsuejkJgnAHvc1TCyeUfieUC0IcTnol/aAgEO7Bqouwvk9PoZ42vBBL19dwRwCsKM6scquxpQO3vroVeVmpTLJY/V4zIyZWZrsVZXDLgeQXJ0jSGxqjivNRmJuB+uZjuhM8GABCGn9UX7rvrY/RIz0Vowf1oo2CIHyC0eZphEilX7RyIQKZFGAvx+KkV9IvCgLhHma6SABAQW7XGjBDT6Guaz6GZ9fXaH7GaE5bVZx55dah1g6u97Py9ZFjjkcZImXVngNHmMdlFT+lZiW9oZESDOCh75fgtle3IgBEPTT131pGRiSHWjtwzbIPaKMgCB/BEtbXQqTSL1K5EIFMCrDXY3HKK+knBYFwDzNdBAAe+n6JqRJs1YEC6M9pq5FXFkeuG/TtkeFolIEl/VZvXFbwW20fnQwOYGppIZZcew4KcqMfekFuBm4aW8R8HXWjWF1ZJ3iEBEGIhtebFECXoitS6VeVC/X6sd8HsCkXIlAV4NjN0gu5JnIsnSEFFdUNeGf7V6iobkCnmefoBE7lzJsVxz78pyrmMRKJhZEuwmqAWnWgRBI7p61GXiPlm2hUeVyQkx4nO2PfM6o437E0VT1ZZYTdvYTHaJKBpI9oqEwtLcSUkoK4MP2WmkbNLjRayGhJEgShDY83yUmlX1UuYj1iBS5672XykIkci52oiBNpbVT8T5ihp4uwrjsRqZ2xc9pO5FWVb/e/XYnGlnbbY1O/D0DYiGGJAjmxnq1Ej0TsJX6r7SNDI4KUYCBOuPOG/mijIAh/wLO2nVb67SoXdpFJARY1FrspSiMH9tStz1MJBrrex4rfFATCG7R0EVbspHbqGQx207qmlhZi0pB+GP1oORpbtOswAgBys1LRfKJOw0gmx8pjFkcNj7HEWhtmJXpkdS+JHNPBI21Mn3Gzts8IMjRMMFpgRtBGQRD2EVEMrHcNlvqsG8cWYUpJgStKvx3lwi4yKcAixiIiKvLRvibT+ryQ0vU+1ucmY/E/YR2ZGieosDpQeA0Gu5HXtG5BPDJjGG57dSug892PXdbV4jbuO3LSMWvUKSjqna15n1kcNazG0pqqeuYoKKusmjvxNAzu193yHNGKzBo5QezU9jkxp8nQYEBvgRlBGwVB2ENEMbDZNWRIW5IBmRRgEWMRERVxwviSrfifsI5b5zHwKn0sCvUtE4rx7o46bplnN/LKKm+tfAeLo8bs+wG+w/9YZdXY03pbdiLpRWaNjAzAWmqWU3OaDA1G1AW2+bMGzPn9Vhw6qh/+o42CIOwhojMP6zW8TluSAZkUYBFjEWEkOGF8ieosRHiLG53D7Ch9LAr9T6cOtSTz7EZeWaMPTkV39b4fAMYtXMsVBXVabrLUgMRGNqw6yZyc02RocJASDGDsab3x2OXG4T/aKAjCOiLSXniv4WXakgzIpACLGIsII8EpJYKiaP7GjcYJIpQ+M4XeS5nntbzV+v6K6gbuKKjTcpOlBiSkAPPKhqJ3j3Rb6cVOzmlqb2sBES3oCILQRkTrPr+1/5MBmeSa1bGorWzrm48iPzuNqe2lHk62Hp5aWoiN907CiptH46mZI7Di5tHYeO8k2jt8gNOyRWQLZFWhnj5iAMbQgcKGWI2COiE3VTn2Z8Y23r17pNt6xk7PaYpoWMTJdAsZC8wIwi1EpL3IVNzsJ2RKI+MdC+uhWTxGgpPRB6+9ukQ0rPuu07JFpg5wsSSybmInCipSblo5/M9u7ZzTc5oMDRs4sVF4fRouQXiNiLQX0fn1PBus3zdjmRRg1rHopZpowWskyGR8aeH3+SYDPPuu040TZHWSJLpuYjdVUoTc5JFjLGNixek5TYaGROhNsrrmY7j11a34LaVlEUkAS3vGvMxUhBQFnSFFU6kSmV/Ps8Em+mYsIywFk/nZqZh13ikIBIAxp/bGaE6FQCbjKxKab/bhrYdwugDYaaXPimHqRvG71waz13VqvIf/iRyT03OaajQkgWWS3ffWx0x5mQThZ4xy41UOHe3ANc9/gHEL12K1Rh6rqPx6dYONDWOrG2zkd/O8lxAHS8FkY0sHnv5bNRavq8Y1y/TnjZ+g+WYfK/UQkbJFDzvKn6r02akv0mN1ZR3GLVyLWc9txu0rt2PWc5tN14LImhGR43ICu/UWam3FO9u/QkV1A9c94T38T2TtnJP1aAAZGq7AMvlYJtmh1g4sXrvXqWEShDToCfxYjJQqEZsG6wbrxmZMaGMlhcTvyjjNNzFYLYKdWlqIWyYUI1bvCga6zqiwW7vjhNJn1TB1ulBYNoPZaqMGu8YSqxy7bsxAR5pHONkMhFKnHIY1tM06yV78Rw3mTjqNcnCJhCd8dk11A+Ys1z67xqz1np38et4NVtYCzkTHSgqJqDakXiFzwbCfsFoPsbqyDkvX18QZeooCLF1fg7NP6WlLMRPdhMBO+1Ina0baj4dw/9uVjrYKtgJvqqSI1DJWOXZxaaHrZ4wkzMngXufnOQHP5GOdZIdaO2jzIJKGlGAAwWBA94BMwFypsppf78QGS12uxMNS06OFn5VxWQuG/YaVegg3ztEAxCp9dgxTp2pGVlfW4f63P0Zji3XZLhKrOqio+cAix3plp2HkwJ4sP4cZrd8t+l5LYWgkYkEb7+QbVZyPvMxUQ4VKhTYPIpnwSqlyYoO124aQiMeoiJMFP8pTpwuGkwUrRbBuRpNENSGwI0OdKBTm7a7k9Bq1o4OKmg8scqyhpR0XPr5OmG7slu7teY2Gm/l5dgp1eOFNu0gJBnDD2CKma9PmQSQTXilVPEWZThZwEuaw1vRo4Ud5ajbfAJpvLFiph5AlmsSjz9iRoaJrRozSpXjGJQq7OqjI+cAix0Tpxm7q3p4aGm4WtLnd1cDK5Js7aTDyslJ130vKCpGMeKXE82ywTnftSDasOIViizh//1/noyAnPSGNP5bOR9OGF9J8Y4C3CFaGaBKvPmNXhooqFF5dWYfRj5ajsaWd6f1Or1EROqjo+TC1tBB/v2ci8rO1dUERurHbzSQ8TZ1yKwT5/s79mL18W9zrLIU6VvP2rEy+lGAAj102TDOkSMoKkax42d+cpyjTyVOkkwk74fzYVJP50870rC++06idj55dX6P5dxFFyckCTz2Ek2cOsOgbVgqPRchQuzUjvOlSKk6uURE6qDofjK7Dayx9tK/J0doVt5tJeGpouBGCfH9nHeauiDcygO8W231vfoweGakYfWqvqAltZ8OzKoxIWSGIeLxcFzwbrOynSMuO6IPBElmedoYUvLvDOCLv165aXsBaD+GU44NF37BTeCxiLVitGeE9jA7oKnz+xYxS4Ws00pjbc+Bbps8Y6aApwQCmDS/UNfgB/uii07qx2+l/jhoaZta50yHI1ZV1mL18q+n71MO/Ihe13Q0vUhjFogqni0u7FJLY+0LKCkHE4+W64NlgZT1FWnac6uaTqPKUWtzyI6q7pWgDllXfsPvM3V4L6v3etPcg12F0+dmpqPjZ95DWTWx2v5Yxx4KRDspi8L+7ow4/nTqU+T47rRu7nf7nmKHBYp1b9fqzCAt10+JBXdRPX30OFqwyzl/Ti4LEkpuVikOtMSGwE5bGC5tq8cKmWs0oCSkrBBFPMq6LRGz9rYWTinMizhtZipL9gugOO6KUdh4DW8Qzd2stWFXqAwAemTHMESODN3WLJQ2O5bBlXrnlZHqeG9ePxRFDg9U6txKCZBUWvMe5A98t6nnvVKLBpFhJKwoSidGkVmJetJoWQBBEYpOIrb/1IMWZDxmKkv2C6JQ8FRFKO4+B7ZdnbrUew8l0Kd7ULdY0OCfkltN1iW7XPQrvOsVbzc7TzYCnHZfVzUgBTI0Mre9+f2dduEvKpr0HMf/dfzFPaieq/AmC8Dduth+UAb8oUbJALZXZcLvDDi88iirrMx85sKdrrfxjsaLUA9+lSznhQLHieGbtqOWU3BLV6cur60ciPKJhJfzNEoLkzd91azNSxzN3xVbYWct282mTJb2CIJIBt04flgmvu/n4DS+7sclM7LMOhRSpa1l4FFWWZz5teCEufHydZ1FQXqVeHbcT6VIqrMbc3ImDMLhfDy4Z4aTccrqmxq2aHeGGhtUwklkIkteAYTnO3Yj87FQ0tXQwf1aUw8BKJCaZ0isIIhlIxkJfL7v5+JVE7qplBa1nnZepfzZVJF6l5PEqqkbPfNrwQixdXyM8RYwH3vvoxlxlNebGntbHUv2X02lOTsp4N2p2hBsaToWReA0YluPctVAX9byyoZizfBvXZ0XAe1+cyj0lCL8gi7da5DiStV7Bq24+fiZRu2rxovesDx3VP48gEq9S8qwoqlrPfOTAnrjw8XWeR0FZ7+PciYMw9rQ+rsxVFmOuX046QoqCd7Z/xb2GyOA3Rrih4VQYyYoBo/fw8050gjJa1FNLC7EkGLDUNcEqvPm0bqRXyKLEEYQWsnirRY8jmesVvOjm43eZlohdtXiwWhcAiO+wYwUrimrsM6+obpAiCsqqA9455QzX1p2ZMacAOHY8hGue/yD8Oq/8tiK3kkW/Em5oOBVGsnMAntbDX1NVH7eo87PTsGD6dx0P1M9urm7AnOVbmT0jVuG9L06nV8iixBGEFrJ4q50YB0vqZ0FOesIW+rrdzSeZlfREwEqxLyBXLYtdA1uWKKistUN6xpx6BEHsMQRW5DeP3Eom/cqRyhsnqtnVyQt8N1lVzCav+vCnjxiAMYO6zr2YWlqIeWVDkZ/9Xf5mQ0s7FqyqiurmkhIMYOzg3njs8mG6nR5EcNPYIu774qRgSbaON4S/kKWTDM84OkMKcycYI3mncux4CGuq6m2NP5GRRfEinIf1GcbWazjRYccMIzmgpauw4nUUNPJ35Wam4emr3eloxMPU0kJsvHcSVtw8Gk/NHIHf33Q+MrqlaL7XyX0k2fQrxw7scyJvVGQe3OrKOsxZvo3LC6l1+F4gEH8uhhUmlxRwf8YpwZJMKQeEP5HFW806jsVr92Llh59zea9UeXffWx/HH/oJ4FBrB259dSueufocXHJWYnnAROC14kW4B+szfPqacxAMBDxLVXHSi+32IWyR6P2ueWVD0TM7XarUoMioQ0V1A+oPu7uPJKN+5ZihATiTNyrCgOF90DyH7/FiZ/E7JVhkUeIIQg9ZvNWs119UvjvuNZbQ/JSSAsx/twqAftrm3BVbsRhn45Kz+jONJVnwUvEi3IX1WY8+lS9KIBKnUz29Slky+l1zlm/DkmvPwfQRA4R+pyi82EeSUb9ypmmxw9gJLwLsD3rRmt3ch+/FkpeViqw07dCcKgwuLu0ynHjDc3bSyYyQRYkjCD1k8VbbuT5LaH5LTaOhxw3oaq09e/m2hAu328Up+UjIh+zP2q1UTzcPYQPkSWG1ihf7SDLqV54YGjy5yk7A+gAXr9uLa57/APWH2yx/16HWDrS2d+LSswrj8kMDJ2TeC5tqMeu5zRi3cC23suCEYJFFiSMIPWQ5FdlsHGZEeq+04NlsZN3QvZT3bitehHfI/Kx5vNh2ia1DWHHzaGy8d5InJ25r/S6v9b9IvNhHklG/cjR1SgsZKu29eIAf7WvClgcm46N9TSivqseyTbVxh/xZDaGKroehlANCdmTpbMLSNpEFPYOCR1bJGG6XQd7TORPJg6zPWrQXW22LWn/4GBq/bUN+dhoKcjPDv9Wtdse8v0sGeRCJF/tIMupXrhoadnIUI/sN9+6eDijAwZY2S4LE7qnhVqhrPoZXKmqRn52Gt7fv13yPnUIgkYJFFiWOIIyQ5ZAko3HMPO9kLCrfY3oNPYNClVWsrTtlCrfL0n4YcKZeMFl64PsNGc8UEenF1lLWVWR12vbtkSGVPIjE7X0kGfWrgKKYlzMfPnwYubm5aG5uRk5OjqUv6gwpGLdwre6GqVpxG++dFHeDjRYWYG1xqZMecPfkb1ZW3Dzac2Epm/eB6ELEevQCp8Yti8KnNQ4AGLdwran3SkvuqayurMOtJ2SVGTLIDcCevPcDfpeNJEOsYVXWqOvBjhwA9I332Gu5pbSz/q6/3zMRFz6+Tmp54PY+4ncZArCvR9ciGlYr7VkWlhWLWM+KlQUZPJOyhqEJIhJZPJh647DrvZpaWohnrj4Hc1dsjUu3jLyWTOH2RO6sIqtnlnAWLcUwPzsVP59eatrxTYQXm/X0cwXutUdl/V0f7WuSXh64vY8kk37lWjG4lRxFnoUF8BdDRhZNzZ04iPlzbtA7O93rIQCw3+GLIJIdEUWql5xViMWzztb8m4zh9kTtrOL3LjuENfQOWGts6cDs5dtw40tbTAub7coBntPPRRWWs8DyuxJVHtglWfQr1yIaVnIUeRaWVYtYfdAjB/bEM3+r1vUYasFT7MlNYs43gkhKRHivLjmrP34bDHhek8JConZWSeRIDaENi8Nz7SffYO0n3zAdwmlVDvAq4W4q7Wa/K1HlgVVE1hz7AdcMjZEDeyIYgKEiHwx0vU/FykKxurg+2tfEZWSkdQsiNRhAS3unpe8z4+C31lvqEgQhHyJC834JtydqZxXyzCYfvJEEs/Q5q3KAVwl3W2k3+l2JKg+s4ETNsey4ljrFosiHlK73qVhZKFYXF+/G0H485JiRASSPZU8QBB9+CLfLfoCaVcgzm3xYMRqdSJ/jObPHjTOEeEhUecCLXgpeJGqtVyIdwCp1jQbvYVh2FpdTG0N+dhrX++0cECPTQTgEQSQ3Mh+gpsIrM2U5KJJwj9qDrVzv5z18j3UORirrRgQgp9LuB3ngJE7XHMuM1DUa6sJibe0487xTTLs26KUcjCrOR15mKg4d7WD6LlZ+MKI/XthUy/x+BdaERCK0SiMIIrGQOdXLisxMxh74yczqyjo8Wb7b0mdZnKu8c9CsW6bse77M8sBp3Kg5lhXXDI1RxfnIy0rFoVZtRV4vR29qaSFuHFvEpKwX9c7S/ZvZgk4JBnDD2CKmw7V4mFJSgHMH9sTcFduYakDyslIxpaSA6zuo3SJBJCeynCFihCzthyOxIzNlOSiScBZWD7QeZs5Vq3MwUlnXOxlcZmSUB27gZs2xbLhmaKypqtc1MgBjT/6UkgImQ0NvYbMu6LmTBuPFf9QajpMHNYSeEgxgMQKYvdw8MnOotYPLijVrt2j1pHGCIOSGopjWECEzk9kzmyzweKAjYSlstjIH/eBU8MMYI3FzvG7WHMuGK4aGuqiMMPLk2+lYwLugH7tsmOkBgaxEGk6XnFWIG/exRWZ4rFhqt0gQyQdFMa0jSmYmq2c2WbDiTWZNn+Odg35wKsg2RjMjwu3xmumxkSRaFy5XisFZPAOqJ18Lno4FsYVVm6sbmBc08F1YvDDXniV509iiqMnaGVIwIC+T6bM8Viy1WySI5IIOjbNHoshMav7hLFa8yQW5GXj66rORm5lm+Fx45qBepyKZuhPJNsbVlXUYt3AtZj23Gbev3I5Zz23GuIVrw+PwYrxGemwkiVjr5UpEQ4RgZ8mL1bJQ8zJTub87Miy+pqoeK7Z8jqMdIabrqEyOiM6Y9U1WsWLFUrtFgkguKIppj0SQmbJ5jxMR1kyKX14xPHzYWlNLOxasMn8urHOrd/d03P2HHVKnRrNkjcx/91/okZGKg986fyidWbT36avPxoJVuzy5p2bF/EBi1nq5YmiIEuxGebF6k4u1i1Tsd6th8TGDemHYgFzc+foOpusAQK/stPDBg3rjisWqFUsH4RBEcpEoHnmv8LvMpLQ5d2DtMDZ2cG8AXc9lznK258I6B6FAeqcCi+Oj/nAbrnn+g/BrThnFLEbPg+9UorHFuF7YyXsaq8fqnQzut3oXI1wxNEQKdq28WDvdIcy+uzOk4OC37VzXbGhpx4WPr8O8sqG6lnMsVq1YardIEMlFInjkvcTPMpOaf7gLa4cx3ufCOgcPtrQxjdNLp4KV73bKKGYxeoyMjEicvKdm9V1uRCzdNGSEGRpGgxYh2I2ub6c7hNF3s6Y8aVHffAyzl29jeu+8sqG4fmyx5YdM7RYJwn2sCGoRwt3vHnkZ8KvMpLQ592HpMGblubDMwYrqBqYxeulUsPLdThnFIo0Dt+5p7J7Q1NKGOcu3ORqxdDv1UoihwTJoO4Ld7Pqskyv2QD6j72ZNedKD53O9e6TbXmjUbpEg3MOKoBYl3P3skZcJP8pMSpvzBjMPtNXnYjYH/eBU4OmmFIkTRjGrcZCfnYamlnbP76nWnhAMaOuPoowzL1IvbRsaPIO2IthZrs86uZ6+5hwEAwHT77Z7UA8voixnM2GYSDl/BOEVVgS1aOFu5LiZV1YS7nrDss6TWS74rUUtpc3JiZ3nYjQH/eBUMBojCyKNYlbDbF5ZCeYs9/ae6u0JRs3j7BpnXqVe2jI0rAyaR7CzXv/v90xkmlyjT+0VdfPU9oCxG6zVVCxevLacqUsJQfBh9aAtJ4S7luOmqaWNqeuNCskFf+EHD3cy4uRz8UOaH0s3JT1EGsWshtnU0kIsCXp3T+06s60aZ16lXtoyNJweNOv1P9rXxG31G22wbcf5Wtmy4ERtCivUpYQgxGBF5jkpJyMdN11db9hze0ku+A8/eLj9jNX91unn4oc0v7huStnp+MkfduDAYXeNYlbDzMt7ateZbdU48yr10pah4fSgea4/fcQAZqvfbIO9Y/LpzGMMBvRDXZFhulgvo4jaFBaoSwlBiMOKzHNDuLOs8wfersTR9k4U5GZi5MCeJBd8ih883H7E7n7r9HPxQ5pf7BjnT/PGKGY1IvTuqdPppFZlvV3jzKvUS1uGhtOD5r0+y+Ri2ZBXfvg5CnLSceBwm25oKy8rFU/POgfNR9sx50R3KaMw3UWl4mtTWAQXdSkhCHFYkXluCHeWdd7Q0h4+Dyg/O9XTXvKEPfzg4fYTovZbei7ReGkUWzXM3EgntSLreYwzPUPJq9RLW4aG04O2cn2zycWqeN85eTCeLN+ja4k/dtmw8EE9S4IB04XkRG0Ki7eRupQQhDisyCQ3hDvv+pWhlzxhDz94uP2A2X4LAPe//TGOdoRQkGNuONBziVd0/37PRHy0r0l648utdFKWTl2x2TKsxpmZoeRF6qUtQ8PpvEQnrs+6cRb1zma2xEV7MURGIahLCUGIw4pMciOv3qn1S3KBSHRY8uUbWzpw52vbAVCzBDOMFN3pIwZ4ODJj3EwzZ+nU9ev/OBu9eqRz6ZSshpLbUSbb7W2dHrTo6/Mo3mMG9WI2IFi9GCy5fyKjENSlhCDEYkUmOS0nrfay18OPciGZ2/QS1uGN2lGzBH383GDC7TRzs05dv/jzLi7jjMVQmv/uv9AjIxVtx0P45ZXDAQU42NLmj5PBnc5LFHl9XsVbZBiUNfdPZBSCupQQhHisyCQn5aTdXvaR+FEuUJtewiq8UbtEa5YQa6CPHNjTUpqT3xvPsBqcm/YeFCa3p5YWIhQCZi/fGvc3J+px6w+34ZrnPwi/pspIp1P9hBgagPN5iaKu76TibbRgaw+24sny3UyWvugoBHUpIQjxWJFJTspJq73s87PT0NjSHv633+SCn72ohPdYiQYmSrMEvZOpI2sDtAx2reih3xvPsBqci9ftxZtbvxQiIztDCv7nvSrNvzlVjxuJWzJSmKHhJ5xQvFkWrBZak8kJY4i6YRBE4hO5zusPH8OC9/6lW/itOiz8Uqiphd+9qIT32IkG+rlZAuvJ1HUxyqhe9PDi0gKm75X1nvEYnKIU9MVr96D+sLv1uLHXd0NGJqWhAYhVvK0cJR+J1mRywhiibhgEkfhErvPM1CBue7UrLK/nsEjrFvStXPC7F5WQA6vRQCvKnQy1RLwnUyvoUkZDIWDOcu3o4QubapmuJWuDCR6DU4SCvrqyDovK9zC9V0Q9rh5uyMikNTQAMYq33aPkI4mdTBSFIAjCDomeNkntuwlRREUDm49iwapdaGppF9pERZZaIisnU9c1H8OD71QatgE2wg8NJngMTjsKuqo3smK3HpcFJ2VkUhsaIrB7lHwkWpOJohAEQdghkR0W1L6bEElUNDAtRWj6sky1RFaVyshaLiv4ocGEKi8XrfkUi9dVm77fyr3k0RsLBdTjsuCkjPTM0JAhfCgCEVagHyx9giD4kUXOJarDgtp3E04hMhooWy2R24Z3MAAsnuWfpgwpwQDGntaHydCwci959Ea79bi9s9Pxkz/swIHD3slITwwNWcKHIrC7YNXpM/O8U/Dezv2+NroIgviORJJzspLI7btlMVKTGVHRQNlqiUSfu2NGSAF6Zqe58E3iEOHE0FvDrHrjnZNPF1KPO3+atzLSdUNDpvChCNTJaDV9Ki8rFQqAReW7w6+RMkIQ/ibR5JzMJGIdChmp8iAiGihbLVFKMIB5ZUMxe/k2rs/lZ6fp1q2Y4bc6KbtODKM1PKWkAAU5GYYdpwpy0jF30mmWxx9r5Dx99TlYsMobGemqoSFb+FAEKcEApg0vxLPra0zfq07WOycPRlHvbNQebNHsOkDKCEH4l0SUc7KTSHUoZKQmHrLVEq2urMOCVbu4PlOYm4F5ZSWYs9xasbEf66SsOjHM1vAtE4px7Hin4XfPGnWK5XHrGTnzyoaiZ3a66zLSVUNDtvChCDpDCt7dUcf03sjJ2RlSMG7hWs33kTJCEHzIlGaSiHLODyRCHQoZqe5gR15Y+axMtUR6SrAekd77qaWFWBKMV7yNzgzze50UrxPDbA0DYHJMLyrfg5UffsEdcTAycuYs34Yl156D6SMGMF9PBK4aGrKFD0XA2j1gXtlQXD+2ODw5SRkhCDHIlmaSiHKOcAfaF8RgZAzYkRdWPytLLRFLO/5YoyHWe6+leDe1tGHOiTQsP9ZJmRmPPE4MkZ1IeaOYsjoqXDU0ZAsfiqC8qp7pfb17pEc9WFJGCMI+MqaZJKKcI9yB9gX7GBkDACzLC7uyRoZaIhYlOKR0OUZ790jX9d5rKd5LggFf1kmJdlSJXJu8xoGsjgpXDQ2ZwociWF1Zh2UWT8MkZYQg7GHXe+NUulWiyTnCPWhfsIeZMZB7ovlKLGbyQpSn2OtaIlYluHePdO70Gq9/mxWccFSJXps8xoGsjgpXDQ1ZwociYD3ZUVUqRg7siYrqhvACHDmwJykjBGEDO94bJ9OtEknOEe5CRqp1WHLjD7V26H7eSF6I9BR7WUvktCFr97e5WWvnVJqRU62DWYwDWR0VQVe/Dd+FDwtyo39oQW6Gr7ppsObhKQCmDS/EhY+vw6znNuP2ldsx67nNuPDxdZg2vOu3xk5hUkYIwhyr3hvVixW7flUv1upKtuYORiSKnCPcRTVSAdoXeBGVG68lV2T1FPOiKsF6sycAvpOoRbK6sg7jFq6N0pPGLVwrRB5rwWM88sCyhq3AYhzI+nw9ObBPZIjNq24zrAJl0pA+WLq+RjM0t3R9DW6ZUIx3d9T5Lq+RILzGivfGzWI5P6YS8CJTty8j/DJOQI5cfj8iSsnXkiuyeop5kTXaKjqFiWW9O2k8Gq3hacMLsfRE1ynWiEd+dipGDuyp+/fI3zvzvFPwZPluqZ6vJ4YGICZ86GW3GVaBsv2LZkOl5t0ddfj7PRPx0b4mX2yCBCELVtJM3C6WS4SWq3rI1u1LD7+MM5JkMFJFY1fJN0pLS6SUNtkMWdHOH9b17rTxaLSGzz6lZ9wYjWhs6cCFj6/TfD5avzcvKxVAdKqgl44KzwwNu3jdbYZF8PTMTkVjS7vuNVSl5qN9TQmrjBCEU1jxziVKCoTXeC1/WfHLOLVIZCPVCVj25LysVDS1dnB7e81kjQJg5nkn472d+5mMQq8jbDIZsiKdP0br/dZXt4YPS3arTlZvDWu3CG6PO7k79jfEyiy939vc2gEFwBXnnISs9BQMzM/Cf44pQlo316slAPjU0JChVzCLkjNjxACmrlSk1BCENXi9c4mSAuElMshfFvwyTkIMLHvy9RcUo/loO/64fX+UE5DF26sna3JPeI8Xle8Jv2YUMZMlwibSkLVjONUfFuP8YWkGEPuM1DQmL9KMtO7/5JJ+GP3oXzUd1LEyCyf+2+j3vrH1y/Brz2+soYgGD7L0CjZTcnIz05gMDVJqCMI6PN65REqB8ApZ5K8ZfhknIQ69PTnvRFvbReW7w6/lZ6dixogBmFxSwKwYx8qa2oOteLJ8N3PEzItaBKexewDigvf+xfQ9ZnoSbzMAGetkP9rXxJQFoxao8/5er6K4vjQ0ZEp/MFJyOkMKKTUE4QKs3jlZiyH9hEzyV8T3ez1OQizxxkBLlCdbpamlAy9sqsV5nMq5Kms6QwrGLVzLHDHzqhbBSewYTnqfjYVVT+JdxzLWyTops7yM4nqTsGUT2dIfVMEzfcQAjBnUK/wAqVUhQcgHtZ61h2zy1+73ez1OQjzqnnzpWf2x8sMvNN+jKrgP/6kKnSH+Ew9426OKbKfK2qK7M6SgoroB72z/ChXVDZZ+px5mhpMCYP67/9L8TqPPRsKjJ1lZx7F1srE6nNvwyCw7v5e3Za9dfBnRcCL9wakQpGwdHgiCkKsY0m/4Jf1MtnHKkOaSbDiZPsfrfRblrWaNjIRCChas2uVYxIMlVan+cBsWr92L2ycP5v4sAORnp+EXM0qZxmvnoDxZopq8Mssvv9eXhobo9AenQ5B6Sg2AqNPCIzcetzYl2vyIZIW6+ljDL+lnMo1ThjSXZMTJVBTeiJmoCBur8TR7+ba4v4nM02e9Z4vKd+OMgu5R38f62QfLhjKP02i9myFLVJNXZvnl9/rS0ADERQrcan8Yq9QYbTwAXNmUaPMjCOsks5Hul0itDOP0c4tdv+Nk+hyv91lUhM2ON1pknj7PPYv9PtbPFuRmco1Jb73rIUv0NRIjmTWvbChyM9Pwzvav0LdHBqaUFPji9/rC0NDb0O2mP3jV/tCs17MWojcl2vwIwjp+NdJFGkd+ST/zcpzUYtdbnEyf4/U+i4qw2fVG66WL8coG9d6yKLix3+fkc9HrDAbIG32NhfWcDXXP2XjvpLjmB15HcSOR3tAw29DtpD940f6Qpdez3lhEbUq0+RGEdfxqpDthHMmefharPF16Vn9XZRq12PUWp9PneCNmIiJsdmoRIomMjFiRDeq91XOOGn2f088lVi6dUdBd955PKSnQTWH3ksjfsLqyDnOWs+85ZxT0kCraLLWh4fSG7kX7Q95ez5GI2pRo8yP8iAypSn410v1qHNlBhqiTm3uMDOtDRpxOn+ONmNmNsLGcUs7CngNHUFHdgKaWdi4lNva33Dl5sGb74FhiIzFupjXq3fM1VfUYt3CtlJFpdT3XNx/FglW7uPYc2aLN0hoabmzoXrQ/FLGhsHSlMJpg1F+ekBW9uSuD0gj400j3q3FkB1kMK7f2GFnWh6w4rXjxRvbsRgKN8/hLsGBVlWnEY/G6aixeV41gQNs4YZUNcycNxootX+ie8G2UBmX2XEQaz1p1sjLICC201rMeenuOTNFmaQ0NNzZ0L9ofijBajK7BsuFQf3lCRvTm7rThhVi6vkaKDcGPRrrfjCO7yoVIw8ruWNzYY2RWmGRCJsVLBEZKejAI5m5ERkdrsMiGlGAA86d1RVjUz6iwpEHpPRce45l3ncrsfGE9yDAWmfacWKQ9sM+NDd2LA/XUjcfKFQPoWmh6mxLrIT5mYzD7HoIQjd7crWs+hmc1jAzA/oFbVvCjke4n42h1ZR3GLVyLWc9txu0rt2PWc5sxbuHasOxiQdTBaCLG4vQew1Lz5+b6IORAjXjkZqUKuZ6ZbBB9CCqrLqO+l3edijw8USSsBxlqIdOeE4u0hoZbG7qVBWLntE2jjccMBfqbEs+Gw7P5OXmyKEEA9oSr2xuCH410vxhHPMqFESIMK1FjAZw9iV5WhYlwHhYFu7m1Q8h3sciGqaWF+Ps9EzGvbCiuGzMQ88qG4u/3TOSe3zy6jNV1KqvzxUoNr4x7TiyupU5ZbZ3mRloTT/6miFxY3l7PKjeOLdL9Dt70CJZCLMr7JdzAToMEFbc2BJkOgWNFthOytWg/HsL9b1cKSWWwa1g5kVbhVI2ArAoT4Sxm6XJPX322bgExDzyyQUtfeH5jDbe+wKrLbK5usLxOZXW+8K5TO3tOpE7eOzsdCAAHv21zpHDcFUNDawLmZ6fhByP6Y0pJgeaP4tnQRRQMseRvisyFjdx4Nu39BovXVZt+ZkpJge7fWCfopr3fhO/TlJIC3c2P8n4JtxChBLm5IYjuluJ0tyDZjaPVlXW4/+2P0dii733lqSOxa1g5VdPiRI2ArAoT4RwshvCD71QaricWeGSDSH2BdT+o+Owg0zp9aVMNevdIj5KtsjpfeNep1T3HrNhctEPZcUNDbwI2trTjhU21eGFTre6PksnrzhLOu//tj3G0I4SCHH1lQUupGFWcjze3fmVr0rNO0EiDxqiwStZCKSLxsKMEebUhiPJQuyW/ZDghWwvewkcWJcSuYeWnKIGsChPhHCyGsBUjIxiILgxnlQ2i9QX2/YBN1i5YtSv835GyVUbnC88ZKfnZqfj7PROR1o2vAoJF5op2KDtqaLDmXtcZ/CijDd1NrztLekdjSwfufG07AG1lwUipsDvprRzio3ef/NalhvA3Vg+g8tobb9dD7XbU0MkWn1aiMlZqc1iVENWwmv/uv1B/uC38er+cdMyfdqbhffVTlED2aBUhHqcM3MWzzkbP7HRu2SBaX2A1nscM6oXF6/aaXi+SWNkqm/OF5xDExpYOfLSviWsPYpW5oh3KjhaD8+Ze63XHUDf06SMGYMygXuF0KTe7bfAu7thiJLOiJQC2CgatFJnr3Sc/efQI/8PSnCArLSXuc3lZqb5N4fOqW5CWLLWL1e5MPPuD9YJHvRmlj98K/p0sNifkg9XAzc9OY77mnZMH45Kz+luSDaL1BdZmNaNP7cXdwTNWtk4tLcTGeydhxc2j8dTMEVhx82hsvHeSp2tmamkhbhxbxPReXh2MR+aKbCThqKHBcxN4f5Tb3TZ4vVeRE7r9eIhJqZhSUmBr0uttOGbjjL1PfvLoEYmB3tzNO9GesbW9M+4zTYI6qnhBonQLstOdiXeT5PHMq+OKPUTswGHzcXnR9twuMipMhDOwGsI/n17KfM2i3tmWx8OjL7B2sWQxnq128IyVrU44X4xguQdG9biR8OpgVpzDIhzKjqZOWVFERVvHorzuVtI71An9SkUtV2jR7omhkekRew58yxRejLxPlPdLeEHs3O3dPR0/eX277vv9XCuUCFFDu7nZrPtDr+w0/GJGKaaWFjKlaInIGZcxrcKMRDuQjtCGNV1uamkh7vz6dCwq3216TTtOQ1Z9oamlHeMWrmWuR2NJ9bTawRPwRray1uQ5pYNZec4iHMqOGhpWlHPR3nRRXnejxW3GvsZWpveJmviRG05FdQOToRF5nyjvl/CK2LkbmV8fi59rhRIhamg3N5tlf8jPTkXFz76HtG5B5k1aVM64kzUtBGEHVkN47qTTsGLLPl05KsJpyKIvTBteiDnL+evRWIzn2HV68EhbVAG4HmqExa31zVOT55QOxqOTi3QoO5o6xRPa4s179SKP1kpqEgCc3DOL6X0133wb/m9RB+VZvU+U90t4TSJ4/fXwWx2AFqz3/c+VdZoyzCxFKQDgkRnDwkYGa4qWyHnjdloFQbDCki6XEgxg/rQzw+spEpFOQyN94emrz8a7O+ocrUeLXKfXjy1mkq1NLW2WasusYKUmzwkdjFUnF+1Qdry9LUtoy8qP8srrHmk91zcfxYJVu9DU0m4Y3hrSrwfTtZ/8614MKcwBAGEtL+3cJ/LoEV6SCF5/PRIhash631+u2IeXK/ZpyjC9/aFfTjpmjToFbcdD2LTnIOa/y54KlcjzhiAiYfX4u5EGqKcvuN3Fkj3Css21jn9W74ETOhiLTi56brhyYF/kzSqvqsfb27+K6vNs9Ud5lUcbubgz01JMlYV1u79mvvbP3vpYs8jVzgKwc58o75fwikSvFdJblz2zUzFjxADkZqahM6RIa2ys/aSe6/16Mix2M6092IoVWz7HovI9TNeN3aQTfd4QBC9uOQ219AUvItNGOs+8shIsWOXuOWF27oETOlhcPWQinAwOfHezxgzqhfvLSoRNeDsLSER+nlm/9iklBbj/7Urm6+l10rG7ALQKbaEAB1vaUFHdQJEKQjoSwetvRuS6XFNVjz9u34/GlnYs21SLZQaHmXrN+zvr8NyGWq7PGMkwdX9YXVmHJ8t3c9XAqaibdDLMG8Iabubky4ZXTkOvIowiIizq++3OFxmjrG7OB9cMjUjMfiCvMLByw8SfyBs9vvZOBaFQV8issaXdwvXisRtijNzM7/7DDsdPIyYIu/ix+w8vKcEAmo+248VNta6F8u3QGVLw4DvszpNIjGSYlQP8IoncpJNh3hB8iN/zCRa8jDDaibCsqarHXa9vFzJfkj3K6omhYYTTwqAzpGDx2j2aYXkrm7peJ4HGlnbMXr4V3xvSx/aYY7ETYnT7NGKCsEui1wqJaMfq5Ni0PIJ2nSdaMoz3gNdI9BpaeBntJuRBxn0vWeaYbBFG1qjBC5tq416zOl9kuwduI5Wh4bQwWF1Zh/nvVsUd4qTCu6mzeOD++sk3lserh9XwmswKDUEYkci1Qm4XS7Ki5/S5pJTtMCkjDh5pi6s/seNAOdrRiTVV9XH7gxzRbsJLZNz3km2OyRRhZGnxGgwAWk2w7MwXme6B20hjaDgtDPSMGK3vYt3UWT1wgRMmLEvf4tysVDS3djgSXpNVoSGIZEbGNr5GTp9lGp4+Xhas2oXnN9ZEbbB28pObWzuEOaNk83wT9pBt30vWOSZLZNosuqBA28hQsTNfZLkHbuPoORo88AgDXqzk/rJs6qwbv6J8ZyzpUXiiN/Jjlw0DNN4rIrwmo0JDEMmObIWCLD3fReyLdTFnYLCcLaL3N6N+/KxnElnpda+HqHOQCPvItO+JnGN+RJZzaYzOqLhpbBHTNazOF1nugZtIE9FwUhhYyf09eKQN72z/ytDi5Nn4bxxbhD9X1keNo1d2GqaP6I8pJQVR3+FUeI11vHsOHKFOVAThErIVCrLIS1F6kALg/rc/xtGOEApyMjCvbCjmLN8W52mExr+1rlXXfAwvbarB9WOLkRIMcKWoiPJ8J1tajOzIZMjLFl1JZoy6UrFEbdX5kiy1NnaQxtBwUhjwGifBAKKOsNfbJJpa2hAIdEUszJhSUoAHGNv6OhVeYz1+fvG6aixeV02bI0G4gGyFgqzy8oYLBuKlf+yz3CVKpbGlA3e+th0AUJCTgbKzCrFxz0EcOqrd6tsMNS1r2vBCLF1fw5yiIsLZlaxpMTIjkyEvU3SF0K7h4pkvfnAqyGAISZM6xRI21+oswgKvcRLrrauPCfF3hhQ8Vb4bs5dvYzIy1HHHhswA6IbXnQivsR4/rxL7uwkiGfAi7cUolO+2csoqL/vnZdo2MmKpP3wM7+2ss2xkqNQ1H8OzGkYGoJ+iYtfZlexpMbJitO85YcgbyQ+ZoiuENqzzZU1VPW57dWtchEomvWl1ZR3GLVyLWc9txu0rt2PWc5sxbuFa18cmTUTDSa8eqydfK1wPRBejh0LA/7yn37lK65pa4/bKEmY5fl6FOlERyUCkx0c9lTpyfbvloZKlUJDVo2fXGPASrRQVu55vSouRF5aOPyI8v2b7ukzRFUIfs/kypaQA4xaulaqTWSwyRVelMTQA59p/GRkxKhmpQRzrCOleQ90kZi/fyvy9+dmpeGTGMEwpKUBFdUNYgDW1tGHO8m2eTYBIhWbT3oNYvG6v7ntpcyQSGS3FIBY3BbMMbXxZnT6VXx32YHRiiUxRsevsorQYuTEy5EU4/lgVO5nSJGVChhSfSIzmS0V1g9ROBdboqluGkFSGBuCcV0/PiOmZlYqm1g5DI8Mq8y49EwAwbuHaqO9kiZw4PQFUhYY2RyJZ4Wl5LYOHyk305GW/nHTMGnUK2o6HkJuZ6uEIxRCbomLk7Jp5Xtfv1muUQWkx8qNlyIvw/PK050/m8xT0kLXWQc/x44XexGOIsTT0cNMQks7QAJzz6sUaMb27p+Mnr28X/j0qnze04sny3VzdU1RLePNnDRh7Wm/HxqZCmyORjPC2vPbaQ+UFsfJSTStbVL4n/B7WZhiyYZSiEv+7W0787t3h92gpQZQW4z9End/FmzYnS5qkV0Snq7ZEyRQVmRsouK038RpirAbOmqp6V/YzaYrB3SKyyDoYCKD+cJvw7wgAKMhJx4otn1sulpzz+614f+d+x4tSnSzCJwhZsdLyGki+yJ4qL9O7BfFk+e642jS/GhmAcYpK9O/eE7dPaBV8ul10TNhH1PldVjzcfjpPQWSDjNgCZS0jA+i692r767e3yXUejZt6kxpx4yk6ZzVw3tm+35V7KmVEwy2cVBpmjTpFdwGxcOhoB2Yv3xb1mhOhRNlaaxKEG1hd+8kY2WOJ/gQD0d36emR0w5Fjxx0fmxVYU1SseLspLcZfiEqBSeTMAJFpTazpqpFEtr+WIZ0KcE9vshpxG1Wcj/zsVDS2GDfsaGhpdyVKn9SGhhOLPjezGxZefhbajouv+XAqlEibI5Fs8K59o7QX2YoYeTEbv5UD/GQzMh64ZCj65qRzPR+rXaSSPS3GT4gyEBI1bU5k5yLedFUtZEqnckNvsiqDUoIBzBgxgOngQTei9EltaLC2veXh8NGuDdYJI8bJbgG0ORLJBM/aN/JQyVrEyIrW+POzU/Hz6aW45Kz+ABIjXaxvTjqmjxjA9Rk73m4ZuocR5ogyEBIxM0BU/YqK1XRVu9/rJE7rTXZk0OSSAq4Tzp0k6Wo0IonMqRXJw3+qwsiBPVGY68wDrGs+hsVrradl6eGnnFGCsAPP4ZV6h+ZZyZ2VCb3xN7Z0pW0++n4VAH+me8TSu3s692cSOR2G6EJkXY1Mh26KQFT9iooohwXv9zqNk3qTHRkkU/1tUkc0gC7hcMuEYjy7vkbI9dRF8NG+Jjz0/RLc+ir7uRs8LCrfgzMKelAUgiAsohv6PtHCtah3tu6aEu3tcxuWNIZn19cgM7UbZk88TXjk121+8vp2zJ92Jpeyl6jpMEQ0IlNgEikzQHQLV9EGeSJEWs1glUEjB/aMOqtNnXOyRNmS3tBYXVknzMiI5OsjxzB9xADcOLYILzCEr6xw31sfY/670aeUsyhJgLN55X7PWSeSB6uKgd9PgWZNY3jyr3uw8sMvMH1EIZaur9E9A0h2Dhxu487tVjdqPWeRAv+lwxDaiDQQEiVtTnRET3SqejJEElmMhWnDC3Hh4+t003dlqL9NakND9eo5gboIppQUOGZoHGrtABDdVaD+cFtUtyutfHEn88pZrk2GCCETVhQDvx90yTOu+sPHsHR9DW6ZUIx3d9TZzrP2Aj9EmQhvSRQDQRQshkFeVipzRI9Fab5j8uk4JT8TC1btQlNLO0USYRxxmza8ywFkVqzvdZQtqQ0NEcVJscQuApbQV15WKgAFTa3iO7XETjiRXSRiYbk2AI3i07QTxaf+ymElkhe/5+9bGde7O+rw93smYsnf9tpq3e0VvFEmM0cUGS5EImMW0QO6nJ1rquqZdQZWD3tmWoqQlJ9EcWpqGQsjB/bEhY+vY07f9dKITmpDQ7S3UWsRsFjxj142DEc7QuFe0SKJnHCThvRzLK+cJWf9vrc+RnNrR9x7GlvaMXv5Vvzoy2L87JKShBEOROLi9/x91j7rKqqS/mFtI1Z++IWzg3MYVrnv9/Q4glCxuqdOKSlAXlbqieyJeKzoDCwedhEpP3rZFfPKStAzO813+kWssVBR3eAb+ZTUhoZdb2P39BR829YZ/rfeImBZNBXVDbbGYoQ64V6pqHVsYrJsynrCSuXZ9TUIKQre21nvebtQMnYII2QqtLPKdaMH4sm/7uX6jNnm5gdY5b7f0+MIArCXKr2lptFw37aqM7B42O2k/OhlV9Q1H8Ps5dERGlH6hZnOIFqn8JN8SmpDw05xUkFOOtb/dBI+2tfENHHMFo0TZ3rEsq+xlel9ViamqMn83IbauNfqXD6kx+9nIxDuIEuhHS9a85uVkCL+IFI3yc9mzyn3e3ocIR6/OaDspkp7rcxaSfnhPRhQVNq4kc7ghE7hJ/nkK0NDb5FbXfxGXkk91KvOn3Ym0roFhVnxPGMpyEnHseMhzTQkIwbmZzG9z8rEdHoyK3AnH9rJGhYi8ZCh0I4HvfltRgBAblYqVn74pRPDco0ZIwYwPxu/p8cRYvGbA0pEC24/KbMqvLW3dtPGzXSGWyYUMxVs8+In+eQbQ0NvkU8bXhjXCYVn8et5JfMyUzF+cC98WNuE+sNt4ddzs1JxwwXFmDSkn2bfYiuohlLb8RDumDwYK7Z8HvWdWi1r11TVMxtI6oT7zzFFeH5jjWkXiVBIQWdI4fo9bkRknM439PvZCIQ3eF1oxwqvp09FlTFmqY9+YHJJgebres4qv6fHEWLwowNKRI2Rn5RZFSvRFaspYGY6AwA8tyHeyFD/bken8JN88oWhYZRvp3UGBu/iN/JKdoYULF67By9uqsWhox041NqBReW78dRfdyMUMSCrnZO0DKiCnAzcOfl0FPXO0jVi9AykWCInXFq3oGnU5FBrB65Z9gG3p8Zs0isAuqd3w7dt9jpr1TcfNX2P1QgXFX8SiQyrpy+2SLzfiQiqnw0NI4XIzFPtx/Q4QhwyO6CM9joRaU9+UmZV7ERXeI0UFpkaMvDs2NUp/CKfpDc0rHjhrCx+Pa/kmqp6PFm+J+77YydPbOckFnS9JIePYVH5btw0tkjXAwfEG0i1B1tPREP0JxyrgWLFU2M26UMhxBVi8dLY0m74dzvhba/zUQnCSVjn7bxLz0RBTkZYeQkpCq55/gOHR+ccRgoRq6faT+lxhFjcdkCxOsrM9jpRaU9TSgpwx+TT8eKmGhw6+p2zQTZlVsVOdgWvkSJKF7BzHTvyya2aI+kNDatnXYhY/FaMnGfX12BY/1z06pFh+PBYrr1sUy2WbarlOvBu7qTTTCeOOjE3f9aAOb/fGiU8VKx6aswm/Y++LLZ1Ent+9/S419T7saaqXvNwRFajyY/5qATBCuu8LcjJiJKZ//Onfzk1JFcIBICbxxfHrX1eTzVFMZMTNx1QrI4yFgN5SkmB7bQnrfHkZabihrFFmDtpsJTGttXaWyspYKJ0AbvXsSKf3Kw5kt7QsLt41c9bsdysGjn/vXJ71OTWeng81zY78C7y+qwTLiUYQDAQ0DQyVJxoXfezS0ow/KQ8PPhOZVR6Rq/sNDSYRCuALiUoEpYOOqxGkx/zURMZJ70tfuseIwLW+R0KKXhn+1fhQ6H+uH2/20MVSkgBlq6vwdmn9OSSwZQqSQDuOaBYo2s8BrKdtCe98TQf7cCT5XtwRkEP6aIZKqyZG4C9FDCW6EkwACiKtsHjlU7hds2R9IaG3cW758C3eKp8d1yBNYvlZtXIYXl4PNdWr/eztz5Gk0aetNXJwTqGP1fWAYAwZeySs/rjotJCzVMujYRCYcyC5Omgw6I0+DEfNVFx0tvit+4xomCpozra0Ylrln2XJsVzqJ/MaHWto1RJggU3HFA8xgOPgWw1h1/muhRWtLIrmlrasGDVLmH1DCw6w83ju7pOyaJTePFspTc07HYzWrxO+0AqFuVcVFhM6+FZubaWkaF3fRZYx/ByxT68XLFPqDKmFfVQFyxgviCtdtAxUxr8UlyVyDjpbfFj9xiR6HbZy0pFU2tHXMG3TEZG9/RuuOb8ky2nXtY1H8PitXtw++TTAVj3VCdjNCyZSQkGMG14oeG8s6ss8hgPvAaylRz+RIn2aekZsU5Ou+uXRWc4+5SenukUsfIqpCiuP1vpDQ0r+XYssCjno4rzkZeVKqTbSuzDE90O1srk4B2D08oYj5JvNa2NRbmg4k/vcNLbkgheOhHEzu/e3dPxk9e3ez0sUxQlhNIBebausSgi5cOKpzpZo2HJzOrKOiw1MDJumRBf/8MLj/FgxUDmzeFP5GifE/VWZjqDVzqFXo0NCyKfbVDYlRxEVUALcqMXWGFuBn40oRiFudYiD5HKuVuoD081oIDvPPYir29EZ0hBRXUD3tu5HzPPOzmsZJmhbsYP/6kKnUY922wwtbQQG++dhBU3j8ZTM0dgxc2j8fd7JiI3Mw3vbP8KFdUN6Awp3IsggPjUKyNUYTR9xACMGdQroRVPmeDxpMl0bb8ROb+DgUBUWqmstLSH8N8rttm+jiq/jGSwVhRVjYbFziHVAbP6RIopkTiwRM7f3VFnez/kMR5UA1lvR+Ld6+yORwtVx4jcsxMdM53BbZ1CT14Z1eVGIrLpjfQRDRUji/CnU4diS00jNu39BovXVXNfW09p3VLTKLx3fOTD4ylYsnJ9LTQt3KwuC5fltzoVMtVLR1hdWRdXu1GYm4GZ553CfG2qr/APTnrSEtlLZ4dk+72R8os1ikrRsOSEJXIuYj/kia65UUtopy7FyagfpS2yYTW1HHCmQN03hgagH/JSX7e6Yeop57zXCwb0D2fRe3iRBpRee1YWjCaHWfvX5hMGxp2TT0dDSxterthn+n0ilROjU9+Xro8/VbO++RieLN+NvKxUNLd2mC4mqq/wD052eKH2xdok2+8FouUXS1pDouSsE3y45ZzgNR6criW0aswYHa5866tb8Vub9XWUtsiG1dRyp5yyvjI0zODdMM0sN9brzZ04CGNP64O1nxzAcxv4C8ZUQ2nMoF7IzUzDovLdTN+rYrbwWdu/rvzwc/zyiuFMhoYo5YT31HfgO6HXcTwUHruWsaEeeEheD//gZIcXal+sjeh6MT8QK7/M8rYpGpacOOmciPXOTykp4DIenM775zVmWLzo9731saWoX7I38eCFVQ7lZaa6cghjQhkaPBsmi+XGqpjcOeUMrKmqx/MGRoZRwVikwDm3qCf69UjDgSP6Z0rERk70JoeV9q8IwDVlzE54DwBa2ju7xnSiT7UKeTn8i5NpAdS+WBu7DTdENulwmgCAfjnpCCnfnRXCopxRNCw5cco5YeSd33jvJGbjwemDJHmMGRYv+qHWDixeuxe3Tx7MPAZKW+SHVQ49ffU5CAYDdDI4DzwbJovlxqqYADBUmAPoKhj76dShTBEHtWZC7zsXzzoHPbPTbJ88rsXBb9tcU8ashvdiUY0uP0cwKPf0O5xMC6D2xdrYqRdT7x2gfZioWWtQp9A7K+TY8RCuef67s0JYHBMUDUtOnHBO+M07z2rMsHrRX/xHDeZOOo35nrmVtphIezCrvBrtUqObhDI0AP0NUy0gLuqdxTWJWBSTiuoGSwtB9+TNEzUTuTGtdXmUIatK/MEjbbh+bLErypjINIMAgPcr63F/mf880pR7Go+TaQHUvlgb9b68tKkGC1btMn2/mjIaee/07uvZp/TEfW99LLy5RiyFBkaPKk9jx8Ci4LkVDUskZSdREOmcSGTvPKsX/VBrB5dR4EbaYqLtwbJF7xPO0ADEKxJm17OyEFgETmZqCp6+6RwcbGnj/g1WF92CVbvw/MYa7hBuLJ0hBZs/a0BFdQMABecX9UIwJYCD3373W0SmGfi1GNNv3i03cTItwOmUA7+SEgygd490pvcO7tcDYwb1CreyjJUTsUrzlvsn48OaRvzhoy/wx+37hY579r8NwvjB+kZP7+x0/OQPOwDEGzqsCp7T0bBEU3YSCVE6RSI3FRhVnB+X868Hj37idNqiTHuwSEeDTNH7hDQ0APGKhNH1rCwEVoETDAYwfcQArrHyjEkLuwtsdWVdnPdyMaLbDhfmZmBeWQlTTQ1PDrifijET2btF+BceeWbUMe7dHXWaSvMTV43ABzWNpmH9eWVDccfrO9B+PGQ6ljMKesTJ50iZXVHdgPrD9hU8p6JhMik7yY6esidCp0jkpgIpwQBuGFuEReV7TN/Lo584mbYo0x7shKNBlui9Lw7skx0rB+g4LXBGFeejIIfNMxmLnYP5VlfW4dZXt5qmSNQ1H8Ps5VsxbXjXAtI6MCsA4EcTipGbxXaSJdCV+uWXw4HoADlCRljlWVNLu+aBUGrHOL2D7dZU1TMdlBcMBpiMDMBccREpb0UfvGWm7ADOHpJKfMfqyjqMW7gWs57bjNtXbses5zZj3MK1wg5jlLGpgMjD9eZOGhyuMdVCSxcyg/dgTR5k2YOdPAxUhsOHydAQgJWF4LTAWVNVj2OMm7QWsQuMRRh1hhTMf7eK63te++eXePrqs+NOfS/IzcCSa8/B2af05MrrXrBql9CNwUkS2btF+BcWeTavbCgWrOJrNhGpNKutPPXW/ZSSAjz8JzZZwqK4yKjgqcii7CQ7bpz87sap3jyINqxSggE8dtkwzd/HYhTo6RlqGpCevLDq8ZdhD04GR0PCpk65DW8+nJPhQLO2tnlZqbj87AFYxnA44NdHjjGF9DpDCl7aVGOYnqDFodYO7Pm6RbMeBADGLVzLdT3AXrqBm8WYMis/iQAV1lrHTJ7lZqZZajYRqTRPKSlAj/RUVHx2EECX1230qV0eN7MGG5GweDNl7holg7KT7LiVQiNTka5T6XpWawPM9Awn0oBk2IMTuW5HhQwNgfAsBKcEDktb28zUFEwa0o/J0Kg92Iony3cbCiMgvsMLDy9u6mp3py4iVUHctPegZWXGysbgdjGmzMqP3xH9LJPRaDGSZ+9s/8rWtcur6nHX69ujns+bW78MP5/yqnqm69w0tojpecqk4MUig7KT7Lip7FlRxEXLH6cNK16jwOjg3kijR3TtrQx7cDI4GsjQEIzWQtATEk50BWBpa8t6MF+/nHSs2PK5oTD62Vsfo8lmy8pDRzuweO0e3D75dKaTzFng3Ri8KMaUWfmRBSsbrOhnmczdgPQ2drtKr5aTQ30+T199Nt5mNGQmlxQwf6dMXVgikUHZSXbcVvZ4FHEn5I8bhpWZUaDK9vrmo1iwapeuc1RBl57hREG2DHtwMjgayNBwGLfDgayC8K+7DpgusFmjTjHsIKEAto0MlUXle9DafhxL19cIPWWY5X542XlCVuVHBqxssKKfJXUD0sZMOTZCr4uc+nwefKcSjS3mcqVXdhq38i1LF5ZIZFB2kh0vlD0W77xT8sdrLzqvQ7Gp9TtnpGi83oOTwdFAhoaDsAoJkeFAVkH4zvb9eKCsxHCBtdkoJrfC0g1ijQyA7X6I8O7YCW3LqPx4jdUNVqSnTqbWh7JhpBybYfReBWAyMgBg+oj+lu67jGeoeK3sJDsyKntOyh8vvehmNaR6vLipFnMnDXZE1nq5ByeDo4EMDYfwSkkZVZyP/OxU0826oaUdW2oaDRdY12F77qE40FShqaXN9D12vTsiQtsyKj9eYWftiPTUJUORnh30lGO3mMKRNuUHyOHgHTIqe07KH68MK5YaUj0OHeU7UZwXL/fgRHc0kKHhEF4pKSnBAGaMYO8opX5Gawx20iOcpjA3A5eeVYjnNtQYvm/Bql246ETUSA873h1KrRGPnbUj0lPndXqBH4hUjjftPYjF6/YKuW5+dhqaWtp15Y6bLUDdhBwO3iGbslfffJTpfVbkj1eGFUsNqRGJLGsT2dFAhoZDeKmkTC4pYDI09hw4gorqBtPOWLe+ulX4GK0yd+IgjD2tD0YV52NLTaOpoVHXfAwvbapB7x7pugvXqneHUmucwc7aEempS9QiPdEdbFTleFRxPt7c+qXpvVcUBQcOt5mcCl6COcvl8S4TyYEsyt7qyjosWLWL6b1W5Y8XhpVdfcdvspaXRHU0kKHhEF4qKayRiMXrqrF4XbVhms/U0kLcOLYILzAYLpGoCkL39G74tu0412f1rleQm4E7p5wRFvqsHp9Iga31W616dyi1xhnsrB2RnjoZ87bt4mQHLdZ7D8D0PVNLC7Ek6L53ORnbGBPReK3ssdYwiJA/bhtWVvUdu7810de17L+PDA2H8FJJ4S3UNEvzmVJSwG1oFORmYOZ5Jxt2rWJFS0Hk8fhEovdbrXh3KLXGGeyuHVGeOhnztu3gRpof671neY/bSlAytzFOVmRT0HhrGETIHzcNKyvp2HZlbaKvaz/8voCimJfgHj58GLm5uWhubkZOTo4b40oI1I0d0FZSnM7f52khpypvG++dFLeYO0MKxi1ca3idwtwM/PKK4TjY0hYW2O/t3I/bV263+SviF43VrhUqZr+VdeOpqG7ArOc2m37fiptHCxXkfl2PPOMWsXZEKRF+EORmmK1hozVh9fvM7r1MSp6eTHFLVrtNMsgQM2Rc16x7Sn52Kh6ZMcyXc9JItisA8rJScSiibb6dZ5Lo69rr38e6Himi4SBeF5fxFGoapfmkBAOmhdfThhdi7ODeUa/ZTQvLy0zF09ecg9Gn9gorIHa6VqiY/VZWoyARU2tkQcTaEeWpkyVv2w5up/mx3HuvU1RUqNYq+ZC1iQdr9LtsWH/kZqahM6T4bk6ayXZRsjbR17Wffh8ZGg7jtZKibuZ20nze37kfyzYaF12/u6MOP506NOp3We1apV7hscuHYexp0caL3a4VkdhNaUq01BrZ8HrtRCKLUmwVSvPTh2qtkguZFTRW59wrm/fhlc37PI/AWMVMtotYZ4m+rv30+4KefnuSoCop00cMwJhBvTxRlKwW2K6urMPs5dsQMrEU1AkdiaqIA98p3rGUDStEz6zUqNcKcjN0PUoiFSERhfiqd6YgN/paRr+BYEeGtZMIJGoHLRGQEZZc8ChobqM651ilnBqBWV1Z5+i47NAZUlBR3YB3tn+FiuoGdJ5QJpyW7Ym+rv30+yiikSRYSfNRPT+saE1ovTBpYW4Gpg0vxDvb69AUkY+Zn52GeWX6HhpWRSg/OxVNLR2upDTJ5Hkn/I1TdQuU5qcPGWHJhcwKGm8jF68jMGZ4WQeT6OvaT7+PDI0kwUqaD2+akjqhY5WlKSUFmDSkH16pqMW+xlYMzM9Cvx4ZmLtyW9w1GlvaMXv5Vvw2qB0NYFWY5pUNxZzl21xLafJ7ag3hPTK0npVNUXEDMsKSC9kVND3nnB4ypchEYlQHc+urW3Hj2CJMKSlwzCnnh3Vtx7Hkh9+nQoZGEqBO5rbjIdwx+XSs2PI56g+bF9jyeHTUk3q1lKW8E6lRkZ0kAiZr6WdvfazpoWFVmLr68AfixtIvJx2zRp2CtuMhw8MKCcJNZGo9m2yQEZZc+EFBi4yS/7myDi9X7DP9jAwpMiqdIQX3vfWxbh0MALywqRYvbKp1LMIh+7q261iS/fdFQu1tExytyVxwQtku6p1taEWzttoDgN9eew4A2Go7G8vv/+v8uGJwFdZFGukxqD3YGmdk+bGYzq/r0alxy9Qm1Qoytp5NRuzISr+R7DLE69bzPHjVRt0OT5XvZj5Di+WeW5VZnSEFi9fuxYubanDoqJiWuSIQ2ZbWy/Q01vVIhkYCY3cyqwqQUdeoYABYPOscXFRaYHrWBi9zJ56Guy86w3B8rMLH637TIvHrenRi3DL2wufFj4pEopKIjgktSIb4R3aY7cOiHREs4zHadztDCkYuWBOl2Jth9BusPifN7IrMVNwwtghzJw125F6xnh8k2rHklfOIztFIIrQmGQCuFn56E9WsMG3xrLNxyVmFqKhuEGpkfDdSfVjrImRuZ0hYR9Ze+LzIXJzqR+xsuqpMWV1ZhyfLd/t+bhH6eNHEw8rclClFhkXp31LTyGVkAPp1JlZlvN7nmo924MnyPTijoIfw9ctqEDnRllb2GlEyNHyO3uSeed4pzJO5+Wi74QLR6xoVuYCcUILGnKqdNsWLn/pNE2wkkvEoe3GqnxDhpU6kuUUY46aCZmduylBfxar029EFIj9rdR16sX55DKJkdCyRoeFjjCb3ovLdTNdYU1WPFzfVmi4QM8+PaCUoLysVowVtAMm4sBOdRDIe/VCc6gW83l9REa5EmluEHIiYm162UedR3u3oApGftboO3V6/vIZNMjqWyNDwKWaTm5U/bt9vukAmDemHj/Y1GQo3q6eA6/HYZcMAdOWvq987cmBP03FokYwLO9FJJONRptQIWeD1/or0YibS3CK8R+Tc9CpFhkd5t6ILaDlTrK5D1s/937/qPDmBPBkdS2Ro+BTeMy5iCQDomZ2KxpZ23feoC2T0o+VobDHu2MB70JD6ntzMbmg+ejz8ekFOOuZPOxMA4gqmggFEnVDOGnZOxoWd6CSa8ShDaoQsWPH+ivRiJtrcIrwlESJkPEq/FV0AiHemWF2HrJ976R/7kN4tiJ9dUsL0fj14DaJkdCwFvR4AYQ0eb1rsdFX/PWPEAKbPRxoZwHcb/urKuqjXVWWpIDd6offMSg2fpaFSkJuB3157DrbO+3esuHk0npo5AituHo1N930PQFeb3FjhHIqRWHrjiEVd2ID+vUi0hZ3oqMaj3hML4LuzXfzC1NJCbLx3UtR62HjvJE+NjM6QgorqBryz/StUVDegM3YR2ny/1ufNIrUP/6kq7roioxCJOLcI7/AiQmZ3HcbCq/Tz6gJazgN1Heqhtw7NPhfJs+tr8P5OY/3BDCsGkd790bsXfociGj6FdXLfOXkwVn74haaXNDczDcs21XJ/t1G4Vy+PFIBubmmkF8dI0eAZRyzkMU4sEtUrJFP3EN70JRGF2Fa9vyKjEH6cW3Q2iry4HSFzom2vlawAK7pAJCnBAKYNL8Sz62t0x6W1DtX1e+uJc1LMmPdOJS4qtV4YznJv+uWkI6QoeGf7V+Hf7GXNjduQoeFTWBf+3EmDMXfSYM3J3BlSLNdVGIV79ZQlFgWKNyWMJ+ycTAs7GSDj0Tl405dEFWJb9f6KTo/009zyy3kQyYqbqbtOtfy2anzb0QVWV9ZhqYGRccuEYt3fMrW0EDeNLWJypDa0tNtKWzO7NwqAY8dDuOb5D8KvR65PUY4lmZ0NZGj4FN6FrzWZeXMptRBdEGn1eqyfk8ljTNiHjEfx8Baviix2ter9dSIK4Ye5lShnySQybkXInG7r6qbxbZbZEADw7o46/HTqUN3fMrmkgDljw64eo3dvcrNScai1A4datdPPRa1P2Z0NVKPhY0Tk+eldo1d2GtMYRBdEWr1e7+7pQsdB+AfVeJw+YgDGDOollSLIiuicajvwpC9Zeb8RduojnMh7lnluWa1nIdzHjZx8ketQj6mlhfj7PRMxr2worhszEPPKhuLv90wUrsyK+C2jivORn52q+/dIROgxsTV2v7/pfGR0S9F8r3LifyLWp+psiL1frDWsbkARDZ8jwuumXmNzdQMqPjsIIIDzi/Nxzxs7cOBwm65XoWdWqvCCyFHF+cg74QXggvZSwgWcCE/L5o3iTV8SWexq1/vrhyiEKBKhm1EioicjnJ6bbhSda8mq5zfWCJdVIn5LSjCAn08vxezl2wyvIbKxQ2TGREV1A+oPG/8Ou+vTL4eLkqGRAIhIB1pTVR8lQBav6zo0z0h/b2rtwJqqeilCcwdb2rweApHgOGEQyJj6wpu+JLrY1W6KRrKkR9J5H/KgGhflVfV4e/tXuu3gnZybThedG8mqW1/dijsnD0ZR72whBpSo33LJWf3xoy8PcReUi4B13a2pqrc8J/zibCBDg9AVIM0mUQUnrOUtNY380QxQT3vCWZwwCGT1RvEWrzpR7JpMkQmr0HkfcqDlgIjELaeBk0XnLGl6i8r3hF/zosuVHmef0hOAvqEhAq0oFuu6e2f7fjxQZs3Y8YuzgWo0khw7J4zz5nyy5KHzLgg/97SXKS+f0MepXHg3cqqtwHvujFPn1MhcHyEDdN6H9+jlx0fiVr2Mk+dF8XaDtFsfIOq3qLJbD9WZY+e5rK6sw7iFazHruc24feV2zHpuM8YtXIumljamGhG165UVRDobnNRHKKKR5Ng9YRxgMw5Y0056Z7MXdcva054F2fLyCX2cCk/L7I3iTV/yUzvYRMGP530kErxnPrmRwuLUOuSVQbJ0uXI6tcgo0j1n+TZMGtIHf/3kG9PrWJXxIiI/nSEFi9fuwYubanHoqHbKn13I0EhyRCgxZtYyV9oJhzzyqxIjY14+oY9TBgGrN6r2YAvXdUXBm75E6U724W02QAaed1hx0rnhNHBiHVpJvxNhXNn9LU46c1hSX7d9cYjpWlbTG+06G1ZX1uG+tz7WTFcXqY+QoZHk2MnfZbWWefLQD37LVtQ9d+Ig3DnlDN8pMbLm5RP6OJULb+aNUllUvgeD+3ZHz+x01xV43uLVZCnEdgKrUU4y8LzBinLqVr2M6HXIKqu0sGtc2fktTtYxsURLGls6kJ+dhqaWdscOa7TqbNBzeEaOX5Q+QoZGkmNHgADmoXne0CXrgh97Wh9fbqR+6RJBfIdTRZaR3igz5q7YhsiUWUqzSyx4o5xakQ+SF/bhiSjxKKciT//2AjuH+/bOTkdFdYMnRrCTBfKsBtQPRvTHi5tqHU1v5HU2sKb9idJHyNBIcqwKkGAAWDzrbFNFhzd06aRgkAGZ8/IJbZzMhZ9aWog7Jp+OReW7Dd8XW5eXrGl2Tpxj4jW8UU6q73IG3vvK66Tze72MnudcjwC6Tsb+yR92RJ0n4eZcFSG79WQOq6E5paQAo4rzHU9v5In88Kb92dVHyNAguAUI0KX49GQo3OYNXaYEA5hXNlTzkJ1EKHCklpT+xMlc+KLeWdyfUTfMB96uxKQh/ZDWLfEbCCaqgs0T5Ww+2k71XQ5gpW6O1UmXCHNUJdZzXnuwFU+ecJLEKvEKcCL3Pzr/3+25akd2G8mcKSUFzE7RlGBAqvRGp+oJ9SBDgwAQLUD+XFmHlyv2mX6GZbKqXh+jjbQwNwOhkIJ3tn+F2oOtWLHlc833JUKBY6JHbBIZp3Lh7QjxhpZ2jH60HI/MGObrdWFGIjdQYN306w8fw/+u/oTquwRjp25OT4nNyeiGs0/Jw4TBffCfY4oSyhEQ6zk/o6B73O/vl5OOY8dDmkXGXsxVK7KbRebwREtkql/j2XNEtMgmQ4MIE7kQWAyNPQe+RUV1g+GCTQkGMG14oeHJnM1HO3DNsg9Mv29emb+NDIBaUvodJzYLu3VSjS0dvle2jUj0Bgqsm37jt21U3+UAduvmIpXYNVX1+OP2/Whsacffdx/E33cfxPMba3zvIDNCS4kPKQqueV5/T/dirvLIblaZs/HeSUzREtlSPnn2HBH6CBkaRBysk3Dxur1YvG6vYWi4M6Tg3R3Gh/a0tneajikAYMGqKlxU6k9lIhJqSUlEYqfQMhI/K9tGJHoDBdYoZ352GtP1qL6LDxF1cynBAJqPtuPFTbUJGXUzI1aJf2f7V0yfk3Wu8sgcs2iJjCmfLHtOXlYqHrtMTKQ8ceJ5hDCMTuXUwugUUBEHAgLenZLsFFNLC7Hx3klYcfNoPDVzBFbcPBob752UsBsRYYxqfBbkWkuj8sv6sHL6bKI3UGA9BbkgN5PpelTfxYeIujkzDzjg/MngMuH3WkRemaMaWtNHDMCYQb2ijAytk+PtnpwuAr09Jy8rFXdOPh0fPThFmD5CEQ1CE54CcaP0BdGbv1+VCS1kytkkrCMqLB6bgvHCplrua8i8Pqx69vyutLDAEuXsDClU3+UAIurmEj3qxovfaxHdMD5lSPl06wweMjQIXSIn4aa932Dxumrd9+oJUtGbvxPKhGz5k4R/EB0WTwkGMKo4H3e9vt3SeGRVtu0Uc/tdaWHFbNOn+i5nEHFfEz3qxovf56rsxqdIncUNhycZGoQh6iS0KkjtFrqqOKVMyJg/SfgDpzohWUk3lFnZtuvZ87vSwoPZpk/1Xc5g9b6qCt+eA98yfY+sjgAn8PNcddP4rG8+ynWgoR91FjI0CCashhJFFLo6pUwkcstMwlmcDIvzej1lV7ZFePb8rLSIxq10h2SD975qKXx6yOwIcBI/z1W7ModVZ1qwahcaW9rD/zYyGvyqs5ChQTBhJ5Sot2B7ZqWiqbXD1ABxQpnwQ/4kYY5XaW9OhsV5vZ6yK9ui0kr8rLSIhuq7nIH1vuopfFrI7ghwGj/PVTsyhzWbI9LIAPSNBj/rLGRoEEzYDSXqLdg1VfXxHoOcdMwadQqKemc7pkxQ8Z7/8TKE7GRONotRn5+dhgfLhqIgN1N6ZVtkMbeflRYrUP2YfBgpfFrI7Ahwc375dS6zyhyt32clm0PPaPBLzYcWZGgQzNgNJWotWK+8lFS852+8DiE72QmJxaj/xYxSKRUXLZKlmFs0fszFTgZYa6jmThyEsaf1kVahdnN+JfpcNvp9WjpTfnYqGlviT01X0TIanNJZ3Hg2ZGgQXDhhGHjhpUyGlpmJRKTHpXf3dMx/91+ehpCdVp4TqSYhmYq5ReG1IU3ow6rIDe7Xw7F9za4H2s35lehzmeX3bbx3UtTzqj98DHe+tt302pFzzQmdxa1nQ4YGwU0ipC+Ql9U/8BRdAu6EkN1QnhOpJiGRDCenYTn87YG3KzFpSD+kdaMzd93GayeVXQ+0m7n+rN81aUg/fLSvyXdyjudeRu5FFdUNTNePnEOidRY35wEZGgQTfs2v1IO8rP6Ap+gyFqdDyG4oz4lg1KskkuHEglWZyZKa09DSjtGPluORGcPISHMZL51UIjzQTtcnRs77g0famL5r9KN/Ze68JBNW76WVOSRaZ3GzTpUMDcKURM2vJC+r3PAWXcbiRgg52ZRnuySS4WSEHZnJaiA3tnQkROqJ3/DKSSXKA+1kfSJv9FmFtfOSbFi9l1bnkEidxc06VTI0CEMSPb+SFEV5sXJwHeB+CDlZlGeCDbsykzflRtaWlomMF04qUR5op1K/7ESfY5G9XauKnXtpdQ6J0lncTAEkQ4PQxc99m3kgRVFOrHhSZA8hE4mNCJnJ2n9fvSbNTW9w20klygPtROqX3eizFn6Y23bvpdU5JEJncTMFkCrJCF14FDCCEI0VT0pBbgZ3lI1aHROiECEz1bQKHmhueoOq8E0fMQBjBvVy1OEmygMdOb9iR2s19ctq9JkFmee2iHvp5hyK/V7R80APMjQIXUgBI7xE9bjoibkAuvLef3/T+Xhq5gisuHk0Nt47iTttwesuMkTiIPIU9CXXnoP87DSm69HcTHxY5SGLB1qdXwW50fPGiqMGsKYD5GenMr1P9rkt+l66iVtjp9QpQhdSwAgvYS2YGzu4t63voVbHhChEysyppYWYNKQfRj9arnu4F83N5EF0EbrI1C/WeT+vbCh690hH3x4ZGDmwJy58fF1CyF0/13q6MXaKaBC6iPSgEIQV3PC4uBlCJhIb0TIzrVsQj8wYhgBobhLi5aGotB3WeX/92OLwd6V1CyaU3PUqBUoETo89oCiKaf3O4cOHkZubi+bmZuTk5AgdACE3aicJQNuDIntoMBHx63q0M243znFJ1DbOhLs4ITNFz81klCGJhIznWlmd9yR3/QvreiRDgzCFBIFc+HU9+mHcMm7ghP9wQmaKnJt+WIta+HXcyYLVeU9y15+QoUEIhQSBPPh1Pfp13ARhBZllpl/Xol/HnUzIPO8JsbCuRyoGJ5igsyYIgiDYIZlJJCM074lYqBicIAiCIAiCIAjhkKFBEARBEARBEIRwmFKn1DKOw4cPOzoYgiDMUdchQ3mVVJAcIQg5IBlCEIRdWOUIk6Fx5MgRAMDJJ59sc1gEQYjiyJEjyM3N9XoYzJAcIQi5IBlCEIRdzOQIU9epUCiE/fv3o0ePHggEqHsAQXiJoig4cuQI+vfvj2DQP9mPJEcIQg5IhhAEYRdWOcJkaBAEQRAEQRAEQfDgH1cGQRAEQRAEQRC+gQwNgiAIgiAIgiCEQ4YGQRAEQRAEQRDCIUODIAiCIAiCIAjhkKFBEARBEARBEIRwyNAgCIIgCIIgCEI4ZGgQBEEQBEEQBCGc/w82VOYo4Q7JCwAAAABJRU5ErkJggg==", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "loc_sampler = Mix_Distribution(n_cluster=3)\n", + "generator = TSPGenerator(num_loc=200, loc_sampler=loc_sampler)\n", + "env.generator = generator\n", + "\n", + "fig, axs = plt.subplots(1, 3, figsize=(10, 3))\n", + "td = env.generator(3) # generate 3 instances\n", + "for i in range(3):\n", + " axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1])\n", + " axs[i].set_xticks([]); axs[i].set_yticks([])\n", + "fig.suptitle(\"TSP with 200 locations, mixed distribution\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Generating different distributions for MCP\n", + "\n", + "In here we visualize the different weight and size distributions for MCP by passing the distribution name, which is automatically parsed:" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "from rl4co.envs.graph import MCPEnv, MCPGenerator\n", + "from matplotlib import pyplot as plt\n", + "import torch\n", + "from collections import Counter\n", + "\n", + "generator = MCPGenerator(size_distribution=\"uniform\", weight_distribution=\"uniform\")\n", + "env = MCPEnv(generator=generator)\n", + "data = env.generator(100)\n", + "\n", + "sizes = torch.count_nonzero(data[\"membership\"], dim=-1).flatten().tolist()\n", + "size2cnt = Counter(sizes)\n", + "weights = data[\"weights\"].flatten().tolist()\n", + "weight2cnt = Counter(weights)\n", + "\n", + "# plot the size distributions and the weight distributions\n", + "plt.figure()\n", + "plt.bar(size2cnt.keys(), size2cnt.values())\n", + "plt.title(\"Size distribution\")\n", + "plt.xlabel(\"Size\")\n", + "plt.ylabel(\"Probability\")\n", + "plt.show()\n", + "\n", + "# Note: the size distributions are not perfectly uniform since there might be repeated items and are removed in post-processing\n", + "\n", + "plt.figure()\n", + "plt.bar(weight2cnt.keys(), weight2cnt.values())\n", + "plt.title(\"Weight distribution\")\n", + "plt.xlabel(\"Weight\")\n", + "plt.ylabel(\"Probability\")\n", + "plt.show()\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We can also pass a custom `sampler` to generate data:" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "from collections import Counter\n", + "from torch.distributions import Normal\n", + "\n", + "size_sampler = Normal(10, 2)\n", + "weight_sampler = Normal(5, 1)\n", + "\n", + "generator = MCPGenerator(size_sampler=size_sampler, weight_sampler=weight_sampler)\n", + "env = MCPEnv(generator=generator)\n", + "data = env.generator(100)\n", + "\n", + "sizes = torch.count_nonzero(data[\"membership\"], dim=-1).flatten().tolist()\n", + "size2cnt = Counter(sizes)\n", + "weights = data[\"weights\"].flatten().tolist()\n", + "weight2cnt = Counter(weights)\n", + "\n", + "# plot the size distributions and the weight distributions\n", + "plt.figure()\n", + "plt.bar(size2cnt.keys(), size2cnt.values())\n", + "plt.title(\"Size distribution\")\n", + "plt.xlabel(\"Size\")\n", + "plt.ylabel(\"Probability\")\n", + "plt.show()\n", + "\n", + "plt.figure()\n", + "plt.bar(weight2cnt.keys(), weight2cnt.values())\n", + "plt.title(\"Weight distribution\")\n", + "plt.xlabel(\"Weight\")\n", + "plt.ylabel(\"Probability\")\n", + "plt.show()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Tl;dr: RL4CO allows for easily generating data for CO problems! 🚀" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "nipsreb", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.7" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/other/3-data-generator-distributions/index.html b/examples/other/3-data-generator-distributions/index.html new file mode 100644 index 00000000..83c1d5ff --- /dev/null +++ b/examples/other/3-data-generator-distributions/index.html @@ -0,0 +1,3483 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + Generating data in RL4CO - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/examples/other/index.html b/examples/other/index.html new file mode 100644 index 00000000..a98c4e1d --- /dev/null +++ b/examples/other/index.html @@ -0,0 +1,2386 @@ + + + + + + + + + + + + + + + + + + + + + + + Miscellaneous Examples - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + +

Miscellaneous Examples

+

Collection of examples on other topics.

+

Index

+
    +
  • 1-mtvrp.ipynb: here we show how to use the Multi-Task Vehicle Routing Problem (MTVRP) environment, which includes 16 tasks that can be solved simultaneously.
  • +
  • 2-scheduling.ipynb: provides a brief introduction to scheduling problems with RL4CO with the Flexible Job Shop Scheduling Problem (FJSP) environment.
  • +
  • 3-data-generator-distributions.ipynb: here we show how to use the data generators and how to generate data from custom distributions.
  • +
+ + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/index.html b/index.html new file mode 100644 index 00000000..9c78ee80 --- /dev/null +++ b/index.html @@ -0,0 +1,3069 @@ + + + + + + + + + + + + + + + + + + + + + + + + + RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + + + + + + + + + + + + + +
+
+ + + + + + + + + +

Home

+ +
+ +
+ +
+
+
+ + +
+
Loading...
+
+
+ AI4CO Logo +
+
+ + +
+
+
+ +

An extensive Reinforcement Learning (RL) for Combinatorial Optimization (CO) benchmark. Our goal is to provide a unified framework for RL-based CO algorithms, and to facilitate reproducible research in this field, decoupling the science from the engineering.

+

RL4CO is built upon:

+
    +
  • TorchRL: official PyTorch framework for RL algorithms and vectorized environments on GPUs
  • +
  • TensorDict: a library to easily handle heterogeneous data such as states, actions and rewards
  • +
  • PyTorch Lightning: a lightweight PyTorch wrapper for high-performance AI research
  • +
  • Hydra: a framework for elegantly configuring complex applications
  • +
+
+ RL4CO-Overview +
+ +

We offer flexible and efficient implementations of the following policies:

+
    +
  • Constructive: learn to construct a solution from scratch
      +
    • Autoregressive (AR): construct solutions one step at a time via a decoder
    • +
    • NonAutoregressive (NAR): learn to predict a heuristic, such as a heatmap, to then construct a solution
    • +
    +
  • +
  • Improvement: learn to improve a pre-existing solution
  • +
+
+ RL4CO-Policy-Overview +
+ +

We provide several utilities and modularization. For example, we modularize reusable components such as environment embeddings that can easily be swapped to solve new problems.

+
+ RL4CO-Env-Embedding +
+ +

Getting started

+

Open In Colab

+

RL4CO is now available for installation on pip! +

pip install rl4co
+

+

To get started, we recommend checking out our quickstart notebook or the minimalistic example below.

+

Install from source

+

This command installs the bleeding edge main version, useful for staying up-to-date with the latest developments - for instance, if a bug has been fixed since the last official release but a new release hasn’t been rolled out yet:

+
pip install -U git+https://github.com/ai4co/rl4co.git
+
+

Local install and development

+

If you want to develop RL4CO we recommend you to install it locally with pip in editable mode:

+
git clone https://github.com/ai4co/rl4co && cd rl4co
+pip install -e .
+
+

We recommend using a virtual environment such as conda to install rl4co locally.

+

Usage

+

Train model with default configuration (AM on TSP environment): +

python run.py
+

+
+

Tip

+

You may check out this notebook to get started with Hydra!

+
+
+ Change experiment settings + +Train model with chosen experiment configuration from [configs/experiment/](configs/experiment/) +
python run.py experiment=routing/am env=tsp env.num_loc=50 model.optimizer_kwargs.lr=2e-4
+
+Here you may change the environment, e.g. with `env=cvrp` by command line or by modifying the corresponding experiment e.g. [configs/experiment/routing/am.yaml](configs/experiment/routing/am.yaml). + +
+ +
+ Disable logging + +
python run.py experiment=routing/am logger=none '~callbacks.learning_rate_monitor'
+
+Note that `~` is used to disable a callback that would need a logger. + +
+ +
+ Create a sweep over hyperparameters (-m for multirun) + +
python run.py -m experiment=routing/am  model.optimizer.lr=1e-3,1e-4,1e-5
+
+
+ +

Minimalistic Example

+

Here is a minimalistic example training the Attention Model with greedy rollout baseline on TSP in less than 30 lines of code:

+
from rl4co.envs.routing import TSPEnv, TSPGenerator
+from rl4co.models import AttentionModelPolicy, POMO
+from rl4co.utils import RL4COTrainer
+
+# Instantiate generator and environment
+generator = TSPGenerator(num_loc=50, loc_distribution="uniform")
+env = TSPEnv(generator)
+
+# Create policy and RL model
+policy = AttentionModelPolicy(env_name=env.name, num_encoder_layers=6)
+model = POMO(env, policy, batch_size=64, optimizer_kwargs={"lr": 1e-4})
+
+# Instantiate Trainer and fit
+trainer = RL4COTrainer(max_epochs=10, accelerator="gpu", precision="16-mixed")
+trainer.fit(model)
+
+

Other examples can be found on our documentation!

+

Testing

+

Run tests with pytest from the root directory:

+
pytest tests
+
+

Known Bugs

+

Bugs installing PyTorch Geometric (PyG)

+

Installing PyG via Conda seems to update Torch itself. We have found that this update introduces some bugs with torchrl. At this moment, we recommend installing PyG with Pip: +

pip install torch_geometric
+

+

Contributing

+

Have a suggestion, request, or found a bug? Feel free to open an issue or submit a pull request. +If you would like to contribute, please check out our contribution guidelines here. We welcome and look forward to all contributions to RL4CO!

+

We are also on Slack if you have any questions or would like to discuss RL4CO with us. We are open to collaborations and would love to hear from you 🚀

+

Contributors

+

+ +

+

Citation

+

If you find RL4CO valuable for your research or applied projects:

+
@article{berto2024rl4co,
+    title={{RL4CO: an Extensive Reinforcement Learning for Combinatorial Optimization Benchmark}},
+    author={Federico Berto and Chuanbo Hua and Junyoung Park and Laurin Luttmann and Yining Ma and Fanchen Bu and Jiarui Wang and Haoran Ye and Minsu Kim and Sanghyeok Choi and Nayeli Gast Zepeda and Andr\'e Hottung and Jianan Zhou and Jieyi Bi and Yu Hu and Fei Liu and Hyeonah Kim and Jiwoo Son and Haeyeon Kim and Davide Angioni and Wouter Kool and Zhiguang Cao and Jie Zhang and Kijung Shin and Cathy Wu and Sungsoo Ahn and Guojie Song and Changhyun Kwon and Lin Xie and Jinkyoo Park},
+    year={2024},
+    journal={arXiv preprint arXiv:2306.17100},
+    note={\url{https://github.com/ai4co/rl4co}}
+}
+
+

Note that a previous version of RL4CO has been accepted as an oral presentation at the NeurIPS 2023 GLFrontiers Workshop. Since then, the library has greatly evolved and improved!

+
+

Join us

+

Slack

+

We invite you to join our AI4CO community, an open research group in Artificial Intelligence (AI) for Combinatorial Optimization (CO)!

+
+ AI4CO Logo +
+ + + + + + + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/objects.inv b/objects.inv new file mode 100644 index 0000000000000000000000000000000000000000..5618cfe3a7328df8b0a67310ba68c1f607a37143 GIT binary patch literal 3291 zcmV<13?%a-AX9K?X>NERX>N99Zgg*Qc_4OWa&u{KZXhxWBOp+6Z)#;@bUGkXOf*AJ z3L_v^WpZMd?av*PJAarPHb0B7EY-J#6b0A}H zZE$jBb8}^6Aa!$TZf78RY-wUH3V7PholSG2Iu?fa^DDY)W;=9EY8F$o^R=CH_r#7X zPTgKo3djx}kSIxZ+WqTCLV&@>AfY4rF8apin&&+_I{KC%Mgj$~{13+>SpF0Y{STiO z`unH+^xr5&oPYY)r2M0`eh@>$*U`S1Vu^v}P=J%}KpX^I36cSO;42NH>d zl23QHfGyYyCY-WG5{VAnh44M%;w5&lyal*rw>j?0_Axf~IsnKnmF@>jFhd0i!pb&s zyv=*fz~S|`(xCt_yhDdnR8S5>#pGCAfuUt_o{z!FqDc6TvWy2?AwjdlK9fJS&gcdw zPTp|LP#XRxL>IJihTQ;$9}ML=X5+#9lx0}3Bmy$@%&RY2!VV%yc@Vwf=smVxn$k=i*B_#v8cj$A8bCph0C|RE`UeC{5x-oQ9HZ zrD0fgS~2%ngs4D;8RGBYY=%D&i$SqPsG3x$meferV;mzEy@7%mCh>4pXo<{I6k%y? ziX(yJG6y-Z2z0E;(s9JFM1gZqprEig)5fNUs%zD31h9=nuNN{c1>}6|aTY2X# z*4aQsw6O3tH##zHq!{sndvP4WIszw%`pkpO?V4#^3^24j{<%T(S2 zlb1V$V12Cx&h9Q`U_2g|hA*7G-69nZAcsshovtPBf(_m(D}KYf3mD(>xN7US3-=D& zHO*5r^K&?FA&OxIgC==O{)LFAflRwRyOw4yT@fEr1>WsS`|s}!{e8ZzS=8Hu=t?tUC(5OIZcx&!Q56K zlP>)wnM%L7?{p!*DK7d@FDAz4jVm5KeM>9YQD(9f1udI1HLxu{hi{a=Po?iMm~LrJ z?cxaoR!dEhz%})qbG3r!S94F;yN>dl z93M@gRm`2}?Vn@S2nmo-zfc>GSBF$2UoeVi)g`lPgAg00b=6>mpVKTy0?=L!^kgif zoC7*}Llb!i^GF2s!x>IibO~v!;&qyOH-NVC!7VG&(;5rVOlT89GeK=f!*Li>p;p*b zy%N^{GvtX{dUMcG8~SnfisM+;g{o4Mcl{J zPYoTP2+ER3ue~nxmt|8DIEl5MIy^OrQgLujfA;N6Ijkw#*01uf&!iPPx*?iKYN|BJ zs$v=;BxJX75~-(YQdBg5(8$D;ghCY`tF4OB-vlrHWy8+k^F)c99ehQYa4a zd$2yGdw+14^^1OuoT}vnwQgaw#l&7<^qPnPR;{t`y+kE{Lk!2GS0no2>Jb;F4>Ref zM@-h9Q7|w5xU}s3NY^@9(({}a|2CVap=wJ0tmp1=rJ{q$a6)9dBE2e=CIs^`)qj-V zhYYO=_UHf~QEFhfi-c*(v(i}p%qdZwFqC?6QwQIRuT~flF9}#v&sZ<+cwT;8-#yhv1~u=)M%R0gYXjuZMN?qxK#5I0v8%gfA=lp zC(bTJd`8)}=w5jVvNqaFu75`?JLF!hZ=*ezkV`S|uJRMO7aBg}RzH@iydJ(bBEVhc z{Hd<-0Ya;T8pwEx4yis<&bc@1^%EC%jAmhRRxVfDQ2eQl8W)VzlA%?e%m~FP$6=;s zC{4FCj?@H+>tB=xsMvW|KCdh&|ICVu+xi)1H^WX6J~#LD+2cp-J%txF$}C7( zHL7L-bgcG>4(nw>@hzyQ`Gq@e0vl{7H^Zx$iPG}b(ENr8F_xaM zkD4rI^B0pt4GP@Ydu|Lho!c?uSBFp(-(;!62&!GHknXH95ERTX`|Xin9>q9Ekqj^* z_(_(qESM3oEk4tt(%dn1 zlr7yRUI&FR;&m-kazlB|xpC;?=6YYV+U`q~NSLA%h!7#ca<(lNnb!jka38_5@%JFQ zY?dY7-OMw~M;EPM0j588O9QU+b)f*$)4G7dcB|U(W%ddgC=xdmD|aR$R*`6D&vj(M zTBP}=Hg!iLltpLyfIZi7>u7=o4yfJ^Y)ADrxW|e|bb<_jiTg{1e}_H4J^WiX{RP5b z*)x6kE7ji-{%>;hdp;}m1t-D5%zeD!7KJW}nYkM39A5Yip)S_DfK;F*HA^Hf2P z4A8tmhJ@POSaoWPO^#cE_E?>eG9B?7id5rry`g$|_oN#dGUGc{AVT*R*r)NyPaJO} z$}rz9HtuNlow;DD_t&-Q{BirT^38|r zjFnRL5-ZRMt{dyo@NMzP6tkzlxZ^z}q;5G0XbxOpizA%jTN1~Z02*JGExod3a-ze8 z%}<#$I#8W>tj?b5m+VAv-TJmb`J#)kesgLfPM)Od$FKX;(s{ByW$XD9R9=*Iw1&Ej zR|Mkkyx6-LG+*<(EH`uB1Qz#QA=GVyZ#V6}^?_j=pGNBHo2$`36J=6>Xd^LO_1+eB z=yu%g#Y;F2viG2#p;672%bvtgWM0vV>0Oik3ynMVI~I#dR~@ST1Eb7fb6@rQ0Y+lVR4?^$$$()& 3x more CPU. We may generally recommend using the :class:`TensorDictDatasetList` + + Note: + Check out the issue on tensordict for more details: + https://github.com/pytorch-labs/tensordict/issues/374. + """ + + def __init__(self, td: TensorDict): + self.data = td + + def __len__(self): + return len(self.data) + + def __getitems__(self, index): + # Tricks: + # - batched data loading with `__getitems__` for faster loading + # - avoid directly indexing TensorDicts for faster loading + return TensorDict( + {key: item[index] for key, item in self.data.items()}, + batch_size=torch.Size([len(index)]), + **td_kwargs, + ) + + def add_key(self, key, value): + self.data.update({key: value}) # native method + return self + + @staticmethod + def collate_fn(batch: Union[dict, TensorDict]): + """Equivalent to collating with `lambda x: x`""" + return batch diff --git a/rl4co/data/generate_data.py b/rl4co/data/generate_data.py new file mode 100644 index 00000000..5d837ba1 --- /dev/null +++ b/rl4co/data/generate_data.py @@ -0,0 +1,397 @@ +import argparse +import logging +import os +import sys + +from typing import List, Union + +import numpy as np + +from rl4co.data.utils import check_extension +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +DISTRIBUTIONS_PER_PROBLEM = { + "tsp": [None], + "vrp": [None], + "pctsp": [None], + "op": ["const", "unif", "dist"], + "mdpp": [None], + "pdp": [None], + "atsp": [None] +} + + +def generate_env_data(env_type, *args, **kwargs): + """Generate data for a given environment type in the form of a dictionary""" + try: + # breakpoint() + # remove all None values from args + args = [arg for arg in args if arg is not None] + + return getattr(sys.modules[__name__], f"generate_{env_type}_data")( + *args, **kwargs + ) + except AttributeError: + raise NotImplementedError(f"Environment type {env_type} not implemented") + + +def generate_tsp_data(dataset_size, tsp_size): + return { + "locs": np.random.uniform(size=(dataset_size, tsp_size, 2)).astype(np.float32) + } + + +def generate_vrp_data(dataset_size, vrp_size, capacities=None): + # From Kool et al. 2019, Hottung et al. 2022, Kim et al. 2023 + CAPACITIES = { + 10: 20.0, + 15: 25.0, + 20: 30.0, + 30: 33.0, + 40: 37.0, + 50: 40.0, + 60: 43.0, + 75: 45.0, + 100: 50.0, + 125: 55.0, + 150: 60.0, + 200: 70.0, + 500: 100.0, + 1000: 150.0, + } + + # If capacities are provided, replace keys in CAPACITIES with provided values if they exist + if capacities is not None: + for k, v in capacities.items(): + if k in CAPACITIES: + print(f"Replacing capacity for {k} with {v}") + CAPACITIES[k] = v + + return { + "depot": np.random.uniform(size=(dataset_size, 2)).astype( + np.float32 + ), # Depot location + "locs": np.random.uniform(size=(dataset_size, vrp_size, 2)).astype( + np.float32 + ), # Node locations + "demand": np.random.randint(1, 10, size=(dataset_size, vrp_size)).astype( + np.float32 + ), # Demand, uniform integer 1 ... 9 + "capacity": np.full(dataset_size, CAPACITIES[vrp_size]).astype(np.float32), + } # Capacity, same for whole dataset + + +def generate_pdp_data(dataset_size, pdp_size): + depot = np.random.uniform(size=(dataset_size, 2)) + loc = np.random.uniform(size=(dataset_size, pdp_size, 2)) + return { + "locs": loc.astype(np.float32), + "depot": depot.astype(np.float32), + } + + +def generate_op_data(dataset_size, op_size, prize_type="const", max_lengths=None): + depot = np.random.uniform(size=(dataset_size, 2)) + loc = np.random.uniform(size=(dataset_size, op_size, 2)) + + # Methods taken from Fischetti et al. 1998 + if prize_type == "const": + prize = np.ones((dataset_size, op_size)) + elif prize_type == "unif": + prize = (1 + np.random.randint(0, 100, size=(dataset_size, op_size))) / 100.0 + else: # Based on distance to depot + assert prize_type == "dist" + prize_ = np.linalg.norm(depot[:, None, :] - loc, axis=-1) + prize = ( + 1 + (prize_ / prize_.max(axis=-1, keepdims=True) * 99).astype(int) + ) / 100.0 + + # Max length is approximately half of optimal TSP tour, such that half (a bit more) of the nodes can be visited + # which is maximally difficult as this has the largest number of possibilities + MAX_LENGTHS = {20: 2.0, 50: 3.0, 100: 4.0} + max_lengths = MAX_LENGTHS if max_lengths is None else max_lengths + + return { + "depot": depot.astype(np.float32), + "locs": loc.astype(np.float32), + "prize": prize.astype(np.float32), + "max_length": np.full(dataset_size, max_lengths[op_size]).astype(np.float32), + } + + +def generate_pctsp_data(dataset_size, pctsp_size, penalty_factor=3, max_lengths=None): + depot = np.random.uniform(size=(dataset_size, 2)) + loc = np.random.uniform(size=(dataset_size, pctsp_size, 2)) + + # For the penalty to make sense it should be not too large (in which case all nodes will be visited) nor too small + # so we want the objective term to be approximately equal to the length of the tour, which we estimate with half + # of the nodes by half of the tour length (which is very rough but similar to op) + # This means that the sum of penalties for all nodes will be approximately equal to the tour length (on average) + # The expected total (uniform) penalty of half of the nodes (since approx half will be visited by the constraint) + # is (n / 2) / 2 = n / 4 so divide by this means multiply by 4 / n, + # However instead of 4 we use penalty_factor (3 works well) so we can make them larger or smaller + MAX_LENGTHS = {20: 2.0, 50: 3.0, 100: 4.0} + max_lengths = MAX_LENGTHS if max_lengths is None else max_lengths + penalty_max = max_lengths[pctsp_size] * (penalty_factor) / float(pctsp_size) + penalty = np.random.uniform(size=(dataset_size, pctsp_size)) * penalty_max + + # Take uniform prizes + # Now expectation is 0.5 so expected total prize is n / 2, we want to force to visit approximately half of the nodes + # so the constraint will be that total prize >= (n / 2) / 2 = n / 4 + # equivalently, we divide all prizes by n / 4 and the total prize should be >= 1 + deterministic_prize = ( + np.random.uniform(size=(dataset_size, pctsp_size)) * 4 / float(pctsp_size) + ) + + # In the deterministic setting, the stochastic_prize is not used and the deterministic prize is known + # In the stochastic setting, the deterministic prize is the expected prize and is known up front but the + # stochastic prize is only revealed once the node is visited + # Stochastic prize is between (0, 2 * expected_prize) such that E(stochastic prize) = E(deterministic_prize) + stochastic_prize = ( + np.random.uniform(size=(dataset_size, pctsp_size)) * deterministic_prize * 2 + ) + + return { + "locs": loc.astype(np.float32), + "depot": depot.astype(np.float32), + "penalty": penalty.astype(np.float32), + "deterministic_prize": deterministic_prize.astype(np.float32), + "stochastic_prize": stochastic_prize.astype(np.float32), + } + + +def generate_mdpp_data( + dataset_size, + size=10, + num_probes_min=2, + num_probes_max=5, + num_keepout_min=1, + num_keepout_max=50, + lock_size=True, +): + """Generate data for the nDPP problem. + If `lock_size` is True, then the size if fixed and we skip the `size` argument if it is not 10. + This is because the RL environment is based on a real-world PCB (parametrized with data) + """ + if lock_size and size != 10: + # log.info("Locking size to 10, skipping generate_mdpp_data with size {}".format(size)) + return None + + bs = dataset_size # bs = batch_size to generate data in batch + m = n = size + if isinstance(bs, int): + bs = [bs] + + locs = np.stack(np.meshgrid(np.arange(m), np.arange(n)), axis=-1).reshape(-1, 2) + locs = locs / np.array([m, n], dtype=np.float32) + locs = np.expand_dims(locs, axis=0) + locs = np.repeat(locs, bs[0], axis=0) + + available = np.ones((bs[0], m * n), dtype=bool) + + probe = np.random.randint(0, high=m * n, size=(bs[0], 1)) + np.put_along_axis(available, probe, False, axis=1) + + num_probe = np.random.randint(num_probes_min, num_probes_max + 1, size=(bs[0], 1)) + probes = np.zeros((bs[0], m * n), dtype=bool) + for i in range(bs[0]): + p = np.random.choice(m * n, num_probe[i], replace=False) + np.put_along_axis(available[i], p, False, axis=0) + np.put_along_axis(probes[i], p, True, axis=0) + + num_keepout = np.random.randint(num_keepout_min, num_keepout_max + 1, size=(bs[0], 1)) + for i in range(bs[0]): + k = np.random.choice(m * n, num_keepout[i], replace=False) + np.put_along_axis(available[i], k, False, axis=0) + + return { + "locs": locs.astype(np.float32), + "probe": probes.astype(bool), + "action_mask": available.astype(bool), + } + +def generate_atsp_data(dataset_size, atsp_size, tmat_class: bool = True): + cost_matrix = np.random.uniform(size=(dataset_size, atsp_size, atsp_size)) + cost_matrix[..., np.arange(atsp_size), np.arange(atsp_size)] = 0 + if tmat_class: + for i in range(atsp_size): + cost_matrix = np.minimum(cost_matrix, cost_matrix[..., :, [i]] + cost_matrix[..., [i], :]) + return { + "cost_matrix": cost_matrix.astype(np.float32) + } + + +def generate_dataset( + filename: Union[str, List[str]] = None, + data_dir: str = "data", + name: str = None, + problem: Union[str, List[str]] = "all", + data_distribution: str = "all", + dataset_size: int = 10000, + graph_sizes: Union[int, List[int]] = [20, 50, 100], + overwrite: bool = False, + seed: int = 1234, + disable_warning: bool = True, + distributions_per_problem: Union[int, dict] = None, +): + """We keep a similar structure as in Kool et al. 2019 but save and load the data as npz + This is way faster and more memory efficient than pickle and also allows for easy transfer to TensorDict + + Args: + filename: Filename to save the data to. If None, the data is saved to data_dir/problem/problem_graph_size_seed.npz. Defaults to None. + data_dir: Directory to save the data to. Defaults to "data". + name: Name of the dataset. Defaults to None. + problem: Problem to generate data for. Defaults to "all". + data_distribution: Data distribution to generate data for. Defaults to "all". + dataset_size: Number of datasets to generate. Defaults to 10000. + graph_sizes: Graph size to generate data for. Defaults to [20, 50, 100]. + overwrite: Whether to overwrite existing files. Defaults to False. + seed: Random seed. Defaults to 1234. + disable_warning: Whether to disable warnings. Defaults to True. + distributions_per_problem: Number of distributions to generate per problem. Defaults to None. + """ + + if isinstance(problem, list) and len(problem) == 1: + problem = problem[0] + + graph_sizes = [graph_sizes] if isinstance(graph_sizes, int) else graph_sizes + + if distributions_per_problem is None: + distributions_per_problem = DISTRIBUTIONS_PER_PROBLEM + + if problem == "all": + problems = distributions_per_problem + else: + problems = { + problem: distributions_per_problem[problem] + if data_distribution == "all" + else [data_distribution] + } + + # Support multiple filenames if necessary + filenames = [filename] if isinstance(filename, str) else filename + iter = 0 + + # Main loop for data generation. We loop over all problems, distributions and sizes + for problem, distributions in problems.items(): + for distribution in distributions or [None]: + for graph_size in graph_sizes: + if filename is None: + datadir = os.path.join(data_dir, problem) + os.makedirs(datadir, exist_ok=True) + fname = os.path.join( + datadir, + "{}{}{}_{}_seed{}.npz".format( + problem, + "_{}".format(distribution) + if distribution is not None + else "", + graph_size, + name, + seed, + ), + ) + else: + try: + fname = filenames[iter] + # make directory if necessary + os.makedirs(os.path.dirname(fname), exist_ok=True) + iter += 1 + except Exception: + raise ValueError( + "Number of filenames does not match number of problems" + ) + fname = check_extension(filename, extension=".npz") + + if not overwrite and os.path.isfile( + check_extension(fname, extension=".npz") + ): + if not disable_warning: + log.info( + "File {} already exists! Run with -f option to overwrite. Skipping...".format( + fname + ) + ) + continue + + # Set seed + np.random.seed(seed) + + # Automatically generate dataset + dataset = generate_env_data( + problem, dataset_size, graph_size, distribution + ) + + # A function can return None in case of an error or a skip + if dataset is not None: + # Save to disk as dict + log.info("Saving {} dataset to {}".format(problem, fname)) + np.savez(fname, **dataset) + + +def generate_default_datasets(data_dir, generate_eda=False): + """Generate the default datasets used in the paper and save them to data_dir/problem""" + generate_dataset(data_dir=data_dir, name="val", problem="all", seed=4321) + generate_dataset(data_dir=data_dir, name="test", problem="all", seed=1234) + + # By default, we skip the EDA datasets since they can easily be generated on the fly when needed + if generate_eda: + generate_dataset( + data_dir=data_dir, + name="test", + problem="mdpp", + seed=1234, + graph_sizes=[10], + dataset_size=100, + ) # EDA (mDPP) + + +if __name__ == "__main__": + parser = argparse.ArgumentParser() + parser.add_argument( + "--filename", help="Filename of the dataset to create (ignores datadir)" + ) + parser.add_argument( + "--data_dir", + default="data", + help="Create datasets in data_dir/problem (default 'data')", + ) + parser.add_argument( + "--name", type=str, required=True, help="Name to identify dataset" + ) + parser.add_argument( + "--problem", + type=str, + default="all", + help="Problem, 'tsp', 'vrp', 'pctsp' or 'op_const', 'op_unif' or 'op_dist'" + " or 'all' to generate all", + ) + parser.add_argument( + "--data_distribution", + type=str, + default="all", + help="Distributions to generate for problem, default 'all'.", + ) + parser.add_argument( + "--dataset_size", type=int, default=10000, help="Size of the dataset" + ) + parser.add_argument( + "--graph_sizes", + type=int, + nargs="+", + default=[20, 50, 100], + help="Sizes of problem instances (default 20, 50, 100)", + ) + parser.add_argument("-f", action="store_true", help="Set true to overwrite") + parser.add_argument("--seed", type=int, default=1234, help="Random seed") + parser.add_argument("--disable_warning", action="store_true", help="Disable warning") + args = parser.parse_args() + + logging.basicConfig(level=logging.INFO) + + args.overwrite = args.f + delattr(args, "f") + generate_dataset(**vars(args)) diff --git a/rl4co/data/transforms.py b/rl4co/data/transforms.py new file mode 100644 index 00000000..6fb8807e --- /dev/null +++ b/rl4co/data/transforms.py @@ -0,0 +1,150 @@ +import math +from typing import Union +import torch + +from tensordict.tensordict import TensorDict +from torch import Tensor + +from rl4co.utils.ops import batchify +from rl4co.utils.pylogger import get_pylogger + + +log = get_pylogger(__name__) + + +def dihedral_8_augmentation(xy: Tensor) -> Tensor: + """ + Augmentation (x8) for grid-based data (x, y) as done in POMO. + This is a Dihedral group of order 8 (rotations and reflections) + https://en.wikipedia.org/wiki/Examples_of_groups#dihedral_group_of_order_8 + + Args: + xy: [batch, graph, 2] tensor of x and y coordinates + """ + # [batch, graph, 2] + x, y = xy.split(1, dim=2) + # augmnetations [batch, graph, 2] + z0 = torch.cat((x, y), dim=2) + z1 = torch.cat((1 - x, y), dim=2) + z2 = torch.cat((x, 1 - y), dim=2) + z3 = torch.cat((1 - x, 1 - y), dim=2) + z4 = torch.cat((y, x), dim=2) + z5 = torch.cat((1 - y, x), dim=2) + z6 = torch.cat((y, 1 - x), dim=2) + z7 = torch.cat((1 - y, 1 - x), dim=2) + # [batch*8, graph, 2] + aug_xy = torch.cat((z0, z1, z2, z3, z4, z5, z6, z7), dim=0) + return aug_xy + + +def dihedral_8_augmentation_wrapper( + xy: Tensor, reduce: bool = True, *args, **kw +) -> Tensor: + """Wrapper for dihedral_8_augmentation. If reduce, only return the first 1/8 of the augmented data + since the augmentation augments the data 8 times. + """ + xy = xy[: xy.shape[0] // 8, ...] if reduce else xy + return dihedral_8_augmentation(xy) + + +def symmetric_transform(x: Tensor, y: Tensor, phi: Tensor, offset: float = 0.5): + """SR group transform with rotation and reflection + Like the one in SymNCO, but a vectorized version + + Args: + x: [batch, graph, 1] tensor of x coordinates + y: [batch, graph, 1] tensor of y coordinates + phi: [batch, 1] tensor of random rotation angles + offset: offset for x and y coordinates + """ + x, y = x - offset, y - offset + # random rotation + x_prime = torch.cos(phi) * x - torch.sin(phi) * y + y_prime = torch.sin(phi) * x + torch.cos(phi) * y + # make random reflection if phi > 2*pi (i.e. 50% of the time) + mask = phi > 2 * math.pi + # vectorized random reflection: swap axes x and y if mask + xy = torch.cat((x_prime, y_prime), dim=-1) + xy = torch.where(mask, xy.flip(-1), xy) + return xy + offset + + +def symmetric_augmentation(xy: Tensor, num_augment: int = 8, first_augment: bool = False): + """Augment xy data by `num_augment` times via symmetric rotation transform and concatenate to original data + + Args: + xy: [batch, graph, 2] tensor of x and y coordinates + num_augment: number of augmentations + first_augment: whether to augment the first data point + """ + # create random rotation angles (4*pi for reflection, 2*pi for rotation) + phi = torch.rand(xy.shape[0], device=xy.device) * 4 * math.pi + + # set phi to 0 for first , i.e. no augmentation as in SymNCO + if not first_augment: + phi[: xy.shape[0] // num_augment] = 0.0 + x, y = xy[..., [0]], xy[..., [1]] + return symmetric_transform(x, y, phi[:, None, None]) + + +def min_max_normalize(x): + return (x - x.min()) / (x.max() - x.min()) + + +def get_augment_function(augment_fn: Union[str, callable]): + if callable(augment_fn): + return augment_fn + if augment_fn == "dihedral8": + return dihedral_8_augmentation_wrapper + if augment_fn == "symmetric": + return symmetric_augmentation + raise ValueError(f"Unknown augment_fn: {augment_fn}. Available options: 'symmetric', 'dihedral8' or a custom callable") + + +class StateAugmentation(object): + """Augment state by N times via symmetric rotation/reflection transform + + Args: + num_augment: number of augmentations + augment_fn: augmentation function to use, e.g. 'symmetric' (default) or 'dihedral8', if callable, + then use the function directly. If 'dihedral8', then num_augment must be 8 + first_aug_identity: whether to augment the first data point too + normalize: whether to normalize the augmented data + feats: list of features to augment + """ + + def __init__( + self, + num_augment: int = 8, + augment_fn: Union[str, callable] = 'symmetric', + first_aug_identity: bool = True, + normalize: bool = False, + feats: list = None, + ): + self.augmentation = get_augment_function(augment_fn) + assert not ( + self.augmentation == dihedral_8_augmentation_wrapper and num_augment != 8 + ), "When using the `dihedral8` augmentation function, then num_augment must be 8" + + if feats is None: + log.info("Features not passed, defaulting to 'locs'") + self.feats = ["locs"] + else: + self.feats = feats + self.num_augment = num_augment + self.normalize = normalize + self.first_aug_identity = first_aug_identity + + def __call__(self, td: TensorDict) -> TensorDict: + td_aug = batchify(td, self.num_augment) + for feat in self.feats: + if not self.first_aug_identity: + init_aug_feat = td_aug[feat][list(td.size()), 0].clone() + aug_feat = self.augmentation(td_aug[feat], self.num_augment) + if self.normalize: + aug_feat = min_max_normalize(aug_feat) + if not self.first_aug_identity: + aug_feat[list(td.size()), 0] = init_aug_feat + td_aug[feat] = aug_feat + + return td_aug diff --git a/rl4co/data/utils.py b/rl4co/data/utils.py new file mode 100644 index 00000000..f8a1e288 --- /dev/null +++ b/rl4co/data/utils.py @@ -0,0 +1,71 @@ +import os + +import numpy as np + +from tensordict.tensordict import TensorDict + +CURR_DIR = os.path.dirname(os.path.abspath(__file__)) +ROOT_PATH = os.path.dirname(os.path.dirname(CURR_DIR)) + + +def load_npz_to_tensordict(filename): + """Load a npz file directly into a TensorDict + We assume that the npz file contains a dictionary of numpy arrays + This is at least an order of magnitude faster than pickle + """ + x = np.load(filename) + x_dict = dict(x) + batch_size = x_dict[list(x_dict.keys())[0]].shape[0] + return TensorDict(x_dict, batch_size=batch_size) + + +def save_tensordict_to_npz(tensordict, filename, compress: bool = False): + """Save a TensorDict to a npz file + We assume that the TensorDict contains a dictionary of tensors + """ + x_dict = {k: v.numpy() for k, v in tensordict.items()} + if compress: + np.savez_compressed(filename, **x_dict) + else: + np.savez(filename, **x_dict) + + +def check_extension(filename, extension=".npz"): + """Check that filename has extension, otherwise add it""" + if os.path.splitext(filename)[1] != extension: + return filename + extension + return filename + + +def load_solomon_instance(name, path=None, edge_weights=False): + """Load solomon instance from a file""" + import vrplib + + if not path: + path = "data/solomon/instances/" + path = os.path.join(ROOT_PATH, path) + if not os.path.isdir(path): + os.makedirs(path) + file_path = f"{path}{name}.txt" + if not os.path.isfile(file_path): + vrplib.download_instance(name=name, path=path) + return vrplib.read_instance( + path=file_path, + instance_format="solomon", + compute_edge_weights=edge_weights, + ) + + +def load_solomon_solution(name, path=None): + """Load solomon solution from a file""" + import vrplib + + if not path: + path = "data/solomon/solutions/" + path = os.path.join(ROOT_PATH, path) + if not os.path.isdir(path): + os.makedirs(path) + file_path = f"{path}{name}.sol" + if not os.path.isfile(file_path): + vrplib.download_solution(name=name, path=path) + return vrplib.read_solution(path=file_path) diff --git a/rl4co/envs/__init__.py b/rl4co/envs/__init__.py new file mode 100644 index 00000000..1c43a7d1 --- /dev/null +++ b/rl4co/envs/__init__.py @@ -0,0 +1,77 @@ +# Base environment +from rl4co.envs.common.base import RL4COEnvBase + +# EDA +from rl4co.envs.eda import DPPEnv, MDPPEnv + +# Graph +from rl4co.envs.graph import FLPEnv, MCPEnv + +# Routing +from rl4co.envs.routing import ( + ATSPEnv, + CVRPEnv, + CVRPTWEnv, + DenseRewardTSPEnv, + MDCPDPEnv, + MTSPEnv, + MTVRPEnv, + OPEnv, + PCTSPEnv, + PDPEnv, + PDPRuinRepairEnv, + SDVRPEnv, + SPCTSPEnv, + SVRPEnv, + TSPEnv, + TSPkoptEnv, +) + +# Scheduling +from rl4co.envs.scheduling import FFSPEnv, FJSPEnv, JSSPEnv, SMTWTPEnv + +# Register environments +ENV_REGISTRY = { + "atsp": ATSPEnv, + "cvrp": CVRPEnv, + "cvrptw": CVRPTWEnv, + "dpp": DPPEnv, + "ffsp": FFSPEnv, + "jssp": JSSPEnv, + "fjsp": FJSPEnv, + "mdpp": MDPPEnv, + "mtsp": MTSPEnv, + "op": OPEnv, + "pctsp": PCTSPEnv, + "pdp": PDPEnv, + "pdp_ruin_repair": PDPRuinRepairEnv, + "sdvrp": SDVRPEnv, + "svrp": SVRPEnv, + "spctsp": SPCTSPEnv, + "tsp": TSPEnv, + "smtwtp": SMTWTPEnv, + "mdcpdp": MDCPDPEnv, + "mtvrp": MTVRPEnv, + "tsp_kopt": TSPkoptEnv, + "mcp": MCPEnv, + "flp": FLPEnv, +} + + +def get_env(env_name: str, *args, **kwargs) -> RL4COEnvBase: + """Get environment by name. + + Args: + env_name: Environment name + *args: Positional arguments for environment + **kwargs: Keyword arguments for environment + + Returns: + Environment + """ + env_cls = ENV_REGISTRY.get(env_name, None) + if env_cls is None: + raise ValueError( + f"Unknown environment {env_name}. Available environments: {ENV_REGISTRY.keys()}" + ) + return env_cls(*args, **kwargs) diff --git a/rl4co/envs/common/__init__.py b/rl4co/envs/common/__init__.py new file mode 100644 index 00000000..20b8afba --- /dev/null +++ b/rl4co/envs/common/__init__.py @@ -0,0 +1,2 @@ +from .base import RL4COEnvBase +from .utils import Generator, get_sampler diff --git a/rl4co/envs/common/base.py b/rl4co/envs/common/base.py new file mode 100644 index 00000000..d2f4aa55 --- /dev/null +++ b/rl4co/envs/common/base.py @@ -0,0 +1,403 @@ +import abc + +from os.path import join as pjoin +from typing import Iterable, Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.envs import EnvBase + +from rl4co.data.dataset import TensorDictDataset +from rl4co.data.utils import load_npz_to_tensordict +from rl4co.utils.ops import get_num_starts, select_start_nodes +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class RL4COEnvBase(EnvBase, metaclass=abc.ABCMeta): + """Base class for RL4CO environments based on TorchRL EnvBase. + The environment has the usual methods for stepping, resetting, and getting the specifications of the environment + that shoud be implemented by the subclasses of this class. + It also has methods for getting the reward, action mask, and checking the validity of the solution, and + for generating and loading the datasets (supporting multiple dataloaders as well for validation and testing). + + Args: + data_dir: Root directory for the dataset + train_file: Name of the training file + val_file: Name of the validation file + test_file: Name of the test file + val_dataloader_names: Names of the dataloaders to use for validation + test_dataloader_names: Names of the dataloaders to use for testing + check_solution: Whether to check the validity of the solution at the end of the episode + dataset_cls: Dataset class to use for the environment (which can influence performance) + seed: Seed for the environment + device: Device to use. Generally, no need to set as tensors are updated on the fly + batch_size: Batch size to use for the environment. Generally, no need to set as tensors are updated on the fly + run_type_checks: If True, run type checks on the TensorDicts at each step + allow_done_after_reset: If True, an environment can be done after a reset + _torchrl_mode: Whether to use the TorchRL mode (see :meth:`step` for more details) + """ + + batch_locked = False + + def __init__( + self, + *, + data_dir: str = "data/", + train_file: str = None, + val_file: str = None, + test_file: str = None, + val_dataloader_names: list = None, + test_dataloader_names: list = None, + check_solution: bool = True, + dataset_cls: callable = TensorDictDataset, + seed: int = None, + device: str = "cpu", + batch_size: torch.Size = None, + run_type_checks: bool = False, + allow_done_after_reset: bool = False, + _torchrl_mode: bool = False, + **kwargs, + ): + super().__init__( + device=device, + batch_size=batch_size, + run_type_checks=run_type_checks, + allow_done_after_reset=allow_done_after_reset, + ) + # if any kwargs are left, we want to warn the user + kwargs.pop("name", None) # we remove the name for checking + if kwargs: + log.error( + f"Unused keyword arguments: {', '.join(kwargs.keys())}. " + "Please check the base class documentation at https://rl4co.readthedocs.io/en/latest/_content/api/envs/base.html. " + "In case you would like to pass data generation arguments, please pass a `generator` method instead " + "or for example: `generator_kwargs=dict(num_loc=50)` to the constructor." + ) + self.data_dir = data_dir + self.train_file = pjoin(data_dir, train_file) if train_file is not None else None + self._torchrl_mode = _torchrl_mode + self.dataset_cls = dataset_cls + + def get_files(f): + if f is not None: + if isinstance(f, Iterable) and not isinstance(f, str): + return [pjoin(data_dir, _f) for _f in f] + else: + return pjoin(data_dir, f) + return None + + def get_multiple_dataloader_names(f, names): + if f is not None: + if isinstance(f, Iterable) and not isinstance(f, str): + if names is None: + names = [f"{i}" for i in range(len(f))] + else: + assert len(names) == len( + f + ), "Number of dataloader names must match number of files" + else: + if names is not None: + log.warning( + "Ignoring dataloader names since only one dataloader is provided" + ) + return names + + self.val_file = get_files(val_file) + self.test_file = get_files(test_file) + self.val_dataloader_names = get_multiple_dataloader_names( + self.val_file, val_dataloader_names + ) + self.test_dataloader_names = get_multiple_dataloader_names( + self.test_file, test_dataloader_names + ) + self.check_solution = check_solution + if seed is None: + seed = torch.empty((), dtype=torch.int64).random_().item() + self.set_seed(seed) + + def step(self, td: TensorDict) -> TensorDict: + """Step function to call at each step of the episode containing an action. + If `_torchrl_mode` is True, we call `_torchrl_step` instead which set the + `next` key of the TensorDict to the next state - this is the usual way to do it in TorchRL, + but inefficient in our case + """ + if not self._torchrl_mode: + # Default: just return the TensorDict without farther checks etc is faster + td = self._step(td) + return {"next": td} + else: + # Since we simplify the syntax + return self._torchrl_step(td) + + def reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + """Reset function to call at the beginning of each episode""" + if batch_size is None: + batch_size = self.batch_size if td is None else td.batch_size + if td is None or td.is_empty(): + td = self.generator(batch_size=batch_size) + batch_size = [batch_size] if isinstance(batch_size, int) else batch_size + self.to(td.device) + return super().reset(td, batch_size=batch_size) + + def _torchrl_step(self, td: TensorDict) -> TensorDict: + """See :meth:`super().step` for more details. + This is the usual way to do it in TorchRL, but inefficient in our case + + Note: + Here we clone the TensorDict to avoid recursion error, since we allow + for directly updating the TensorDict in the step function + """ + # sanity check + self._assert_tensordict_shape(td) + next_preset = td.get("next", None) + + next_tensordict = self._step( + td.clone() + ) # NOTE: we clone to avoid recursion error + next_tensordict = self._step_proc_data(next_tensordict) + if next_preset is not None: + next_tensordict.update(next_preset.exclude(*next_tensordict.keys(True, True))) + td.set("next", next_tensordict) + return td + + @abc.abstractmethod + def _step(self, td: TensorDict) -> TensorDict: + """Step function to call at each step of the episode containing an action. + Gives the next observation, reward, done + """ + raise NotImplementedError + + @abc.abstractmethod + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + """Reset function to call at the beginning of each episode""" + raise NotImplementedError + + def _make_spec(self, td_params: TensorDict = None): + """Make the specifications of the environment (observation, action, reward, done)""" + raise NotImplementedError + + def get_reward(self, td: TensorDict, actions: torch.Tensor) -> torch.Tensor: + """Function to compute the reward. Can be called by the agent to compute the reward of the current state + This is faster than calling step() and getting the reward from the returned TensorDict at each time for CO tasks + """ + if self.check_solution: + self.check_solution_validity(td, actions) + return self._get_reward(td, actions) + + @abc.abstractmethod + def _get_reward(self, td, actions) -> TensorDict: + """Function to compute the reward. Can be called by the agent to compute the reward of the current state + This is faster than calling step() and getting the reward from the returned TensorDict at each time for CO tasks + """ + raise NotImplementedError + + def get_action_mask(self, td: TensorDict) -> torch.Tensor: + """Function to compute the action mask (feasible actions) for the current state + Action mask is 1 if the action is feasible, 0 otherwise + """ + raise NotImplementedError + + def get_num_starts(self, td): + return get_num_starts(td, self.name) + + def select_start_nodes(self, td, num_starts): + return select_start_nodes(td, self, num_starts) + + def check_solution_validity(self, td: TensorDict, actions: torch.Tensor) -> None: + """Function to check whether the solution is valid. Can be called by the agent to check the validity of the current state + This is called with the full solution (i.e. all actions) at the end of the episode + """ + raise NotImplementedError + + def replace_selected_actions( + self, + cur_actions: torch.Tensor, + new_actions: torch.Tensor, + selection_mask: torch.Tensor, + ) -> torch.Tensor: + """ + Replace selected current actions with updated actions based on `selection_mask`. + """ + raise NotImplementedError + + def local_search( + self, td: TensorDict, actions: torch.Tensor, **kwargs + ) -> torch.Tensor: + """Function to improve the solution. Can be called by the agent to improve the current state + This is called with the full solution (i.e. all actions) at the end of the episode + """ + raise NotImplementedError( + f"Local is not implemented yet for {self.name} environment" + ) + + def dataset(self, batch_size=[], phase="train", filename=None): + """Return a dataset of observations + Generates the dataset if it does not exist, otherwise loads it from file + """ + if filename is not None: + log.info(f"Overriding dataset filename from {filename}") + f = getattr(self, f"{phase}_file") if filename is None else filename + if f is None: + if phase != "train": + log.warning(f"{phase}_file not set. Generating dataset instead") + td = self.generator(batch_size) + else: + log.info(f"Loading {phase} dataset from {f}") + if phase == "train": + log.warning( + "Loading training dataset from file. This may not be desired in RL since " + "the dataset is fixed and the agent will not be able to explore new states" + ) + try: + if isinstance(f, Iterable) and not isinstance(f, str): + names = getattr(self, f"{phase}_dataloader_names") + return { + name: self.dataset_cls(self.load_data(_f, batch_size)) + for name, _f in zip(names, f) + } + else: + td = self.load_data(f, batch_size) + except FileNotFoundError: + log.error( + f"Provided file name {f} not found. Make sure to provide a file in the right path first or " + f"unset {phase}_file to generate data automatically instead" + ) + td = self.generator(batch_size) + + return self.dataset_cls(td) + + def transform(self): + """Used for converting TensorDict variables (such as with torch.cat) efficiently + https://pytorch.org/rl/reference/generated/torchrl.envs.transforms.Transform.html + By default, we do not need to transform the environment since we use specific embeddings + """ + return self + + def render(self, *args, **kwargs): + """Render the environment""" + raise NotImplementedError + + @staticmethod + def load_data(fpath, batch_size=[]): + """Dataset loading from file""" + return load_npz_to_tensordict(fpath) + + def _set_seed(self, seed: Optional[int]): + """Set the seed for the environment""" + rng = torch.manual_seed(seed) + self.rng = rng + + def to(self, device): + """Override `to` device method for safety against `None` device (may be found in `TensorDict`)""" + if device is None: + return self + else: + return super().to(device) + + @staticmethod + def solve( + instances: TensorDict, + max_runtime: float, + num_procs: int = 1, + **kwargs, + ) -> tuple[torch.Tensor, torch.Tensor]: + """Classical solver for the environment. This is a wrapper for the baselines solver. + + Args: + instances: The instances to solve + max_runtime: The maximum runtime for the solver + num_procs: The number of processes to use + + Returns: + A tuple containing the action and the cost, respectively + """ + raise NotImplementedError + + def __getstate__(self): + """Return the state of the environment. By default, we want to avoid pickling + the random number generator directly as it is not allowed by `deepcopy` + """ + state = self.__dict__.copy() + state["rng"] = state["rng"].get_state() + return state + + def __setstate__(self, state): + """Set the state of the environment. By default, we want to avoid pickling + the random number generator directly as it is not allowed by `deepcopy` + """ + self.__dict__.update(state) + self.rng = torch.manual_seed(0) + self.rng.set_state(state["rng"]) + + +class ImprovementEnvBase(RL4COEnvBase, metaclass=abc.ABCMeta): + """Base class for Improvement environments based on RL4CO EnvBase. + Note that this class assumes that the solution is stored in a linked list format. + Here, if `rec[i] = j`, it means the node `i` is connected to node `j`, i.e., edge `i-j` is in the solution. + For example, if edge `0-1`, edge `1-5`, edge `2-10` are in the solution, so we have `rec[0]=1`, `rec[1]=5` and `rec[2]=10`. + Kindly see https://github.com/yining043/VRP-DACT/blob/new_version/Play_with_DACT.ipynb for an example at the end for TSP. + """ + + def __init__( + self, + **kwargs, + ): + super().__init__(**kwargs) + + @abc.abstractmethod + def _step(self, td: TensorDict, solution_to=None) -> TensorDict: + raise NotImplementedError + + def step_to_solution(self, td, solution) -> TensorDict: + return self._step(td, solution_to=solution) + + @staticmethod + def _get_reward(td, actions) -> TensorDict: + raise NotImplementedError( + "This function is not used for improvement tasks since the reward is computed per step" + ) + + @staticmethod + def get_costs(coordinates, rec): + batch_size, size = rec.size() + + # calculate the route length value + d1 = coordinates.gather(1, rec.long().unsqueeze(-1).expand(batch_size, size, 2)) + d2 = coordinates + length = (d1 - d2).norm(p=2, dim=2).sum(1) + + return length + + @staticmethod + def _get_real_solution(rec): + batch_size, seq_length = rec.size() + visited_time = torch.zeros((batch_size, seq_length)).to(rec.device) + pre = torch.zeros((batch_size), device=rec.device).long() + for i in range(seq_length): + visited_time[torch.arange(batch_size), rec[torch.arange(batch_size), pre]] = ( + i + 1 + ) + pre = rec[torch.arange(batch_size), pre] + + visited_time = visited_time % seq_length + return visited_time.argsort() + + @staticmethod + def _get_linked_list_solution(solution): + solution_pre = solution + solution_post = torch.cat((solution[:, 1:], solution[:, :1]), 1) + + rec = solution.clone() + rec.scatter_(1, solution_pre, solution_post) + return rec + + @classmethod + def get_best_solution(cls, td): + return cls._get_real_solution(td["rec_best"]) + + @classmethod + def get_current_solution(cls, td): + return cls._get_real_solution(td["rec_current"]) diff --git a/rl4co/envs/common/distribution_utils.py b/rl4co/envs/common/distribution_utils.py new file mode 100644 index 00000000..ab8e1449 --- /dev/null +++ b/rl4co/envs/common/distribution_utils.py @@ -0,0 +1,292 @@ +import random + +import torch + + +class Cluster: + """ + Multiple gaussian distributed clusters, as in the Solomon benchmark dataset + Following the setting in Bi et al. 2022 (https://arxiv.org/abs/2210.07686) + + Args: + n_cluster: Number of the gaussian distributed clusters + """ + + def __init__(self, n_cluster: int = 3): + super().__init__() + self.lower, self.upper = 0.2, 0.8 + self.std = 0.07 + self.n_cluster = n_cluster + + def sample(self, size): + + batch_size, num_loc, _ = size + + # Generate the centers of the clusters + center = self.lower + (self.upper - self.lower) * torch.rand( + batch_size, self.n_cluster * 2 + ) + + # Pre-define the coordinates + coords = torch.zeros(batch_size, num_loc, 2) + + # Calculate the size of each cluster + cluster_sizes = [num_loc // self.n_cluster] * self.n_cluster + for i in range(num_loc % self.n_cluster): + cluster_sizes[i] += 1 + + # Generate the coordinates + current_index = 0 + for i in range(self.n_cluster): + means = center[:, i * 2 : (i + 1) * 2] + stds = torch.full((batch_size, 2), self.std) + points = torch.normal( + means.unsqueeze(1).expand(-1, cluster_sizes[i], -1), + stds.unsqueeze(1).expand(-1, cluster_sizes[i], -1), + ) + coords[:, current_index : current_index + cluster_sizes[i], :] = points + current_index += cluster_sizes[i] + + # Confine the coordinates to range [0, 1] + coords.clamp_(0, 1) + + return coords + + +class Mixed: + """ + 50% nodes sampled from uniform distribution, 50% nodes sampled from gaussian distribution, as in the Solomon benchmark dataset + Following the setting in Bi et al. 2022 (https://arxiv.org/abs/2210.07686) + + Args: + n_cluster_mix: Number of the gaussian distributed clusters + """ + + def __init__(self, n_cluster_mix=1): + super().__init__() + self.lower, self.upper = 0.2, 0.8 + self.std = 0.07 + self.n_cluster_mix = n_cluster_mix + + def sample(self, size): + + batch_size, num_loc, _ = size + + # Generate the centers of the clusters + center = self.lower + (self.upper - self.lower) * torch.rand( + batch_size, self.n_cluster_mix * 2 + ) + + # Pre-define the coordinates sampled under uniform distribution + coords = torch.FloatTensor(batch_size, num_loc, 2).uniform_(0, 1) + + # Sample mutated index (default setting: 50% mutation) + mutate_idx = torch.stack( + [torch.randperm(num_loc)[: num_loc // 2] for _ in range(batch_size)] + ) + + # Generate the coordinates + segment_size = num_loc // (2 * self.n_cluster_mix) + remaining_indices = num_loc // 2 - segment_size * (self.n_cluster_mix - 1) + sizes = [segment_size] * (self.n_cluster_mix - 1) + [remaining_indices] + for i in range(self.n_cluster_mix): + indices = mutate_idx[:, sum(sizes[:i]) : sum(sizes[: i + 1])] + means_x = center[:, 2 * i].unsqueeze(1).expand(-1, sizes[i]) + means_y = center[:, 2 * i + 1].unsqueeze(1).expand(-1, sizes[i]) + coords.scatter_( + 1, + indices.unsqueeze(-1).expand(-1, -1, 2), + torch.stack( + [ + torch.normal(means_x.expand(-1, sizes[i]), self.std), + torch.normal(means_y.expand(-1, sizes[i]), self.std), + ], + dim=2, + ), + ) + + # Confine the coordinates to range [0, 1] + coords.clamp_(0, 1) + + return coords + + +class Gaussian_Mixture: + """ + Following Zhou et al. (2023): https://arxiv.org/abs/2305.19587 + + Args: + num_modes: the number of clusters/modes in the Gaussian Mixture. + cdist: scale of the uniform distribution for center generation. + """ + + def __init__(self, num_modes: int = 0, cdist: int = 0): + super().__init__() + self.num_modes = num_modes + self.cdist = cdist + + def sample(self, size): + + batch_size, num_loc, _ = size + + if self.num_modes == 0: # (0, 0) - uniform + return torch.rand((batch_size, num_loc, 2)) + elif self.num_modes == 1 and self.cdist == 1: # (1, 1) - gaussian + return self.generate_gaussian(batch_size, num_loc) + else: + res = [self.generate_gaussian_mixture(num_loc) for _ in range(batch_size)] + return torch.stack(res) + + def generate_gaussian_mixture(self, num_loc): + """Following the setting in Zhang et al. 2022 (https://arxiv.org/abs/2204.03236)""" + + # Randomly decide how many points each mode gets + nums = torch.multinomial( + input=torch.ones(self.num_modes) / self.num_modes, + num_samples=num_loc, + replacement=True, + ) + + # Prepare to collect points + coords = torch.empty((0, 2)) + + # Generate points for each mode + for i in range(self.num_modes): + num = (nums == i).sum() # Number of points in this mode + if num > 0: + center = torch.rand((1, 2)) * self.cdist + cov = torch.eye(2) # Covariance matrix + nxy = torch.distributions.MultivariateNormal( + center.squeeze(), covariance_matrix=cov + ).sample((num,)) + coords = torch.cat((coords, nxy), dim=0) + + return self._global_min_max_scaling(coords) + + def generate_gaussian(self, batch_size, num_loc): + """Following the setting in Xin et al. 2022 (https://openreview.net/pdf?id=nJuzV-izmPJ)""" + + # Mean and random covariances + mean = torch.full((batch_size, num_loc, 2), 0.5) + covs = torch.rand(batch_size) # Random covariances between 0 and 1 + + # Generate the coordinates + coords = torch.zeros((batch_size, num_loc, 2)) + for i in range(batch_size): + # Construct covariance matrix for each sample + cov_matrix = torch.tensor([[1.0, covs[i]], [covs[i], 1.0]]) + m = torch.distributions.MultivariateNormal( + mean[i], covariance_matrix=cov_matrix + ) + coords[i] = m.sample() + + # Shuffle the coordinates + indices = torch.randperm(coords.size(0)) + coords = coords[indices] + + return self._batch_normalize_and_center(coords) + + def _global_min_max_scaling(self, coords): + + # Scale the points to [0, 1] using min-max scaling + coords_min = coords.min(0, keepdim=True).values + coords_max = coords.max(0, keepdim=True).values + coords = (coords - coords_min) / (coords_max - coords_min) + + return coords + + def _batch_normalize_and_center(self, coords): + # Step 1: Compute min and max along each batch + coords_min = coords.min(dim=1, keepdim=True).values + coords_max = coords.max(dim=1, keepdim=True).values + + # Step 2: Normalize coordinates to range [0, 1] + coords = ( + coords - coords_min + ) # Broadcasting subtracts min value on each coordinate + range_max = ( + (coords_max - coords_min).max(dim=-1, keepdim=True).values + ) # The maximum range among both coordinates + coords = coords / range_max # Divide by the max range to normalize + + # Step 3: Center the batch in the middle of the [0, 1] range + coords = ( + coords + (1 - coords.max(dim=1, keepdim=True).values) / 2 + ) # Centering the batch + + return coords + + +class Mix_Distribution: + """ + Mixture of three exemplar distributions in batch-level, i.e. Uniform, Cluster, Mixed + Following the setting in Bi et al. 2022 (https://arxiv.org/abs/2210.07686) + + Args: + n_cluster: Number of the gaussian distributed clusters in Cluster distribution + n_cluster_mix: Number of the gaussian distributed clusters in Mixed distribution + """ + + def __init__(self, n_cluster=3, n_cluster_mix=1): + super().__init__() + self.lower, self.upper = 0.2, 0.8 + self.std = 0.07 + self.Mixed = Mixed(n_cluster_mix=n_cluster_mix) + self.Cluster = Cluster(n_cluster=n_cluster) + + def sample(self, size): + + batch_size, num_loc, _ = size + + # Pre-define the coordinates sampled under uniform distribution + coords = torch.FloatTensor(batch_size, num_loc, 2).uniform_(0, 1) + + # Random sample probability for the distribution of each sample + p = torch.rand(batch_size) + + # Mixed + mask = p <= 0.33 + n_mixed = mask.sum().item() + if n_mixed > 0: + coords[mask] = self.Mixed.sample((n_mixed, num_loc, 2)) + + # Cluster + mask = (p > 0.33) & (p <= 0.66) + n_cluster = mask.sum().item() + if n_cluster > 0: + coords[mask] = self.Cluster.sample((n_cluster, num_loc, 2)) + + # The remaining ones are uniformly distributed + return coords + + +class Mix_Multi_Distributions: + """ + Mixture of 11 Gaussian-like distributions in batch-level + Following the setting in Zhou et al. (2023): https://arxiv.org/abs/2305.19587 + """ + + def __init__(self): + super().__init__() + self.dist_set = [(0, 0), (1, 1)] + [ + (m, c) for m in [3, 5, 7] for c in [10, 30, 50] + ] + + def sample(self, size): + batch_size, num_loc, _ = size + coords = torch.zeros(batch_size, num_loc, 2) + + # Pre-select distributions for the entire batch + dists = [random.choice(self.dist_set) for _ in range(batch_size)] + unique_dists = list( + set(dists) + ) # Unique distributions to minimize re-instantiation + + # Instantiate Gaussian_Mixture only once per unique distribution + gm_instances = {dist: Gaussian_Mixture(*dist) for dist in unique_dists} + + # Batch process where possible + for i, dist in enumerate(dists): + coords[i] = gm_instances[dist].sample((1, num_loc, 2)).squeeze(0) + + return coords diff --git a/rl4co/envs/common/utils.py b/rl4co/envs/common/utils.py new file mode 100644 index 00000000..413742d0 --- /dev/null +++ b/rl4co/envs/common/utils.py @@ -0,0 +1,109 @@ +import abc + +from typing import Callable, Union + +import torch + +from tensordict.tensordict import TensorDict +from torch.distributions import Exponential, Normal, Poisson, Uniform + +from rl4co.envs.common.distribution_utils import ( + Cluster, + Gaussian_Mixture, + Mix_Distribution, + Mix_Multi_Distributions, + Mixed, +) + + +class Generator(metaclass=abc.ABCMeta): + """Base data generator class, to be called with `env.generator(batch_size)`""" + + def __init__(self, **kwargs): + self.kwargs = kwargs + + def __call__(self, batch_size) -> TensorDict: + batch_size = [batch_size] if isinstance(batch_size, int) else batch_size + return self._generate(batch_size) + + @abc.abstractmethod + def _generate(self, batch_size, **kwargs) -> TensorDict: + raise NotImplementedError + + +def get_sampler( + val_name: str, + distribution: Union[int, float, str, type, Callable], + low: float = 0, + high: float = 1.0, + **kwargs, +): + """Get the sampler for the variable with the given distribution. + If kwargs are passed, they will be parsed e.g. with `val_name` + `_dist_arg` (e.g. `loc_std` for Normal distribution). + + Args: + val_name: Name of the variable + distribution: int/float value (as constant distribution), or string with the distribution name (supporting + uniform, normal, exponential, and poisson) or PyTorch Distribution type or a callable function that + returns a PyTorch Distribution + low: Minimum value for the variable, used for Uniform distribution + high: Maximum value for the variable, used for Uniform distribution + kwargs: Additional arguments for the distribution + + Example: + ```python + sampler_uniform = get_sampler("loc", "uniform", 0, 1) + sampler_normal = get_sampler("loc", "normal", loc_mean=0.5, loc_std=.2) + ``` + """ + if isinstance(distribution, (int, float)): + return Uniform(low=distribution, high=distribution) + elif distribution == Uniform or distribution == "uniform": + return Uniform(low=low, high=high) + elif distribution == Normal or distribution == "normal" or distribution == "gaussian": + assert ( + kwargs.get(val_name + "_mean", None) is not None + ), "mean is required for Normal distribution" + assert ( + kwargs.get(val_name + "_std", None) is not None + ), "std is required for Normal distribution" + return Normal(loc=kwargs[val_name + "_mean"], scale=kwargs[val_name + "_std"]) + elif distribution == Exponential or distribution == "exponential": + assert ( + kwargs.get(val_name + "_rate", None) is not None + ), "rate is required for Exponential/Poisson distribution" + return Exponential(rate=kwargs[val_name + "_rate"]) + elif distribution == Poisson or distribution == "poisson": + assert ( + kwargs.get(val_name + "_rate", None) is not None + ), "rate is required for Exponential/Poisson distribution" + return Poisson(rate=kwargs[val_name + "_rate"]) + elif distribution == "center": + return Uniform(low=(high - low) / 2, high=(high - low) / 2) + elif distribution == "corner": + return Uniform( + low=low, high=low + ) # todo: should be also `low, high` and any other corner + elif isinstance(distribution, Callable): + return distribution(**kwargs) + elif distribution == "gaussian_mixture": + return Gaussian_Mixture(num_modes=kwargs["num_modes"], cdist=kwargs["cdist"]) + elif distribution == "cluster": + return Cluster(kwargs["n_cluster"]) + elif distribution == "mixed": + return Mixed(kwargs["n_cluster_mix"]) + elif distribution == "mix_distribution": + return Mix_Distribution(kwargs["n_cluster"], kwargs["n_cluster_mix"]) + elif distribution == "mix_multi_distributions": + return Mix_Multi_Distributions() + else: + raise ValueError(f"Invalid distribution type of {distribution}") + + +def batch_to_scalar(param): + """Return first element if in batch. Used for batched parameters that are the same for all elements in the batch.""" + if len(param.shape) > 0: + return param[0].item() + if isinstance(param, torch.Tensor): + return param.item() + return param diff --git a/rl4co/envs/eda/__init__.py b/rl4co/envs/eda/__init__.py new file mode 100644 index 00000000..ce8f2f8c --- /dev/null +++ b/rl4co/envs/eda/__init__.py @@ -0,0 +1,2 @@ +from rl4co.envs.eda.dpp.env import DPPEnv +from rl4co.envs.eda.mdpp.env import MDPPEnv diff --git a/rl4co/envs/eda/dpp/__init__.py b/rl4co/envs/eda/dpp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/eda/dpp/env.py b/rl4co/envs/eda/dpp/env.py new file mode 100644 index 00000000..10def833 --- /dev/null +++ b/rl4co/envs/eda/dpp/env.py @@ -0,0 +1,251 @@ +import os + +from typing import Optional + +import numpy as np +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.pylogger import get_pylogger + +from .generator import DPPGenerator + +log = get_pylogger(__name__) + + +class DPPEnv(RL4COEnvBase): + """Decap Placement Problem (DPP) as done in DevFormer paper: https://arxiv.org/abs/2205.13225 + + The environment is a 10x10 grid with 100 locations containing either a probing port or a keepout region. + The goal is to place decaps (decoupling capacitors) to maximize the impedance suppression at the probing port. + Decaps cannot be placed in keepout regions or at the probing port and the number of decaps is limited. + + Observations: + - locations of the probing port and keepout regions + - current decap placement + - remaining decaps + + Constraints: + - decaps cannot be placed at the probing port or keepout regions + - the number of decaps is limited + + Finish Condition: + - the number of decaps exceeds the limit + + Reward: + - the impedance suppression at the probing port + + Args: + generator: DPPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "dpp" + + def __init__( + self, + generator: DPPGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = DPPGenerator(**generator_params) + self.generator = generator + + self.max_decaps = self.generator.max_decaps + self.size = self.generator.size + self.raw_pdn = self.generator.raw_pdn + self.decap = self.generator.decap + self.freq = self.generator.freq + self.num_freq = self.generator.num_freq + self.data_dir = self.generator.data_dir + + self._make_spec(self.generator) + + def _step(self, td: TensorDict) -> TensorDict: + current_node = td["action"] + + # Set available to 0 (i.e., already placed) if the current node is the first node + available = td["action_mask"].scatter( + -1, current_node.unsqueeze(-1).expand_as(td["action_mask"]), 0 + ) + + # Set done if i is greater than max_decaps + done = td["i"] >= self.max_decaps - 1 + + # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here + reward = torch.zeros_like(done) + + td.update( + { + "i": td["i"] + 1, + "action_mask": available, + "reward": reward, + "done": done, + } + ) + return td + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + device = td.device + + # Other variables + i = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device) + + return TensorDict( + { + "locs": td["locs"], + "probe": td["probe"], + "i": i, + "action_mask": td["action_mask"], + "keepout": ~td["action_mask"], + }, + batch_size=batch_size, + ) + + def _make_spec(self, generator: DPPGenerator): + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.size**2, 2), + dtype=torch.float32, + ), + probe=Unbounded( + shape=(1), + dtype=torch.int64, + ), + keepout=Unbounded( + shape=(generator.size**2), + dtype=torch.bool, + ), + i=Unbounded( + shape=(1), + dtype=torch.int64, + ), + action_mask=Unbounded( + shape=(generator.size**2), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.size**2, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + def _get_reward(self, td, actions): + """ + We call the reward function with the final sequence of actions to get the reward + Calling per-step would be very time consuming due to decap simulation + """ + # We do the operation in a batch + if len(td.batch_size) == 0: + td = td.unsqueeze(0) + actions = actions.unsqueeze(0) + probes = td["probe"] + reward = torch.stack( + [self._decap_simulator(p, a) for p, a in zip(probes, actions)] + ) + return reward + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor): + assert True, "Not implemented" + + def _decap_placement(self, pi, probe): + device = pi.device + + n = m = self.size # columns and rows + num_decap = torch.numel(pi) + z1 = self.raw_pdn.to(device) + + decap = self.decap.reshape(-1).to(device) + z2 = torch.zeros( + (self.num_freq, num_decap, num_decap), dtype=torch.float32, device=device + ) + + qIndx = torch.arange(num_decap, device=device) + + z2[:, qIndx, qIndx] = torch.abs(decap)[:, None].repeat_interleave( + z2[:, qIndx, qIndx].shape[-1], dim=-1 + ) + pIndx = pi.long() + + aIndx = torch.arange(len(z1[0]), device=device) + aIndx = torch.tensor( + list(set(aIndx.tolist()) - set(pIndx.tolist())), device=device + ) + + z1aa = z1[:, aIndx, :][:, :, aIndx] + z1ap = z1[:, aIndx, :][:, :, pIndx] + z1pa = z1[:, pIndx, :][:, :, aIndx] + z1pp = z1[:, pIndx, :][:, :, pIndx] + z2qq = z2[:, qIndx, :][:, :, qIndx] + + zout = z1aa - torch.matmul(torch.matmul(z1ap, torch.inverse(z1pp + z2qq)), z1pa) + + idx = torch.arange(n * m, device=device) + mask = torch.zeros(n * m, device=device).bool() + mask[pi] = True + mask = mask & (idx < probe) + probe -= mask.sum().item() + + zout = zout[:, probe, probe] + return zout + + def _decap_model(self, z_initial, z_final): + impedance_gap = torch.zeros(self.num_freq, device=self.device) + + impedance_gap = z_initial - z_final + reward = torch.sum(impedance_gap * 1000000000 / self.freq.to(self.device)) + + reward = reward / 10 + return reward + + def _initial_impedance(self, probe): + zout = self.raw_pdn.to(self.device)[:, probe, probe] + return zout + + def _decap_simulator(self, probe, solution, keepout=None): + self.to(self.device) + + probe = probe.item() + + assert len(solution) == len( + torch.unique(solution) + ), "An Element of Decap Sequence must be Unique" + + if keepout is not None: + keepout = torch.tensor(keepout) + intersect = torch.tensor(list(set(solution.tolist()) & set(keepout.tolist()))) + assert len(intersect) == 0, "Decap must be not placed at the keepout region" + + z_initial = self._initial_impedance(probe) + z_initial = torch.abs(z_initial) + z_final = self._decap_placement(solution, probe) + z_final = torch.abs(z_final) + reward = self._decap_model(z_initial, z_final) + return reward + + def _load_dpp_data(self, chip_file, decap_file, freq_file): + def _load_file(fpath): + f = os.path.join(self.generator.data_dir, fpath) + if not os.path.isfile(f): + self._download_data() + with open(f, "rb") as f_: + return torch.from_numpy(np.load(f_)).to(self.device) + + self.raw_pdn = _load_file(chip_file) # [num_freq, size^2, size^2] + self.decap = _load_file(decap_file).to(torch.complex64) # [num_freq, 1, 1] + self.freq = _load_file(freq_file) # [num_freq] + self.size = int(np.sqrt(self.raw_pdn.shape[-1])) + self.num_freq = self.freq.shape[0] diff --git a/rl4co/envs/eda/dpp/generator.py b/rl4co/envs/eda/dpp/generator.py new file mode 100644 index 00000000..d34b8e7c --- /dev/null +++ b/rl4co/envs/eda/dpp/generator.py @@ -0,0 +1,169 @@ +import os +import zipfile +from typing import Union, Callable + +import torch +import numpy as np + +from robust_downloader import download +from torch.distributions import Uniform +from tensordict.tensordict import TensorDict + +from rl4co.data.utils import load_npz_to_tensordict +from rl4co.utils.pylogger import get_pylogger +from rl4co.envs.common.utils import get_sampler, Generator + +log = get_pylogger(__name__) + + + +class DPPGenerator(Generator): + """Data generator for the Decap Placement Problem (DPP). + + Args: + min_loc: Minimum location value. Defaults to 0. + max_loc: Maximum location value. Defaults to 1. + num_keepout_min: Minimum number of keepout regions. Defaults to 1. + num_keepout_max: Maximum number of keepout regions. Defaults to 50. + max_decaps: Maximum number of decaps. Defaults to 20. + data_dir: Directory to store data. Defaults to "data/dpp/". + This can be downloaded from this [url](https://drive.google.com/uc?id=1IEuR2v8Le-mtHWHxwTAbTOPIkkQszI95). + chip_file: Name of the chip file. Defaults to "10x10_pkg_chip.npy". + decap_file: Name of the decap file. Defaults to "01nF_decap.npy". + freq_file: Name of the frequency file. Defaults to "freq_201.npy". + url: URL to download data from. Defaults to None. + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each customer + depot [batch_size, 2]: location of the depot + demand [batch_size, num_loc]: demand of each customer + capacity [batch_size]: capacity of the vehicle + """ + def __init__( + self, + min_loc: float = 0.0, + max_loc: float = 1.0, + num_keepout_min: int = 1, + num_keepout_max: int = 50, + max_decaps: int = 20, + data_dir: str = "data/dpp/", + chip_file: str = "10x10_pkg_chip.npy", + decap_file: str = "01nF_decap.npy", + freq_file: str = "freq_201.npy", + url: str = None, + **unused_kwargs + ): + self.min_loc = min_loc + self.max_loc = max_loc + self.num_keepout_min = num_keepout_min + self.num_keepout_max = num_keepout_max + self.max_decaps = max_decaps + self.data_dir = data_dir + + # DPP environment doen't have any other kwargs + if len(unused_kwargs) > 0: + log.error(f"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}") + + + # Download and load the data from online dataset + self.url = ( + "https://github.com/kaist-silab/devformer/raw/main/data/data.zip" + if url is None + else url + ) + self.backup_url = ( + "https://drive.google.com/uc?id=1IEuR2v8Le-mtHWHxwTAbTOPIkkQszI95" + ) + self._load_dpp_data(chip_file, decap_file, freq_file) + + # Check the validity of the keepout parameters + assert ( + num_keepout_min <= num_keepout_max + ), "num_keepout_min must be <= num_keepout_max" + assert ( + num_keepout_max <= self.size**2 + ), "num_keepout_max must be <= size * size (total number of locations)" + + def _generate(self, batch_size) -> TensorDict: + """ + Generate initial observations for the environment with locations, probe, and action mask + Action_mask eliminates the keepout regions and the probe location, and is updated to eliminate placed decaps + """ + m = n = self.size + # if int, convert to list and make it a batch for easier generation + batch_size = [batch_size] if isinstance(batch_size, int) else batch_size + batched = len(batch_size) > 0 + bs = [1] if not batched else batch_size + + # Create a list of locs on a grid + locs = torch.meshgrid( + torch.arange(m), torch.arange(n) + ) + locs = torch.stack(locs, dim=-1).reshape(-1, 2) + # normalize the locations by the number of rows and columns + locs = locs / torch.tensor([m, n], dtype=torch.float) + locs = locs[None].expand(*bs, -1, -1) + + # Create available mask + available = torch.ones((*bs, m * n), dtype=torch.bool) + + # Sample probe location from m*n + probe = torch.randint(m * n, size=(*bs, 1)) + available.scatter_(1, probe, False) + + # Sample keepout locations from m*n except probe + num_keepout = torch.randint( + self.num_keepout_min, + self.num_keepout_max, + size=(*bs, 1), + ) + keepouts = [torch.randperm(m * n)[:k] for k in num_keepout] + for i, (a, k) in enumerate(zip(available, keepouts)): + available[i] = a.scatter(0, k, False) + + return TensorDict( + { + "locs": locs if batched else locs.squeeze(0), + "probe": probe if batched else probe.squeeze(0), + "action_mask": available if batched else available.squeeze(0), + }, + batch_size=batch_size, + ) + + def _load_dpp_data(self, chip_file, decap_file, freq_file): + def _load_file(fpath): + f = os.path.join(self.data_dir, fpath) + if not os.path.isfile(f): + self._download_data() + with open(f, "rb") as f_: + return torch.from_numpy(np.load(f_)) + + self.raw_pdn = _load_file(chip_file) # [num_freq, size^2, size^2] + self.decap = _load_file(decap_file).to(torch.complex64) # [num_freq, 1, 1] + self.freq = _load_file(freq_file) # [num_freq] + self.size = int(np.sqrt(self.raw_pdn.shape[-1])) + self.num_freq = self.freq.shape[0] + + def _download_data(self): + log.info("Downloading data...") + try: + download(self.url, self.data_dir, "data.zip") + except Exception: + log.error( + f"Download from main url {self.url} failed. Trying backup url {self.backup_url}..." + ) + download(self.backup_url, self.data_dir, "data.zip") + log.info("Download complete. Unzipping...") + zipfile.ZipFile(os.path.join(self.data_dir, "data.zip"), "r").extractall( + self.data_dir + ) + log.info("Unzip complete. Removing zip file") + os.remove(os.path.join(self.data_dir, "data.zip")) + + def load_data(self, fpath, batch_size=[]): + data = load_npz_to_tensordict(fpath) + # rename key if necessary (old dpp version) + if "observation" in data.keys(): + data["locs"] = data.pop("observation") + return data diff --git a/rl4co/envs/eda/dpp/render.py b/rl4co/envs/eda/dpp/render.py new file mode 100644 index 00000000..fec5ecba --- /dev/null +++ b/rl4co/envs/eda/dpp/render.py @@ -0,0 +1,84 @@ +import torch +import numpy as np +import matplotlib.pyplot as plt + +from matplotlib import cm, colormaps + +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(self, decaps, probe, action_mask, ax=None, legend=True): + """ + Plot a grid of 1x1 squares representing the environment. + The keepout regions are the action_mask - decaps - probe + """ + import matplotlib.pyplot as plt + + settings = { + 0: {"color": "white", "label": "available"}, + 1: {"color": "grey", "label": "keepout"}, + 2: {"color": "tab:red", "label": "probe"}, + 3: {"color": "tab:blue", "label": "decap"}, + } + + nonzero_indices = torch.nonzero(~action_mask, as_tuple=True)[0] + keepout = torch.cat([nonzero_indices, probe, decaps.squeeze(-1)]) + unique_elements, counts = torch.unique(keepout, return_counts=True) + keepout = unique_elements[counts == 1] + + if ax is None: + fig, ax = plt.subplots(1, 1, figsize=(6, 6)) + + grid = np.meshgrid(np.arange(0, self.size), np.arange(0, self.size)) + grid = np.stack(grid, axis=-1) + + # Add new dimension to grid filled up with 0s + grid = np.concatenate([grid, np.zeros((self.size, self.size, 1))], axis=-1) + + # Add keepout = 1 + grid[keepout // self.size, keepout % self.size, 2] = 1 + # Add probe = 2 + grid[probe // self.size, probe % self.size, 2] = 2 + # Add decaps = 3 + grid[decaps // self.size, decaps % self.size, 2] = 3 + + xdim, ydim = grid.shape[0], grid.shape[1] + ax.imshow(np.zeros((xdim, ydim)), cmap="gray") + + ax.set_xlim(0, xdim) + ax.set_ylim(0, ydim) + + for i in range(xdim): + for j in range(ydim): + color = settings[grid[i, j, 2]]["color"] + x, y = grid[i, j, 0], grid[i, j, 1] + ax.add_patch(plt.Rectangle((x, y), 1, 1, color=color, linestyle="-")) + + # Add grid with 1x1 squares + ax.grid( + which="major", axis="both", linestyle="-", color="k", linewidth=1, alpha=0.5 + ) + # set 10 ticks + ax.set_xticks(np.arange(0, xdim, 1)) + ax.set_yticks(np.arange(0, ydim, 1)) + + # Invert y axis + ax.invert_yaxis() + + # Add legend + if legend: + num_unique = 4 + handles = [ + plt.Rectangle((0, 0), 1, 1, color=settings[i]["color"]) + for i in range(num_unique) + ] + ax.legend( + handles, + [settings[i]["label"] for i in range(num_unique)], + ncol=num_unique, + loc="upper center", + bbox_to_anchor=(0.5, 1.1), + ) diff --git a/rl4co/envs/eda/mdpp/__init__.py b/rl4co/envs/eda/mdpp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/eda/mdpp/env.py b/rl4co/envs/eda/mdpp/env.py new file mode 100644 index 00000000..5c4400d8 --- /dev/null +++ b/rl4co/envs/eda/mdpp/env.py @@ -0,0 +1,154 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.eda.dpp.env import DPPEnv +from rl4co.utils.pylogger import get_pylogger + +from .generator import MDPPGenerator + +log = get_pylogger(__name__) + + +class MDPPEnv(DPPEnv): + """Multiple decap placement problem (mDPP) environment + This is a modified version of the DPP environment where we allow multiple probing ports + + Observations: + - locations of the probing ports and keepout regions + - current decap placement + - remaining decaps + + Constraints: + - decaps cannot be placed at the probing ports or keepout regions + - the number of decaps is limited + + Finish Condition: + - the number of decaps exceeds the limit + + Reward: + - the impedance suppression at the probing ports + + Args: + generator: DPPGenerator instance as the data generator + generator_params: parameters for the generator + reward_type: reward type, either minmax or meansum + - minmax: min of the max of the decap scores + - meansum: mean of the sum of the decap scores + + Note: + The minmax is more challenging as it requires to find the best decap location + for the worst case + """ + + name = "mdpp" + + def __init__( + self, + generator: MDPPGenerator = None, + generator_params: dict = {}, + reward_type: str = "minmax", + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = MDPPGenerator(**generator_params) + self.generator = generator + + assert reward_type in [ + "minmax", + "meansum", + ], "reward_type must be minmax or meansum" + self.reward_type = reward_type + + self._make_spec(self.generator) + + def _step(self, td: TensorDict) -> TensorDict: + # Step function is the same as DPPEnv, only masking changes + return super()._step(td) + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + # Reset function is the same as DPPEnv, only masking changes due to probes + td_reset = super()._reset(td, batch_size=batch_size) + + # Action mask is 0 if both action_mask (e.g. keepout) and probe are 0 + action_mask = torch.logical_and(td_reset["action_mask"], ~td_reset["probe"]) + # Keepout regions are the inverse of action_mask + td_reset.update( + { + "keepout": ~td_reset["action_mask"], + "action_mask": action_mask, + } + ) + return td_reset + + def _make_spec(self, generator: MDPPGenerator): + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.size**2, 2), + dtype=torch.float32, + ), + probe=Unbounded( + shape=(1), + dtype=torch.int64, + ), + keepout=Unbounded( + shape=(generator.size**2), + dtype=torch.bool, + ), + i=Unbounded( + shape=(1), + dtype=torch.int64, + ), + action_mask=Unbounded( + shape=(generator.size**2), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.size**2, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + def _get_reward(self, td, actions): + """We call the reward function with the final sequence of actions to get the reward + Calling per-step would be very time consuming due to decap simulation + """ + # We do the operation in a batch + if len(td.batch_size) == 0: + td = td.unsqueeze(0) + actions = actions.unsqueeze(0) + + # Reward calculation is expensive since we need to run decap simulation (not vectorizable) + reward = torch.stack( + [ + self._single_env_reward(td_single, action) + for td_single, action in zip(td, actions) + ] + ) + return reward + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor): + assert True, "Not implemented" + + def _single_env_reward(self, td, actions): + """Get reward for single environment. We""" + + list_probe = torch.nonzero(td["probe"]).squeeze() + scores = torch.zeros_like(list_probe, dtype=torch.float32) + for i, probe in enumerate(list_probe): + # Get the decap scores for the probe location + scores[i] = self._decap_simulator(probe, actions) + # If minmax, return min of max decap scores else mean + return scores.min() if self.reward_type == "minmax" else scores.mean() diff --git a/rl4co/envs/eda/mdpp/generator.py b/rl4co/envs/eda/mdpp/generator.py new file mode 100644 index 00000000..75767150 --- /dev/null +++ b/rl4co/envs/eda/mdpp/generator.py @@ -0,0 +1,178 @@ +import os +import zipfile +from typing import Union, Callable + +import torch +import numpy as np + +from robust_downloader import download +from torch.distributions import Uniform +from tensordict.tensordict import TensorDict + +from rl4co.data.utils import load_npz_to_tensordict +from rl4co.utils.pylogger import get_pylogger +from rl4co.envs.common.utils import get_sampler, Generator + +log = get_pylogger(__name__) + + +class MDPPGenerator(Generator): + """Data generator for the Multi Decap Placement Problem (MDPP). + + Args: + min_loc: Minimum location value. Defaults to 0. + max_loc: Maximum location value. Defaults to 1. + num_keepout_min: Minimum number of keepout regions. Defaults to 1. + num_keepout_max: Maximum number of keepout regions. Defaults to 50. + max_decaps: Maximum number of decaps. Defaults to 20. + data_dir: Directory to store data. Defaults to "data/dpp/". + This can be downloaded from this [url](https://drive.google.com/uc?id=1IEuR2v8Le-mtHWHxwTAbTOPIkkQszI95). + chip_file: Name of the chip file. Defaults to "10x10_pkg_chip.npy". + decap_file: Name of the decap file. Defaults to "01nF_decap.npy". + freq_file: Name of the frequency file. Defaults to "freq_201.npy". + url: URL to download data from. Defaults to None. + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each customer + depot [batch_size, 2]: location of the depot + demand [batch_size, num_loc]: demand of each customer + capacity [batch_size]: capacity of the vehicle + """ + def __init__( + self, + min_loc: float = 0.0, + max_loc: float = 1.0, + num_keepout_min: int = 1, + num_keepout_max: int = 50, + num_probes_min: int = 2, + num_probes_max: int = 5, + max_decaps: int = 20, + data_dir: str = "data/dpp/", + chip_file: str = "10x10_pkg_chip.npy", + decap_file: str = "01nF_decap.npy", + freq_file: str = "freq_201.npy", + url: str = None, + **unused_kwargs + ): + self.min_loc = min_loc + self.max_loc = max_loc + self.num_keepout_min = num_keepout_min + self.num_keepout_max = num_keepout_max + self.num_probes_min = num_probes_min + self.num_probes_max = num_probes_max + self.max_decaps = max_decaps + self.data_dir = data_dir + + # DPP environment doen't have any other kwargs + if len(unused_kwargs) > 0: + log.error(f"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}") + + + # Download and load the data from online dataset + self.url = ( + "https://github.com/kaist-silab/devformer/raw/main/data/data.zip" + if url is None + else url + ) + self.backup_url = ( + "https://drive.google.com/uc?id=1IEuR2v8Le-mtHWHxwTAbTOPIkkQszI95" + ) + self._load_dpp_data(chip_file, decap_file, freq_file) + + # Check the validity of the keepout parameters + assert ( + num_keepout_min <= num_keepout_max + ), "num_keepout_min must be <= num_keepout_max" + assert ( + num_keepout_max <= self.size**2 + ), "num_keepout_max must be <= size * size (total number of locations)" + + def _generate(self, batch_size) -> TensorDict: + m = n = self.size + # if int, convert to list and make it a batch for easier generation + batch_size = [batch_size] if isinstance(batch_size, int) else batch_size + batched = len(batch_size) > 0 + bs = [1] if not batched else batch_size + + # Create a list of locs on a grid + locs = torch.meshgrid(torch.arange(m), torch.arange(n)) + locs = torch.stack(locs, dim=-1).reshape(-1, 2) + # normalize the locations by the number of rows and columns + locs = locs / torch.tensor([m, n], dtype=torch.float) + locs = locs[None].expand(*bs, -1, -1) + + # Create available mask + available = torch.ones((*bs, m * n), dtype=torch.bool) + + # Sample probe location from m*n + probe = torch.randint(m * n, size=(*bs, 1)) + available.scatter_(1, probe, False) + + # Sample probe locatins + num_probe = torch.randint( + self.num_probes_min, + self.num_probes_max, + size=(*bs, 1), + ) + probe = [torch.randperm(m * n)[:p] for p in num_probe] + probes = torch.zeros((*bs, m * n), dtype=torch.bool) + for i, (a, p) in enumerate(zip(available, probe)): + available[i] = a.scatter(0, p, False) + probes[i] = probes[i].scatter(0, p, True) + + # Sample keepout locations from m*n except probe + num_keepout = torch.randint( + self.num_keepout_min, + self.num_keepout_max, + size=(*bs, 1), + ) + keepouts = [torch.randperm(m * n)[:k] for k in num_keepout] + for i, (a, k) in enumerate(zip(available, keepouts)): + available[i] = a.scatter(0, k, False) + + return TensorDict( + { + "locs": locs if batched else locs.squeeze(0), + "probe": probes if batched else probes.squeeze(0), + "action_mask": available if batched else available.squeeze(0), + }, + batch_size=batch_size, + ) + + def _load_dpp_data(self, chip_file, decap_file, freq_file): + def _load_file(fpath): + f = os.path.join(self.data_dir, fpath) + if not os.path.isfile(f): + self._download_data() + with open(f, "rb") as f_: + return torch.from_numpy(np.load(f_)) + + self.raw_pdn = _load_file(chip_file) # [num_freq, size^2, size^2] + self.decap = _load_file(decap_file).to(torch.complex64) # [num_freq, 1, 1] + self.freq = _load_file(freq_file) # [num_freq] + self.size = int(np.sqrt(self.raw_pdn.shape[-1])) + self.num_freq = self.freq.shape[0] + + def _download_data(self): + log.info("Downloading data...") + try: + download(self.url, self.data_dir, "data.zip") + except Exception: + log.error( + f"Download from main url {self.url} failed. Trying backup url {self.backup_url}..." + ) + download(self.backup_url, self.data_dir, "data.zip") + log.info("Download complete. Unzipping...") + zipfile.ZipFile(os.path.join(self.data_dir, "data.zip"), "r").extractall( + self.data_dir + ) + log.info("Unzip complete. Removing zip file") + os.remove(os.path.join(self.data_dir, "data.zip")) + + def load_data(self, fpath, batch_size=[]): + data = load_npz_to_tensordict(fpath) + # rename key if necessary (old dpp version) + if "observation" in data.keys(): + data["locs"] = data.pop("observation") + return data diff --git a/rl4co/envs/eda/mdpp/render.py b/rl4co/envs/eda/mdpp/render.py new file mode 100644 index 00000000..fbd4cd00 --- /dev/null +++ b/rl4co/envs/eda/mdpp/render.py @@ -0,0 +1,161 @@ +import torch +import numpy as np +import matplotlib.pyplot as plt + +from matplotlib import cm, colormaps + +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(self, td, actions=None, ax=None, legend=True, settings=None): + """Plot a grid of squares representing the environment. + The keepout regions are the action_mask - decaps - probe + """ + + import matplotlib.pyplot as plt + + from matplotlib.lines import Line2D + from matplotlib.patches import Annulus, Rectangle, RegularPolygon + + if settings is None: + settings = { + "available": {"color": "white", "label": "available"}, + "keepout": {"color": "grey", "label": "keepout"}, + "probe": {"color": "tab:red", "label": "probe"}, + "decap": {"color": "tab:blue", "label": "decap"}, + } + + def draw_capacitor(ax, x, y, color="black"): + # Backgrund rectangle: same as color but with alpha=0.5 + ax.add_patch(Rectangle((x, y), 1, 1, color=color, alpha=0.5)) + + # Create the plates of the capacitor + plate_width, plate_height = ( + 0.3, + 0.1, + ) # Width and height switched to make vertical + plate_gap = 0.2 + plate1 = Rectangle( + (x + 0.5 - plate_width / 2, y + 0.5 - plate_height - plate_gap / 2), + plate_width, + plate_height, + color=color, + ) + plate2 = Rectangle( + (x + 0.5 - plate_width / 2, y + 0.5 + plate_gap / 2), + plate_width, + plate_height, + color=color, + ) + + # Add the plates to the axes + ax.add_patch(plate1) + ax.add_patch(plate2) + + # Add connection lines (wires) + line_length = 0.2 + line1 = Line2D( + [x + 0.5, x + 0.5], + [ + y + 0.5 - plate_height - plate_gap / 2 - line_length, + y + 0.5 - plate_height - plate_gap / 2, + ], + color=color, + ) + line2 = Line2D( + [x + 0.5, x + 0.5], + [ + y + 0.5 + plate_height + plate_gap / 2, + y + 0.5 + plate_height + plate_gap / 2 + line_length, + ], + color=color, + ) + + # Add the lines to the axes + ax.add_line(line1) + ax.add_line(line2) + + def draw_probe(ax, x, y, color="black"): + # Backgrund rectangle: same as color but with alpha=0.5 + ax.add_patch(Rectangle((x, y), 1, 1, color=color, alpha=0.5)) + ax.add_patch(Annulus((x + 0.5, y + 0.5), (0.2, 0.2), 0.1, color=color)) + + def draw_keepout(ax, x, y, color="black"): + # Backgrund rectangle: same as color but with alpha=0.5 + ax.add_patch(Rectangle((x, y), 1, 1, color=color, alpha=0.5)) + ax.add_patch( + RegularPolygon( + (x + 0.5, y + 0.5), numVertices=6, radius=0.45, color=color + ) + ) + + size = self.size + td = td.detach().cpu() + # if batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + + if actions is None: + actions = td.get("action", None) + + # Transform actions from idx to one-hot + decaps = torch.zeros(size**2) + decaps.scatter_(0, actions, 1) + decaps = decaps.reshape(size, size) + + keepout = ~td["action_mask"].reshape(size, size) + probes = td["probe"].reshape(size, size) + + if ax is None: + _, ax = plt.subplots(1, 1, figsize=(6, 6)) + + grid = np.meshgrid(np.arange(0, size), np.arange(0, size)) + grid = np.stack(grid, axis=-1) + + xdim, ydim = grid.shape[0], grid.shape[1] + # ax.imshow(np.zeros((xdim, ydim)), cmap="gray") + + ax.set_xlim(0, xdim) + ax.set_ylim(0, ydim) + + for i in range(xdim): + for j in range(ydim): + x, y = grid[i, j, 0], grid[i, j, 1] + + if decaps[i, j] == 1: + draw_capacitor(ax, x, y, color=settings["decap"]["color"]) + elif probes[i, j] == 1: + draw_probe(ax, x, y, color=settings["probe"]["color"]) + elif keepout[i, j] == 1: + draw_keepout(ax, x, y, color=settings["keepout"]["color"]) + + ax.grid( + which="major", axis="both", linestyle="-", color="k", linewidth=1, alpha=0.5 + ) + # set 10 ticks + ax.set_xticks(np.arange(0, xdim, 1)) + ax.set_yticks(np.arange(0, ydim, 1)) + + # Invert y axis + ax.invert_yaxis() + + # # Add legend + if legend: + colors = [settings[k]["color"] for k in settings.keys()] + labels = [settings[k]["label"] for k in settings.keys()] + handles = [ + plt.Rectangle( + (0, 0), 1, 1, color=c, edgecolor="k", linestyle="-", linewidth=1 + ) + for c in colors + ] + ax.legend( + handles, + [label for label in labels], + ncol=len(colors), + loc="upper center", + bbox_to_anchor=(0.5, 1.1), + ) diff --git a/rl4co/envs/graph/__init__.py b/rl4co/envs/graph/__init__.py new file mode 100644 index 00000000..355a55c6 --- /dev/null +++ b/rl4co/envs/graph/__init__.py @@ -0,0 +1,4 @@ +from rl4co.envs.graph.flp.env import FLPEnv +from rl4co.envs.graph.flp.generator import FLPGenerator +from rl4co.envs.graph.mcp.env import MCPEnv +from rl4co.envs.graph.mcp.generator import MCPGenerator diff --git a/rl4co/envs/graph/flp/__init__.py b/rl4co/envs/graph/flp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/graph/flp/env.py b/rl4co/envs/graph/flp/env.py new file mode 100644 index 00000000..aa73b3f9 --- /dev/null +++ b/rl4co/envs/graph/flp/env.py @@ -0,0 +1,169 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +from .generator import FLPGenerator + +log = get_pylogger(__name__) + + +class FLPEnv(RL4COEnvBase): + """Facility Location Problem (FLP) environment + At each step, the agent chooses a location. The reward is 0 unless enough number of locations are chosen. + The reward is (-) the total distance of each location to its closest chosen location. + + Observations: + - the locations + - the number of locations to choose + + Constraints: + - the given number of locations must be chosen + + Finish condition: + - the given number of locations are chosen + + Reward: + - (minus) the total distance of each location to its closest chosen location + + Args: + generator: FLPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "flp" + + def __init__( + self, + generator: FLPGenerator = None, + generator_params: dict = {}, + check_solution=False, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = FLPGenerator(**generator_params) + self.generator = generator + self.check_solution = check_solution + self._make_spec(self.generator) + + def _step(self, td: TensorDict) -> TensorDict: + # action: [batch_size, 1]; the location to be chosen in each instance + selected = td["action"] + batch_size = selected.shape[0] + + # Update location selection status + chosen = td["chosen"].clone() # (batch_size, n_locations) + n_points_ = chosen.shape[-1] + + chosen[torch.arange(batch_size).to(td.device), selected] = True + + # We are done if we choose enough locations + done = td["i"] >= (td["to_choose"] - 1) + + # The reward is calculated outside via get_reward for efficiency, so we set it to zero here + reward = torch.zeros_like(done) + + # Update distances + orig_distances = td["orig_distances"] # (batch_size, n_points, n_points) + + cur_min_dist = ( + gather_by_index( + orig_distances, chosen.nonzero(as_tuple=True)[1].view(batch_size, -1) + ) + .view(batch_size, -1, n_points_) + .min(dim=1) + .values + ) + + # We cannot choose the already-chosen locations + action_mask = ~chosen + + td.update( + { + "distances": cur_min_dist, # (batch_size, n_points) + # states changed by actions + "chosen": chosen, # each entry is binary; 1 iff the corresponding facility is chosen + "i": td["i"] + 1, # the number of sets we have chosen + "action_mask": action_mask, + "reward": reward, + "done": done, + } + ) + return td + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + self.to(td.device) + + return TensorDict( + { + # given information + "locs": td["locs"], # (batch_size, n_points, dim_loc) + "orig_distances": td[ + "orig_distances" + ], # (batch_size, n_points, n_points) + "distances": td["distances"], # (batch_size, n_points, n_points) + # states changed by actions + "chosen": torch.zeros( + *td["locs"].shape[:-1], dtype=torch.bool, device=td.device + ), # each entry is binary; 1 iff the corresponding facility is chosen + "to_choose": td["to_choose"], # the number of sets to choose + "i": torch.zeros( + *batch_size, dtype=torch.int64, device=td.device + ), # the number of sets we have chosen + "action_mask": torch.ones( + *td["locs"].shape[:-1], dtype=torch.bool, device=td.device + ), + }, + batch_size=batch_size, + ) + + def _make_spec(self, generator: FLPGenerator): + # TODO: make spec + pass + + def _get_reward(self, td: TensorDict, actions: torch.Tensor) -> torch.Tensor: + if self.check_solution: + self.check_solution_validity(td, actions) + + # The reward is (minus) the total distance from each location to the closest chosen location + chosen = td["chosen"] # (batch_size, n_points) + batch_size_ = td["chosen"].shape[0] + n_points_ = td["chosen"].shape[-1] + orig_distances = td["orig_distances"] + cur_min_dist = ( + gather_by_index( + orig_distances, chosen.nonzero(as_tuple=True)[1].view(batch_size_, -1) + ) + .view(batch_size_, -1, n_points_) + .min(1) + .values.sum(-1) + ) + return -cur_min_dist + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor) -> None: + # TODO: check solution validity + pass + + @staticmethod + def local_search(td: TensorDict, actions: torch.Tensor, **kwargs) -> torch.Tensor: + # TODO: local search + pass + + @staticmethod + def get_num_starts(td): + return td["action_mask"].shape[-1] + + @staticmethod + def select_start_nodes(td, num_starts): + num_loc = td["action_mask"].shape[-1] + return ( + torch.arange(num_starts, device=td.device).repeat_interleave(td.shape[0]) + % num_loc + ) diff --git a/rl4co/envs/graph/flp/generator.py b/rl4co/envs/graph/flp/generator.py new file mode 100644 index 00000000..adbc7de6 --- /dev/null +++ b/rl4co/envs/graph/flp/generator.py @@ -0,0 +1,74 @@ +import math + +from typing import Callable, Union + +import torch + +from tensordict.tensordict import TensorDict +from torch.distributions import Uniform + +from rl4co.envs.common.utils import Generator, get_sampler +from rl4co.utils.ops import get_distance_matrix +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class FLPGenerator(Generator): + """Data generator for the Facility Location Problem (FLP). + + Args: + num_loc: number of locations in the FLP + min_loc: minimum value for the location coordinates + max_loc: maximum value for the location coordinates + loc_distribution: distribution for the location coordinates + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations + orig_distances [batch_size, num_loc, num_loc]: original distances between locations + distances [batch_size, num_loc]: the current minimum distance rom each location to the chosen locations + chosen [batch_size, num_loc]: indicators of chosen locations + to_choose [batch_size, 1]: number of locations to choose in the FLP + """ + + def __init__( + self, + num_loc: int = 100, + min_loc: float = 0.0, + max_loc: float = 1.0, + loc_distribution: Union[int, float, str, type, Callable] = Uniform, + to_choose: int = 10, + **kwargs, + ): + self.num_loc = num_loc + self.min_loc = min_loc + self.max_loc = max_loc + self.to_choose = to_choose + + # Location distribution + if kwargs.get("loc_sampler", None) is not None: + self.loc_sampler = kwargs["loc_sampler"] + else: + self.loc_sampler = get_sampler( + "loc", loc_distribution, min_loc, max_loc, **kwargs + ) + + def _generate(self, batch_size) -> TensorDict: + # Sample locations + locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2)) + distances = get_distance_matrix(locs) + max_dist = math.sqrt(2) * (self.max_loc - self.min_loc) + + return TensorDict( + { + "locs": locs, + "orig_distances": distances, + "distances": torch.full( + (*batch_size, self.num_loc), max_dist, dtype=torch.float + ), + "chosen": torch.zeros(*batch_size, self.num_loc, dtype=torch.bool), + "to_choose": torch.ones(*batch_size, dtype=torch.long) * self.to_choose, + }, + batch_size=batch_size, + ) diff --git a/rl4co/envs/graph/mcp/__init__.py b/rl4co/envs/graph/mcp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/graph/mcp/env.py b/rl4co/envs/graph/mcp/env.py new file mode 100644 index 00000000..3f0275e0 --- /dev/null +++ b/rl4co/envs/graph/mcp/env.py @@ -0,0 +1,193 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.pylogger import get_pylogger + +from .generator import MCPGenerator + +log = get_pylogger(__name__) + + +class MCPEnv(RL4COEnvBase): + """Maximum Coverage Problem (MCP) environment + At each step, the agent chooses a set. The reward is 0 unless enough number of sets are chosen. + The reward is the total weights of the covered items (i.e., items in any chosen set). + + Observations: + - the weights of items + - the membership of items in sets + - the number of sets to choose + + Constraints: + - the given number of sets must be chosen + + Finish condition: + - the given number of sets are chosen + + Reward: + - the total weights of the covered items (i.e., items in any chosen set) + + Args: + generator: MCPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "mcp" + + def __init__( + self, + generator: MCPGenerator = None, + generator_params: dict = {}, + check_solution=False, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = MCPGenerator(**generator_params) + self.generator = generator + self.check_solution = check_solution + self._make_spec(self.generator) + + def _step(self, td: TensorDict) -> TensorDict: + # action: [batch_size, 1]; the set to be chosen in each instance + batch_size = td["action"].shape[0] + selected = td["action"] + + # Update set selection status + chosen = td["chosen"].clone() # (batch_size, n_sets) + chosen[torch.arange(batch_size).to(td.device), selected] = True + + # We are done if we choose enough sets + done = td["i"] >= (td["n_sets_to_choose"] - 1) + + # The reward is calculated outside via get_reward for efficiency, so we set it to -inf here + reward = torch.ones_like(done) * float("-inf") + + remaining_sets = ~chosen # (batch_size, n_sets) + + chosen_membership = chosen.unsqueeze(-1) * td["membership"] + chosen_membership_nonzero = chosen_membership.nonzero() + remaining_membership = remaining_sets.unsqueeze(-1) * td["membership"] + + batch_indices, set_indices, item_indices = chosen_membership_nonzero.T + chosen_items_indices = chosen_membership[ + batch_indices, set_indices, item_indices + ].long() + + batch_size, n_items = td["weights"].shape + + # We have batch_indices and chosen_items_indices + # chosen_items: (batch_size, n_items) + # for each i, chosen_items[batch_size[i], chosen_items_indices[i]] += 1 + chosen_items = torch.zeros(batch_size, n_items + 1, device=td.device) + chosen_items[batch_indices, chosen_items_indices] += 1 + chosen_items = chosen_items[:, 1:] # Remove the first column (invalid zeros) + + # chosen_item[i, j] > 0 means item j is chosen in batch i + covered_items = (chosen_items > 0).float() # (batch_size, n_items) + remaining_items = 1.0 - covered_items # (batch_size, n_items) + + # We cannot choose the already-chosen sets + action_mask = ~chosen + + td.update( + { + "membership": remaining_membership, # (batch_size, n_sets, max_size) + "weights": td["weights"] * remaining_items, # (batch_size, n_items) + "chosen": chosen, + "i": td["i"] + 1, + "action_mask": action_mask, + "reward": reward, + "done": done, + } + ) + return td + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + self.to(td.device) + + return TensorDict( + { + # given information; constant for each given instance + "orig_membership": td["membership"], # (batch_size, n_sets, max_size) + "membership": td["membership"], # (batch_size, n_sets, max_size) + "orig_weights": td["weights"], # (batch_size, n_items) + "weights": td["weights"], # (batch_size, n_items) + "n_sets_to_choose": td["n_sets_to_choose"], # (batch_size, 1) + # states changed by actions + "chosen": torch.zeros( + *td["membership"].shape[:-1], dtype=torch.bool, device=td.device + ), # each entry is binary; 1 iff the corresponding set is chosen + "i": torch.zeros( + *batch_size, dtype=torch.int64, device=td.device + ), # the number of sets we have chosen + "action_mask": torch.ones( + *td["membership"].shape[:-1], dtype=torch.bool, device=td.device + ), + }, + batch_size=batch_size, + ) + + def _make_spec(self, generator: MCPGenerator): + # TODO: make spec + pass + + def _get_reward(self, td: TensorDict, actions: torch.Tensor) -> torch.Tensor: + if self.check_solution: + self.check_solution_validity(td, actions) + + membership = td[ + "orig_membership" + ] # (batch_size, n_sets, max_size); membership[i, j] = the items in set j in batch i (with 0 padding) + weights = td["orig_weights"] # (batch_size, n_items) + chosen_sets = td["chosen"] # (batch_size, n_set); 1 if chosen, 0 otherwise + + chosen_membership = chosen_sets.unsqueeze(-1) * membership + chosen_membership_nonzero = chosen_membership.nonzero() + + batch_indices, set_indices, item_indices = chosen_membership_nonzero.T + chosen_items_indices = chosen_membership[ + batch_indices, set_indices, item_indices + ].long() + + batch_size, n_items = weights.shape + + # We have batch_indices and chosen_items_indices + # chosen_items: (batch_size, n_items) + # For each i, chosen_items[batch_size[i], chosen_items_indices[i]] += 1 + chosen_items = torch.zeros(batch_size, n_items + 1, device=td.device) + chosen_items[batch_indices, chosen_items_indices] += 1 + chosen_items = chosen_items[:, 1:] # remove the first column + + # chosen_item[i, j] > 0 means item j is chosen in batch i + chosen_items = (chosen_items > 0).float() + # Compute the total weights of chosen items + chosen_weights = torch.sum(chosen_items * weights, dim=-1) + + return chosen_weights + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor) -> None: + # TODO: check solution validity + pass + + @staticmethod + def local_search(td: TensorDict, actions: torch.Tensor, **kwargs) -> torch.Tensor: + # TODO: local search + pass + + @staticmethod + def get_num_starts(td): + return td["action_mask"].shape[-1] + + @staticmethod + def select_start_nodes(td, num_starts): + num_sets = td["action_mask"].shape[-1] + return ( + torch.arange(num_starts, device=td.device).repeat_interleave(td.shape[0]) + % num_sets + ) diff --git a/rl4co/envs/graph/mcp/generator.py b/rl4co/envs/graph/mcp/generator.py new file mode 100644 index 00000000..99d5463f --- /dev/null +++ b/rl4co/envs/graph/mcp/generator.py @@ -0,0 +1,138 @@ +from typing import Callable, Union + +import torch + +from tensordict.tensordict import TensorDict +from torch.distributions import Uniform + +from rl4co.envs.common.utils import Generator, get_sampler +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def remove_repeat(x: torch.Tensor) -> torch.Tensor: + """ + Remove the repeated elements in each row (i.e., the last dimension) of the input tensor x, + and change the repeated elements to 0 + + Ref: https://stackoverflow.com/questions/62300404 + + Args: + x: input tensor + """ + + # sorting the rows so that duplicate values appear together + # e.g., first row: [1, 2, 3, 3, 3, 4, 4] + y, indices = x.sort(dim=-1) + + # subtracting, so duplicate values will become 0 + # e.g., first row: [1, 2, 3, 0, 0, 4, 0] + y[..., 1:] *= ((y[..., 1:] - y[..., :-1]) != 0).long() + + # retrieving the original indices of elements + indices = indices.sort(dim=-1)[1] + + # re-organizing the rows following original order + # e.g., first row: [1, 2, 3, 4, 0, 0, 0] + return torch.gather(y, -1, indices) + + +class MCPGenerator(Generator): + """Data generator for the Maximum Coverage Problem (MCP). + + Args: + num_items: number of items in the MCP + num_sets: number of sets in the MCP + min_weight: minimum value for the item weights + max_weight: maximum value for the item weights + min_size: minimum size for the sets + max_size: maximum size for the sets + n_sets_to_choose: number of sets to choose in the MCP + + Returns: + A TensorDict with the following keys: + membership [batch_size, num_sets, max_size]: membership of items in sets + weights [batch_size, num_items]: weights of the items + n_sets_to_choose [batch_size, 1]: number of sets to choose in the MCP + """ + + def __init__( + self, + num_items: int = 200, + num_sets: int = 100, + min_weight: int = 1, + max_weight: int = 10, + min_size: int = 5, + max_size: int = 15, + n_sets_to_choose: int = 10, + size_distribution: Union[int, float, str, type, Callable] = Uniform, + weight_distribution: Union[int, float, str, type, Callable] = Uniform, + **kwargs, + ): + self.num_items = num_items + self.num_sets = num_sets + self.min_weight = min_weight + self.max_weight = max_weight + self.min_size = min_size + self.max_size = max_size + self.n_sets_to_choose = n_sets_to_choose + + # Set size distribution + if kwargs.get("size_sampler", None) is not None: + self.size_sampler = kwargs["size_sampler"] + else: + self.size_sampler = get_sampler( + "size", size_distribution, min_size, max_size + 1, **kwargs + ) + + # Item weight distribution + if kwargs.get("weight_sampler", None) is not None: + self.weight_sampler = kwargs["weight_sampler"] + else: + self.weight_sampler = get_sampler( + "weight", weight_distribution, min_weight, max_weight + 1, **kwargs + ) + + def _generate(self, batch_size) -> TensorDict: + try: + batch_size = batch_size[0] + except TypeError: + batch_size = batch_size + + # Sample item weights + weights_tensor = self.weight_sampler.sample((batch_size, self.num_items)) + weights_tensor = torch.floor(weights_tensor) + weights_tensor = torch.clamp(weights_tensor, self.min_weight, self.max_weight) + + # Sample set sizes + set_sizes = self.size_sampler.sample((batch_size, self.num_sets)) + set_sizes = torch.floor(set_sizes).long() + set_sizes = torch.clamp(set_sizes, self.min_size, self.max_size) + max_size = set_sizes.max().item() + + # Create membership tensor + membership_tensor_max_size = torch.randint( + 1, self.num_items + 1, (batch_size, self.num_sets, max_size) + ) + + cutoffs_masks = torch.arange(self.max_size).view(1, 1, -1) < set_sizes.unsqueeze( + -1 + ) + # Take the masked elements, 0 means the item is invalid + membership_tensor = ( + membership_tensor_max_size * cutoffs_masks + ) # (batch_size, num_sets, max_size) + + # Remove repeated items in each set + membership_tensor = remove_repeat(membership_tensor) + + return TensorDict( + { + "membership": membership_tensor.float(), # (batch_size, num_sets, max_size) + "weights": weights_tensor.float(), # (batch_size, num_items) + "n_sets_to_choose": torch.ones(batch_size, 1) + * self.n_sets_to_choose, # (batch_size, 1) + }, + batch_size=batch_size, + ) diff --git a/rl4co/envs/routing/__init__.py b/rl4co/envs/routing/__init__.py new file mode 100644 index 00000000..7588b5f4 --- /dev/null +++ b/rl4co/envs/routing/__init__.py @@ -0,0 +1,24 @@ +from rl4co.envs.routing.atsp.env import ATSPEnv +from rl4co.envs.routing.atsp.generator import ATSPGenerator +from rl4co.envs.routing.cvrp.env import CVRPEnv +from rl4co.envs.routing.cvrp.generator import CVRPGenerator +from rl4co.envs.routing.cvrptw.env import CVRPTWEnv +from rl4co.envs.routing.cvrptw.generator import CVRPTWGenerator +from rl4co.envs.routing.mdcpdp.env import MDCPDPEnv +from rl4co.envs.routing.mdcpdp.generator import MDCPDPGenerator +from rl4co.envs.routing.mtsp.env import MTSPEnv +from rl4co.envs.routing.mtsp.generator import MTSPGenerator +from rl4co.envs.routing.mtvrp.env import MTVRPEnv +from rl4co.envs.routing.mtvrp.generator import MTVRPGenerator +from rl4co.envs.routing.op.env import OPEnv +from rl4co.envs.routing.op.generator import OPGenerator +from rl4co.envs.routing.pctsp.env import PCTSPEnv +from rl4co.envs.routing.pctsp.generator import PCTSPGenerator +from rl4co.envs.routing.pdp.env import PDPEnv, PDPRuinRepairEnv +from rl4co.envs.routing.pdp.generator import PDPGenerator +from rl4co.envs.routing.sdvrp.env import SDVRPEnv +from rl4co.envs.routing.spctsp.env import SPCTSPEnv +from rl4co.envs.routing.svrp.env import SVRPEnv +from rl4co.envs.routing.svrp.generator import SVRPGenerator +from rl4co.envs.routing.tsp.env import DenseRewardTSPEnv, TSPEnv, TSPkoptEnv +from rl4co.envs.routing.tsp.generator import TSPGenerator diff --git a/rl4co/envs/routing/atsp/__init__.py b/rl4co/envs/routing/atsp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/atsp/env.py b/rl4co/envs/routing/atsp/env.py new file mode 100644 index 00000000..ed944e50 --- /dev/null +++ b/rl4co/envs/routing/atsp/env.py @@ -0,0 +1,168 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.envs.common.utils import batch_to_scalar +from rl4co.utils.pylogger import get_pylogger + +from .generator import ATSPGenerator +from .render import render + +log = get_pylogger(__name__) + + +class ATSPEnv(RL4COEnvBase): + """Asymmetric Traveling Salesman Problem (ATSP) environment + At each step, the agent chooses a customer to visit. The reward is 0 unless the agent visits all the customers. + In that case, the reward is (-)length of the path: maximizing the reward is equivalent to minimizing the path length. + Unlike the TSP, the distance matrix is asymmetric, i.e., the distance from A to B is not necessarily the same as the distance from B to A. + + Observations: + - distance matrix between customers + - the current customer + - the first customer (for calculating the reward) + - the remaining unvisited customers + + Constraints: + - the tour starts and ends at the same customer. + - each customer must be visited exactly once. + + Finish Condition: + - the agent has visited all customers. + + Reward: + - (minus) the negative length of the path. + + Args: + generator: ATSPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "atsp" + + def __init__( + self, + generator: ATSPGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = ATSPGenerator(**generator_params) + self.generator = generator + self._make_spec(self.generator) + + @staticmethod + def _step(td: TensorDict) -> TensorDict: + current_node = td["action"] + first_node = current_node if batch_to_scalar(td["i"]) == 0 else td["first_node"] + + # Set not visited to 0 (i.e., we visited the node) + available = td["action_mask"].scatter( + -1, current_node.unsqueeze(-1).expand_as(td["action_mask"]), 0 + ) + + # We are done there are no unvisited locations + done = torch.count_nonzero(available, dim=-1) <= 0 + + # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here + reward = torch.zeros_like(done) + + td.update( + { + "first_node": first_node, + "current_node": current_node, + "i": td["i"] + 1, + "action_mask": available, + "reward": reward, + "done": done, + }, + ) + return td + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + # Initialize distance matrix + cost_matrix = td["cost_matrix"] + device = td.device + + # Other variables + current_node = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device) + available = torch.ones( + (*batch_size, self.generator.num_loc), dtype=torch.bool, device=device + ) # 1 means not visited, i.e. action is allowed + i = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device) + + return TensorDict( + { + "cost_matrix": cost_matrix, + "first_node": current_node, + "current_node": current_node, + "i": i, + "action_mask": available, + }, + batch_size=batch_size, + ) + + def _make_spec(self, generator: ATSPGenerator): + self.observation_spec = Composite( + cost_matrix=Bounded( + low=generator.min_dist, + high=generator.max_dist, + shape=(generator.num_loc, generator.num_loc), + dtype=torch.float32, + ), + first_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + i=Unbounded( + shape=(1), + dtype=torch.int64, + ), + action_mask=Unbounded( + shape=(generator.num_loc), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.num_loc, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + def _get_reward(self, td: TensorDict, actions: torch.Tensor) -> torch.Tensor: + distance_matrix = td["cost_matrix"] + + # Get indexes of tour edges + nodes_src = actions + nodes_tgt = torch.roll(actions, -1, dims=1) + batch_idx = torch.arange( + distance_matrix.shape[0], device=distance_matrix.device + ).unsqueeze(1) + # return negative tour length + return -distance_matrix[batch_idx, nodes_src, nodes_tgt].sum(-1) + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor): + assert ( + torch.arange(actions.size(1), out=actions.data.new()) + .view(1, -1) + .expand_as(actions) + == actions.data.sort(1)[0] + ).all(), "Invalid tour" + + @staticmethod + def render(td, actions=None, ax=None): + return render(td, actions, ax) diff --git a/rl4co/envs/routing/atsp/generator.py b/rl4co/envs/routing/atsp/generator.py new file mode 100644 index 00000000..31208005 --- /dev/null +++ b/rl4co/envs/routing/atsp/generator.py @@ -0,0 +1,66 @@ +from typing import Union, Callable + +import torch + +from torch.distributions import Uniform +from tensordict.tensordict import TensorDict + +from rl4co.utils.pylogger import get_pylogger +from rl4co.envs.common.utils import get_sampler, Generator + +log = get_pylogger(__name__) + + +class ATSPGenerator(Generator): + """Data generator for the Asymmetric Travelling Salesman Problem (ATSP) + Generate distance matrices inspired by the reference MatNet (Kwon et al., 2021) + We satifsy the triangle inequality (TMAT class) in a batch + + Args: + num_loc: number of locations (customers) in the TSP + min_dist: minimum value for the distance between nodes + max_dist: maximum value for the distance between nodes + dist_distribution: distribution for the distance between nodes + tmat_class: whether to generate a class of distance matrix + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each customer + """ + def __init__( + self, + num_loc: int = 10, + min_dist: float = 0.0, + max_dist: float = 1.0, + dist_distribution: Union[ + int, float, str, type, Callable + ] = Uniform, + tmat_class: bool = True, + **kwargs + ): + self.num_loc = num_loc + self.min_dist = min_dist + self.max_dist = max_dist + self.tmat_class = tmat_class + + # Distance distribution + if kwargs.get("dist_sampler", None) is not None: + self.dist_sampler = kwargs["dist_sampler"] + else: + self.dist_sampler = get_sampler("dist", dist_distribution, 0.0, 1.0, **kwargs) + + def _generate(self, batch_size) -> TensorDict: + # Generate distance matrices inspired by the reference MatNet (Kwon et al., 2021) + # We satifsy the triangle inequality (TMAT class) in a batch + batch_size = [batch_size] if isinstance(batch_size, int) else batch_size + dms = ( + self.dist_sampler.sample((batch_size + [self.num_loc, self.num_loc])) + * (self.max_dist - self.min_dist) + + self.min_dist + ) + dms[..., torch.arange(self.num_loc), torch.arange(self.num_loc)] = 0 + log.info("Using TMAT class (triangle inequality): {}".format(self.tmat_class)) + if self.tmat_class: + for i in range(self.num_loc): + dms = torch.minimum(dms, dms[..., :, [i]] + dms[..., [i], :]) + return TensorDict({"cost_matrix": dms}, batch_size=batch_size) diff --git a/rl4co/envs/routing/atsp/render.py b/rl4co/envs/routing/atsp/render.py new file mode 100644 index 00000000..8ad0a903 --- /dev/null +++ b/rl4co/envs/routing/atsp/render.py @@ -0,0 +1,50 @@ +import torch +import numpy as np +import matplotlib.pyplot as plt + +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(td, actions=None, ax=None): + if ax is None: + # Create a plot of the nodes + _, ax = plt.subplots() + + td = td.detach().cpu() + + if actions is None: + actions = td.get("action", None) + + # If batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + actions = actions[0] + + locs = td["locs"] + + # Gather locs in order of action if available + if actions is None: + log.warning("No action in TensorDict, rendering unsorted locs") + else: + actions = actions.detach().cpu() + locs = gather_by_index(locs, actions, dim=0) + + # Cat the first node to the end to complete the tour + locs = torch.cat((locs, locs[0:1])) + x, y = locs[:, 0], locs[:, 1] + + # Plot the visited nodes + ax.scatter(x, y, color="tab:blue") + + # Add arrows between visited nodes as a quiver plot + dx, dy = np.diff(x), np.diff(y) + ax.quiver( + x[:-1], y[:-1], dx, dy, scale_units="xy", angles="xy", scale=1, color="k" + ) + + # Setup limits and show + ax.set_xlim(-0.05, 1.05) + ax.set_ylim(-0.05, 1.05) diff --git a/rl4co/envs/routing/cvrp/__init__.py b/rl4co/envs/routing/cvrp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/cvrp/env.py b/rl4co/envs/routing/cvrp/env.py new file mode 100644 index 00000000..b01083f4 --- /dev/null +++ b/rl4co/envs/routing/cvrp/env.py @@ -0,0 +1,265 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.data.utils import load_npz_to_tensordict +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.ops import gather_by_index, get_tour_length +from rl4co.utils.pylogger import get_pylogger + +from .generator import CVRPGenerator + +try: + from .local_search import local_search +except Exception: + # In case some dependencies are not installed (e.g., pyvrp) + local_search = None +from .render import render + +log = get_pylogger(__name__) + + +class CVRPEnv(RL4COEnvBase): + """Capacitated Vehicle Routing Problem (CVRP) environment. + At each step, the agent chooses a customer to visit depending on the current location and the remaining capacity. + When the agent visits a customer, the remaining capacity is updated. If the remaining capacity is not enough to + visit any customer, the agent must go back to the depot. The reward is 0 unless the agent visits all the cities. + In that case, the reward is (-)length of the path: maximizing the reward is equivalent to minimizing the path length. + + Observations: + - location of the depot. + - locations and demand of each customer. + - current location of the vehicle. + - the remaining customer of the vehicle, + + Constraints: + - the tour starts and ends at the depot. + - each customer must be visited exactly once. + - the vehicle cannot visit customers exceed the remaining capacity. + - the vehicle can return to the depot to refill the capacity. + + Finish Condition: + - the vehicle has visited all customers and returned to the depot. + + Reward: + - (minus) the negative length of the path. + + Args: + generator: CVRPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "cvrp" + + def __init__( + self, + generator: CVRPGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = CVRPGenerator(**generator_params) + self.generator = generator + self._make_spec(self.generator) + + def _step(self, td: TensorDict) -> TensorDict: + current_node = td["action"][:, None] # Add dimension for step + n_loc = td["demand"].size(-1) # Excludes depot + + # Not selected_demand is demand of first node (by clamp) so incorrect for nodes that visit depot! + selected_demand = gather_by_index( + td["demand"], torch.clamp(current_node - 1, 0, n_loc - 1), squeeze=False + ) + + # Increase capacity if depot is not visited, otherwise set to 0 + used_capacity = (td["used_capacity"] + selected_demand) * ( + current_node != 0 + ).float() + + # Note: here we do not subtract one as we have to scatter so the first column allows scattering depot + # Add one dimension since we write a single value + visited = td["visited"].scatter(-1, current_node, 1) + + # SECTION: get done + done = visited.sum(-1) == visited.size(-1) + reward = torch.zeros_like(done) + + td.update( + { + "current_node": current_node, + "used_capacity": used_capacity, + "visited": visited, + "reward": reward, + "done": done, + } + ) + td.set("action_mask", self.get_action_mask(td)) + return td + + def _reset( + self, + td: Optional[TensorDict] = None, + batch_size: Optional[list] = None, + ) -> TensorDict: + device = td.device + + # Create reset TensorDict + td_reset = TensorDict( + { + "locs": torch.cat((td["depot"][:, None, :], td["locs"]), -2), + "demand": td["demand"], + "current_node": torch.zeros( + *batch_size, 1, dtype=torch.long, device=device + ), + "used_capacity": torch.zeros((*batch_size, 1), device=device), + "vehicle_capacity": torch.full( + (*batch_size, 1), self.generator.vehicle_capacity, device=device + ), + "visited": torch.zeros( + (*batch_size, td["locs"].shape[-2] + 1), + dtype=torch.uint8, + device=device, + ), + }, + batch_size=batch_size, + ) + td_reset.set("action_mask", self.get_action_mask(td_reset)) + return td_reset + + @staticmethod + def get_action_mask(td: TensorDict) -> torch.Tensor: + # For demand steps_dim is inserted by indexing with id, for used_capacity insert node dim for broadcasting + exceeds_cap = td["demand"] + td["used_capacity"] > td["vehicle_capacity"] + + # Nodes that cannot be visited are already visited or too much demand to be served now + mask_loc = td["visited"][..., 1:].to(exceeds_cap.dtype) | exceeds_cap + + # Cannot visit the depot if just visited and still unserved nodes + mask_depot = (td["current_node"] == 0) & ((mask_loc == 0).int().sum(-1) > 0)[ + :, None + ] + return ~torch.cat((mask_depot, mask_loc), -1) + + def _get_reward(self, td: TensorDict, actions: TensorDict) -> TensorDict: + # Gather locations in order of tour (add depot since we start and end there) + locs_ordered = torch.cat( + [ + td["locs"][..., 0:1, :], # depot + gather_by_index(td["locs"], actions), # order locations + ], + dim=1, + ) + return -get_tour_length(locs_ordered) + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor): + """Check that solution is valid: nodes are not visited twice except depot and capacity is not exceeded""" + # Check if tour is valid, i.e. contain 0 to n-1 + batch_size, graph_size = td["demand"].size() + sorted_pi = actions.data.sort(1)[0] + + # Sorting it should give all zeros at front and then 1...n + assert ( + torch.arange(1, graph_size + 1, out=sorted_pi.data.new()) + .view(1, -1) + .expand(batch_size, graph_size) + == sorted_pi[:, -graph_size:] + ).all() and (sorted_pi[:, :-graph_size] == 0).all(), "Invalid tour" + + # Visiting depot resets capacity so we add demand = -capacity (we make sure it does not become negative) + demand_with_depot = torch.cat((-td["vehicle_capacity"], td["demand"]), 1) + d = demand_with_depot.gather(1, actions) + + used_cap = torch.zeros_like(td["demand"][:, 0]) + for i in range(actions.size(1)): + used_cap += d[ + :, i + ] # This will reset/make capacity negative if i == 0, e.g. depot visited + # Cannot use less than 0 + used_cap[used_cap < 0] = 0 + assert ( + used_cap <= td["vehicle_capacity"] + 1e-5 + ).all(), "Used more than capacity" + + @staticmethod + def load_data(fpath, batch_size=[]): + """Dataset loading from file + Normalize demand by capacity to be in [0, 1] + """ + td_load = load_npz_to_tensordict(fpath) + td_load.set("demand", td_load["demand"] / td_load["capacity"][:, None]) + return td_load + + def _make_spec(self, generator: CVRPGenerator): + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.num_loc + 1, 2), + dtype=torch.float32, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + demand=Bounded( + low=-generator.capacity, + high=generator.max_demand, + shape=(generator.num_loc + 1, 1), + dtype=torch.float32, + ), + action_mask=Unbounded( + shape=(generator.num_loc + 1, 1), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.num_loc + 1, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + def replace_selected_actions( + self, + cur_actions: torch.Tensor, + new_actions: torch.Tensor, + selection_mask: torch.Tensor, + ) -> torch.Tensor: + """ + Replace selected current actions with updated actions based on `selection_mask`. + + Args: + cur_actions [batch_size, num_loc] + new_actions [batch_size, num_loc] + selection_mask [batch_size,] + """ + diff_length = cur_actions.size(-1) - new_actions.size(-1) + if diff_length > 0: + new_actions = torch.nn.functional.pad( + new_actions, (0, diff_length, 0, 0), mode="constant", value=0 + ) + elif diff_length < 0: + cur_actions = torch.nn.functional.pad( + cur_actions, (0, -diff_length, 0, 0), mode="constant", value=0 + ) + cur_actions[selection_mask] = new_actions[selection_mask] + return cur_actions + + @staticmethod + def local_search(td: TensorDict, actions: torch.Tensor, **kwargs) -> torch.Tensor: + assert ( + local_search is not None + ), "Cannot import local_search module. Check if `pyvrp` is installed." + return local_search(td, actions, **kwargs) + + @staticmethod + def render(td: TensorDict, actions: torch.Tensor = None, ax=None): + return render(td, actions, ax) diff --git a/rl4co/envs/routing/cvrp/generator.py b/rl4co/envs/routing/cvrp/generator.py new file mode 100644 index 00000000..d6404781 --- /dev/null +++ b/rl4co/envs/routing/cvrp/generator.py @@ -0,0 +1,143 @@ +from typing import Callable, Union + +import torch + +from tensordict.tensordict import TensorDict +from torch.distributions import Uniform + +from rl4co.envs.common.utils import Generator, get_sampler +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +# From Kool et al. 2019, Hottung et al. 2022, Kim et al. 2023 +CAPACITIES = { + 10: 20.0, + 15: 25.0, + 20: 30.0, + 30: 33.0, + 40: 37.0, + 50: 40.0, + 60: 43.0, + 75: 45.0, + 100: 50.0, + 125: 55.0, + 150: 60.0, + 200: 70.0, + 500: 100.0, + 1000: 150.0, +} + + +class CVRPGenerator(Generator): + """Data generator for the Capacitated Vehicle Routing Problem (CVRP). + + Args: + num_loc: number of locations (cities) in the VRP, without the depot. (e.g. 10 means 10 locs + 1 depot) + min_loc: minimum value for the location coordinates + max_loc: maximum value for the location coordinates + loc_distribution: distribution for the location coordinates + depot_distribution: distribution for the depot location. If None, sample the depot from the locations + min_demand: minimum value for the demand of each customer + max_demand: maximum value for the demand of each customer + demand_distribution: distribution for the demand of each customer + capacity: capacity of the vehicle + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each customer + depot [batch_size, 2]: location of the depot + demand [batch_size, num_loc]: demand of each customer + capacity [batch_size]: capacity of the vehicle + """ + + def __init__( + self, + num_loc: int = 20, + min_loc: float = 0.0, + max_loc: float = 1.0, + loc_distribution: Union[int, float, str, type, Callable] = Uniform, + depot_distribution: Union[int, float, str, type, Callable] = None, + min_demand: int = 1, + max_demand: int = 10, + demand_distribution: Union[int, float, type, Callable] = Uniform, + vehicle_capacity: float = 1.0, + capacity: float = None, + **kwargs, + ): + self.num_loc = num_loc + self.min_loc = min_loc + self.max_loc = max_loc + self.min_demand = min_demand + self.max_demand = max_demand + self.vehicle_capacity = vehicle_capacity + + # Location distribution + if kwargs.get("loc_sampler", None) is not None: + self.loc_sampler = kwargs["loc_sampler"] + else: + self.loc_sampler = get_sampler( + "loc", loc_distribution, min_loc, max_loc, **kwargs + ) + + # Depot distribution + if kwargs.get("depot_sampler", None) is not None: + self.depot_sampler = kwargs["depot_sampler"] + else: + self.depot_sampler = get_sampler( + "depot", depot_distribution, min_loc, max_loc, **kwargs + ) if depot_distribution is not None else None + + # Demand distribution + if kwargs.get("demand_sampler", None) is not None: + self.demand_sampler = kwargs["demand_sampler"] + else: + self.demand_sampler = get_sampler( + "demand", demand_distribution, min_demand - 1, max_demand - 1, **kwargs + ) + + # Capacity + if ( + capacity is None + ): # If not provided, use the default capacity from Kool et al. 2019 + capacity = CAPACITIES.get(num_loc, None) + if ( + capacity is None + ): # If not in the table keys, find the closest number of nodes as the key + closest_num_loc = min(CAPACITIES.keys(), key=lambda x: abs(x - num_loc)) + capacity = CAPACITIES[closest_num_loc] + log.warning( + f"The capacity capacity for {num_loc} locations is not defined. Using the closest capacity: {capacity}\ + with {closest_num_loc} locations." + ) + self.capacity = capacity + + def _generate(self, batch_size) -> TensorDict: + + # Sample locations: depot and customers + if self.depot_sampler is not None: + depot = self.depot_sampler.sample((*batch_size, 2)) + locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2)) + else: + # if depot_sampler is None, sample the depot from the locations + locs = self.loc_sampler.sample((*batch_size, self.num_loc + 1, 2)) + depot = locs[..., 0, :] + locs = locs[..., 1:, :] + + # Sample demands + demand = self.demand_sampler.sample((*batch_size, self.num_loc)) + demand = (demand.int() + 1).float() + + # Sample capacities + capacity = torch.full((*batch_size, 1), self.capacity) + + return TensorDict( + { + "locs": locs, + "depot": depot, + "demand": demand / self.capacity, + "capacity": capacity, + }, + batch_size=batch_size, + ) diff --git a/rl4co/envs/routing/cvrp/local_search.py b/rl4co/envs/routing/cvrp/local_search.py new file mode 100644 index 00000000..73deb7d4 --- /dev/null +++ b/rl4co/envs/routing/cvrp/local_search.py @@ -0,0 +1,215 @@ +from functools import partial +from multiprocessing import Pool +from typing import Tuple, Union + +import numpy as np +import torch + +from pyvrp import ( + Client, + CostEvaluator, + Depot, + ProblemData, + RandomNumberGenerator, + Solution, + VehicleType, +) +from pyvrp.search import ( + NODE_OPERATORS, + ROUTE_OPERATORS, + LocalSearch, + NeighbourhoodParams, + compute_neighbours, +) +from tensordict.tensordict import TensorDict + +from rl4co.utils.ops import get_distance_matrix +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +C = ( + 10**4 +) # Scaling factor for the data, to convert the float values to integers as required by PyVRP + + +def local_search( + td: TensorDict, + actions: torch.Tensor, + max_trials: int = 10, + neighbourhood_params: Union[dict, None] = None, + load_penalty: float = 0.2, + allow_infeasible_solution: bool = False, + seed: int = 0, + num_workers: int = 1, +): + """ + Improve the solution using local search for CVRP, based on PyVRP. + + Args: + td: TensorDict, td from env with shape [batch_size,] + actions: torch.Tensor, Tour indices with shape [batch_size, max_seq_len] + max_trials: int, maximum number of trials for local search + neighbourhood_params: dict, parameters for neighbourhood search + load_penalty: int, penalty for exceeding the vehicle capacity + allow_infeasible_solution: bool, whether to allow infeasible solutions + seed: int, random seed for local search + num_workers: int, number of workers for parallel processing + Returns: + torch.Tensor, Improved tour indices with shape [batch_size, max_seq_len] + """ + + # Convert tensors to numpy arrays + # Note: to avoid the overhead of device transfer, we recommend to pass the tensors in cpu + actions_np = actions.detach().cpu().numpy() + positions_np = td["locs"].detach().cpu().numpy() # [batch_size, num_loc + 1, 2] + demands_np = td["demand"].detach().cpu().numpy() # [batch_size, num_loc] + demands_np = np.pad(demands_np, ((0, 0), (1, 0)), mode="constant") # Add depot demand + distances = td.get("distances", None) # [batch_size, num_loc + 1, num_loc + 1] + if distances is None: + distances_np = get_distance_matrix(td["locs"]).numpy() + else: + distances_np = distances.detach().cpu().numpy() + + max_trials = 1 if allow_infeasible_solution else max_trials + + partial_func = partial( + local_search_single, + neighbourhood_params=neighbourhood_params, + load_penalty=load_penalty, + allow_infeasible_solution=allow_infeasible_solution, + max_trials=max_trials, + seed=seed, + ) + + if num_workers > 1: + with Pool(processes=num_workers) as pool: + new_actions = pool.starmap( + partial_func, zip(actions_np, positions_np, demands_np, distances_np) + ) + else: + new_actions = [ + partial_func(*args) + for args in zip(actions_np, positions_np, demands_np, distances_np) + ] + + # padding with zero + lengths = [len(act) for act in new_actions] + max_length = max(lengths) + new_actions = np.array( + [ + np.pad(act, (0, max_length - length), mode="constant") + for act, length in zip(new_actions, lengths) + ] + ) + return torch.from_numpy(new_actions[:, :-1].astype(np.int64)).to( + td.device + ) # We can remove the last zero + + +def local_search_single( + path: np.ndarray, + positions: np.ndarray, + demands: np.ndarray, + distances: np.ndarray, + neighbourhood_params: Union[dict, None] = None, + allow_infeasible_solution: bool = False, + load_penalty: float = 0.2, + max_trials: int = 10, + seed: int = 0, +) -> np.ndarray: + data = make_data(positions, demands, distances) + solution = make_solution(data, path) + ls_operator = make_search_operator(data, seed, neighbourhood_params) + + improved_solution, is_feasible = perform_local_search( + ls_operator, + solution, + int(load_penalty * C), # * C as we scale the data in `make_data` + remaining_trials=max_trials, + ) + + # Return the original path if no feasible solution is found + if not is_feasible and not allow_infeasible_solution: + return path + + # Recover the path from the sub-routes in the solution + route_list = [ + idx for route in improved_solution.routes() for idx in [0] + route.visits() + ] + [0] + return np.array(route_list) + + +def make_data( + positions: np.ndarray, demands: np.ndarray, distances: np.ndarray +) -> ProblemData: + positions = (positions * C).astype(int) + distances = (distances * C).astype(int) + + capacity = C + demands = np.round(demands * capacity).astype(int) + + return ProblemData( + clients=[ + Client(x=pos[0], y=pos[1], delivery=d) + for pos, d in zip(positions[1:], demands[1:]) + ], + depots=[Depot(x=positions[0][0], y=positions[0][1])], + vehicle_types=[ + VehicleType( + len(positions) - 1, + capacity, + 0, + name=",".join(map(str, range(1, len(positions)))), + ) + ], + distance_matrices=[distances], + duration_matrices=[np.zeros_like(distances)], + ) + + +def make_solution(data: ProblemData, path: np.ndarray) -> Solution: + # Split the paths into sub-routes by the zeros + routes = [ + arr[1:].tolist() for arr in np.split(path, np.where(path == 0)[0]) if len(arr) > 1 + ] + return Solution(data, routes) + + +def make_search_operator( + data: ProblemData, seed=0, neighbourhood_params: Union[dict, None] = None +) -> LocalSearch: + rng = RandomNumberGenerator(seed) + neighbours = compute_neighbours( + data, NeighbourhoodParams(**(neighbourhood_params or {})) + ) + ls = LocalSearch(data, rng, neighbours) + for node_op in NODE_OPERATORS: + ls.add_node_operator(node_op(data)) + for route_op in ROUTE_OPERATORS: + ls.add_route_operator(route_op(data)) + return ls + + +def perform_local_search( + ls_operator: LocalSearch, + solution: Solution, + load_penalty: int, + remaining_trials: int = 5, +) -> Tuple[Solution, bool]: + cost_evaluator = CostEvaluator( + load_penalty=load_penalty, tw_penalty=0, dist_penalty=0 + ) + improved_solution = ls_operator(solution, cost_evaluator) + remaining_trials -= 1 + if is_feasible := improved_solution.is_feasible() or remaining_trials == 0: + return improved_solution, is_feasible + + # print("Warning: Infeasible solution found from local search.", + # "This will slow down the search due to the repeated local search runs.") + + # If infeasible, run the local search again with a higher penalty + return perform_local_search( + ls_operator, solution, load_penalty * 10, remaining_trials=remaining_trials + ) diff --git a/rl4co/envs/routing/cvrp/render.py b/rl4co/envs/routing/cvrp/render.py new file mode 100644 index 00000000..c1b21014 --- /dev/null +++ b/rl4co/envs/routing/cvrp/render.py @@ -0,0 +1,139 @@ +import matplotlib.pyplot as plt +import numpy as np +import torch + +from matplotlib import cm, colormaps + +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(td, actions=None, ax=None, skip_depot=True, integer_demands=True): + num_routine = (actions == 0).sum().item() + 2 + base = colormaps["nipy_spectral"] + color_list = base(np.linspace(0, 1, num_routine)) + cmap_name = base.name + str(num_routine) + out = base.from_list(cmap_name, color_list, num_routine) + + if ax is None: + # Create a plot of the nodes + _, ax = plt.subplots() + + td = td.detach().cpu() + + if actions is None: + actions = td.get("action", None) + + # if batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + actions = actions[0] + + locs = td["locs"] + scale_demand = td["capacity"][0] if td["capacity"].ndim == 1 else td["capacity"] + demands = td["demand"] * scale_demand + + # add the depot at the first action and the end action + actions = torch.cat([torch.tensor([0]), actions, torch.tensor([0])]) + + # gather locs in order of action if available + if actions is None: + log.warning("No action in TensorDict, rendering unsorted locs") + else: + locs = locs + + # Cat the first node to the end to complete the tour + x, y = locs[:, 0], locs[:, 1] + + # plot depot + ax.scatter( + locs[0, 0], + locs[0, 1], + edgecolors=cm.Set2(2), + facecolors="none", + s=100, + linewidths=2, + marker="s", + alpha=1, + ) + + # plot visited nodes + ax.scatter( + x[1:], + y[1:], + edgecolors=cm.Set2(0), + facecolors="none", + s=50, + linewidths=2, + marker="o", + alpha=1, + ) + + # plot demand bars + for node_idx in range(1, len(locs)): + ax.add_patch( + plt.Rectangle( + (locs[node_idx, 0] - 0.005, locs[node_idx, 1] + 0.015), + 0.01, + demands[node_idx - 1] / (scale_demand * 10), + edgecolor=cm.Set2(0), + facecolor=cm.Set2(0), + fill=True, + ) + ) + + # text demand + for node_idx in range(1, len(locs)): + demand_text = ( + f"{demands[node_idx-1].int().item()}" + if integer_demands + else f"{demands[node_idx-1].item():.2f}" + ) + ax.text( + locs[node_idx, 0], + locs[node_idx, 1] - 0.025, + f"{demand_text}", + horizontalalignment="center", + verticalalignment="top", + fontsize=10, + color=cm.Set2(0), + ) + + # text depot + ax.text( + locs[0, 0], + locs[0, 1] - 0.025, + "Depot", + horizontalalignment="center", + verticalalignment="top", + fontsize=10, + color=cm.Set2(2), + ) + + # plot actions + color_idx = 0 + for action_idx in range(len(actions) - 1): + if actions[action_idx] == 0: + color_idx += 1 + from_loc = locs[actions[action_idx]] + to_loc = locs[actions[action_idx + 1]] + if skip_depot and (actions[action_idx] == 0 or actions[action_idx + 1] == 0): + continue + ax.plot( + [from_loc[0], to_loc[0]], + [from_loc[1], to_loc[1]], + color=out(color_idx), + lw=1, + ) + ax.annotate( + "", + xy=(to_loc[0], to_loc[1]), + xytext=(from_loc[0], from_loc[1]), + arrowprops=dict(arrowstyle="-|>", color=out(color_idx)), + size=15, + annotation_clip=False, + ) + + ax.set_xlim(-0.05, 1.05) + ax.set_ylim(-0.05, 1.05) diff --git a/rl4co/envs/routing/cvrptw/__init__.py b/rl4co/envs/routing/cvrptw/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/cvrptw/env.py b/rl4co/envs/routing/cvrptw/env.py new file mode 100644 index 00000000..a6a4ea49 --- /dev/null +++ b/rl4co/envs/routing/cvrptw/env.py @@ -0,0 +1,287 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.data.utils import ( + load_npz_to_tensordict, + load_solomon_instance, + load_solomon_solution, +) +from rl4co.envs.routing.cvrp.env import CVRPEnv +from rl4co.utils.ops import gather_by_index, get_distance + +from ..cvrp.generator import CVRPGenerator +from .generator import CVRPTWGenerator +from .render import render + + +class CVRPTWEnv(CVRPEnv): + """Capacitated Vehicle Routing Problem with Time Windows (CVRPTW) environment. + Inherits from the CVRPEnv class in which customers are considered. + Additionally considers time windows within which a service has to be started. + + Observations: + - location of the depot. + - locations and demand of each customer. + - current location of the vehicle. + - the remaining customer of the vehicle. + - the current time. + - service durations of each location. + - time windows of each location. + + Constraints: + - the tour starts and ends at the depot. + - each customer must be visited exactly once. + - the vehicle cannot visit customers exceed the remaining customer. + - the vehicle can return to the depot to refill the customer. + - the vehicle must start the service within the time window of each location. + + Finish Condition: + - the vehicle has visited all customers and returned to the depot. + + Reward: + - (minus) the negative length of the path. + + Args: + generator: CVRPTWGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "cvrptw" + + def __init__( + self, + generator: CVRPTWGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = CVRPTWGenerator(**generator_params) + self.generator = generator + self._make_spec(self.generator) + + def _make_spec(self, generator: CVRPTWGenerator): + if isinstance(generator, CVRPGenerator): + super()._make_spec(generator) + else: + current_time = Unbounded(shape=(1), dtype=torch.float32, device=self.device) + current_loc = Unbounded(shape=(2), dtype=torch.float32, device=self.device) + durations = Bounded( + low=generator.min_time, + high=generator.max_time, + shape=(generator.num_loc, 1), + dtype=torch.int64, + device=self.device, + ) + time_windows = Bounded( + low=generator.min_time, + high=generator.max_time, + shape=( + generator.num_loc, + 2, + ), # Each location has a 2D time window (start, end) + dtype=torch.int64, + device=self.device, + ) + # Extend observation specs + self.observation_spec = Composite( + **self.observation_spec, + current_time=current_time, + current_loc=current_loc, + durations=durations, + time_windows=time_windows, + ) + + @staticmethod + def get_action_mask(td: TensorDict) -> torch.Tensor: + """In addition to the constraints considered in the CVRPEnv, the time windows are considered. + The vehicle can only visit a location if it can reach it in time, i.e. before its time window ends. + """ + not_masked = CVRPEnv.get_action_mask(td) + current_loc = gather_by_index(td["locs"], td["current_node"]) + dist = get_distance(current_loc[..., None, :], td["locs"]) + td.update({"current_loc": current_loc, "distances": dist}) + can_reach_in_time = ( + td["current_time"] + dist <= td["time_windows"][..., 1] + ) # I only need to start the service before the time window ends, not finish it. + return not_masked & can_reach_in_time + + def _step(self, td: TensorDict) -> TensorDict: + """In addition to the calculations in the CVRPEnv, the current time is + updated to keep track of which nodes are still reachable in time. + The current_node is updeted in the parent class' _step() function. + """ + batch_size = td["locs"].shape[0] + # update current_time + distance = gather_by_index(td["distances"], td["action"]).reshape([batch_size, 1]) + duration = gather_by_index(td["durations"], td["action"]).reshape([batch_size, 1]) + start_times = gather_by_index(td["time_windows"], td["action"])[..., 0].reshape( + [batch_size, 1] + ) + td["current_time"] = (td["action"][:, None] != 0) * ( + torch.max(td["current_time"] + distance, start_times) + duration + ) + # current_node is updated to the selected action + td = super()._step(td) + return td + + def _reset( + self, td: Optional[TensorDict] = None, batch_size: Optional[list] = None + ) -> TensorDict: + device = td.device + td_reset = TensorDict( + { + "locs": torch.cat((td["depot"][..., None, :], td["locs"]), -2), + "demand": td["demand"], + "current_node": torch.zeros( + *batch_size, 1, dtype=torch.long, device=device + ), + "current_time": torch.zeros( + *batch_size, 1, dtype=torch.float32, device=device + ), + "used_capacity": torch.zeros((*batch_size, 1), device=device), + "vehicle_capacity": torch.full( + (*batch_size, 1), self.generator.vehicle_capacity, device=device + ), + "visited": torch.zeros( + (*batch_size, td["locs"].shape[-2] + 1), + dtype=torch.uint8, + device=device, + ), + "durations": td["durations"], + "time_windows": td["time_windows"], + }, + batch_size=batch_size, + ) + td_reset.set("action_mask", self.get_action_mask(td_reset)) + return td_reset + + def _get_reward(self, td: TensorDict, actions: torch.Tensor) -> torch.Tensor: + """The reward is the negative tour length. Time windows + are not considered for the calculation of the reward.""" + return super()._get_reward(td, actions) + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor) -> None: + CVRPEnv.check_solution_validity(td, actions) + batch_size = td["locs"].shape[0] + # distances to depot + distances = get_distance( + td["locs"][..., 0, :], td["locs"].transpose(0, 1) + ).transpose(0, 1) + # basic checks on time windows + assert torch.all(distances >= 0.0), "Distances must be non-negative." + assert torch.all(td["time_windows"] >= 0.0), "Time windows must be non-negative." + assert torch.all( + td["time_windows"][..., :, 0] + distances + td["durations"] + <= td["time_windows"][..., 0, 1][0] # max_time is the same for all batches + ), "vehicle cannot perform service and get back to depot in time." + assert torch.all( + td["durations"] >= 0.0 + ), "Service durations must be non-negative." + assert torch.all( + td["time_windows"][..., 0] < td["time_windows"][..., 1] + ), "there are unfeasible time windows" + # check vehicles can meet deadlines + curr_time = torch.zeros(batch_size, 1, dtype=torch.float32, device=td.device) + curr_node = torch.zeros_like(curr_time, dtype=torch.int64, device=td.device) + for ii in range(actions.size(1)): + next_node = actions[:, ii] + dist = get_distance( + gather_by_index(td["locs"], curr_node).reshape([batch_size, 2]), + gather_by_index(td["locs"], next_node).reshape([batch_size, 2]), + ).reshape([batch_size, 1]) + curr_time = torch.max( + (curr_time + dist).int(), + gather_by_index(td["time_windows"], next_node)[..., 0].reshape( + [batch_size, 1] + ), + ) + assert torch.all( + curr_time + <= gather_by_index(td["time_windows"], next_node)[..., 1].reshape( + [batch_size, 1] + ) + ), "vehicle cannot start service before deadline" + curr_time = curr_time + gather_by_index(td["durations"], next_node).reshape( + [batch_size, 1] + ) + curr_node = next_node + curr_time[curr_node == 0] = 0.0 # reset time for depot + + @staticmethod + def render(td: TensorDict, actions: torch.Tensor = None, ax=None): + render(td, actions, ax) + + @staticmethod + def load_data( + name: str, + solomon=False, + path_instances: str = None, + type: str = None, + compute_edge_weights: bool = False, + ): + if solomon: + assert type in [ + "instance", + "solution", + ], "type must be either 'instance' or 'solution'" + if type == "instance": + instance = load_solomon_instance( + name=name, path=path_instances, edge_weights=compute_edge_weights + ) + elif type == "solution": + instance = load_solomon_solution(name=name, path=path_instances) + return instance + return load_npz_to_tensordict(filename=name) + + def extract_from_solomon(self, instance: dict, batch_size: int = 1): + # extract parameters for the environment from the Solomon instance + self.min_demand = instance["demand"][1:].min() + self.max_demand = instance["demand"][1:].max() + self.vehicle_capacity = instance["capacity"] + self.min_loc = instance["node_coord"][1:].min() + self.max_loc = instance["node_coord"][1:].max() + self.min_time = instance["time_window"][:, 0].min() + self.max_time = instance["time_window"][:, 1].max() + # assert the time window of the depot starts at 0 and ends at max_time + assert self.min_time == 0, "Time window of depot must start at 0." + assert ( + self.max_time == instance["time_window"][0, 1] + ), "Depot must have latest end time." + # convert to format used in CVRPTWEnv + td = TensorDict( + { + "depot": torch.tensor( + instance["node_coord"][0], + dtype=torch.float32, + device=self.device, + ).repeat(batch_size, 1), + "locs": torch.tensor( + instance["node_coord"][1:], + dtype=torch.float32, + device=self.device, + ).repeat(batch_size, 1, 1), + "demand": torch.tensor( + instance["demand"][1:], + dtype=torch.float32, + device=self.device, + ).repeat(batch_size, 1), + "durations": torch.tensor( + instance["service_time"], + dtype=torch.int64, + device=self.device, + ).repeat(batch_size, 1), + "time_windows": torch.tensor( + instance["time_window"], + dtype=torch.int64, + device=self.device, + ).repeat(batch_size, 1, 1), + }, + batch_size=1, # we assume batch_size will always be 1 for loaded instances + ) + return self.reset(td, batch_size=batch_size) diff --git a/rl4co/envs/routing/cvrptw/generator.py b/rl4co/envs/routing/cvrptw/generator.py new file mode 100644 index 00000000..770f88fb --- /dev/null +++ b/rl4co/envs/routing/cvrptw/generator.py @@ -0,0 +1,162 @@ +from typing import Union, Callable + +import torch + +from torch.distributions import Uniform +from tensordict.tensordict import TensorDict + +from rl4co.envs.routing.cvrp.generator import CVRPGenerator +from rl4co.utils.ops import get_distance + + +class CVRPTWGenerator(CVRPGenerator): + """Data generator for the Capacitated Vehicle Routing Problem with Time Windows (CVRPTW) environment + Generates time windows and service durations for the locations. The depot has a time window of [0, self.max_time]. + The time windows define the time span within which a service has to be started. To reach the depot in time from the last node, + the end time of each node is bounded by the service duration and the distance back to the depot. + The start times of the time windows are bounded by how long it takes to travel there from the depot. + + Args: + num_loc: number of locations (customers) in the VRP, without the depot. (e.g. 10 means 10 locs + 1 depot) + min_loc: minimum value for the location coordinates + max_loc: maximum value for the location coordinates, default is 150 insted of 1.0, will be scaled + loc_distribution: distribution for the location coordinates + depot_distribution: distribution for the depot location. If None, sample the depot from the locations + min_demand: minimum value for the demand of each customer + max_demand: maximum value for the demand of each customer + demand_distribution: distribution for the demand of each customer + capacity: capacity of the vehicle + max_time: maximum time for the vehicle to complete the tour + scale: if True, the locations, time windows, and service durations will be scaled to [0, 1]. Default to False + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each city + depot [batch_size, 2]: location of the depot + demand [batch_size, num_loc]: demand of each customer + while the demand of the depot is a placeholder + capacity [batch_size, 1]: capacity of the vehicle + durations [batch_size, num_loc]: service durations of each location + time_windows [batch_size, num_loc, 2]: time windows of each location + """ + def __init__( + self, + num_loc: int = 20, + min_loc: float = 0.0, + max_loc: float = 150.0, + loc_distribution: Union[ + int, float, str, type, Callable + ] = Uniform, + depot_distribution: Union[ + int, float, str, type, Callable + ] = None, + min_demand: int = 1, + max_demand: int = 10, + demand_distribution: Union[ + int, float, type, Callable + ] = Uniform, + vehicle_capacity: float = 1.0, + capacity: float = None, + max_time: float = 480, + scale: bool = False, + **kwargs, + ): + super().__init__( + num_loc=num_loc, + min_loc=min_loc, + max_loc=max_loc, + loc_distribution=loc_distribution, + depot_distribution=depot_distribution, + min_demand=min_demand, + max_demand=max_demand, + demand_distribution=demand_distribution, + vehicle_capacity=vehicle_capacity, + capacity=capacity, + **kwargs, + ) + self.max_loc = max_loc + self.min_time = 0.0 + self.max_time = max_time + self.scale = scale + + def _generate(self, batch_size) -> TensorDict: + td = super()._generate(batch_size) + + batch_size = [batch_size] if isinstance(batch_size, int) else batch_size + + ## define service durations + # generate randomly (first assume service durations of 0, to be changed later) + durations = torch.zeros( + *batch_size, self.num_loc + 1, dtype=torch.float32 + ) + + ## define time windows + # 1. get distances from depot + dist = get_distance(td["depot"], td["locs"].transpose(0, 1)).transpose(0, 1) + dist = torch.cat((torch.zeros(*batch_size, 1), dist), dim=1) + + # 2. define upper bound for time windows to make sure the vehicle can get back to the depot in time + upper_bound = self.max_time - dist - durations + + # 3. create random values between 0 and 1 + ts_1 = torch.rand(*batch_size, self.num_loc + 1) + ts_2 = torch.rand(*batch_size, self.num_loc + 1) + + # 4. scale values to lie between their respective min_time and max_time and convert to integer values + min_ts = (dist + (upper_bound - dist) * ts_1).int() + max_ts = (dist + (upper_bound - dist) * ts_2).int() + + # 5. set the lower value to min, the higher to max + min_times = torch.min(min_ts, max_ts) + max_times = torch.max(min_ts, max_ts) + + # 6. reset times for depot + min_times[..., :, 0] = 0.0 + max_times[..., :, 0] = self.max_time + + # 7. ensure min_times < max_times to prevent numerical errors in attention.py + # min_times == max_times may lead to nan values in _inner_mha() + mask = min_times == max_times + if torch.any(mask): + min_tmp = min_times.clone() + min_tmp[mask] = torch.max( + dist[mask].int(), min_tmp[mask] - 1 + ) # we are handling integer values, so we can simply substract 1 + min_times = min_tmp + + mask = min_times == max_times # update mask to new min_times + if torch.any(mask): + max_tmp = max_times.clone() + max_tmp[mask] = torch.min( + torch.floor(upper_bound[mask]).int(), + torch.max( + torch.ceil(min_tmp[mask] + durations[mask]).int(), + max_tmp[mask] + 1, + ), + ) + max_times = max_tmp + + # Scale to [0, 1] + if self.scale: + durations = durations / self.max_time + min_times = min_times / self.max_time + max_times = max_times / self.max_time + td["depot"] = td["depot"] / self.max_time + td["locs"] = td["locs"] / self.max_time + + # 8. stack to tensor time_windows + time_windows = torch.stack((min_times, max_times), dim=-1) + + assert torch.all( + min_times < max_times + ), "Please make sure the relation between max_loc and max_time allows for feasible solutions." + + # Reset duration at depot to 0 + durations[:, 0] = 0.0 + td.update( + { + "durations": durations, + "time_windows": time_windows, + } + ) + return td diff --git a/rl4co/envs/routing/cvrptw/render.py b/rl4co/envs/routing/cvrptw/render.py new file mode 100644 index 00000000..74748e1c --- /dev/null +++ b/rl4co/envs/routing/cvrptw/render.py @@ -0,0 +1,133 @@ +import torch +import numpy as np +import matplotlib.pyplot as plt + +from matplotlib import cm, colormaps + +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(td, actions=None, ax=None): + num_routine = (actions == 0).sum().item() + 2 + base = colormaps["nipy_spectral"] + color_list = base(np.linspace(0, 1, num_routine)) + cmap_name = base.name + str(num_routine) + out = base.from_list(cmap_name, color_list, num_routine) + + if ax is None: + # Create a plot of the nodes + _, ax = plt.subplots() + + td = td.detach().cpu() + + if actions is None: + actions = td.get("action", None) + + # if batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + actions = actions[0] + + locs = td["locs"] + scale_demand = td["capacity"][0] + demands = td["demand"] * scale_demand + + # add the depot at the first action and the end action + actions = torch.cat([torch.tensor([0]), actions, torch.tensor([0])]) + + # gather locs in order of action if available + if actions is None: + log.warning("No action in TensorDict, rendering unsorted locs") + else: + locs = locs + + # Cat the first node to the end to complete the tour + x, y = locs[:, 0], locs[:, 1] + + # plot depot + ax.scatter( + locs[0, 0], + locs[0, 1], + edgecolors=cm.Set2(2), + facecolors="none", + s=100, + linewidths=2, + marker="s", + alpha=1, + ) + + # plot visited nodes + ax.scatter( + x[1:], + y[1:], + edgecolors=cm.Set2(0), + facecolors="none", + s=50, + linewidths=2, + marker="o", + alpha=1, + ) + + # plot demand bars + for node_idx in range(1, len(locs)): + ax.add_patch( + plt.Rectangle( + (locs[node_idx, 0] - 0.005, locs[node_idx, 1] + 0.015), + 0.01, + demands[node_idx - 1] / (scale_demand * 10), + edgecolor=cm.Set2(0), + facecolor=cm.Set2(0), + fill=True, + ) + ) + + # text demand + for node_idx in range(1, len(locs)): + ax.text( + locs[node_idx, 0], + locs[node_idx, 1] - 0.025, + f"{demands[node_idx-1].item():.2f}", + horizontalalignment="center", + verticalalignment="top", + fontsize=10, + color=cm.Set2(0), + ) + + # text depot + ax.text( + locs[0, 0], + locs[0, 1] - 0.025, + "Depot", + horizontalalignment="center", + verticalalignment="top", + fontsize=10, + color=cm.Set2(2), + ) + + # plot actions + color_idx = 0 + for action_idx in range(len(actions) - 1): + if actions[action_idx] == 0: + color_idx += 1 + from_loc = locs[actions[action_idx]] + to_loc = locs[actions[action_idx + 1]] + ax.plot( + [from_loc[0], to_loc[0]], + [from_loc[1], to_loc[1]], + color=out(color_idx), + lw=1, + ) + ax.annotate( + "", + xy=(to_loc[0], to_loc[1]), + xytext=(from_loc[0], from_loc[1]), + arrowprops=dict(arrowstyle="-|>", color=out(color_idx)), + size=15, + annotation_clip=False, + ) + + ax.set_xlim(-0.05, 1.05) + ax.set_ylim(-0.05, 1.05) diff --git a/rl4co/envs/routing/mdcpdp/__init__.py b/rl4co/envs/routing/mdcpdp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/mdcpdp/env.py b/rl4co/envs/routing/mdcpdp/env.py new file mode 100644 index 00000000..c649c5c3 --- /dev/null +++ b/rl4co/envs/routing/mdcpdp/env.py @@ -0,0 +1,400 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.ops import gather_by_index + +from .generator import MDCPDPGenerator +from .render import render + + +class MDCPDPEnv(RL4COEnvBase): + """Multi Depot Capacitated Pickup and Delivery Problem (MDCPDP) environment. + One reference to understand the problem could be: Solving the multi-compartment capacitated location routing + problem with pickup–delivery routes and stochastic demands (https://doi.org/10.1016/j.cie.2015.05.008). + The environment is made of num_loc + num_depots locations (cities): + - num_depot depot + - num_loc / 2 pickup locations + - num_loc / 2 delivery locations + The goal is to visit all the pickup and delivery locations in the shortest path possible starting from the depot + The conditions is that the agent must visit a pickup location before visiting its corresponding delivery location + The capacity is the maximum number of pickups that the vehicle can carry at the same time + + Observations: + - locs: locations of the cities [num_loc + num_depot, 2] + - current_node: current node of the agent [1] + - to_deliver: if the node is to deliver [1] + - i: current step [1] + - action_mask: mask of the available actions [num_loc + num_depot] + - shape: shape of the observation + + Constraints: + - The agent cannot visit the same city twice + - The agent must visit the pickup location before the delivery location + - The agent must visit the depot at the end of the tour + + Finish Condition: + - The agent visited all the locations + + Reward: + - Min-sum: the reward is the negative of the length of the tour + - Min-max: the reward is the negative of the maximum length of the tour + - Lateness: the reward is the negative of the cumulate sum of the length of the tour + - Lateness-square: the reward is the negative of the cumulate sum of the square of the length of the tour + + Args: + generator: MDCPDPGenerator instance as the data generator + generator_params: parameters for the generator + dist_mode: distance mode. One of ["L1", "L2"] + reward_mode: objective of the problem. One of ["lateness", "lateness_square", "minmax", "minsum"] + problem_mode: type of the problem. One of ["close", "open"] + start_mode: type of the start. One of ["order", "random"] + """ + + name = "mdcpdp" + + def __init__( + self, + generator: MDCPDPGenerator = None, + generator_params: dict = {}, + dist_mode: str = "L2", + reward_mode: str = "lateness", + problem_mode: str = "close", + start_mode: str = "order", + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = MDCPDPGenerator(**generator_params) + self.generator = generator + self.dist_mode = dist_mode + self.reward_mode = reward_mode + self.problem_mode = problem_mode + self.start_mode = start_mode + self.depot_mode = generator.depot_mode + self._make_spec(self.generator) + + assert self.dist_mode in ["L1", "L2"], "Distance mode (L1/L2) not supported" + assert self.reward_mode in [ + "lateness", + "lateness_square", + "minmax", + "minsum", + ], "Objective mode not supported" + assert self.problem_mode in [ + "close", + "open", + ], "Task type (open/close) not supported" + assert self.start_mode in [ + "order", + "random", + ], "Start type (order/random) not supported" + + def _step(self, td: TensorDict) -> TensorDict: + current_node = td["action"].unsqueeze(-1) + current_depot = td["current_depot"] + + num_depot = td["capacity"].shape[-1] + num_loc = td["locs"].shape[-2] - num_depot # no depot + pd_split_idx = num_loc // 2 + num_depot + + # Pickup and delivery node pair of selected node + new_to_deliver = (current_node + num_loc // 2) % (num_loc + num_depot) + + # If back to the depot + back_flag = (current_node < num_depot) & ( + td["available"].gather(-1, current_node) == 0 + ) + + # Set available to 0 (i.e., we visited the node) + available = td["available"].scatter( + -1, current_node.expand_as(td["action_mask"]), 0 + ) + + # Record the to be delivered node + to_deliver = td["to_deliver"].scatter( + -1, new_to_deliver.expand_as(td["to_deliver"]), 1 + ) + + # Update number of current carry orders + current_carry = td["current_carry"] + current_carry += ( + (current_node < pd_split_idx) & (current_node >= num_depot) + ).long() # If pickup, add 1 + current_carry -= (current_node >= pd_split_idx).long() # If delivery, minus 1 + + # Update the current depot + current_depot = td["current_depot"] + current_depot = torch.where(back_flag, current_node, current_depot) + + # Update the length of current tour + current_length = td["current_length"] + prev_loc = gather_by_index(td["locs"], td["current_node"]) + curr_loc = gather_by_index(td["locs"], current_node) + current_step_length = self.get_distance(prev_loc, curr_loc) + + # If this path is the way between two depods, i.e. open a new route, set the length to 0 + current_step_length = torch.where( + (current_node < num_depot) & (td["current_node"] < num_depot), + 0, + current_step_length, + ) + + # If the problem mode is open, the path back to the depot will not be counted + if self.problem_mode == "open": + current_step_length = torch.where( + (current_node < num_depot) & (td["current_node"] >= num_depot), + 0, + current_step_length, + ) + + # Update the current length + current_length.scatter_add_(-1, current_depot, current_step_length) + + # Update the arrive time for each city + arrivetime_record = td["arrivetime_record"] + arrivetime_record.scatter_( + -1, current_node, current_length.gather(-1, current_depot) + ) + + # Action is feasible if the node is not visited and is to deliver + action_mask = available & to_deliver + + # If reach the capacity, only delivery is available + current_capacity = td["capacity"].gather(-1, current_depot) + capacity_flag = current_carry >= current_capacity + action_mask[ + ..., num_depot:pd_split_idx + ] &= ~capacity_flag # If reach the capacity, pickup is not available + + # If back to the current depot, this tour is done, set other depots to availbe to start + # a new tour. Must start from a depot. + action_mask[..., num_depot:] &= ~back_flag.expand_as(action_mask[..., num_depot:]) + + # If back to the depot, other unvisited depots are available + # if not back to the depot, depots are not available except the current depot + action_mask[..., :num_depot] &= back_flag.expand_as(action_mask[..., :num_depot]) + action_mask[..., :num_depot].scatter_(-1, current_depot, ~back_flag) + + # If this is the last agent, it has to finish all the left taks + last_depot_flag = ( + torch.sum(available[..., :num_depot].long(), dim=-1, keepdim=True) == 0 + ) + action_mask[..., :num_depot] &= ~last_depot_flag.expand_as( + action_mask[..., :num_depot] + ) + + # Update depot mask + carry_flag = current_carry > 0 # If agent is carrying orders + action_mask[ + ..., :num_depot + ] &= ~carry_flag # If carrying orders, depot is not available + + # We are done there are no unvisited locations + done = torch.count_nonzero(available, dim=-1) == 0 + + # If done, the last depot would be always available + action_mask[..., :num_depot].scatter_( + -1, + current_depot, + action_mask[..., :num_depot].gather(-1, current_depot) | done, + ) + + # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here + reward = torch.zeros_like(done) + + # Update step + td.update( + { + "current_node": current_node, + "current_depot": current_depot, + "current_carry": current_carry, + "available": available, + "to_deliver": to_deliver, + "i": td["i"] + 1, + "action_mask": action_mask, + "reward": reward, + "done": done, + } + ) + return td + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + device = td.device + locs = torch.cat((td["depot"], td["locs"]), -2) + + # Record how many depots are visited + depot_idx = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device) + + # Pick is 1, deliver is 0 [batch_size, graph_size+1], i.e. [1, 1, ..., 1, 0, ...0] + to_deliver = torch.cat( + [ + torch.ones( + *batch_size, + self.generator.num_loc // 2 + self.generator.num_depot, + dtype=torch.bool, + device=device, + ), + torch.zeros( + *batch_size, + self.generator.num_loc // 2, + dtype=torch.bool, + device=device, + ), + ], + dim=-1, + ) + + # Current depot index + if self.start_mode == "random": + current_depot = torch.randint( + low=0, high=self.generator.num_depot, size=(*batch_size, 1), device=device + ) + elif self.start_mode == "order": + current_depot = torch.zeros( + (*batch_size, 1), dtype=torch.int64, device=device + ) + + # Current carry order number + current_carry = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device) + + # Current length of each depot + current_length = torch.zeros( + (*batch_size, self.generator.num_depot), dtype=torch.float32, device=device + ) + + # Arrive time for each city + arrivetime_record = torch.zeros( + (*batch_size, self.generator.num_loc + self.generator.num_depot), + dtype=torch.float32, + device=device, + ) + + # Cannot visit depot at first step # [0,1...1] so set not available + available = torch.ones( + (*batch_size, self.generator.num_loc + self.generator.num_depot), + dtype=torch.bool, + device=device, + ) + action_mask = ~available.contiguous() # [batch_size, graph_size+1] + action_mask[..., 0] = 1 # First step is always the depot + + # Other variables + current_node = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device) + i = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device) + + return TensorDict( + { + "locs": locs, + "depot_idx": depot_idx, + "current_node": current_node, + "current_depot": current_depot, + "current_carry": current_carry, + "current_length": current_length, + "arrivetime_record": arrivetime_record, + "capacity": td["capacity"], + "lateness_weight": td["lateness_weight"], + "to_deliver": to_deliver, + "available": available, + "i": i, + "action_mask": action_mask, + }, + batch_size=batch_size, + ) + + def _make_spec(self, generator: MDCPDPGenerator): + """Make the observation and action specs from the parameters.""" + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.num_loc + 1, 2), + dtype=torch.float32, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + to_deliver=Unbounded( + shape=(1), + dtype=torch.int64, + ), + i=Unbounded( + shape=(1), + dtype=torch.int64, + ), + action_mask=Unbounded( + shape=(generator.num_loc + 1), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.num_loc + 1, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + def get_distance(self, prev_loc, cur_loc): + # Use L1 norm to calculate the distance for Manhattan distance + if self.dist_mode == "L1": + return torch.abs(cur_loc - prev_loc).norm(p=1, dim=-1) + elif self.dist_mode == "L2": + return torch.abs(cur_loc - prev_loc).norm(p=2, dim=-1) + else: + raise ValueError(f"Invalid distance norm: {self.dist_norm}") + + def _get_reward(self, td: TensorDict, actions) -> TensorDict: + """Return the rewrad for the current state + Support modes: + - minmax: the reward is the maximum length of all agents + - minsum: the reward is the sum of all agents' length + - lateness: the reward is the sum of all agents' length plus the lateness with a weight + Args: + - actions [batch_size, num_depot+num_locs-1]: the actions taken by the agents + note that the last city back to depot is not included here + """ + # Check the validity of the actions + num_depot = td["capacity"].shape[-1] + num_loc = td["locs"].shape[-2] - num_depot # except depot + + # Append the last depot to the end of the actions + actions = torch.cat([actions, td["current_depot"]], dim=-1) + + # Calculate the reward + if self.reward_mode == "minmax": + cost = torch.max(td["current_length"], dim=-1)[0] + elif self.reward_mode == "minsum": + cost = torch.sum(td["current_length"], dim=-1) + elif self.reward_mode == "lateness": + cost = torch.sum(td["current_length"], dim=(-1)) + lateness = td["arrivetime_record"][..., num_depot + num_loc // 2 :] + if self.reward_mode == "lateness_square": + lateness = lateness**2 + lateness = torch.sum(lateness, dim=-1) + # lateness weight - note that if this is 0, the reward is the same as the cost + # and if this is 1, the reward is the same as the lateness + cost = ( + cost * (1 - td["lateness_weight"].squeeze()) + + lateness * td["lateness_weight"].squeeze() + ) + else: + raise NotImplementedError( + f"Invalid reward mode: {self.reward_mode}. Available modes: minmax, minsum, lateness_square, lateness" + ) + return -cost # minus for reward + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor): + assert True, "Not implemented" + + @staticmethod + def render(td: TensorDict, actions: torch.Tensor = None, ax=None): + return render(td, actions, ax) diff --git a/rl4co/envs/routing/mdcpdp/generator.py b/rl4co/envs/routing/mdcpdp/generator.py new file mode 100644 index 00000000..284e46a0 --- /dev/null +++ b/rl4co/envs/routing/mdcpdp/generator.py @@ -0,0 +1,126 @@ +from typing import Union, Callable + +import torch + +from torch.distributions import Uniform +from tensordict.tensordict import TensorDict + +from rl4co.utils.pylogger import get_pylogger +from rl4co.envs.common.utils import get_sampler, Generator + +log = get_pylogger(__name__) + + +class MDCPDPGenerator(Generator): + """Data generator for the Multi Depot Capacitated Pickup and Delivery Problem (MDCPDP) environment. + + Args: + num_loc: number of locations (customers) + min_loc: minimum value for the location coordinates + max_loc: maximum value for the location coordinates, default is 150 insted of 1.0, will be scaled + loc_distribution: distribution for the location coordinates + num_depot: number of depots, each depot has one vehicle + depot_mode: mode for the depot, either single or multiple + depod_distribution: distribution for the depot coordinates + min_capacity: minimum value of the capacity + max_capacity: maximum value of the capacity + min_lateness_weight: minimum value of the lateness weight + max_lateness_weight: maximum value of the lateness weight + latebess_weight_distribution: distribution for the lateness weight + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each customer + depot [batch_size, num_depot, 2]: locations of each depot + capacity [batch_size, 1]: capacity of the vehicle + lateness_weight [batch_size, 1]: weight of the lateness cost + """ + def __init__( + self, + num_loc: int = 20, + min_loc: float = 0.0, + max_loc: float = 1.0, + loc_distribution: Union[ + int, float, str, type, Callable + ] = Uniform, + num_depot: int = 5, + depot_mode: str = "multiple", + depot_distribution: Union[ + int, float, str, type, Callable + ] = Uniform, + min_capacity: int = 1, + max_capacity: int = 5, + min_lateness_weight: float = 1.0, + max_lateness_weight: float = 1.0, + lateness_weight_distribution: Union[ + int, float, str, type, Callable + ] = Uniform, + **kwargs + ): + self.num_loc = num_loc + self.min_loc = min_loc + self.max_loc = max_loc + self.depot_mode = depot_mode + self.num_depot = num_depot + self.min_capacity = min_capacity + self.max_capacity = max_capacity + self.min_lateness_weight = min_lateness_weight + self.max_lateness_weight = max_lateness_weight + + # Number of locations must be even + if num_loc % 2 != 0: + log.warn("Number of locations must be even. Adding 1 to the number of locations.") + self.num_loc += 1 + + # Check depot mode validity + assert depot_mode in ["single", "multiple"], f"Invalid depot mode: {depot_mode}" + + # Location distribution + if kwargs.get("loc_sampler", None) is not None: + self.loc_sampler = kwargs["loc_sampler"] + else: + self.loc_sampler = get_sampler("loc", loc_distribution, min_loc, max_loc, **kwargs) + + # Depot distribution + if kwargs.get("depot_sampler", None) is not None: + self.depot_sampler = kwargs["depot_sampler"] + else: + self.depot_sampler = get_sampler("depot", depot_distribution, min_loc, max_loc, **kwargs) + + # Lateness weight distribution + if kwargs.get("lateness_weight_sampler", None) is not None: + self.lateness_weight_sampler = kwargs["lateness_weight_sampler"] + else: + self.lateness_weight_sampler = get_sampler( + "lateness_weight", lateness_weight_distribution, min_lateness_weight, max_lateness_weight, **kwargs + ) + + def _generate(self, batch_size) -> TensorDict: + # Sample locations + locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2)) + + # Sample depot + if self.depot_mode == "single": + depot = self.depot_sampler.sample((*batch_size, 2))[:, None, :].repeat(1, self.num_depot, 1) + else: + depot = self.depot_sampler.sample((*batch_size, self.num_depot, 2)) + + # Sample capacity + capacity = torch.randint( + self.min_capacity, + self.max_capacity + 1, + size=(*batch_size, 1), + ) + + # Sample lateness weight + lateness_weight = self.lateness_weight_sampler.sample((*batch_size, 1)) + + return TensorDict( + { + "locs": locs, + "depot": depot, + "capacity": capacity, + "lateness_weight": lateness_weight, + }, + batch_size=batch_size, + ) diff --git a/rl4co/envs/routing/mdcpdp/render.py b/rl4co/envs/routing/mdcpdp/render.py new file mode 100644 index 00000000..5711b1d7 --- /dev/null +++ b/rl4co/envs/routing/mdcpdp/render.py @@ -0,0 +1,120 @@ +from tensordict.tensordict import TensorDict + + +def render(td: TensorDict, actions=None, ax=None): + import matplotlib.pyplot as plt + markersize = 8 + + td = td.detach().cpu() + + # If batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + if actions is not None: + actions = actions[0] + + n_depots = td["capacity"].size(-1) + n_pickups = (td["locs"].size(-2) - n_depots) // 2 + + # Variables + init_deliveries = td["to_deliver"][n_depots:] + delivery_locs = td["locs"][n_depots:][~init_deliveries.bool()] + pickup_locs = td["locs"][n_depots:][init_deliveries.bool()] + depot_locs = td["locs"][:n_depots] + actions = actions if actions is not None else td["action"] + + if ax is None: + _, ax = plt.subplots(figsize=(4, 4)) + + # Plot the actions in order + last_depot = 0 + for i in range(len(actions)-1): + if actions[i+1] < n_depots: + last_depot = actions[i+1] + if actions[i] < n_depots and actions[i+1] < n_depots: + continue + from_node = actions[i] + to_node = ( + actions[i + 1] if i < len(actions) - 1 else actions[0] + ) # last goes back to depot + from_loc = td["locs"][from_node] + to_loc = td["locs"][to_node] + ax.plot([from_loc[0], to_loc[0]], [from_loc[1], to_loc[1]], "k-") + ax.annotate( + "", + xy=(to_loc[0], to_loc[1]), + xytext=(from_loc[0], from_loc[1]), + arrowprops=dict(arrowstyle="->", color="black"), + annotation_clip=False, + ) + + # Plot last back to the depot + from_node = actions[-1] + to_node = last_depot + from_loc = td["locs"][from_node] + to_loc = td["locs"][to_node] + ax.plot([from_loc[0], to_loc[0]], [from_loc[1], to_loc[1]], "k-") + ax.annotate( + "", + xy=(to_loc[0], to_loc[1]), + xytext=(from_loc[0], from_loc[1]), + arrowprops=dict(arrowstyle="->", color="black"), + annotation_clip=False, + ) + + # Annotate node location + for i, loc in enumerate(td["locs"]): + ax.annotate( + str(i), + (loc[0], loc[1]), + textcoords="offset points", + xytext=(0, 5), + ha="center", + ) + + for i, depot_loc in enumerate(depot_locs): + ax.plot( + depot_loc[0], + depot_loc[1], + "tab:green", + marker="s", + markersize=markersize, + label="Depot" if i == 0 else None, + ) + + # Plot the pickup locations + for i, pickup_loc in enumerate(pickup_locs): + ax.plot( + pickup_loc[0], + pickup_loc[1], + "tab:red", + marker="^", + markersize=markersize, + label="Pickup" if i == 0 else None, + ) + + # Plot the delivery locations + for i, delivery_loc in enumerate(delivery_locs): + ax.plot( + delivery_loc[0], + delivery_loc[1], + "tab:blue", + marker="x", + markersize=markersize, + label="Delivery" if i == 0 else None, + ) + + # Plot pickup and delivery pair: from loc[n_depot + i ] to loc[n_depot + n_pickups + i] + for i in range(n_pickups): + pickup_loc = td["locs"][n_depots + i] + delivery_loc = td["locs"][n_depots + n_pickups + i] + ax.plot( + [pickup_loc[0], delivery_loc[0]], + [pickup_loc[1], delivery_loc[1]], + "k--", + alpha=0.5, + ) + + # Setup limits and show + ax.set_xlim(-0.05, 1.05) + ax.set_ylim(-0.05, 1.05) diff --git a/rl4co/envs/routing/mpdp/__init__.py b/rl4co/envs/routing/mpdp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/mpdp/env.py b/rl4co/envs/routing/mpdp/env.py new file mode 100644 index 00000000..21143abe --- /dev/null +++ b/rl4co/envs/routing/mpdp/env.py @@ -0,0 +1,394 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +from .generator import MPDPGenerator +from .render import render + +log = get_pylogger(__name__) + + +class MPDPEnv(RL4COEnvBase): + """Multi-agent Pickup and Delivery Problem (mPDP) environment. + The goal is to pick up and deliver all the packages while satisfying the precedence constraints. + When an agent goes back to the depot, a new agent is spawned. In the min-max version, the goal is to minimize the + maximum tour length among all agents. The reward is 0 unless the agent visits all the customers. + In that case, the reward is (-)length of the path: maximizing the reward is equivalent to minimizing the path length. + + Observations: + - locations of the depot, pickup, and delivery locations + - current location of the vehicle + - the remaining locations to deliver + - the visited locations + - the current step + + Constraints: + - the tour starts and ends at the depot + - each pickup location must be visited before its corresponding delivery location + - the vehicle cannot visit the same location twice + + Finish Condition: + - the vehicle has visited all locations + + Reward: + - (minus) the negative length of the path + + Args: + generator: MPDPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "mpdp" + + def __init__( + self, + generator: MPDPGenerator = None, + generator_params: dict = {}, + objective: str = "minmax", + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = MPDPGenerator(**generator_params) + self.generator = generator + self.objective = objective + self._make_spec(self.generator) + + def _step(self, td: TensorDict) -> TensorDict: + selected = td["action"][:, None] # Add dimension for step + + agent_num = td["lengths"].size(1) + n_loc = td["to_delivery"].size(-1) - agent_num - 1 + + new_to_delivery = (selected + n_loc // 2) % ( + n_loc + agent_num + 1 + ) # the pair node of selected node + + is_request = (selected > agent_num) & (selected <= agent_num + n_loc // 2) + td["left_request"][is_request] -= 1 + depot_distance = td["depot_distance"].scatter(-1, selected, 0) + + add_pd = td["add_pd_distance"][is_request.squeeze(-1), :].gather( + -1, selected[is_request.squeeze(-1), :] - agent_num - 1 + ) + td["longest_lengths"][is_request.squeeze(-1), :].scatter_add_( + -1, td["count_depot"][is_request.squeeze(-1), :], add_pd + ) + td["add_pd_distance"][is_request.squeeze(-1), :].scatter_( + -1, selected[is_request.squeeze(-1), :] - agent_num - 1, 0 + ) + remain_sum_paired_distance = td["add_pd_distance"].sum(-1, keepdim=True) + remain_pickup_max_distance = depot_distance[:, : agent_num + 1 + n_loc // 2].max( + dim=-1, keepdim=True + )[0] + remain_delivery_max_distance = depot_distance[ + :, agent_num + 1 + n_loc // 2 : + ].max(dim=-1, keepdim=True)[0] + + # Calculate makespan + cur_coord = gather_by_index(td["locs"], selected) + path_lengths = (cur_coord - td["cur_coord"]).norm(p=2, dim=-1) + + td["lengths"].scatter_add_(-1, td["count_depot"], path_lengths.unsqueeze(-1)) + + # If visit depot then plus one to count_depot\ + td["count_depot"][ + (selected == td["agent_idx"]) & (td["agent_idx"] < agent_num) + ] += 1 # torch.ones(td["count_depot"][(selected == 0) & (td["agent_idx"] < agent_num)].shape, dtype=torch.int64, device=td["count_depot"].device) + + # `agent_idx` is added by 1 if the current agent comes back to depot + agent_idx = (td["count_depot"] + 1) * torch.ones( + selected.size(0), 1, dtype=torch.long, device=td["count_depot"].device + ) + visited = td["visited"].scatter(-1, selected.unsqueeze(-1), 1) + to_delivery = td["to_delivery"].scatter(-1, new_to_delivery[:, :, None], 1) + + # Get done and reward + done = visited.all(dim=-1, keepdim=True).squeeze(-1) + reward = torch.zeros_like(done) + + td.update( + { + "visited": visited, + "agent_idx": agent_idx, + "cur_coord": cur_coord, + "to_delivery": to_delivery, + "depot_distance": depot_distance, + "remain_sum_paired_distance": remain_sum_paired_distance, + "remain_pickup_max_distance": remain_pickup_max_distance, + "remain_delivery_max_distance": remain_delivery_max_distance, + "i": td["i"] + 1, + "done": done, + "reward": reward, + } + ) + td.set("action_mask", self.get_action_mask(td)) + return td + + def _reset( + self, + td: Optional[TensorDict] = None, + batch_size: Optional[list] = None, + agent_num: Optional[int] = None, # NOTE hardcoded from ET + ) -> TensorDict: + device = td.device + + # NOTE: this is a hack to get the agent_num + # agent_num = td["agent_num"][0].item() if agent_num is None else agent_num + # agent_num = agent_num if agent_num is not None else td["agent_num"][0].item() + + depot = td["depot"] + depot = depot.repeat(1, agent_num + 1, 1) + loc = td["locs"] + left_request = loc.size(1) // 2 + whole_instance = torch.cat((depot, loc), dim=1) + + # Distance from all nodes between each other + distance = torch.cdist(whole_instance, whole_instance, p=2) + index = torch.arange(left_request, 2 * left_request, device=device)[None, :, None] + index = index.repeat(distance.shape[0], 1, 1) + add_pd_distance = distance[ + :, agent_num + 1 : agent_num + 1 + left_request, agent_num + 1 : + ].gather(-1, index) + add_pd_distance = add_pd_distance.squeeze(-1) + + remain_pickup_max_distance = distance[:, 0, : agent_num + 1 + left_request].max( + dim=-1, keepdim=True + )[0] + remain_delivery_max_distance = distance[:, 0, agent_num + 1 + left_request :].max( + dim=-1, keepdim=True + )[0] + remain_sum_paired_distance = add_pd_distance.sum(dim=-1, keepdim=True) + + # Distance from depot to all nodes + # Delivery nodes should consider the sum of distance from depot to paired pickup nodes and pickup nodes to delivery nodes + distance[:, 0, agent_num + 1 : agent_num + 1 + left_request] = ( + distance[:, 0, agent_num + 1 : agent_num + 1 + left_request] + + distance[:, 0, agent_num + 1 + left_request :] + ) + + # Distance from depot to all nodes + depot_distance = distance[:, 0, :] + depot_distance[:, agent_num + 1 : agent_num + 1 + left_request] = depot_distance[ + :, agent_num + 1 : agent_num + 1 + left_request + ] # + add_pd_distance + + batch_size, n_loc, _ = loc.size() + to_delivery = torch.cat( + [ + torch.ones( + batch_size, + 1, + n_loc // 2 + agent_num + 1, + dtype=torch.uint8, + device=device, + ), + torch.zeros(batch_size, 1, n_loc // 2, dtype=torch.uint8, device=device), + ], + dim=-1, + ) + + # Create reset TensorDict + td_reset = TensorDict( + { + "locs": torch.cat((depot, loc), -2), + "visited": torch.zeros( + batch_size, + 1, + n_loc + agent_num + 1, + dtype=torch.uint8, + device=device, + ), + "lengths": torch.zeros(batch_size, agent_num, device=device), + "longest_lengths": torch.zeros(batch_size, agent_num, device=device), + "cur_coord": ( + td["depot"] if len(td["depot"].shape) == 2 else td["depot"].squeeze(1) + ), + "i": torch.zeros( + batch_size, dtype=torch.int64, device=device + ), # Vector with length num_steps + "to_delivery": to_delivery, + "count_depot": torch.zeros( + batch_size, 1, dtype=torch.int64, device=device + ), + "agent_idx": torch.ones(batch_size, 1, dtype=torch.long, device=device), + "left_request": left_request + * torch.ones(batch_size, 1, dtype=torch.long, device=device), + "remain_pickup_max_distance": remain_pickup_max_distance, + "remain_delivery_max_distance": remain_delivery_max_distance, + "depot_distance": depot_distance, + "remain_sum_paired_distance": remain_sum_paired_distance, + "add_pd_distance": add_pd_distance, + }, + batch_size=batch_size, + ) + td_reset.set("action_mask", self.get_action_mask(td_reset)) + return td_reset + + @staticmethod + def get_action_mask(td: TensorDict) -> torch.Tensor: + """Get the action mask for the current state.""" + + visited_loc = td["visited"].clone() + + agent_num = td["lengths"].size(1) + n_loc = visited_loc.size(-1) - agent_num - 1 # num of customers + batch_size = visited_loc.size(0) + agent_idx = td["agent_idx"][:, None, :] + mask_loc = visited_loc.to(td["to_delivery"].device) | (1 - td["to_delivery"]) + + # depot + if td["i"][0].item() != 0: + mask_loc[:, :, : agent_num + 1] = 1 + + # if deliver nodes which is assigned agent is complete, then agent can go to depot + no_item_to_delivery = ( + visited_loc[:, :, n_loc // 2 + agent_num + 1 :] + == td["to_delivery"][:, :, n_loc // 2 + agent_num + 1 :] + ).all(dim=-1) + mask_loc[no_item_to_delivery.squeeze(-1), :, :] = mask_loc[ + no_item_to_delivery.squeeze(-1), :, : + ].scatter_(-1, agent_idx[no_item_to_delivery.squeeze(-1), :, :], 0) + + condition = (td["count_depot"] == agent_num - 1) & ( + (visited_loc[:, :, agent_num + 1 :] == 0).sum(dim=-1) != 0 + ) + + mask_loc[..., agent_num][condition] = 1 + + else: + return ( + torch.cat( + [ + torch.zeros( + batch_size, 1, 1, dtype=torch.uint8, device=mask_loc.device + ), + torch.ones( + batch_size, + 1, + n_loc + agent_num, + dtype=torch.uint8, + device=mask_loc.device, + ), + ], + dim=-1, + ) + > 0 + ) + action_mask = mask_loc == 0 # action_mask gets feasible actions + return action_mask + + def _get_reward(self, td: TensorDict, actions: torch.Tensor) -> torch.Tensor: + # Calculate the reward (negative tour length) + if self.objective == "minmax": + return -td["lengths"].max(dim=-1, keepdim=True)[0].squeeze(-1) + elif self.objective == "minsum": + return -td["lengths"].sum(dim=-1, keepdim=True).squeeze(-1) + else: + raise ValueError(f"Unknown objective {self.objective}") + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor) -> None: + assert True, "Not implemented" + + def _make_spec(self, generator: MPDPGenerator): + """Make the observation and action specs from the parameters.""" + max_nodes = self.num_loc + self.max_num_agents + 1 + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(max_nodes, 2), + dtype=torch.float32, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + action_mask=Unbounded( + shape=(max_nodes, 1), + dtype=torch.bool, + ), + visited=Unbounded( + shape=(1, max_nodes), + dtype=torch.bool, + ), + lengths=Unbounded( + shape=(generator.max_num_agents,), + dtype=torch.float32, + ), + longest_lengths=Unbounded( + shape=(generator.max_num_agents,), + dtype=torch.float32, + ), + cur_coord=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(2,), + dtype=torch.float32, + ), + to_delivery=Unbounded( + shape=(max_nodes, 1), + dtype=torch.bool, + ), + count_depot=Unbounded( + shape=(1,), + dtype=torch.int64, + ), + agent_idx=Unbounded( + shape=(1,), + dtype=torch.int64, + ), + left_request=Unbounded( + shape=(1,), + dtype=torch.int64, + ), + remain_pickup_max_distance=Unbounded( + shape=(1,), + dtype=torch.float32, + ), + remain_delivery_max_distance=Unbounded( + shape=(1,), + dtype=torch.float32, + ), + depot_distance=Unbounded( + shape=(max_nodes,), + dtype=torch.float32, + ), + remain_sum_paired_distance=Unbounded( + shape=(1,), + dtype=torch.float32, + ), + add_pd_distance=Unbounded( + shape=(max_nodes,), + dtype=torch.float32, + ), + ## NOTE: we should have a vectorized implementation for agent_num + # agent_num=Unbounded( + # shape=(1,), + # dtype=torch.int64, + # ), + i=Unbounded( + shape=(1,), + dtype=torch.int64, + ), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=max_nodes, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + @staticmethod + def render(td: TensorDict, actions: torch.Tensor = None, ax=None): + return render(td, actions, ax) diff --git a/rl4co/envs/routing/mpdp/generator.py b/rl4co/envs/routing/mpdp/generator.py new file mode 100644 index 00000000..13f42932 --- /dev/null +++ b/rl4co/envs/routing/mpdp/generator.py @@ -0,0 +1,95 @@ +from typing import Union, Callable + +import torch + +from torch.distributions import Uniform +from tensordict.tensordict import TensorDict + +from rl4co.utils.pylogger import get_pylogger +from rl4co.envs.common.utils import get_sampler, Generator + +log = get_pylogger(__name__) + + +class MPDPGenerator(Generator): + """Data generator for the Capacitated Vehicle Routing Problem (CVRP). + Args: + num_loc: number of locations + min_loc: minimum location value + max_loc: maximum location value + loc_distribution: distribution for the locations + depot_distribution: distribution for the depot location. If None, sample the depot from the locations + min_num_agents: minimum number of agents + max_num_agents: maximum number of agents + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each customer and the depot + depot [batch_size, 2]: location of the depot + num_agents [batch_size]: number of agents + """ + def __init__( + self, + num_loc: int = 20, + min_loc: float = 0.0, + max_loc: float = 1.0, + loc_distribution: Union[ + int, float, str, type, Callable + ] = Uniform, + depot_distribution: Union[ + int, float, str, type, Callable + ] = None, + min_num_agents: int = 2, + max_num_agents: int = 10, + **kwargs + ): + self.num_loc = num_loc + self.min_loc = min_loc + self.max_loc = max_loc + self.min_num_agents = min_num_agents + self.max_num_agents = max_num_agents + + # Number of locations must be even + if num_loc % 2 != 0: + log.warn("Number of locations must be even. Adding 1 to the number of locations.") + self.num_loc += 1 + + # Location distribution + if kwargs.get("loc_sampler", None) is not None: + self.loc_sampler = kwargs["loc_sampler"] + else: + self.loc_sampler = get_sampler("loc", loc_distribution, min_loc, max_loc, **kwargs) + + # Depot distribution + if kwargs.get("depot_sampler", None) is not None: + self.depot_sampler = kwargs["depot_sampler"] + else: + self.depot_sampler = get_sampler("depot", depot_distribution, min_loc, max_loc, **kwargs) if depot_distribution is not None else None + + + def _generate(self, batch_size) -> TensorDict: + # Sample locations: depot and customers + if self.depot_sampler is not None: + depot = self.depot_sampler.sample((*batch_size, 2)) + locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2)) + else: + # if depot_sampler is None, sample the depot from the locations + locs = self.loc_sampler.sample((*batch_size, self.num_loc + 1, 2)) + depot = locs[..., 0, :] + locs = locs[..., 1:, :] + + # Sample the number of agents + num_agents = torch.randint( + self.min_num_agents, + self.max_num_agents + 1, + size=(*batch_size, ), + ) + + return TensorDict( + { + "locs": locs, + "depot": depot, + "num_agents": num_agents, + }, + batch_size=batch_size, + ) diff --git a/rl4co/envs/routing/mpdp/render.py b/rl4co/envs/routing/mpdp/render.py new file mode 100644 index 00000000..1f49a2f9 --- /dev/null +++ b/rl4co/envs/routing/mpdp/render.py @@ -0,0 +1,114 @@ +import torch +import numpy as np +import matplotlib.pyplot as plt + +from matplotlib import cm, colormaps + +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(td, actions=None, ax=None): + # TODO: color switch with new agents; add pickup and delivery nodes as in `PDPEnv.render` + + import matplotlib.pyplot as plt + import numpy as np + + from matplotlib import cm, colormaps + + num_routine = (actions == 0).sum().item() + 2 + base = colormaps["nipy_spectral"] + color_list = base(np.linspace(0, 1, num_routine)) + cmap_name = base.name + str(num_routine) + out = base.from_list(cmap_name, color_list, num_routine) + + if ax is None: + # Create a plot of the nodes + _, ax = plt.subplots() + + td = td.detach().cpu() + + if actions is None: + actions = td.get("action", None) + + # if batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + actions = actions[0] + + locs = td["locs"] + + # add the depot at the first action and the end action + actions = torch.cat([torch.tensor([0]), actions, torch.tensor([0])]) + + # gather locs in order of action if available + if actions is None: + log.warning("No action in TensorDict, rendering unsorted locs") + else: + locs = locs + + # Cat the first node to the end to complete the tour + x, y = locs[:, 0], locs[:, 1] + + # plot depot + ax.scatter( + locs[0, 0], + locs[0, 1], + edgecolors=cm.Set2(2), + facecolors="none", + s=100, + linewidths=2, + marker="s", + alpha=1, + ) + + # plot visited nodes + ax.scatter( + x[1:], + y[1:], + edgecolors=cm.Set2(0), + facecolors="none", + s=50, + linewidths=2, + marker="o", + alpha=1, + ) + + # text depot + ax.text( + locs[0, 0], + locs[0, 1] - 0.025, + "Depot", + horizontalalignment="center", + verticalalignment="top", + fontsize=10, + color=cm.Set2(2), + ) + + # plot actions + color_idx = 0 + for action_idx in range(len(actions) - 1): + if actions[action_idx] == 0: + color_idx += 1 + from_loc = locs[actions[action_idx]] + to_loc = locs[actions[action_idx + 1]] + ax.plot( + [from_loc[0], to_loc[0]], + [from_loc[1], to_loc[1]], + color=out(color_idx), + lw=1, + ) + ax.annotate( + "", + xy=(to_loc[0], to_loc[1]), + xytext=(from_loc[0], from_loc[1]), + arrowprops=dict(arrowstyle="-|>", color=out(color_idx)), + size=15, + annotation_clip=False, + ) + + # Setup limits and show + ax.set_xlim(-0.05, 1.05) + ax.set_ylim(-0.05, 1.05) diff --git a/rl4co/envs/routing/mtsp/__init__.py b/rl4co/envs/routing/mtsp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/mtsp/env.py b/rl4co/envs/routing/mtsp/env.py new file mode 100644 index 00000000..bf39cf74 --- /dev/null +++ b/rl4co/envs/routing/mtsp/env.py @@ -0,0 +1,240 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.envs.common.utils import batch_to_scalar +from rl4co.utils.ops import gather_by_index, get_distance, get_tour_length + +from .generator import MTSPGenerator +from .render import render + + +class MTSPEnv(RL4COEnvBase): + """Multiple Traveling Salesman Problem environment + At each step, an agent chooses to visit a city. A maximum of `num_agents` agents can be employed to visit the cities. + The cost can be defined in two ways: + - `minmax`: (default) the reward is the maximum of the path lengths of all the agents + - `sum`: the cost is the sum of the path lengths of all the agents + Reward is - cost, so the goal is to maximize the reward (minimize the cost). + + Observations: + - locations of the depot and each customer. + - number of agents. + - the current agent index. + - the current location of the vehicle. + + Constrains: + - each agent's tour starts and ends at the depot. + - each customer must be visited exactly once. + + Finish condition: + - all customers are visited and all agents back to the depot. + + Reward: + There are two ways to calculate the cost (-reward): + - `minmax`: (default) the cost is the maximum of the path lengths of all the agents. + - `sum`: the cost is the sum of the path lengths of all the agents. + + Args: + cost_type: type of cost to use, either `minmax` or `sum` + generator: MTSPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "mtsp" + + def __init__( + self, + generator: MTSPGenerator = None, + generator_params: dict = {}, + cost_type: str = "minmax", + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = MTSPGenerator(**generator_params) + self.generator = generator + self.cost_type = cost_type + self._make_spec(self.generator) + + @staticmethod + def _step(td: TensorDict) -> TensorDict: + # Initial variables + is_first_action = batch_to_scalar(td["i"]) == 0 + current_node = td["action"] + first_node = current_node if is_first_action else td["first_node"] + + # Get the locations of the current node and the previous node and the depot + cur_loc = gather_by_index(td["locs"], current_node) + prev_loc = gather_by_index( + td["locs"], td["current_node"] + ) # current_node is the previous node + depot_loc = td["locs"][..., 0, :] + + # If current_node is the depot, then increment agent_idx + cur_agent_idx = td["agent_idx"] + (current_node == 0).long() + + # Set not visited to 0 (i.e., we visited the node) + available = td["action_mask"].scatter( + -1, current_node[..., None].expand_as(td["action_mask"]), 0 + ) + # Available[..., 0] is the depot, which is always available unless: + # - current_node is the depot + # - agent_idx greater than num_agents -1 + available[..., 0] = torch.logical_and( + current_node != 0, td["agent_idx"] < td["num_agents"] - 1 + ) + + # We are done there are no unvisited locations except the depot + done = torch.count_nonzero(available[..., 1:], dim=-1) == 0 + + # If done is True, then we make the depot available again, so that it will be selected as the next node with prob 1 + available[..., 0] = torch.logical_or(done, available[..., 0]) + + # Update the current length + current_length = td["current_length"] + get_distance(cur_loc, prev_loc) + + # If done, we add the distance from the current_node to the depot as well + current_length = torch.where( + done, current_length + get_distance(cur_loc, depot_loc), current_length + ) + + # We update the max_subtour_length and reset the current_length + max_subtour_length = torch.where( + current_length > td["max_subtour_length"], + current_length, + td["max_subtour_length"], + ) + + # If current agent is different from previous agent, then we have a new subtour and reset the length + current_length *= (cur_agent_idx == td["agent_idx"]).float() + + # The reward is the negative of the max_subtour_length (minmax objective) + reward = -max_subtour_length + + td.update( + { + "max_subtour_length": max_subtour_length, + "current_length": current_length, + "agent_idx": cur_agent_idx, + "first_node": first_node, + "current_node": current_node, + "i": td["i"] + 1, + "action_mask": available, + "reward": reward, + "done": done, + } + ) + + return td + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + device = td.device + + # Keep track of the agent number to know when to stop + agent_idx = torch.zeros((*batch_size,), dtype=torch.int64, device=device) + + # Make variable for max_subtour_length between subtours + max_subtour_length = torch.zeros(batch_size, dtype=torch.float32, device=device) + current_length = torch.zeros(batch_size, dtype=torch.float32, device=device) + + # Other variables + current_node = torch.zeros((*batch_size,), dtype=torch.int64, device=device) + available = torch.ones( + (*batch_size, self.generator.num_loc), dtype=torch.bool, device=device + ) # 1 means not visited, i.e. action is allowed + available[..., 0] = 0 # Depot is not available as first node + i = torch.zeros((*batch_size,), dtype=torch.int64, device=device) + + return TensorDict( + { + "locs": td["locs"], # depot is first node + "num_agents": td["num_agents"], + "max_subtour_length": max_subtour_length, + "current_length": current_length, + "agent_idx": agent_idx, + "first_node": current_node, + "current_node": current_node, + "i": i, + "action_mask": available, + }, + batch_size=batch_size, + ) + + def _make_spec(self, generator: MTSPGenerator): + """Make the observation and action specs from the parameters.""" + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.num_loc, 2), + dtype=torch.float32, + ), + num_agents=Unbounded( + shape=(1), + dtype=torch.int64, + ), + agent_idx=Unbounded( + shape=(1), + dtype=torch.int64, + ), + current_length=Unbounded( + shape=(1), + dtype=torch.float32, + ), + max_subtour_length=Unbounded( + shape=(1), + dtype=torch.float32, + ), + first_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + i=Unbounded( + shape=(1), + dtype=torch.int64, + ), + action_mask=Unbounded( + shape=(generator.num_loc), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.num_loc, + ) + self.reward_spec = Unbounded() + self.done_spec = Unbounded(dtype=torch.bool) + + def _get_reward(self, td, actions=None) -> TensorDict: + # With minmax, get the maximum distance among subtours, calculated in the model + if self.cost_type == "minmax": + return td["reward"].squeeze(-1) + + # With distance, same as TSP + elif self.cost_type == "sum": + locs = td["locs"] + locs_ordered = locs.gather(1, actions.unsqueeze(-1).expand_as(locs)) + return -get_tour_length(locs_ordered) + + else: + raise ValueError(f"Cost type {self.cost_type} not supported") + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor): + assert True, "Not implemented" + + @staticmethod + def render(td, actions=None, ax=None): + return render(td, actions, ax) diff --git a/rl4co/envs/routing/mtsp/generator.py b/rl4co/envs/routing/mtsp/generator.py new file mode 100644 index 00000000..1716ca41 --- /dev/null +++ b/rl4co/envs/routing/mtsp/generator.py @@ -0,0 +1,72 @@ +from typing import Callable, Union + +import torch + +from tensordict.tensordict import TensorDict +from torch.distributions import Uniform + +from rl4co.envs.common.utils import Generator, get_sampler +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class MTSPGenerator(Generator): + """Data generator for the Multiple Travelling Salesman Problem (mTSP). + + Args: + num_loc: number of locations (customers) in the TSP + min_loc: minimum value for the location coordinates + max_loc: maximum value for the location coordinates + loc_distribution: distribution for the location coordinates + min_num_agents: minimum number of agents (vehicles), include + max_num_agents: maximum number of agents (vehicles), include + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each customer + num_agents [batch_size]: number of agents (vehicles) + """ + + def __init__( + self, + num_loc: int = 20, + min_loc: float = 0.0, + max_loc: float = 1.0, + loc_distribution: Union[int, float, str, type, Callable] = Uniform, + min_num_agents: int = 5, + max_num_agents: int = 5, + **kwargs, + ): + self.num_loc = num_loc + self.min_loc = min_loc + self.max_loc = max_loc + self.min_num_agents = min_num_agents + self.max_num_agents = max_num_agents + + # Location distribution + if kwargs.get("loc_sampler", None) is not None: + self.loc_sampler = kwargs["loc_sampler"] + else: + self.loc_sampler = get_sampler( + "loc", loc_distribution, min_loc, max_loc, **kwargs + ) + + def _generate(self, batch_size) -> TensorDict: + # Sample locations + locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2)) + + # Sample the number of agents + num_agents = torch.randint( + self.min_num_agents, + self.max_num_agents + 1, + size=(*batch_size,), + ) + + return TensorDict( + { + "locs": locs, + "num_agents": num_agents, + }, + batch_size=batch_size, + ) diff --git a/rl4co/envs/routing/mtsp/render.py b/rl4co/envs/routing/mtsp/render.py new file mode 100644 index 00000000..173301ae --- /dev/null +++ b/rl4co/envs/routing/mtsp/render.py @@ -0,0 +1,95 @@ +import torch +import numpy as np +import matplotlib.pyplot as plt + +from matplotlib import colormaps + +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(td, actions=None, ax=None): + def discrete_cmap(num, base_cmap="nipy_spectral"): + """Create an N-bin discrete colormap from the specified input map""" + base = colormaps[base_cmap] + color_list = base(np.linspace(0, 1, num)) + cmap_name = base.name + str(num) + return base.from_list(cmap_name, color_list, num) + + if actions is None: + actions = td.get("action", None) + # if batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + actions = actions[0] + + num_agents = td["num_agents"] + locs = td["locs"] + cmap = discrete_cmap(num_agents, "rainbow") + + fig, ax = plt.subplots() + + # Add depot action = 0 to before first action and after last action + actions = torch.cat( + [ + torch.zeros(1, dtype=torch.int64), + actions, + torch.zeros(1, dtype=torch.int64), + ] + ) + + # Make list of colors from matplotlib + for i, loc in enumerate(locs): + if i == 0: + # depot + marker = "s" + color = "g" + label = "Depot" + markersize = 10 + else: + # normal location + marker = "o" + color = "tab:blue" + label = "Customers" + markersize = 8 + if i > 1: + label = "" + + ax.plot( + loc[0], + loc[1], + color=color, + marker=marker, + markersize=markersize, + label=label, + ) + + # Plot the actions in order + agent_idx = 0 + for i in range(len(actions)): + if actions[i] == 0: + agent_idx += 1 + color = cmap(num_agents - agent_idx) + + from_node = actions[i] + to_node = ( + actions[i + 1] if i < len(actions) - 1 else actions[0] + ) # last goes back to depot + from_loc = td["locs"][from_node] + to_loc = td["locs"][to_node] + ax.plot([from_loc[0], to_loc[0]], [from_loc[1], to_loc[1]], color=color) + ax.annotate( + "", + xy=(to_loc[0], to_loc[1]), + xytext=(from_loc[0], from_loc[1]), + arrowprops=dict(arrowstyle="->", color=color), + annotation_clip=False, + ) + + # Legend + handles, labels = ax.get_legend_handles_labels() + ax.legend(handles, labels) + ax.set_title("mTSP") + ax.set_xlabel("x-coordinate") + ax.set_ylabel("y-coordinate") diff --git a/rl4co/envs/routing/mtvrp/__init__.py b/rl4co/envs/routing/mtvrp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/mtvrp/baselines/__init__.py b/rl4co/envs/routing/mtvrp/baselines/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/mtvrp/baselines/constants.py b/rl4co/envs/routing/mtvrp/baselines/constants.py new file mode 100644 index 00000000..e17b888b --- /dev/null +++ b/rl4co/envs/routing/mtvrp/baselines/constants.py @@ -0,0 +1,42 @@ +LKH_SCALING_FACTOR = 100_000 +ORTOOLS_SCALING_FACTOR = 100_000 +PYVRP_SCALING_FACTOR = 1_000 + + +ROUTEFINDER2LKH = { + "CVRP": "CVRP", + "OVRP": "OVRP", + "OVRPB": None, # Issue: don't know + "OVRPBL": None, # Issue: distance limits + "OVRPBLTW": None, # Issue: distance limits + "OVRPBTW": None, # Issue: service times don't work in VRPBTW + "OVRPL": "OVRP", + "OVRPLTW": "CVRPTW", + "OVRPMB": "VRPMPD", + "OVRPMBL": "VRPMPD", + "OVRPMBTW": "VRPMPDTW", + "OVRPMBLTW": "VRPMPDTW", # Issue: distance limits + "OVRPTW": "CVRPTW", + "VRPB": None, # Issue: don't know: linehaul after backhaul + "VRPBL": None, + "VRPBLTW": None, # Issue: service times don't work in VRPBTW + "VRPBTW": None, # Issue: service times don't work in VRPBTW + "VRPL": "DCVRP", + "VRPLTW": "CVRPTW", # I don't think that limits get respected + "VRPMB": "VRPMPD", + "VRPMBL": "VRPMPD", # I don't think that limits get respected + "VRPMBTW": "VRPMPDTW", + "VRPMBLTW": None, # Issue: don't know + "VRPTW": "CVRPTW", +} + +LKH_VARIANTS = [ + "CVRP", + "OVRP", + "CVRPTW", + "DCVRP", + "VRPB", + "VRPBTW", + "VRPMPD", + "VRPMPDTW", +] diff --git a/rl4co/envs/routing/mtvrp/baselines/lkh.py b/rl4co/envs/routing/mtvrp/baselines/lkh.py new file mode 100644 index 00000000..40946516 --- /dev/null +++ b/rl4co/envs/routing/mtvrp/baselines/lkh.py @@ -0,0 +1,214 @@ +import lkh +import numpy as np + +from tensordict import TensorDict +from torch import Tensor + +from .constants import LKH_SCALING_FACTOR, ROUTEFINDER2LKH +from .utils import scale + + +def solve( + instance: TensorDict, + max_runtime: float, + problem_type: str, + num_runs: int, + solver_loc: str, +) -> tuple[Tensor, Tensor]: + """ + Solves an AnyVRP instance with OR-Tools. + + Args: + instance: The AnyVRP instance to solve. + max_runtime: The maximum runtime for the solver. + problem_type: The problem type for LKH3. + num_runs: The number of runs to perform and returns the best result. + solver_loc: The location of the LKH3 solver executable. + + Returns: + A tuple containing the action and the cost, respectively. + """ + problem = instance2problem(instance, problem_type, LKH_SCALING_FACTOR) + action, cost = _solve(problem, max_runtime, num_runs, solver_loc) + cost /= -LKH_SCALING_FACTOR + + return action, cost + + +def _solve( + problem: lkh.LKHProblem, + max_runtime: float, + num_runs: int, + solver_loc: str, +) -> tuple[Tensor, Tensor]: + """ + Solves an instance with LKH3. + + Args: + problem: The LKHProblem instance. + max_runtime: The maximum runtime for each solver run. + num_runs: The number of runs to perform and returns the best result. + solver_loc: The location of the LKH3 solver executable. + + Returns: + A tuple containing the action and the cost, respectively. + """ + routes, cost = lkh.solve( + solver_loc, + problem=problem, + time_limit=max_runtime, + runs=num_runs, + ) + + action = routes2action(routes) + return action, cost + + +def instance2problem( + instance: TensorDict, + problem_type: str, + scaling_factor, +) -> lkh.LKHProblem: + """ + Converts an AnyVRP instance to an LKHProblem instance. + + Args: + instance: The AnyVRP instance to convert. + problem_type: The problem type for LKH3. + scaling_factor: The scaling factor to apply to the instance data. + + Returns: + The LKHProblem instance. + """ + num_locations = instance["demand_linehaul"].size()[0] + + # Data specifications + specs = {} + specs["DIMENSION"] = num_locations + specs["CAPACITY"] = scale(instance["vehicle_capacity"], scaling_factor) + + if not np.isinf(distance_limit := instance["distance_limit"]).any(): + specs["DISTANCE"] = scale(distance_limit, scaling_factor) + + specs["EDGE_WEIGHT_TYPE"] = "EXPLICIT" + specs["EDGE_WEIGHT_FORMAT"] = "FULL_MATRIX" + specs["NODE_COORD_TYPE"] = "TWOD_COORDS" + + # LKH can only solve VRP variants that are explicitly supported (so no + # arbitrary combinations between individual supported features). We can + # support some open variants with some modeling tricks. + lkh_problem_type = ROUTEFINDER2LKH[problem_type] + if lkh_problem_type is None: + raise ValueError(f"Problem type {problem_type} is not supported by LKH.") + + specs["TYPE"] = lkh_problem_type + + # Weird LKH quirk: specifying the number of vehicles lets (D)CVRP hang. + if lkh_problem_type not in ["CVRP", "DCVRP"]: + specs["VEHICLES"] = num_locations - 1 + + # Data sections + sections = {} + sections["NODE_COORD_SECTION"] = scale(instance["locs"], scaling_factor) + + demand_linehaul = scale(instance["demand_linehaul"], scaling_factor) + demand_backhaul = scale(instance["demand_backhaul"], scaling_factor) + sections["DEMAND_SECTION"] = demand_linehaul + demand_backhaul + + time_windows = scale(instance["time_windows"], scaling_factor) + sections["TIME_WINDOW_SECTION"] = time_windows + + service_times = scale(instance["durations"], scaling_factor) + sections["SERVICE_TIME_SECTION"] = service_times + + distances = instance["cost_matrix"] + backhaul_class = instance["backhaul_class"] + + if backhaul_class == 1: + # VRPB has a backhaul section that specifies the backhaul nodes. + backhaul_idcs = np.flatnonzero(instance["demand_backhaul"]).tolist() + sections["BACKHAUL_SECTION"] = backhaul_idcs + [-1] + + # linehaul = np.flatnonzero(demand_linehaul > 0) + # backhaul = np.flatnonzero(demand_backhaul > 0) + # distances[np.ix_(backhaul, linehaul)] = time_windows.max() + + elif backhaul_class == 2: + # VRPMPD has a pickup and delivery section that specifies the pickup + # and delivery quantities for each node, as well as the time windows. + # The regular time window section is redundant in this case. + data = [ + [ + 0, # dummy + time_windows[idx][0], + time_windows[idx][1], + service_times[idx], + demand_backhaul[idx], + demand_linehaul[idx], + ] + for idx in range(num_locations) + ] + sections["PICKUP_AND_DELIVERY_SECTION"] = data + + if instance["open_route"]: + # Arcs to the depot are set to zero as vehicles don’t need to return. + distances[:, 0] = 0 + + sections["EDGE_WEIGHT_SECTION"] = scale(distances, scaling_factor) + + # Convert to VRPLIB-like string. + problem = "\n".join(f"{k} : {v}" for k, v in specs.items()) + problem += "\n" + "\n".join(_format(name, data) for name, data in sections.items()) + problem += "\n" + "\n".join(["DEPOT_SECTION", "1", "-1", "EOF"]) + + return lkh.LKHProblem.parse(problem) + + +def _is_1D(data) -> bool: + for elt in data: + if isinstance(elt, (list, tuple, np.ndarray)): + return False + return True + + +def _format(name: str, data) -> str: + """ + Formats a data section. + + Args: + name: The name of the section. + data: The data to be formatted. + + Returns: + A VRPLIB-formatted data section. + """ + section = [name] + include_idx = name not in ["EDGE_WEIGHT_SECTION", "BACKHAUL_SECTION"] + + if name == "BACKHAUL_SECTION": + # Treat backhaul section as row vector. + section.append("\t".join(str(val) for val in data)) + + elif _is_1D(data): + # Treat 1D arrays as column vectors, so each element is a row. + for idx, elt in enumerate(data, 1): + prefix = f"{idx}\t" if include_idx else "" + section.append(prefix + str(elt)) + else: + for idx, row in enumerate(data, 1): + prefix = f"{idx}\t" if include_idx else "" + rest = "\t".join([str(elt) for elt in row]) + section.append(prefix + rest) + + return "\n".join(section) + + +def routes2action(routes: list[list[int]]) -> list[int]: + """ + Converts LKH routes to an action. + """ + # LKH routes are location-indexed, which in turn are 1-indexed. The first + # location is always the depot, so we subtract 2 to get client indices. + # LKH routes are 1-indexed, so we subtract 1 to get client indices. + routes_ = [[client - 1 for client in route] for route in routes] + return [visit for route in routes_ for visit in route + [0]] diff --git a/rl4co/envs/routing/mtvrp/baselines/ortools.py b/rl4co/envs/routing/mtvrp/baselines/ortools.py new file mode 100644 index 00000000..67b31c1a --- /dev/null +++ b/rl4co/envs/routing/mtvrp/baselines/ortools.py @@ -0,0 +1,248 @@ +from dataclasses import dataclass +from typing import Optional + +import numpy as np +import routefinder.baselines.pyvrp as pyvrp + +from ortools.constraint_solver import pywrapcp, routing_enums_pb2 +from tensordict import TensorDict +from torch import Tensor + +from .constants import ORTOOLS_SCALING_FACTOR + + +def solve(instance: TensorDict, max_runtime: float, **kwargs) -> tuple[Tensor, Tensor]: + """ + Solves an MTVRP instance with OR-Tools. + + Args: + instance: The MTVRP instance to solve. + max_runtime: The maximum runtime for the solver. + + Returns: + A tuple containing the action and the cost, respectively. + + Note: + This function depends on PyVRP's data converter to convert the MTVRP + instance to an OR-Tools compatible format. Future versions should + implement a direct conversion. + """ + data = instance2data(instance) + action, cost = _solve(data, max_runtime) + cost /= ORTOOLS_SCALING_FACTOR + cost *= -1 + + return action, cost + + +@dataclass +class ORToolsData: + """ + Convenient dataclass for instance data when using OR-Tools as solver. + + Args: + depot: The depot index. + distance_matrix: The distance matrix between locations. + duration_matrix: The duration matrix between locations. This includes service times. + num_vehicles: The number of vehicles. + vehicle_capacities: The capacity of each vehicle. + max_distance: The maximum distance a vehicle can travel. + demands: The demands of each location. + time_windows: The time windows for each location. Optional. + backhauls: The pickup quantity for backhaul at each location. + """ + + depot: int + distance_matrix: list[list[int]] + duration_matrix: list[list[int]] + num_vehicles: int + vehicle_capacities: list[int] + max_distance: int + demands: list[int] + time_windows: Optional[list[list[int]]] + backhauls: Optional[list[int]] + + @property + def num_locations(self) -> int: + return len(self.distance_matrix) + + +def instance2data(instance: TensorDict) -> ORToolsData: + """ + Converts an AnyVRP instance to an ORToolsData instance. + """ + # TODO: Do not use PyVRP's data converter. + data = pyvrp.instance2data(instance, ORTOOLS_SCALING_FACTOR) + + capacities = [ + veh_type.capacity + for veh_type in data.vehicle_types() + for _ in range(veh_type.num_available) + ] + max_distance = data.vehicle_type(0).max_distance + + demands = [0] + [client.delivery for client in data.clients()] + backhauls = [0] + [client.pickup for client in data.clients()] + service = [0] + [client.service_duration for client in data.clients()] + + tws = [[data.location(0).tw_early, data.location(0).tw_late]] + tws += [[client.tw_early, client.tw_late] for client in data.clients()] + + # Set data to None if instance does not contain explicit values. + default_tw = [0, np.iinfo(np.int64).max] + if all(tw == default_tw for tw in tws): + tws = None # type: ignore + + if all(val == 0 for val in backhauls): + backhauls = None # type: ignore + + distances = data.distance_matrix().copy() + durations = np.array(distances) + np.array(service)[:, np.newaxis] + + if backhauls is not None: + # Serve linehauls before backhauls. + linehaul = np.flatnonzero(np.array(demands) > 0) + backhaul = np.flatnonzero(np.array(backhauls) > 0) + distances[np.ix_(backhaul, linehaul)] = max_distance + + return ORToolsData( + depot=0, + distance_matrix=distances.tolist(), + duration_matrix=durations.tolist(), + num_vehicles=data.num_vehicles, + vehicle_capacities=capacities, + demands=demands, + time_windows=tws, + max_distance=max_distance, + backhauls=backhauls, + ) + + +def _solve(data: ORToolsData, max_runtime: float, log: bool = False): + """ + Solves an instance with OR-Tools. + + Args: + data: The instance data. + max_runtime: The maximum runtime in seconds. + log: Whether to log the search. + + Returns: + A tuple containing the action and the cost, respectively. + """ + # Manager for converting between nodes (location indices) and index + # (internal CP variable indices). + manager = pywrapcp.RoutingIndexManager( + data.num_locations, data.num_vehicles, data.depot + ) + routing = pywrapcp.RoutingModel(manager) + + # Set arc costs equal to distances. + distance_transit_idx = routing.RegisterTransitMatrix(data.distance_matrix) + routing.SetArcCostEvaluatorOfAllVehicles(distance_transit_idx) + + # Max distance constraint. + routing.AddDimension( + distance_transit_idx, + 0, # null distance slack + data.max_distance, # maximum distance per vehicle + True, # start cumul at zero + "Distance", + ) + + # Vehicle capacity constraint. + routing.AddDimensionWithVehicleCapacity( + routing.RegisterUnaryTransitVector(data.demands), + 0, # null capacity slack + data.vehicle_capacities, # vehicle maximum capacities + True, # start cumul to zero + "Demand", + ) + + # Backhauls: this assumes that VRPB is implemented by forbidding arcs + # that go from backhauls to linehauls. + if data.backhauls is not None: + routing.AddDimensionWithVehicleCapacity( + routing.RegisterUnaryTransitVector(data.backhauls), + 0, # null capacity slack + data.vehicle_capacities, # vehicle maximum capacities + True, # start cumul to zero + "Backhaul", + ) + + # Time window constraints. + if data.time_windows is not None: + depot_tw_early = data.time_windows[data.depot][0] + depot_tw_late = data.time_windows[data.depot][1] + + # The depot's late time window is a valid upper bound for the waiting + # time and maximum duration per vehicle. + routing.AddDimension( + routing.RegisterTransitMatrix(data.duration_matrix), + depot_tw_late, # waiting time upper bound + depot_tw_late, # maximum duration per vehicle + False, # don't force start cumul to zero + "Time", + ) + time_dim = routing.GetDimensionOrDie("Time") + + for node, (tw_early, tw_late) in enumerate(data.time_windows): + if node == data.depot: # skip depot + continue + + index = manager.NodeToIndex(node) + time_dim.CumulVar(index).SetRange(tw_early, tw_late) + + # Add time window constraints for each vehicle start node. + for node in range(data.num_vehicles): + start = routing.Start(node) + time_dim.CumulVar(start).SetRange(depot_tw_early, depot_tw_late) + + for node in range(data.num_vehicles): + cumul_start = time_dim.CumulVar(routing.Start(node)) + routing.AddVariableMinimizedByFinalizer(cumul_start) + + cumul_end = time_dim.CumulVar(routing.End(node)) + routing.AddVariableMinimizedByFinalizer(cumul_end) + + # Setup search parameters. + params = pywrapcp.DefaultRoutingSearchParameters() + + gls = routing_enums_pb2.LocalSearchMetaheuristic.GUIDED_LOCAL_SEARCH + params.local_search_metaheuristic = gls + + params.time_limit.FromSeconds(int(max_runtime)) # only accepts int + params.log_search = log + + solution = routing.SolveWithParameters(params) + action = solution2action(data, manager, routing, solution) + objective = solution.ObjectiveValue() + + return action, objective + + +def solution2action(data, manager, routing, solution) -> list[list[int]]: + """ + Converts an OR-Tools solution to routes. + """ + routes = [] + distance = 0 # for debugging + + for vehicle_idx in range(data.num_vehicles): + index = routing.Start(vehicle_idx) + route = [] + route_cost = 0 + + while not routing.IsEnd(index): + node = manager.IndexToNode(index) + route.append(node) + + prev_index = index + index = solution.Value(routing.NextVar(index)) + route_cost += routing.GetArcCostForVehicle(prev_index, index, vehicle_idx) + + if clients := route[1:]: # ignore depot + routes.append(clients) + distance += route_cost + + return [visit for route in routes for visit in route + [0]] diff --git a/rl4co/envs/routing/mtvrp/baselines/pyvrp.py b/rl4co/envs/routing/mtvrp/baselines/pyvrp.py new file mode 100644 index 00000000..1e889323 --- /dev/null +++ b/rl4co/envs/routing/mtvrp/baselines/pyvrp.py @@ -0,0 +1,109 @@ +import numpy as np +import pyvrp as pyvrp + +from pyvrp import Client, Depot, ProblemData, VehicleType, solve as _solve +from pyvrp.constants import MAX_VALUE +from pyvrp.stop import MaxRuntime +from tensordict.tensordict import TensorDict +from torch import Tensor + +from .constants import PYVRP_SCALING_FACTOR +from .utils import scale + + +def solve(instance: TensorDict, max_runtime: float, **kwargs) -> tuple[Tensor, Tensor]: + """ + Solves the AnyVRP instance with PyVRP. + + Args: + instance: The AnyVRP instance to solve. + max_runtime: The maximum runtime for the solver. + + Returns: + A tuple containing the action and the cost, respectively. + """ + data = instance2data(instance, PYVRP_SCALING_FACTOR) + stop = MaxRuntime(max_runtime) + result = _solve(data, stop) + + solution = result.best + action = solution2action(solution) + cost = -result.cost() / PYVRP_SCALING_FACTOR + + return action, cost + + +def instance2data(instance: TensorDict, scaling_factor: int) -> ProblemData: + """ + Converts an AnyVRP instance to a ProblemData instance. + + Args: + instance: The AnyVRP instance to convert. + scaling_factor: The scaling factor to use for the conversion. + + Returns: + The ProblemData instance. + """ + num_locs = instance["demand_backhaul"].size()[0] + + time_windows = scale(instance["time_windows"], scaling_factor) + pickup = scale(instance["demand_backhaul"], scaling_factor) + delivery = scale(instance["demand_linehaul"], scaling_factor) + service = scale(instance["service_time"], scaling_factor) + coords = scale(instance["locs"], scaling_factor) + capacity = scale(instance["vehicle_capacity"], scaling_factor) + max_distance = scale(instance["distance_limit"], scaling_factor) + + depot = Depot( + x=coords[0][0], + y=coords[0][1], + ) + + clients = [ + Client( + x=coords[idx][0], + y=coords[idx][1], + tw_early=time_windows[idx][0], + tw_late=time_windows[idx][1], + delivery=delivery[idx], + pickup=pickup[idx], + service_duration=service[idx], + ) + for idx in range(1, num_locs) + ] + + vehicle_type = VehicleType( + num_available=num_locs - 1, # one vehicle per client + capacity=capacity, + max_distance=max_distance, + tw_early=time_windows[0][0], + tw_late=time_windows[0][1], + ) + + matrix = scale(instance["cost_matrix"], scaling_factor) + + if instance["open_route"]: + # Vehicles do not need to return to the depot, so we set all arcs + # to the depot to zero. + matrix[:, 0] = 0 + + if instance["backhaul_class"] == 1: # VRP with backhauls + # In VRPB, linehauls must be served before backhauls. This can be + # enforced by setting a high value for the distance/duration from depot + # to backhaul (forcing linehaul to be served first) and a large value + # from backhaul to linehaul (avoiding linehaul after backhaul clients). + linehaul = np.flatnonzero(delivery > 0) + backhaul = np.flatnonzero(pickup > 0) + # Note: we remove the constraint that we cannot visit backhauls *only* in a + # a single route as per Slack discussion + # matrix[0, backhaul] = MAX_VALUE + matrix[np.ix_(backhaul, linehaul)] = MAX_VALUE + + return ProblemData(clients, [depot], [vehicle_type], [matrix], [matrix]) + + +def solution2action(solution: pyvrp.Solution) -> list[int]: + """ + Converts a PyVRP solution to the action representation, i.e., a giant tour. + """ + return [visit for route in solution.routes() for visit in route.visits() + [0]] diff --git a/rl4co/envs/routing/mtvrp/baselines/solve.py b/rl4co/envs/routing/mtvrp/baselines/solve.py new file mode 100644 index 00000000..f750fe6d --- /dev/null +++ b/rl4co/envs/routing/mtvrp/baselines/solve.py @@ -0,0 +1,83 @@ +from functools import partial +from multiprocessing import Pool + +from tensordict.tensordict import TensorDict +from torch import Tensor + +from .utils import process_instance + + +class NoSolver: + def solve(self, *args, **kwargs): + pass + + +try: + import rl4co.envs.routing.mtvrp.baselines.pyvrp as pyvrp +except ImportError: + pyvrp = NoSolver() +try: + import rl4co.envs.routing.mtvrp.baselines.lkh as lkh +except ImportError: + lkh = NoSolver() +try: + import rl4co.envs.routing.mtvrp.baselines.ortools as ortools +except ImportError: + ortools = NoSolver() + + +def solve( + instances: TensorDict, + max_runtime: float, + num_procs: int = 1, + solver: str = "pyvrp", + **kwargs, +) -> tuple[Tensor, Tensor]: + """ + Solves the AnyVRP instances with PyVRP. + + Args: + instances: The AnyVRP instances to solve. + max_runtime: The maximum runtime for the solver. + num_procs: The number of processes to use. + solver: The solver to use. + + Returns: + A tuple containing the action and the cost, respectively. + """ + + instances = process_instance(instances) + + if solver == "pyvrp" and isinstance(pyvrp, NoSolver): + raise ImportError( + "PyVRP is not installed. Please install it using `pip install -e .[solvers]`." + ) + if solver == "lkh" and isinstance(lkh, NoSolver): + raise ImportError( + "LKH is not installed. Please install it using `pip install -e .[solvers]`" + ) + if solver == "ortools" and isinstance(ortools, NoSolver): + raise ImportError( + "OR-Tools is not installed. Please install it using `pip install -e .[solvers]`." + ) + + solvers = {"pyvrp": pyvrp.solve, "ortools": ortools.solve, "lkh": lkh.solve} + if solver not in solvers: + raise ValueError(f"Unknown baseline solver: {solver}") + + _solve = solvers[solver] + func = partial(_solve, max_runtime=max_runtime, **kwargs) + + if num_procs > 1: + with Pool(processes=num_procs) as pool: + results = pool.map(func, instances) + else: + results = [func(instance) for instance in instances] + + actions, costs = zip(*results) + + # Pad to ensure all actions have the same length. + max_len = max(len(action) for action in actions) + actions = [action + [0] * (max_len - len(action)) for action in actions] + + return Tensor(actions).long(), Tensor(costs) diff --git a/rl4co/envs/routing/mtvrp/baselines/utils.py b/rl4co/envs/routing/mtvrp/baselines/utils.py new file mode 100644 index 00000000..9af2bdf5 --- /dev/null +++ b/rl4co/envs/routing/mtvrp/baselines/utils.py @@ -0,0 +1,36 @@ +import numpy as np +import torch + +from tensordict import TensorDict +from torch import Tensor + + +def process_instance(td: TensorDict) -> TensorDict: + """ + We simply transform the data to the format the current PyVRP API expects + """ + td_ = td.clone().cpu() + td_.set("durations", td["service_time"]) + cost_mat = torch.cdist(td_["locs"], td_["locs"]) + num_loc = cost_mat.shape[-1] + # note: if we don't do this, PyVRP may complain diagonal is not 0. + # i guess it is because of some conversion from floating point to integer + cost_mat[:, torch.arange(num_loc), torch.arange(num_loc)] = 0 + td_.set("cost_matrix", cost_mat) + backhaul_class = td.get("backhaul_class", torch.ones(td_.batch_size[0], 1)) + td_.set("backhaul_class", backhaul_class) + return td_ + + +def scale(data: Tensor, scaling_factor: int): + """ + Scales ands rounds data to integers so PyVRP can handle it. + """ + array = (data * scaling_factor).numpy().round() + array = np.where(array == np.inf, np.iinfo(np.int32).max, array) + array = array.astype(int) + + if array.size == 1: + return array.item() + + return array diff --git a/rl4co/envs/routing/mtvrp/env.py b/rl4co/envs/routing/mtvrp/env.py new file mode 100644 index 00000000..6beb8eb8 --- /dev/null +++ b/rl4co/envs/routing/mtvrp/env.py @@ -0,0 +1,494 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.data.utils import load_npz_to_tensordict +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.ops import gather_by_index, get_distance +from rl4co.utils.pylogger import get_pylogger + +from .generator import MTVRPGenerator + +log = get_pylogger(__name__) + + +class MTVRPEnv(RL4COEnvBase): + r"""MTVRPEnv is a Multi-Task VRP environment which can take any combination of the following constraints: + + Features: + + - *Capacity (C)* + - Each vehicle has a maximum capacity $Q$, restricting the total load that can be in the vehicle at any point of the route. + - The route must be planned such that the sum of demands and pickups for all customers visited does not exceed this capacity. + - *Time Windows (TW)* + - Every node $i$ has an associated time window $[e_i, l_i]$ during which service must commence. + - Additionally, each node has a service time $s_i$. Vehicles must reach node $i$ within its time window; early arrivals must wait at the node location until time $e_i$. + - *Open Routes (O)* + - Vehicles are not required to return to the depot after serving all customers. + - Note that this does not need to be counted as a constraint since it can be modelled by setting zero costs on arcs returning to the depot $c_{i0} = 0$ from any customer $i \in C$, and not counting the return arc as part of the route. + - *Backhauls (B)* + - Backhauls generalize demand to also account for return shipments. Customers are either linehaul or backhaul customers. + - Linehaul customers require delivery of a demand $q_i > 0$ that needs to be transported from the depot to the customer, whereas backhaul customers need a pickup of an amount $p_i > 0$ that is transported from the client back to the depot. + - It is possible for vehicles to serve a combination of linehaul and backhaul customers in a single route, but then any linehaul customers must precede the backhaul customers in the route. + - *Duration Limits (L)* + - Imposes a limit on the total travel duration (or length) of each route, ensuring a balanced workload across vehicles. + + The environment covers the following 16 variants depending on the data generation: + + | VRP Variant | Capacity (C) | Open Route (O) | Backhaul (B) | Duration Limit (L) | Time Window (TW) | + | :---------- | :----------: | :------------: | :----------: | :----------------: | :--------------: | + | CVRP | ✔ | | | | | + | OVRP | ✔ | ✔ | | | | + | VRPB | ✔ | | ✔ | | | + | VRPL | ✔ | | | ✔ | | + | VRPTW | ✔ | | | | ✔ | + | OVRPTW | ✔ | ✔ | | | ✔ | + | OVRPB | ✔ | ✔ | ✔ | | | + | OVRPL | ✔ | ✔ | | ✔ | | + | VRPBL | ✔ | | ✔ | ✔ | | + | VRPBTW | ✔ | | ✔ | | ✔ | + | VRPLTW | ✔ | | | ✔ | ✔ | + | OVRPBL | ✔ | ✔ | ✔ | ✔ | | + | OVRPBTW | ✔ | ✔ | ✔ | | ✔ | + | OVRPLTW | ✔ | ✔ | | ✔ | ✔ | + | VRPBLTW | ✔ | | ✔ | ✔ | ✔ | + | OVRPBLTW | ✔ | ✔ | ✔ | ✔ | ✔ | + + You may also check out the following papers as reference: + - ["Multi-Task Learning for Routing Problem with Cross-Problem Zero-Shot Generalization" (Liu et al, 2024)](https://arxiv.org/abs/2402.16891) + - ["MVMoE: Multi-Task Vehicle Routing Solver with Mixture-of-Experts" (Zhou et al, 2024)](https://arxiv.org/abs/2405.01029) + - ["RouteFinder: Towards Foundation Models for Vehicle Routing Problems" (Berto et al, 2024)](https://arxiv.org/abs/2406.15007) + + Tip: + Have a look at https://pyvrp.org/ for more information about VRP and its variants and their solutions. Kudos to their help and great job! + + Args: + generator: Generator for the environment, see :class:`MTVRPGenerator`. + generator_params: Parameters for the generator. + """ + + name = "mtvrp" + + def __init__( + self, + generator: MTVRPGenerator = None, + generator_params: dict = {}, + check_solution: bool = False, + **kwargs, + ): + if check_solution: + log.warning( + "Solution checking is enabled. This may slow down the environment." + " We recommend disabling this for training by passing `check_solution=False`." + ) + + super().__init__(check_solution=check_solution, **kwargs) + + if generator is None: + generator = MTVRPGenerator(**generator_params) + self.generator = generator + self._make_spec(self.generator) + + def _step(self, td: TensorDict) -> TensorDict: + # Get locations and distance + prev_node, curr_node = td["current_node"], td["action"] + prev_loc = gather_by_index(td["locs"], prev_node) + curr_loc = gather_by_index(td["locs"], curr_node) + distance = get_distance(prev_loc, curr_loc)[..., None] + + # Update current time + service_time = gather_by_index( + src=td["service_time"], idx=curr_node, dim=1, squeeze=False + ) + start_times = gather_by_index( + src=td["time_windows"], idx=curr_node, dim=1, squeeze=False + )[..., 0] + # we cannot start before we arrive and we should start at least at start times + curr_time = (curr_node[:, None] != 0) * ( + torch.max(td["current_time"] + distance / td["speed"], start_times) + + service_time + ) + + # Update current route length (reset at depot) + curr_route_length = (curr_node[:, None] != 0) * ( + td["current_route_length"] + distance + ) + + # Linehaul (delivery) demands + selected_demand_linehaul = gather_by_index( + td["demand_linehaul"], curr_node, dim=1, squeeze=False + ) + selected_demand_backhaul = gather_by_index( + td["demand_backhaul"], curr_node, dim=1, squeeze=False + ) + + # Backhaul (pickup) demands + # vehicles are empty once we get to the backhauls + used_capacity_linehaul = (curr_node[:, None] != 0) * ( + td["used_capacity_linehaul"] + selected_demand_linehaul + ) + used_capacity_backhaul = (curr_node[:, None] != 0) * ( + td["used_capacity_backhaul"] + selected_demand_backhaul + ) + + # Done when all customers are visited + visited = td["visited"].scatter(-1, curr_node[..., None], True) + done = visited.sum(-1) == visited.size(-1) + reward = torch.zeros_like( + done + ).float() # we use the `get_reward` method to compute the reward + + td.update( + { + "current_node": curr_node, + "current_route_length": curr_route_length, + "current_time": curr_time, + "done": done, + "reward": reward, + "used_capacity_linehaul": used_capacity_linehaul, + "used_capacity_backhaul": used_capacity_backhaul, + "visited": visited, + } + ) + td.set("action_mask", self.get_action_mask(td)) + return td + + def _reset( + self, + td: Optional[TensorDict] = None, + batch_size: Optional[list] = None, + ) -> TensorDict: + device = td.device + + # Create reset TensorDict + td_reset = TensorDict( + { + "locs": td["locs"], + "demand_backhaul": td["demand_backhaul"], + "demand_linehaul": td["demand_linehaul"], + "distance_limit": td["distance_limit"], + "service_time": td["service_time"], + "open_route": td["open_route"], + "time_windows": td["time_windows"], + "vehicle_capacity": td["vehicle_capacity"], + "capacity_original": td["capacity_original"], + "speed": td["speed"], + "current_node": torch.zeros( + (*batch_size,), dtype=torch.long, device=device + ), + "current_route_length": torch.zeros( + (*batch_size, 1), dtype=torch.float32, device=device + ), # for distance limits + "current_time": torch.zeros( + (*batch_size, 1), dtype=torch.float32, device=device + ), # for time windows + "used_capacity_backhaul": torch.zeros( + (*batch_size, 1), device=device + ), # for capacity constraints in backhaul + "used_capacity_linehaul": torch.zeros( + (*batch_size, 1), device=device + ), # for capacity constraints in linehaul + "visited": torch.zeros( + (*batch_size, td["locs"].shape[-2]), + dtype=torch.bool, + device=device, + ), + }, + batch_size=batch_size, + device=device, + ) + td_reset.set("action_mask", self.get_action_mask(td_reset)) + return td_reset + + @staticmethod + def get_action_mask(td: TensorDict) -> torch.Tensor: + curr_node = td["current_node"] # note that this was just updated! + locs = td["locs"] + d_ij = get_distance( + gather_by_index(locs, curr_node)[..., None, :], locs + ) # i (current) -> j (next) + d_j0 = get_distance(locs, locs[..., 0:1, :]) # j (next) -> 0 (depot) + + # Time constraint (TW): + early_tw, late_tw = ( + td["time_windows"][..., 0], + td["time_windows"][..., 1], + ) + arrival_time = td["current_time"] + (d_ij / td["speed"]) + # can reach in time -> only need to *start* in time + can_reach_customer = arrival_time < late_tw + # we must ensure that we can return to depot in time *if* route is closed + # i.e. start time + service time + time back to depot < late_tw + can_reach_depot = ( + torch.max(arrival_time, early_tw) + td["service_time"] + (d_j0 / td["speed"]) + ) * ~td["open_route"] < late_tw[..., 0:1] + + # Distance limit (L): do not add distance to depot if open route (O) + exceeds_dist_limit = ( + td["current_route_length"] + d_ij + (d_j0 * ~td["open_route"]) + > td["distance_limit"] + ) + + # Linehaul demand / delivery (C) and backhaul demand / pickup (B) + # All linehauls are visited before backhauls + linehauls_missing = ((td["demand_linehaul"] * ~td["visited"]).sum(-1) > 0)[ + ..., None + ] + is_carrying_backhaul = ( + gather_by_index( + src=td["demand_backhaul"], + idx=curr_node, + dim=1, + squeeze=False, + ) + > 0 + ) + exceeds_cap_linehaul = ( + td["demand_linehaul"] + td["used_capacity_linehaul"] > td["vehicle_capacity"] + ) + exceeds_cap_backhaul = ( + td["demand_backhaul"] + td["used_capacity_backhaul"] > td["vehicle_capacity"] + ) + + meets_demand_constraint = ( + linehauls_missing + & ~exceeds_cap_linehaul + & ~is_carrying_backhaul + & (td["demand_linehaul"] > 0) + ) | (~exceeds_cap_backhaul & (td["demand_backhaul"] > 0)) + + # Condense constraints + can_visit = ( + can_reach_customer + & can_reach_depot + & meets_demand_constraint + & ~exceeds_dist_limit + & ~td["visited"] + ) + + # Mask depot: don't visit depot if coming from there and there are still customer nodes I can visit + can_visit[:, 0] = ~((curr_node == 0) & (can_visit[:, 1:].sum(-1) > 0)) + return can_visit + + def _get_reward(self, td: TensorDict, actions: TensorDict) -> TensorDict: + # Append depot to actions and get sequence of locations + go_from = torch.cat((torch.zeros_like(actions[:, :1]), actions), dim=1) + go_to = torch.roll(go_from, -1, dims=1) # [b, seq_len] + loc_from = gather_by_index(td["locs"], go_from) + loc_to = gather_by_index(td["locs"], go_to) + + # Get tour length. If route is open and goes to depot, don't count the distance + distances = get_distance(loc_from, loc_to) # [b, seq_len] + tour_length = (distances * ~((go_to == 0) & td["open_route"])).sum(-1) # [b] + return -tour_length # reward is negative cost + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor): + batch_size, n_loc = td["demand_linehaul"].size() + locs = td["locs"] + n_loc -= 1 # exclude depot + sorted_pi = actions.data.sort(1)[0] + + # all customer nodes visited exactly once + assert ( + torch.arange(1, n_loc + 1, out=sorted_pi.data.new()) + .view(1, -1) + .expand(batch_size, n_loc) + == sorted_pi[:, -n_loc:] + ).all() and (sorted_pi[:, :-n_loc] == 0).all(), "Invalid tour" + + # Distance limits (L) + assert (td["distance_limit"] >= 0).all(), "Distance limits must be non-negative." + + # Time windows (TW) + d_j0 = get_distance(locs, locs[..., 0:1, :]) # j (next) -> 0 (depot) + assert torch.all(td["time_windows"] >= 0.0), "Time windows must be non-negative." + assert torch.all(td["service_time"] >= 0.0), "Service time must be non-negative." + assert torch.all( + td["time_windows"][..., 0] < td["time_windows"][..., 1] + ), "there are unfeasible time windows" + assert torch.all( + td["time_windows"][..., :, 0] + d_j0 + td["service_time"] + <= td["time_windows"][..., 0, 1, None] + ), "vehicle cannot perform service and get back to depot in time." + # check individual time windows + curr_time = torch.zeros(batch_size, dtype=torch.float32, device=td.device) + curr_node = torch.zeros(batch_size, dtype=torch.int64, device=td.device) + curr_length = torch.zeros(batch_size, dtype=torch.float32, device=td.device) + for ii in range(actions.size(1)): + next_node = actions[:, ii] + curr_loc = gather_by_index(td["locs"], curr_node) + next_loc = gather_by_index(td["locs"], next_node) + dist = get_distance(curr_loc, next_loc) + + # distance limit (L) + curr_length = curr_length + dist * ~( + td["open_route"].squeeze(-1) & (next_node == 0) + ) # do not count back to depot for open route + assert torch.all( + curr_length <= td["distance_limit"].squeeze(-1) + ), "Route exceeds distance limit" + curr_length[next_node == 0] = 0.0 # reset length for depot + + curr_time = torch.max( + curr_time + dist, gather_by_index(td["time_windows"], next_node)[..., 0] + ) + assert torch.all( + curr_time <= gather_by_index(td["time_windows"], next_node)[..., 1] + ), "vehicle cannot start service before deadline" + curr_time = curr_time + gather_by_index(td["service_time"], next_node) + curr_node = next_node + curr_time[curr_node == 0] = 0.0 # reset time for depot + + # Demand constraints (C) and (B) + # linehauls are the same as backhauls but with a different feature + def _check_c1(feature="demand_linehaul"): + demand = td[feature].gather(dim=1, index=actions) + used_cap = torch.zeros_like(td[feature][:, 0]) + for ii in range(actions.size(1)): + # reset at depot + used_cap = used_cap * (actions[:, ii] != 0) + used_cap += demand[:, ii] + assert ( + used_cap <= td["vehicle_capacity"] + ).all(), "Used more than capacity for {}: {}".format(feature, used_cap) + + _check_c1("demand_linehaul") + _check_c1("demand_backhaul") + + def load_data(self, fpath, batch_size=[], scale=False): + """Dataset loading from file + Normalize demand by capacity to be in [0, 1] + """ + td_load = load_npz_to_tensordict(fpath) + if scale: + td_load.set( + "demand_linehaul", + td_load["demand_linehaul"] / td_load["capacity_original"], + ) + td_load.set( + "demand_backhaul", + td_load["demand_backhaul"] / td_load["capacity_original"], + ) + return td_load + + @staticmethod + def render(*args, **kwargs): + """Simple wrapper for render function""" + from .render import render + + return render(*args, **kwargs) + + def select_start_nodes(self, td, num_starts): + """Select available start nodes for the environment (e.g. for POMO-based training)""" + num_loc = td["locs"].shape[-2] - 1 + selected = ( + torch.arange(num_starts, device=td.device).repeat_interleave(td.shape[0]) + % num_loc + + 1 + ) + return selected + + @staticmethod + def solve( + instances: TensorDict, + max_runtime: float, + num_procs: int = 1, + solver: str = "pyvrp", + **kwargs, + ) -> tuple[torch.Tensor, torch.Tensor]: + """Classical solver for the environment. This is a wrapper for the baselines solver. + Available solvers are: `pyvrp`, `ortools`, `lkh`. Returns the actions and costs. + """ + from .baselines.solve import solve + + return solve(instances, max_runtime, num_procs, solver, **kwargs) + + def _make_spec(self, td_params: TensorDict): + # TODO: include extra vars (but we don't really need them for now) + """Make the observation and action specs from the parameters.""" + self.observation_spec = Composite( + locs=Bounded( + low=self.generator.min_loc, + high=self.generator.max_loc, + shape=(self.generator.num_loc + 1, 2), + dtype=torch.float32, + device=self.device, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + device=self.device, + ), + demand_linehaul=Bounded( + low=-self.generator.capacity, + high=self.generator.max_demand, + shape=(self.generator.num_loc, 1), # demand is only for customers + dtype=torch.float32, + device=self.device, + ), + demand_backhaul=Bounded( + low=-self.generator.capacity, + high=self.generator.max_demand, + shape=(self.generator.num_loc, 1), # demand is only for customers + dtype=torch.float32, + device=self.device, + ), + action_mask=Unbounded( + shape=(self.generator.num_loc + 1, 1), + dtype=torch.bool, + device=self.device, + ), + shape=(), + ) + self.action_spec = Bounded( + low=0, + high=self.generator.num_loc + 1, + shape=(1,), + dtype=torch.int64, + device=self.device, + ) + self.reward_spec = Unbounded(shape=(1,), dtype=torch.float32, device=self.device) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool, device=self.device) + + @staticmethod + def check_variants(td): + """Check if the problem has the variants""" + has_open = td["open_route"].squeeze(-1) + has_tw = (td["time_windows"][:, :, 1] != float("inf")).any(-1) + has_limit = (td["distance_limit"] != float("inf")).squeeze(-1) + has_backhaul = (td["demand_backhaul"] != 0).any(-1) + return has_open, has_tw, has_limit, has_backhaul + + @staticmethod + def get_variant_names(td): + ( + has_open, + has_time_window, + has_duration_limit, + has_backhaul, + ) = MTVRPEnv.check_variants(td) + instance_names = [] + for o, b, l_, tw in zip( + has_open, has_backhaul, has_duration_limit, has_time_window + ): + if not o and not b and not l_ and not tw: + instance_name = "CVRP" + else: + instance_name = "VRP" + if o: + instance_name = "O" + instance_name + if b: + instance_name += "B" + if l_: + instance_name += "L" + if tw: + instance_name += "TW" + instance_names.append(instance_name) + return instance_names + + def print_presets(self): + self.generator.print_presets() diff --git a/rl4co/envs/routing/mtvrp/generator.py b/rl4co/envs/routing/mtvrp/generator.py new file mode 100644 index 00000000..4c06796b --- /dev/null +++ b/rl4co/envs/routing/mtvrp/generator.py @@ -0,0 +1,436 @@ +from typing import Callable, Tuple, Union + +import torch + +from tensordict.tensordict import TensorDict +from torch.distributions import Uniform + +from rl4co.data.utils import save_tensordict_to_npz +from rl4co.envs.common.utils import Generator, get_sampler +from rl4co.utils.ops import get_distance +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def get_vehicle_capacity(num_loc: int) -> int: + """Capacity should be 30 + num_loc/5 if num_loc > 20 as described in Liu et al. 2024 (POMO-MTL). + For every N over 1000, we add 1 of capacity every 33.3 nodes to align with Ye et al. 2024 (GLOP), + i.e. 260 at 2K nodes, 350 at 5K nodes and 500 at 10K nodes. + Note that this serves as a demand scaler. + """ + if num_loc > 1000: + extra_cap = 1000 // 5 + (num_loc - 1000) // 33.3 + elif num_loc > 20: + extra_cap = num_loc // 5 + else: + extra_cap = 0 + return 30 + extra_cap + + +VARIANT_GENERATION_PRESETS = { + "all": {"O": 0.5, "TW": 0.5, "L": 0.5, "B": 0.5}, + "single_feat": {"O": 0.5, "TW": 0.5, "L": 0.5, "B": 0.5}, + "single_feat_otw": {"O": 0.5, "TW": 0.5, "L": 0.5, "B": 0.5, "OTW": 0.5}, # same training as Zhou et al. 2024 + "cvrp": {"O": 0.0, "TW": 0.0, "L": 0.0, "B": 0.0}, + "ovrp": {"O": 1.0, "TW": 0.0, "L": 0.0, "B": 0.0}, + "vrpb": {"O": 0.0, "TW": 0.0, "L": 0.0, "B": 1.0}, + "vrpl": {"O": 0.0, "TW": 0.0, "L": 1.0, "B": 0.0}, + "vrptw": {"O": 0.0, "TW": 1.0, "L": 0.0, "B": 0.0}, + "ovrptw": {"O": 1.0, "TW": 1.0, "L": 0.0, "B": 0.0}, + "ovrpb": {"O": 1.0, "TW": 0.0, "L": 0.0, "B": 1.0}, + "ovrpl": {"O": 1.0, "TW": 0.0, "L": 1.0, "B": 0.0}, + "vrpbl": {"O": 0.0, "TW": 0.0, "L": 1.0, "B": 1.0}, + "vrpbtw": {"O": 0.0, "TW": 1.0, "L": 0.0, "B": 1.0}, + "vrpltw": {"O": 0.0, "TW": 1.0, "L": 1.0, "B": 0.0}, + "ovrpbl": {"O": 1.0, "TW": 0.0, "L": 1.0, "B": 1.0}, + "ovrpbtw": {"O": 1.0, "TW": 1.0, "L": 0.0, "B": 1.0}, + "ovrpltw": {"O": 1.0, "TW": 1.0, "L": 1.0, "B": 0.0}, + "vrpbltw": {"O": 0.0, "TW": 1.0, "L": 1.0, "B": 1.0}, + "ovrpbltw": {"O": 1.0, "TW": 1.0, "L": 1.0, "B": 1.0}, +} + + +class MTVRPGenerator(Generator): + """MTVRP Generator. + Class to generate instances of the MTVRP problem. + If a variant is declared and Subsample is True, the generator will sample the problem based on the variant probabilities. + By default, we use Mixed-Batch Training as in Berto et al. 2024 (RouteFinder), i.e. one batch can contain multiple variants. + + Example presets: + - "all": Sample uniformly from 16 variants + - "single_feat": Sample uniformly between CVRP, OVRP, VRPB, VRPL, VRPTW (as done in Liu et al. 2024 (MTPOMO)) + - "single_feat_otw": Sample uniformly between CVRP, OVRP, VRPB, VRPL, VRPTW, OVRPTW (as done in Zhou et al. 2024 (MVMoE)) + - "cvrp": Only CVRP (similarly for other variants) + + Args: + num_loc: Number of locations to generate + min_loc: Minimum location value + max_loc: Maximum location value + loc_distribution: Distribution to sample locations from + capacity: Vehicle capacity. If None, get value based on `get_vehicle_capacity` + min_demand: Minimum demand value + max_demand: Maximum demand value + min_backhaul: Minimum backhaul value + max_backhaul: Maximum backhaul value + scale_demand: Scale demand values (by default, generate between 1 and 10) + max_time: Maximum time window value (at depot) + backhaul_ratio: Fraction of backhauls (e.g. 0.2 means 20% of nodes are backhaul) + distance_limit: Distance limit + speed: Speed of vehicle. Defaults to 1 + subsample: If False, we always sample all attributes (i.e., OVRPBLTW) + If true, we use the + **kwargs: Additional keyword arguments + """ + + def __init__( + self, + num_loc: int = 20, + min_loc: float = 0.0, + max_loc: float = 1.0, + loc_distribution: Union[int, float, str, type, Callable] = Uniform, + capacity: float = None, + min_demand: int = 1, + max_demand: int = 10, + min_backhaul: int = 1, + max_backhaul: int = 10, + scale_demand: bool = True, + max_time: float = 4.6, + backhaul_ratio: float = 0.2, + distance_limit: float = 3.0, + speed: float = 1.0, + prob_open: float = 0.5, + prob_time_window: float = 0.5, + prob_limit: float = 0.5, + prob_backhaul: float = 0.5, + variant_preset=None, + use_combinations=True, + subsample=True, + **kwargs, + ) -> None: + # Location distribution + self.num_loc = num_loc + self.min_loc = min_loc + self.max_loc = max_loc + if kwargs.get("loc_sampler", None) is not None: + self.loc_sampler = kwargs["loc_sampler"] + else: + self.loc_sampler = get_sampler( + "loc", loc_distribution, min_loc, max_loc, **kwargs + ) + + if capacity is None: + capacity = get_vehicle_capacity(num_loc) + self.capacity = capacity + self.min_demand = min_demand + self.max_demand = max_demand + self.min_backhaul = min_backhaul + self.max_backhaul = max_backhaul + self.scale_demand = scale_demand + self.backhaul_ratio = backhaul_ratio + + self.max_time = max_time + self.distance_limit = distance_limit + self.speed = speed + + assert not (subsample and (variant_preset is None)), ( + "Cannot use subsample if variant_preset is not specified. " + ) + if variant_preset is not None: + log.info(f"Using variant generation preset {variant_preset}") + variant_probs = VARIANT_GENERATION_PRESETS.get(variant_preset) + assert ( + variant_probs is not None + ), f"Variant generation preset {variant_preset} not found. \ + Available presets are {VARIANT_GENERATION_PRESETS.keys()} with probabilities {VARIANT_GENERATION_PRESETS.values()}" + else: + variant_probs = { + "O": prob_open, + "TW": prob_time_window, + "L": prob_limit, + "B": prob_backhaul, + } + # check probabilities + for key, prob in variant_probs.items(): + assert 0 <= prob <= 1, f"Probability {key} must be between 0 and 1" + self.variant_probs = variant_probs + self.variant_preset = variant_preset + if isinstance(variant_preset, str) and variant_preset != "all": + log.warning(f"{variant_preset} selected. Will not use feature combination!") + use_combinations = False + self.use_combinations = use_combinations + self.subsample = subsample + + def _generate(self, batch_size) -> TensorDict: + # Locations + locs = self.generate_locations(batch_size=batch_size, num_loc=self.num_loc) + + # Vehicle capacity (C, B) - applies to both linehaul and backhaul + vehicle_capacity = torch.full( + (*batch_size, 1), self.capacity, dtype=torch.float32 + ) + capacity_original = vehicle_capacity.clone() + + # linehaul demand / delivery (C) and backhaul / pickup demand (B) + demand_linehaul, demand_backhaul = self.generate_demands( + batch_size=batch_size, num_loc=self.num_loc + ) + # add empty depot demands + demand_linehaul = torch.cat( + [torch.zeros(size=(*batch_size, 1)), demand_linehaul], dim=1 + ) + demand_backhaul = torch.cat( + [torch.zeros(size=(*batch_size, 1)), demand_backhaul], dim=1 + ) + + # Open (O) + open_route = self.generate_open_route(shape=(*batch_size, 1)) + + # Time windows (TW) + speed = self.generate_speed(shape=(*batch_size, 1)) + time_windows, service_time = self.generate_time_windows( + locs=locs, + speed=speed, + ) + + # Distance limit (L) + distance_limit = self.generate_distance_limit(shape=(*batch_size, 1), locs=locs) + + # scaling + if self.scale_demand: + demand_backhaul /= vehicle_capacity + demand_linehaul /= vehicle_capacity + vehicle_capacity /= vehicle_capacity + + # Put all variables together + td = TensorDict( + { + "locs": locs, + "demand_backhaul": demand_backhaul, # (C) + "demand_linehaul": demand_linehaul, # (B) + "distance_limit": distance_limit, # (L) + "time_windows": time_windows, # (TW) + "service_time": service_time, # (TW) + "vehicle_capacity": vehicle_capacity, # (C) + "capacity_original": capacity_original, # unscaled capacity (C) + "open_route": open_route, # (O) + "speed": speed, # common + }, + batch_size=batch_size, + ) + + if self.subsample: + # Subsample problems based on given instructions + return self.subsample_problems(td) + else: + # Not subsampling problems, i.e. return tensordict with all attributes + return td + + + + def subsample_problems(self, td): + """Create subproblems starting from seed probabilities depending on their variant. + If random seed sampled in [0, 1] in batch is greater than prob, remove the constraint + thus, if prob high, it is less likely to remove the constraint (i.e. prob=0.9, 90% chance to keep constraint) + """ + batch_size = td.batch_size[0] + + variant_probs = torch.tensor(list(self.variant_probs.values())) + + if self.use_combinations: + # in a batch, multiple variants combinations can be picked + keep_mask = torch.rand(batch_size, 4) >= variant_probs # O, TW, L, B + else: + # in a batch, only a variant can be picked. + # we assign a 0.5 prob to the last variant (which is normal cvrp) + if self.variant_preset in list( + VARIANT_GENERATION_PRESETS.keys() + ) and self.variant_preset not in ( + "all", + "cvrp", + "single_feat", + "single_feat_otw", + ): + cvrp_prob = 0 + else: + cvrp_prob = 0.5 + if self.variant_preset in ("all", "cvrp", "single_feat", "single_feat_otw"): + indices = torch.distributions.Categorical( + torch.Tensor(list(self.variant_probs.values()) + [cvrp_prob])[ + None + ].repeat(batch_size, 1) + ).sample() + if self.variant_preset == "single_feat_otw": + keep_mask = torch.zeros((batch_size, 6), dtype=torch.bool) + keep_mask[torch.arange(batch_size), indices] = True + + # If keep_mask[:, 4] is True, make both keep_mask[:, 0] and keep_mask[:, 1] True + keep_mask[:, :2] |= keep_mask[:, 4:5] + else: + keep_mask = torch.zeros((batch_size, 5), dtype=torch.bool) + keep_mask[torch.arange(batch_size), indices] = True + else: + # if the variant is specified, we keep the attributes with probability > 0 + keep_mask = torch.zeros((batch_size, 4), dtype=torch.bool) + indices = torch.nonzero(variant_probs).squeeze() + keep_mask[:, indices] = True + + td = self._default_open(td, ~keep_mask[:, 0]) + td = self._default_time_window(td, ~keep_mask[:, 1]) + td = self._default_distance_limit(td, ~keep_mask[:, 2]) + td = self._default_backhaul(td, ~keep_mask[:, 3]) + + return td + + @staticmethod + def _default_open(td, remove): + td["open_route"][remove] = False + return td + + @staticmethod + def _default_time_window(td, remove): + default_tw = torch.zeros_like(td["time_windows"]) + default_tw[..., 1] = float("inf") + td["time_windows"][remove] = default_tw[remove] + td["service_time"][remove] = torch.zeros_like(td["service_time"][remove]) + return td + + @staticmethod + def _default_distance_limit(td, remove): + td["distance_limit"][remove] = float("inf") + return td + + @staticmethod + def _default_backhaul(td, remove): + # by default, where there is a backhaul, linehaul is 0. therefore, we add backhaul to linehaul + # and set backhaul to 0 where we want to remove backhaul + td["demand_linehaul"][remove] = td["demand_linehaul"][remove] + td["demand_backhaul"][remove] + td["demand_backhaul"][remove] = 0 + return td + + def generate_locations(self, batch_size, num_loc) -> torch.Tensor: + """Generate seed locations. + + Returns: + locs: [B, N+1, 2] where the first location is the depot. + """ + locs = torch.FloatTensor(*batch_size, num_loc + 1, 2).uniform_( + self.min_loc, self.max_loc + ) + return locs + + def generate_demands(self, batch_size: int, num_loc: int) -> torch.Tensor: + """Classical lineahul demand / delivery from depot (C) and backhaul demand / pickup to depot (B) generation. + Initialize the demand for nodes except the depot, which are added during reset. + Demand sampling Following Kool et al. (2019), demands as integers between 1 and 10. + Generates a slightly different distribution than using torch.randint. + + Returns: + linehaul_demand: [B, N] + backhaul_demand: [B, N] + """ + linehaul_demand = ( + torch.FloatTensor(*batch_size, num_loc) + .uniform_(self.min_demand - 1, self.max_demand - 1) + .int() + + 1 + ).float() + # Backhaul demand sampling + backhaul_demand = ( + torch.FloatTensor(*batch_size, num_loc) + .uniform_(self.min_backhaul - 1, self.max_backhaul - 1) + .int() + + 1 + ).float() + is_linehaul = torch.rand(*batch_size, num_loc) > self.backhaul_ratio + backhaul_demand = ( + backhaul_demand * ~is_linehaul + ) # keep only values where they are not linehauls + linehaul_demand = ( + linehaul_demand * is_linehaul + ) + return linehaul_demand, backhaul_demand + + def generate_time_windows( + self, + locs: torch.Tensor, + speed: torch.Tensor, + ) -> torch.Tensor: + """Generate time windows (TW) and service times for each location including depot. + We refer to the generation process in "Multi-Task Learning for Routing Problem with Cross-Problem Zero-Shot Generalization" + (Liu et al., 2024). Note that another way to generate is from "Learning to Delegate for Large-scale Vehicle Routing" (Li et al, 2021) which + is used in "MVMoE: Multi-Task Vehicle Routing Solver with Mixture-of-Experts" (Zhou et al, 2024). Note that however, in that case + the distance limit would have no influence when time windows are present, since the tw for depot is the same as distance with speed=1. + This function can be overridden for that implementation. + See also https://github.com/RoyalSkye/Routing-MVMoE + + Args: + locs: [B, N+1, 2] (depot, locs) + speed: [B] + + Returns: + time_windows: [B, N+1, 2] + service_time: [B, N+1] + """ + + batch_size, n_loc = locs.shape[0], locs.shape[1] - 1 # no depot + + a, b, c = 0.15, 0.18, 0.2 + service_time = a + (b - a) * torch.rand(batch_size, n_loc) + tw_length = b + (c - b) * torch.rand(batch_size, n_loc) + d_0i = get_distance(locs[:, 0:1], locs[:, 1:]) + h_max = (self.max_time - service_time - tw_length) / d_0i * speed - 1 + tw_start = (1 + (h_max - 1) * torch.rand(batch_size, n_loc)) * d_0i / speed + tw_end = tw_start + tw_length + + # Depot tw is 0, max_time + time_windows = torch.stack( + ( + torch.cat((torch.zeros(batch_size, 1), tw_start), -1), # start + torch.cat((torch.full((batch_size, 1), self.max_time), tw_end), -1), + ), # en + dim=-1, + ) + # depot service time is 0 + service_time = torch.cat((torch.zeros(batch_size, 1), service_time), dim=-1) + return time_windows, service_time # [B, N+1, 2], [B, N+1] + + def generate_distance_limit( + self, shape: Tuple[int, int], locs: torch.Tensor + ) -> torch.Tensor: + """Generates distance limits (L) and checks their feasibilities. + + Returns: + distance_limit: [B, 1] + """ + # calculate distance of all locations to depot + dist_to_depot = torch.cdist(locs, locs[:, 0:1, :], p=2) + assert ( + dist_to_depot * 2 < self.distance_limit # go back and forth + ).all(), "Distance limit too low, not all nodes can be reached from the depot." + return torch.full(shape, self.distance_limit, dtype=torch.float32) + + def generate_open_route(self, shape: Tuple[int, int]): + """Generate open route flags (O). Here we could have a sampler but we simply return True here so all + routes are open. Afterwards, we subsample the problems. + """ + return torch.ones(shape, dtype=torch.bool) + + def generate_speed(self, shape: Tuple[int, int]): + """We simply generate the speed as constant here""" + # in this version, the speed is constant but this class may be overridden + return torch.full(shape, self.speed, dtype=torch.float32) + + @staticmethod + def save_data(td: TensorDict, path, compress: bool = False): + save_tensordict_to_npz(td, path) + + @staticmethod + def print_presets(): + for key, value in VARIANT_GENERATION_PRESETS.items(): + print(f"{key}: {value}") + + @staticmethod + def available_variants(*args, **kwargs): + # remove 'all', 'single_feat' from the list + return list(VARIANT_GENERATION_PRESETS.keys())[3:] diff --git a/rl4co/envs/routing/mtvrp/render.py b/rl4co/envs/routing/mtvrp/render.py new file mode 100644 index 00000000..01a5aadd --- /dev/null +++ b/rl4co/envs/routing/mtvrp/render.py @@ -0,0 +1,145 @@ +import torch + +from tensordict.tensordict import TensorDict + +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render( + td: TensorDict, actions=None, ax=None, scale_xy: bool = True, vehicle_capacity=None +): + import matplotlib.pyplot as plt + import numpy as np + + from matplotlib import cm, colormaps + + num_routine = (actions == 0).sum().item() + 2 + base = colormaps["nipy_spectral"] + color_list = base(np.linspace(0, 1, num_routine)) + cmap_name = base.name + str(num_routine) + out = base.from_list(cmap_name, color_list, num_routine) + + if ax is None: + _, ax = plt.subplots(dpi=100, figsize=(6, 6)) + + td = td.detach().cpu() + + if actions is None: + actions = td.get("action", None) + + if td.batch_size != torch.Size([]): + td = td[0] + actions = actions[0] + + locs = td["locs"] + scale_demand = td["capacity_original"] + demands_linehaul = td["demand_linehaul"] * scale_demand + demands_backhaul = td["demand_backhaul"] * scale_demand + # scale to closest integer + demands_linehaul = demands_linehaul.round().int() + demands_backhaul = demands_backhaul.round().int() + + if actions is None: + log.warning("No action in TensorDict, rendering unsorted locs") + else: + actions = torch.cat([torch.tensor([0]), actions, torch.tensor([0])]) + + # Depot + ax.scatter( + locs[0, 0], + locs[0, 1], + edgecolors=cm.Set2(2), + facecolors="none", + s=100, + linewidths=2, + marker="s", + alpha=1, + ) + + for node_idx, loc in enumerate(locs): + if node_idx == 0: + continue + delivery, pickup = demands_linehaul[node_idx], demands_backhaul[node_idx] + if delivery > 0: + ax.text( + loc[0], + loc[1] + 0.02, + f"{delivery.item()}", + horizontalalignment="center", + verticalalignment="bottom", + fontsize=10, + color=cm.Set2(0), + ) + # scatter delivery as downward triangle + ax.scatter( + loc[0], + loc[1], + edgecolors=cm.Set2(0), + facecolors="none", + s=30, + linewidths=2, + marker="v", + alpha=1, + ) + elif pickup > 0: + ax.text( + loc[0], + loc[1] - 0.02, + f"{pickup.item()}", + horizontalalignment="center", + verticalalignment="top", + fontsize=10, + color=cm.Set2(1), + ) + ax.scatter( + loc[0], + loc[1], + edgecolors=cm.Set2(1), + facecolors="none", + s=30, + linewidths=2, + marker="^", + alpha=1, + ) + else: + print("Error: no demand") + + color_idx = 0 + next_actions = torch.roll(actions, -1, 0) + for ai, aj in zip(actions, next_actions): + if ai == 0: + color_idx += 1 + from_loc = locs[ai] + to_loc = locs[aj] + # if any of from_loc or to_loc is depot, change color and linewidth + if ai == 0 or aj == 0: + color, lw, alpha, style = "lightgrey", 1, 0.5, "--" + else: + color, lw, alpha, style = out(color_idx), 1, 1, "" + ax.plot( + [from_loc[0], to_loc[0]], + [from_loc[1], to_loc[1]], + color=color, + lw=lw, + alpha=alpha, + linestyle=style, + ) + ax.annotate( + "", + xy=(to_loc[0], to_loc[1]), + xytext=(from_loc[0], from_loc[1]), + arrowprops=dict(arrowstyle="->", color=color, lw=lw, alpha=alpha), + size=15, + annotation_clip=False, + ) + + if scale_xy: + ax.set_xlim(-0.05, 1.05) + ax.set_ylim(-0.05, 1.05) + + # Remove the ticks + ax.set_xticks([]) + ax.set_yticks([]) + plt.show() diff --git a/rl4co/envs/routing/op/__init__.py b/rl4co/envs/routing/op/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/op/env.py b/rl4co/envs/routing/op/env.py new file mode 100644 index 00000000..d15617d1 --- /dev/null +++ b/rl4co/envs/routing/op/env.py @@ -0,0 +1,257 @@ +from typing import Optional + +import torch +import torch.nn.functional as F + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.ops import gather_by_index, get_tour_length +from rl4co.utils.pylogger import get_pylogger + +from .generator import OPGenerator +from .render import render + +log = get_pylogger(__name__) + + +class OPEnv(RL4COEnvBase): + """Orienteering Problem (OP) environment. + At each step, the agent chooses a location to visit in order to maximize the collected prize. + The total length of the path must not exceed a given threshold. + + Observations: + - location of the depot + - locations and prize of each customer + - current location of the vehicle + - current tour length + - current total prize + - the remaining length of the path + + Constraints: + - the tour starts and ends at the depot + - not all customers need to be visited + - the vehicle cannot visit customers exceed the remaining length of the path + + Finish Condition: + - the vehicle back to the depot + + Reward: + - the sum of the prizes of visited nodes + + Args: + generator: OPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "op" + + def __init__( + self, + generator: OPGenerator = None, + generator_params: dict = {}, + prize_type: str = "dist", + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = OPGenerator(**generator_params) + self.generator = generator + self.prize_type = prize_type + assert self.prize_type in [ + "dist", + "unif", + "const", + ], f"Invalid prize_type: {self.prize_type}" + self._make_spec(self.generator) + + def _step(self, td: TensorDict) -> TensorDict: + current_node = td["action"][:, None] + + # Update tour length + previus_loc = gather_by_index(td["locs"], td["current_node"]) + current_loc = gather_by_index(td["locs"], current_node) + tour_length = td["tour_length"] + (current_loc - previus_loc).norm(p=2, dim=-1) + + # Update prize with collected prize + current_total_prize = td["current_total_prize"] + gather_by_index( + td["prize"], current_node, dim=-1 + ) + + # Set current node as visited + visited = td["visited"].scatter(-1, current_node, 1) + + # Done if went back to depot (except if it's the first step, since we start at the depot) + done = (current_node.squeeze(-1) == 0) & (td["i"] > 0) + + # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here + reward = torch.zeros_like(done) + + td.update( + { + "tour_length": tour_length, + "current_node": current_node, + "visited": visited, + "current_total_prize": current_total_prize, + "i": td["i"] + 1, + "reward": reward, + "done": done, + } + ) + td.set("action_mask", self.get_action_mask(td)) + return td + + def _reset( + self, + td: Optional[TensorDict] = None, + batch_size: Optional[list] = None, + ) -> TensorDict: + device = td.device + + # Add depot to locs + locs_with_depot = torch.cat((td["depot"][:, None, :], td["locs"]), -2) + + # Create reset TensorDict + td_reset = TensorDict( + { + "locs": locs_with_depot, + "prize": F.pad( + td["prize"], (1, 0), mode="constant", value=0 + ), # add 0 for depot + "tour_length": torch.zeros(*batch_size, device=device), + # max_length is max length allowed when arriving at node, so subtract distance to return to depot + # Additionally, substract epsilon margin for numeric stability + "max_length": td["max_length"][..., None] + - (td["depot"][..., None, :] - locs_with_depot).norm(p=2, dim=-1) + - 1e-6, + "current_node": torch.zeros( + *batch_size, 1, dtype=torch.long, device=device + ), + "visited": torch.zeros( + (*batch_size, locs_with_depot.shape[-2]), + dtype=torch.bool, + device=device, + ), + "current_total_prize": torch.zeros( + *batch_size, dtype=torch.float, device=device + ), + "i": torch.zeros( + (*batch_size,), dtype=torch.int64, device=device + ), # counter + }, + batch_size=batch_size, + ) + td_reset.set("action_mask", self.get_action_mask(td_reset)) + return td_reset + + @staticmethod + def get_action_mask(td: TensorDict) -> torch.Tensor: + """Get action mask with 1 = feasible action, 0 = infeasible action. + Cannot visit if already visited, if depot has been visited, or if the length exceeds the maximum length. + """ + current_loc = gather_by_index(td["locs"], td["current_node"])[..., None, :] + exceeds_length = ( + td["tour_length"][..., None] + (td["locs"] - current_loc).norm(p=2, dim=-1) + > td["max_length"] + ) + mask = td["visited"] | td["visited"][..., 0:1] | exceeds_length + + action_mask = ~mask # 1 = feasible action, 0 = infeasible action + + # Depot can always be visited: we do not hardcode knowledge that this is strictly suboptimal if other options are available + action_mask[..., 0] = 1 + return action_mask + + def _get_reward(self, td: TensorDict, actions: torch.Tensor) -> torch.Tensor: + """Reward is the sum of the prizes of visited nodes""" + # In case all tours directly return to depot, prevent further problems + if actions.size(-1) == 1: + assert (actions == 0).all(), "If all length 1 tours, they should be zero" + return torch.zeros(actions.size(0), dtype=torch.float, device=actions.device) + + # Prize is the sum of the prizes of the visited nodes. Note that prize is padded with 0 for depot at index 0 + collected_prize = td["prize"].gather(1, actions) + return collected_prize.sum(-1) + + @staticmethod + def check_solution_validity( + td: TensorDict, actions: torch.Tensor, add_distance_to_depot: bool = True + ) -> None: + """Check that solution is valid: nodes are not visited twice except depot and capacity is not exceeded. + If `add_distance_to_depot` if True, then the distance to the depot is added to max length since by default, the max length is + modified in the reset function to account for the distance to the depot. + """ + + # Check that tours are valid, i.e. contain 0 to n -1 + sorted_actions = actions.data.sort(1)[0] + # Make sure each node visited once at most (except for depot) + assert ( + (sorted_actions[:, 1:] == 0) + | (sorted_actions[:, 1:] > sorted_actions[:, :-1]) + ).all(), "Duplicates" + + # Gather locations in order of tour and get the length of tours + locs_ordered = gather_by_index(td["locs"], actions) + length = get_tour_length(locs_ordered) + + max_length = td["max_length"] + if add_distance_to_depot: + max_length = ( + max_length + + (td["locs"][..., 0:1, :] - td["locs"]).norm(p=2, dim=-1) + + 1e-6 + ) + assert ( + length[..., None] <= max_length + 1e-5 + ).all(), "Max length exceeded by {}".format( + (length[..., None] - max_length).max() + ) + + def _make_spec(self, generator: OPGenerator): + """Make the observation and action specs from the parameters.""" + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.num_loc + 1, 2), + dtype=torch.float32, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + prize=Unbounded( + shape=(generator.num_loc,), + dtype=torch.float32, + ), + tour_length=Unbounded( + shape=(generator.num_loc,), + dtype=torch.float32, + ), + visited=Unbounded( + shape=(generator.num_loc + 1,), + dtype=torch.bool, + ), + max_length=Unbounded( + shape=(1,), + dtype=torch.float32, + ), + action_mask=Unbounded( + shape=(generator.num_loc + 1, 1), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.num_loc + 1, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + @staticmethod + def render(td: TensorDict, actions: torch.Tensor = None, ax=None): + return render(td, actions, ax) diff --git a/rl4co/envs/routing/op/generator.py b/rl4co/envs/routing/op/generator.py new file mode 100644 index 00000000..bf33d512 --- /dev/null +++ b/rl4co/envs/routing/op/generator.py @@ -0,0 +1,149 @@ +from typing import Callable, Union + +import torch + +from tensordict.tensordict import TensorDict +from torch.distributions import Uniform + +from rl4co.envs.common.utils import Generator, get_sampler +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + +# From Kool et al. 2019 +MAX_LENGTHS = {20: 2.0, 50: 3.0, 100: 4.0} + + +class OPGenerator(Generator): + """Data generator for the Orienteering Problem (OP). + + Args: + num_loc: number of locations (customers) in the OP, without the depot. (e.g. 10 means 10 locs + 1 depot) + min_loc: minimum value for the location coordinates + max_loc: maximum value for the location coordinates + loc_distribution: distribution for the location coordinates + depot_distribution: distribution for the depot location. If None, sample the depot from the locations + min_prize: minimum value for the prize of each customer + max_prize: maximum value for the prize of each customer + prize_distribution: distribution for the prize of each customer + max_length: maximum length of the path + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each customer + depot [batch_size, 2]: location of the depot + prize [batch_size, num_loc]: prize of each customer + max_length [batch_size, 1]: maximum length of the path for each customer + """ + + def __init__( + self, + num_loc: int = 20, + min_loc: float = 0.0, + max_loc: float = 1.0, + loc_distribution: Union[int, float, str, type, Callable] = Uniform, + depot_distribution: Union[int, float, str, type, Callable] = None, + min_prize: float = 1.0, + max_prize: float = 1.0, + prize_distribution: Union[int, float, type, Callable] = Uniform, + prize_type: str = "dist", + max_length: Union[float, torch.Tensor] = None, + **kwargs, + ): + self.num_loc = num_loc + self.min_loc = min_loc + self.max_loc = max_loc + self.min_prize = min_prize + self.max_prize = max_prize + self.prize_type = prize_type + self.max_length = max_length + + # Location distribution + if kwargs.get("loc_sampler", None) is not None: + self.loc_sampler = kwargs["loc_sampler"] + else: + self.loc_sampler = get_sampler( + "loc", loc_distribution, min_loc, max_loc, **kwargs + ) + + # Depot distribution + if kwargs.get("depot_sampler", None) is not None: + self.depot_sampler = kwargs["depot_sampler"] + else: + self.depot_sampler = get_sampler( + "depot", depot_distribution, min_loc, max_loc, **kwargs + ) if depot_distribution is not None else None + + # Prize distribution + if kwargs.get("prize_sampler", None) is not None: + self.prize_sampler = kwargs["prize_sampler"] + elif ( + prize_distribution == "dist" + ): # If prize_distribution is 'dist', then the prize is the distance from the depot + self.prize_sampler = None + else: + self.prize_sampler = get_sampler( + "prize", prize_distribution, min_prize, max_prize, **kwargs + ) + + # Max length + if max_length is not None: + self.max_length = max_length + else: + self.max_length = MAX_LENGTHS.get(num_loc, None) + if self.max_length is None: + closest_num_loc = min(MAX_LENGTHS.keys(), key=lambda x: abs(x - num_loc)) + self.max_length = MAX_LENGTHS[closest_num_loc] + log.warning( + f"The max length for {num_loc} locations is not defined. Using the closest max length: {self.max_length}\ + with {closest_num_loc} locations." + ) + + def _generate(self, batch_size) -> TensorDict: + # Sample locations: depot and customers + if self.depot_sampler is not None: + depot = self.depot_sampler.sample((*batch_size, 2)) + locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2)) + else: + # if depot_sampler is None, sample the depot from the locations + locs = self.loc_sampler.sample((*batch_size, self.num_loc + 1, 2)) + depot = locs[..., 0, :] + locs = locs[..., 1:, :] + + locs_with_depot = torch.cat((depot.unsqueeze(1), locs), dim=1) + + # Methods taken from Fischetti et al. (1998) and Kool et al. (2019) + if self.prize_type == "const": + prize = torch.ones(*batch_size, self.num_loc, device=self.device) + elif self.prize_type == "unif": + prize = ( + 1 + + torch.randint( + 0, 100, (*batch_size, self.num_loc), device=self.device + ).float() + ) / 100 + elif self.prize_type == "dist": # based on the distance to the depot + prize = (locs_with_depot[..., 0:1, :] - locs_with_depot[..., 1:, :]).norm( + p=2, dim=-1 + ) + prize = ( + 1 + (prize / prize.max(dim=-1, keepdim=True)[0] * 99).int() + ).float() / 100 + else: + raise ValueError(f"Invalid prize_type: {self.prize_type}") + + # Support for heterogeneous max length if provided + if not isinstance(self.max_length, torch.Tensor): + max_length = torch.full((*batch_size,), self.max_length) + else: + max_length = self.max_length + + return TensorDict( + { + "locs": locs_with_depot[..., 1:, :], + "depot": locs_with_depot[..., 0, :], + "prize": prize, + "max_length": max_length, + }, + batch_size=batch_size, + ) diff --git a/rl4co/envs/routing/op/render.py b/rl4co/envs/routing/op/render.py new file mode 100644 index 00000000..65ad40be --- /dev/null +++ b/rl4co/envs/routing/op/render.py @@ -0,0 +1,86 @@ +import torch +import numpy as np +import matplotlib.pyplot as plt + +from matplotlib import cm, colormaps + +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(td, actions=None, ax=None): + # Create a plot of the nodes + if ax is None: + _, ax = plt.subplots() + + td = td.detach().cpu() + + # Actions + if actions is None: + actions = td.get("action", None) + actions = actions.detach().cpu() if actions is not None else None + + # if batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + actions = actions[0] if actions is not None else None + + # Variables + depot = td["locs"][0, :] + customers = td["locs"][1:, :] + prizes = td["prize"][1:] + normalized_prizes = ( + 200 * (prizes - torch.min(prizes)) / (torch.max(prizes) - torch.min(prizes)) + + 10 + ) + + # Plot depot and customers with prize + ax.scatter( + depot[0], + depot[1], + marker="s", + c="tab:green", + edgecolors="black", + zorder=5, + s=100, + ) # Plot depot as square + ax.scatter( + customers[:, 0], + customers[:, 1], + s=normalized_prizes, + c=normalized_prizes, + cmap="autumn_r", + alpha=0.6, + edgecolors="black", + ) # Plot all customers with size and color indicating the prize + + # Gather locs in order of action if available + if actions is None: + log.warning("No action in TensorDict, rendering unsorted locs") + else: + # Reorder the customers and their corresponding prizes based on actions + tour = customers[actions - 1] # subtract 1 to match Python's 0-indexing + + # Append the depot at the beginning and the end of the tour + tour = np.vstack((depot, tour, depot)) + + # Use quiver to plot the tour + dx, dy = np.diff(tour[:, 0]), np.diff(tour[:, 1]) + ax.quiver( + tour[:-1, 0], + tour[:-1, 1], + dx, + dy, + scale_units="xy", + angles="xy", + scale=1, + zorder=2, + color="black", + width=0.0035, + ) + + # Setup limits and show + ax.set_xlim(-0.05, 1.05) + ax.set_ylim(-0.05, 1.05) diff --git a/rl4co/envs/routing/pctsp/__init__.py b/rl4co/envs/routing/pctsp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/pctsp/env.py b/rl4co/envs/routing/pctsp/env.py new file mode 100644 index 00000000..222b3cad --- /dev/null +++ b/rl4co/envs/routing/pctsp/env.py @@ -0,0 +1,279 @@ +from typing import Optional + +import torch +import torch.nn.functional as F + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.ops import gather_by_index, get_tour_length +from rl4co.utils.pylogger import get_pylogger + +from .generator import PCTSPGenerator +from .render import render + +log = get_pylogger(__name__) + + +class PCTSPEnv(RL4COEnvBase): + """Prize-collecting TSP (PCTSP) environment. + The goal is to collect as much prize as possible while minimizing the total travel cost. + The environment is stochastic, the prize is only revealed when the node is visited. + + Observations: + - locations of the nodes + - prize and penalty of each node + - current location of the vehicle + - current total prize + - current total penalty + - visited nodes + - prize required to visit a node + - the current step + + Constraints: + - the tour starts and ends at the depot + - the vehicle cannot visit nodes exceed the remaining prize + + Finish Condition: + - the vehicle back to the depot + + Reward: + - the sum of the saved penalties + + Args: + generator: OPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "pctsp" + _stochastic = False + + def __init__( + self, + generator: PCTSPGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = PCTSPGenerator(**generator_params) + self.generator = generator + self._make_spec(self.generator) + + def _step(self, td: TensorDict) -> TensorDict: + current_node = td["action"] + + # Get current coordinates, prize, and penalty + cur_total_prize = td["cur_total_prize"] + gather_by_index( + td["real_prize"], current_node + ) + cur_total_penalty = td["cur_total_penalty"] + gather_by_index( + td["penalty"], current_node + ) + + # Update visited + visited = td["visited"].scatter(-1, current_node[..., None], 1) + + # Done and reward + done = (td["i"] > 0) & (current_node == 0) + + # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here + reward = torch.zeros_like(done) + + # Update state + td.update( + { + "current_node": current_node, + "cur_total_prize": cur_total_prize, + "cur_total_penalty": cur_total_penalty, + "visited": visited, + "i": td["i"] + 1, + "reward": reward, + "done": done, + } + ) + td.set("action_mask", self.get_action_mask(td)) + return td + + def _reset( + self, td: Optional[TensorDict] = None, batch_size: Optional[list] = None + ) -> TensorDict: + device = td.device + + locs = torch.cat([td["depot"][..., None, :], td["locs"]], dim=-2) + expected_prize = td["deterministic_prize"] + real_prize = ( + td["stochastic_prize"] if self.stochastic else td["deterministic_prize"] + ) + penalty = td["penalty"] + + # Concatenate depots + real_prize_with_depot = torch.cat( + [torch.zeros_like(real_prize[..., :1]), real_prize], dim=-1 + ) + penalty_with_depot = F.pad(penalty, (1, 0), mode="constant", value=0) + + # Initialize the current node and prize / penalty + current_node = torch.zeros((*batch_size,), dtype=torch.int64, device=device) + cur_total_prize = torch.zeros(*batch_size, device=device) + cur_total_penalty = penalty.sum(-1) # Sum penalties (all when nothing is visited) + + # Init the action mask (all nodes are available) + visited = torch.zeros( + (*batch_size, self.generator.num_loc + 1), dtype=torch.bool, device=device + ) + i = torch.zeros((*batch_size,), dtype=torch.int64, device=device) + prize_required = torch.full( + (*batch_size,), self.generator.prize_required, device=device + ) + + td_reset = TensorDict( + { + "locs": locs, + "current_node": current_node, + "expected_prize": expected_prize, + "real_prize": real_prize_with_depot, + "penalty": penalty_with_depot, + "cur_total_prize": cur_total_prize, + "cur_total_penalty": cur_total_penalty, + "visited": visited, + "prize_required": prize_required, + "i": i, + }, + batch_size=batch_size, + ) + td_reset.set("action_mask", self.get_action_mask(td_reset)) + return td_reset + + @staticmethod + def get_action_mask(td: TensorDict) -> torch.Tensor: + """Cannot visit depot if not yet collected 1 total prize and there are unvisited nodes""" + mask = td["visited"] | td["visited"][..., 0:1] + mask[..., 0] = (td["cur_total_prize"] < 1.0) & ( + td["visited"][..., 1:].int().sum(-1) < td["visited"][..., 1:].size(-1) + ) + return ~(mask > 0) # Invert mask, since 1 means feasible action + + def _get_reward(self, td: TensorDict, actions: torch.Tensor) -> torch.Tensor: + """Reward is `saved penalties - (total length + penalty)`""" + + # In case all tours directly return to depot, prevent further problems + if actions.size(-1) == 1: + assert (actions == 0).all(), "If all length 1 tours, they should be zero" + return torch.zeros(actions.size(0), dtype=torch.float, device=actions.device) + + # Gather locations in order of tour (add depot since we start and end there) + locs_ordered = torch.cat( + [ + td["locs"][..., 0:1, :], # depot + gather_by_index(td["locs"], actions), # order locations + ], + dim=1, + ) + length = get_tour_length(locs_ordered) + + # Reward is saved penalties - (total length + penalty) + saved_penalty = td["penalty"].gather(1, actions) + return saved_penalty.sum(-1) - (length + td["penalty"][..., 1:].sum(-1)) + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor) -> None: + """Check that the solution is valid, i.e. contains all nodes once at most, and either prize constraint is met or all nodes are visited""" + + # Check that tours are valid, i.e. contain 0 to n -1 + sorted_actions = actions.data.sort(1)[0] + + # Make sure each node visited once at most (except for depot) + assert ( + (sorted_actions[..., 1:] == 0) + | (sorted_actions[..., 1:] > sorted_actions[..., :-1]) + ).all(), "Duplicates" + + prize = td["real_prize"][..., 1:] # Remove depot + prize_with_depot = torch.cat((torch.zeros_like(prize[:, :1]), prize), 1) + p = prize_with_depot.gather(1, actions) + + # Either prize constraint should be satisfied or all prizes should be visited + assert ( + (p.sum(-1) >= 1 - 1e-5) + | ( + sorted_actions.size(-1) - (sorted_actions == 0).int().sum(-1) + == (td["locs"].size(-2) - 1) + ) # no depot + ).all(), "Total prize does not satisfy min total prize" + + @property + def stochastic(self): + return self._stochastic + + @stochastic.setter + def stochastic(self, state: bool): + if state is True: + log.warning( + "Stochastic mode should not be used for PCTSP. Use SPCTSP instead." + ) + + def _make_spec(self, generator): + """Make the locs and action specs from the parameters.""" + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.num_loc, 2), + dtype=torch.float32, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + expected_prize=Unbounded( + shape=(generator.num_loc), + dtype=torch.float32, + ), + real_prize=Unbounded( + shape=(generator.num_loc + 1), + dtype=torch.float32, + ), + penalty=Unbounded( + shape=(generator.num_loc + 1), + dtype=torch.float32, + ), + cur_total_prize=Unbounded( + shape=(1), + dtype=torch.float32, + ), + cur_total_penalty=Unbounded( + shape=(1), + dtype=torch.float32, + ), + visited=Unbounded( + shape=(generator.num_loc + 1), + dtype=torch.bool, + ), + prize_required=Unbounded( + shape=(1), + dtype=torch.float32, + ), + i=Unbounded( + shape=(1), + dtype=torch.int64, + ), + action_mask=Unbounded( + shape=(generator.num_loc), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.num_loc, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + @staticmethod + def render(td: TensorDict, actions: torch.Tensor = None, ax=None): + return render(td, actions, ax) diff --git a/rl4co/envs/routing/pctsp/generator.py b/rl4co/envs/routing/pctsp/generator.py new file mode 100644 index 00000000..332a5c9c --- /dev/null +++ b/rl4co/envs/routing/pctsp/generator.py @@ -0,0 +1,143 @@ +from typing import Callable, Union + +from tensordict.tensordict import TensorDict +from torch.distributions import Uniform + +from rl4co.envs.common.utils import Generator, get_sampler +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +MAX_LENGTHS = {20: 2.0, 50: 3.0, 100: 4.0} + + +class PCTSPGenerator(Generator): + """Data generator for the Prize-collecting Traveling Salesman Problem (PCTSP). + + Args: + num_loc: number of locations (customers) in the VRP, without the depot. (e.g. 10 means 10 locs + 1 depot) + min_loc: minimum value for the location coordinates + max_loc: maximum value for the location coordinates + loc_distribution: distribution for the location coordinates + depot_distribution: distribution for the depot location. If None, sample the depot from the locations + min_demand: minimum value for the demand of each customer + max_demand: maximum value for the demand of each customer + demand_distribution: distribution for the demand of each customer + capacity: capacity of the vehicle + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each city + depot [batch_size, 2]: location of the depot + demand [batch_size, num_loc]: demand of each customer + capacity [batch_size, 1]: capacity of the vehicle + """ + + def __init__( + self, + num_loc: int = 20, + min_loc: float = 0.0, + max_loc: float = 1.0, + loc_distribution: Union[int, float, str, type, Callable] = Uniform, + depot_distribution: Union[int, float, str, type, Callable] = None, + penalty_factor: float = 3.0, + prize_required: float = 1.0, + **kwargs, + ): + self.num_loc = num_loc + self.min_loc = min_loc + self.max_loc = max_loc + self.penalty_fctor = penalty_factor + self.prize_required = prize_required + + # Location distribution + if kwargs.get("loc_sampler", None) is not None: + self.loc_sampler = kwargs["loc_sampler"] + else: + self.loc_sampler = get_sampler( + "loc", loc_distribution, min_loc, max_loc, **kwargs + ) + + # Depot distribution + if kwargs.get("depot_sampler", None) is not None: + self.depot_sampler = kwargs["depot_sampler"] + else: + self.depot_sampler = get_sampler( + "depot", depot_distribution, min_loc, max_loc, **kwargs + ) if depot_distribution is not None else None + + # Prize distribution + self.deterministic_prize_sampler = get_sampler( + "deterministric_prize", "uniform", 0.0, 4.0 / self.num_loc, **kwargs + ) + self.stochastic_prize_sampler = get_sampler( + "stochastic_prize", "uniform", 0.0, 2.0, **kwargs + ) + + # For the penalty to make sense it should be not too large (in which case all nodes will be visited) nor too small + # so we want the objective term to be approximately equal to the length of the tour, which we estimate with half + # of the nodes by half of the tour length (which is very rough but similar to op) + # This means that the sum of penalties for all nodes will be approximately equal to the tour length (on average) + # The expected total (uniform) penalty of half of the nodes (since approx half will be visited by the constraint) + # is (n / 2) / 2 = n / 4 so divide by this means multiply by 4 / n, + # However instead of 4 we use penalty_factor (3 works well) so we can make them larger or smaller + self.max_penalty = kwargs.get("max_penalty", None) + if self.max_penalty is None: # If not provided, use the default max penalty + self.max_penalty = MAX_LENGTHS.get(num_loc, None) + if ( + self.max_penalty is None + ): # If not in the table keys, find the closest number of nodes as the key + closest_num_loc = min(MAX_LENGTHS.keys(), key=lambda x: abs(x - num_loc)) + self.max_penalty = MAX_LENGTHS[closest_num_loc] + log.warning( + f"The max penalty for {num_loc} locations is not defined. Using the closest max penalty: {self.max_penalty}\ + with {closest_num_loc} locations." + ) + + # Adjust as in Kool et al. (2019) + self.max_penalty *= penalty_factor / self.num_loc + self.penalty_sampler = get_sampler( + "penalty", "uniform", 0.0, self.max_penalty, **kwargs + ) + + def _generate(self, batch_size) -> TensorDict: + # Sample locations: depot and customers + if self.depot_sampler is not None: + depot = self.depot_sampler.sample((*batch_size, 2)) + locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2)) + else: + # if depot_sampler is None, sample the depot from the locations + locs = self.loc_sampler.sample((*batch_size, self.num_loc + 1, 2)) + depot = locs[..., 0, :] + locs = locs[..., 1:, :] + + # Sample penalty + penalty = self.penalty_sampler.sample((*batch_size, self.num_loc)) + + # Take uniform prizes + # Now expectation is 0.5 so expected total prize is n / 2, we want to force to visit approximately half of the nodes + # so the constraint will be that total prize >= (n / 2) / 2 = n / 4 + # equivalently, we divide all prizes by n / 4 and the total prize should be >= 1 + deterministic_prize = self.deterministic_prize_sampler.sample( + (*batch_size, self.num_loc) + ) + + # In the deterministic setting, the stochastic_prize is not used and the deterministic prize is known + # In the stochastic setting, the deterministic prize is the expected prize and is known up front but the + # stochastic prize is only revealed once the node is visited + # Stochastic prize is between (0, 2 * expected_prize) such that E(stochastic prize) = E(deterministic_prize) + stochastic_prize = self.stochastic_prize_sampler.sample( + (*batch_size, self.num_loc) + ) * deterministic_prize + + return TensorDict( + { + "locs": locs, + "depot": depot, + "penalty": penalty, + "deterministic_prize": deterministic_prize, + "stochastic_prize": stochastic_prize, + }, + batch_size=batch_size, + ) diff --git a/rl4co/envs/routing/pctsp/render.py b/rl4co/envs/routing/pctsp/render.py new file mode 100644 index 00000000..7d0e3622 --- /dev/null +++ b/rl4co/envs/routing/pctsp/render.py @@ -0,0 +1,93 @@ +import torch + + +def render(td, actions=None, ax=None): + import matplotlib.pyplot as plt + import numpy as np + + from matplotlib import colormaps + + # Create a plot of the nodes + if ax is None: + _, ax = plt.subplots() + + td = td.detach().cpu() + + # Actions + if actions is None: + actions = td.get("action", None) + actions = actions.detach().cpu() if actions is not None else None + + # if batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + actions = actions[0] if actions is not None else None + + # Variables + depot = td["locs"][0, :] + customers = td["locs"][1:, :] + prizes = td["real_prize"][1:] + penalties = td["penalty"][1:] + normalized_prizes = ( + 200 * (prizes - torch.min(prizes)) / (torch.max(prizes) - torch.min(prizes)) + + 10 + ) + normalized_penalties = ( + 3 + * (penalties - torch.min(penalties)) + / (torch.max(penalties) - torch.min(penalties)) + ) + + # Represent penalty with colormap and size of edges + penalty_cmap = colormaps.get_cmap("BuPu") + penalty_colors = penalty_cmap(normalized_penalties) + + # Plot depot and customers with prize (size of nodes) and penalties (size of borders) + ax.scatter( + depot[0], + depot[1], + marker="s", + c="tab:green", + edgecolors="black", + zorder=1, + s=100, + ) # Plot depot as square + ax.scatter( + customers[:, 0], + customers[:, 1], + s=normalized_prizes, + c=normalized_prizes, + cmap="autumn_r", + alpha=1, + edgecolors=penalty_colors, + linewidths=normalized_penalties, + ) # Plot all customers with size and color indicating the prize + + # Gather locs in order of action if available + if actions is None: + print("No action in TensorDict, rendering unsorted locs") + else: + # Reorder the customers and their corresponding prizes based on actions + tour = customers[actions - 1] # subtract 1 to match Python's 0-indexing + + # Append the depot at the beginning and the end of the tour + tour = np.vstack((depot, tour, depot)) + + # Use quiver to plot the tour + dx, dy = np.diff(tour[:, 0]), np.diff(tour[:, 1]) + ax.quiver( + tour[:-1, 0], + tour[:-1, 1], + dx, + dy, + scale_units="xy", + angles="xy", + scale=1, + zorder=2, + color="black", + width=0.0035, + ) + + # Setup limits and show + ax.set_xlim(-0.05, 1.05) + ax.set_ylim(-0.05, 1.05) diff --git a/rl4co/envs/routing/pdp/__init__.py b/rl4co/envs/routing/pdp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/pdp/env.py b/rl4co/envs/routing/pdp/env.py new file mode 100644 index 00000000..4ff0016b --- /dev/null +++ b/rl4co/envs/routing/pdp/env.py @@ -0,0 +1,530 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import ImprovementEnvBase, RL4COEnvBase +from rl4co.utils.ops import gather_by_index, get_tour_length + +from .generator import PDPGenerator +from .render import render, render_improvement + + +class PDPEnv(RL4COEnvBase): + """Pickup and Delivery Problem (PDP) environment. + The environment is made of num_loc + 1 locations (cities): + - 1 depot + - `num_loc` / 2 pickup locations + - `num_loc` / 2 delivery locations + The goal is to visit all the pickup and delivery locations in the shortest path possible starting from the depot + The conditions is that the agent must visit a pickup location before visiting its corresponding delivery location + + Observations: + - locations of the depot, pickup, and delivery locations + - current location of the vehicle + - the remaining locations to deliver + - the visited locations + - the current step + + Constraints: + - the tour starts and ends at the depot + - each pickup location must be visited before its corresponding delivery location + - the vehicle cannot visit the same location twice + + Finish Condition: + - the vehicle has visited all locations + + Reward: + - (minus) the negative length of the path + + Args: + generator: PDPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "pdp" + + def __init__( + self, + generator: PDPGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = PDPGenerator(**generator_params) + self.generator = generator + self._make_spec(self.generator) + + @staticmethod + def _step(td: TensorDict) -> TensorDict: + current_node = td["action"].unsqueeze(-1) + + num_loc = td["locs"].shape[-2] - 1 # except depot + + # Pickup and delivery node pair of selected node + new_to_deliver = (current_node + num_loc // 2) % (num_loc + 1) + + # Set available to 0 (i.e., we visited the node) + available = td["available"].scatter( + -1, current_node.expand_as(td["action_mask"]), 0 + ) + + to_deliver = td["to_deliver"].scatter( + -1, new_to_deliver.expand_as(td["to_deliver"]), 1 + ) + + # Action is feasible if the node is not visited and is to deliver + # action_mask = torch.logical_and(available, to_deliver) + action_mask = available & to_deliver + + # We are done there are no unvisited locations + done = torch.count_nonzero(available, dim=-1) == 0 + + # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here + reward = torch.zeros_like(done) + + # Update step + td.update( + { + "current_node": current_node, + "available": available, + "to_deliver": to_deliver, + "i": td["i"] + 1, + "action_mask": action_mask, + "reward": reward, + "done": done, + } + ) + return td + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + device = td.device + + locs = torch.cat((td["depot"][:, None, :], td["locs"]), -2) + + # Pick is 1, deliver is 0 [batch_size, graph_size+1], [1,1...1, 0...0] + to_deliver = torch.cat( + [ + torch.ones( + *batch_size, + self.generator.num_loc // 2 + 1, + dtype=torch.bool, + ).to(device), + torch.zeros( + *batch_size, + self.generator.num_loc // 2, + dtype=torch.bool, + ).to(device), + ], + dim=-1, + ) + + # Cannot visit depot at first step # [0,1...1] so set not available + available = torch.ones( + (*batch_size, self.generator.num_loc + 1), dtype=torch.bool + ).to(device) + action_mask = ~available.contiguous() # [batch_size, graph_size+1] + action_mask[..., 0] = 1 # First step is always the depot + + # Other variables + current_node = torch.zeros((*batch_size, 1), dtype=torch.int64).to(device) + i = torch.zeros((*batch_size, 1), dtype=torch.int64).to(device) + + return TensorDict( + { + "locs": locs, + "current_node": current_node, + "to_deliver": to_deliver, + "available": available, + "i": i, + "action_mask": action_mask, + }, + batch_size=batch_size, + ) + + def _make_spec(self, generator: PDPGenerator): + """Make the observation and action specs from the parameters.""" + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.num_loc + 1, 2), + dtype=torch.float32, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + to_deliver=Unbounded( + shape=(1), + dtype=torch.int64, + ), + i=Unbounded( + shape=(1), + dtype=torch.int64, + ), + action_mask=Unbounded( + shape=(generator.num_loc + 1), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.num_loc + 1, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + @staticmethod + def _get_reward(td, actions) -> TensorDict: + # Gather locations in order of tour (add depot since we start and end there) + locs_ordered = torch.cat( + [ + td["locs"][..., 0:1, :], # depot + gather_by_index(td["locs"], actions), # order locations + ], + dim=1, + ) + return -get_tour_length(locs_ordered) + + def check_solution_validity(self, td, actions): + # assert (actions[:, 0] == 0).all(), "Not starting at depot" + assert ( + torch.arange(actions.size(1), out=actions.data.new()) + .view(1, -1) + .expand_as(actions) + == actions.data.sort(1)[0] + ).all(), "Not visiting all nodes" + + visited_time = torch.argsort( + actions, 1 + ) # index of pickup less than index of delivery + assert ( + visited_time[:, 1 : actions.size(1) // 2 + 1] + < visited_time[:, actions.size(1) // 2 + 1 :] + ).all(), "Deliverying without pick-up" + + def get_num_starts(self, td): + """Only half of the nodes (i.e. pickup nodes) can be start nodes""" + return (td["locs"].shape[-2] - 1) // 2 + + def select_start_nodes(self, td, num_starts): + """Only nodes from [1 : num_loc // 2 +1] (i.e. pickups) can be selected""" + num_possible_starts = (td["locs"].shape[-2] - 1) // 2 + selected = ( + torch.arange(num_starts, device=td.device).repeat_interleave(td.shape[0]) + % num_possible_starts + + 1 + ) + return selected + + @staticmethod + def render(td: TensorDict, actions: torch.Tensor = None, ax=None): + return render(td, actions, ax) + + +class PDPRuinRepairEnv(ImprovementEnvBase): + """Pickup and Delivery Problem (PDP) environment for performing neural ruin-repair search. + The environment is made of num_loc + 1 locations (cities): + - 1 depot + - `num_loc` / 2 pickup locations + - `num_loc` / 2 delivery locations + + The goal is to search for optimal solutions to pickup and delivery problems by performing a ruin-and-repair neighborhood search on a given initial solution. + (see MDP described in https://arxiv.org/abs/2204.11399) + + The condition is that at each step, the visited solutions must be feasible, + maintaining the sequence of visiting the pickup location before its corresponding delivery location. + + Observations: + - locations of the depot, pickup, and delivery locations + - current solution to be improved + - historical decisions + - the current step + + Constraints: + - the tour starts and ends at the depot + - each pickup location must be visited before its corresponding delivery location + - the vehicle cannot visit the same location twice + + Finish Condition: + - None + + Reward: + - the immediate reduced cost over the current best-so-far solution + (see MDP described in https://arxiv.org/abs/2204.11399) + + Args: + num_loc: number of locations (cities) in the TSP + init_sol_type: the method type used for generating initial solutions (random or greedy) + td_params: parameters of the environment + seed: seed for the environment + device: device to use. Generally, no need to set as tensors are updated on the fly + """ + + name = "pdp_ruin_repair" + + def __init__( + self, + generator: PDPGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = PDPGenerator(**generator_params) + self.generator = generator + self._make_spec(self.generator) + + def _step(self, td: TensorDict, solution_to=None) -> TensorDict: + # get state information from td + solution_best = td["rec_best"] + locs = td["locs"] + cost_bsf = td["cost_bsf"] + action_record = td["action_record"] + bs, gs = solution_best.size() + + # perform local_operator + if solution_to is None: + action = td["action"] + solution = td["rec_current"] + next_rec = self._local_operator(solution, action) + else: + next_rec = solution_to.clone() + new_obj = self.get_costs(locs, next_rec) + + # compute reward and update best-so-far solutions + now_bsf = torch.where(new_obj < cost_bsf, new_obj, cost_bsf) + reward = cost_bsf - now_bsf + index = reward > 0.0 + solution_best[index] = next_rec[index].clone() + + # reset visited_time + visited_time = td["visited_time"] * 0 + pre = torch.zeros((bs), device=visited_time.device).long() + arange = torch.arange(bs) + for i in range(gs): + current_nodes = next_rec[arange, pre] + visited_time[arange, current_nodes] = i + 1 + pre = current_nodes + visited_time = visited_time.long() + + # update action record + if solution_to is None: + action_record[:, :-1] = action_record[:, 1:] + action_record[:, -1] *= 0 + action_record[torch.arange(bs), -1, action[:, 0]] = 1 + + # Update step + td.update( + { + "cost_current": new_obj, + "cost_bsf": now_bsf, + "rec_current": next_rec, + "rec_best": solution_best, + "visited_time": visited_time, + "action_record": action_record, + "i": td["i"] + 1 if solution_to is None else td["i"], + "reward": reward, + } + ) + + return td + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + device = td.device + + locs = torch.cat((td["depot"][:, None, :], td["locs"]), -2) + current_rec = self.generator._get_initial_solutions(locs).to(device) + obj = self.get_costs(locs, current_rec) + + # get index according to the solutions in the linked list data structure + bs = batch_size[0] + seq_length = self.generator.num_loc + 1 + visited_time = torch.zeros((bs, seq_length)).to(device) + pre = torch.zeros((bs)).to(device).long() + arange = torch.arange(bs) + for i in range(seq_length): + current_nodes = current_rec[arange, pre] + visited_time[arange, current_nodes] = i + 1 + pre = current_nodes + visited_time = visited_time.long() + + # get action record and step i + i = torch.zeros((*batch_size, 1), dtype=torch.int64).to(device) + action_record = ( + torch.zeros((bs, seq_length, seq_length // 2)) + if self.training + else torch.zeros((bs, seq_length // 2, seq_length // 2)) + ) + + return TensorDict( + { + "locs": locs, + "cost_current": obj, + "cost_bsf": obj.clone(), + "rec_current": current_rec, + "rec_best": current_rec.clone(), + "visited_time": visited_time, + "action_record": action_record, + "i": i, + }, + batch_size=batch_size, + ) + + @staticmethod + def _local_operator(solution, action): + # get info + pair_index = action[:, 0].view(-1, 1) + 1 + first = action[:, 1].view(-1, 1) + second = action[:, 2].view(-1, 1) + rec = solution.clone() + bs, gs = rec.size() + + # fix connection for pairing node + argsort = rec.argsort() + pre_pairfirst = argsort.gather(1, pair_index) + post_pairfirst = rec.gather(1, pair_index) + rec.scatter_(1, pre_pairfirst, post_pairfirst) + rec.scatter_(1, pair_index, pair_index) + + argsort = rec.argsort() + + pre_pairsecond = argsort.gather(1, pair_index + gs // 2) + post_pairsecond = rec.gather(1, pair_index + gs // 2) + + rec.scatter_(1, pre_pairsecond, post_pairsecond) + + # fix connection for pairing node + post_second = rec.gather(1, second) + rec.scatter_(1, second, pair_index + gs // 2) + rec.scatter_(1, pair_index + gs // 2, post_second) + + post_first = rec.gather(1, first) + rec.scatter_(1, first, pair_index) + rec.scatter_(1, pair_index, post_first) + + return rec + + def _make_spec(self, generator: PDPGenerator): + """Make the observation and action specs from the parameters.""" + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.num_loc + 1, 2), + dtype=torch.float32, + ), + cost_current=Unbounded( + shape=(1), + dtype=torch.float32, + ), + cost_bsf=Unbounded( + shape=(1), + dtype=torch.float32, + ), + rec_current=Unbounded( + shape=(self.generator.num_loc + 1), + dtype=torch.int64, + ), + rec_best=Unbounded( + shape=(self.generator.num_loc + 1), + dtype=torch.int64, + ), + visited_time=Unbounded( + shape=(self.generator.num_loc + 1, self.generator.num_loc + 1), + dtype=torch.int64, + ), + action_record=Unbounded( + shape=(self.generator.num_loc + 1, self.generator.num_loc + 1), + dtype=torch.int64, + ), + i=Unbounded( + shape=(1), + dtype=torch.int64, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(3,), + dtype=torch.int64, + low=0, + high=self.generator.num_loc + 1, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + def check_solution_validity(self, td, actions=None): + # The function can be called by the agent to check the validity of the best found solution + # Note that the args actions are not used in improvement method. + + solution = td["rec_best"] + batch_size, graph_size = solution.size() + + assert ( + torch.arange(graph_size, out=solution.data.new()) + .view(1, -1) + .expand_as(solution) + == solution.data.sort(1)[0] + ).all(), "Not visiting all nodes" + + visited_time = torch.zeros((batch_size, graph_size), device=self.device) + pre = torch.zeros(batch_size, device=self.device).long() + arange = torch.arange(batch_size) + for i in range(graph_size): + visited_time[arange, solution[arange, pre]] = i + 1 + pre = solution[arange, pre] + + assert ( + visited_time[:, 1 : graph_size // 2 + 1] + < visited_time[:, graph_size // 2 + 1 :] + ).all(), "Deliverying without pick-up" + + @staticmethod + def get_mask(selected_node, td): + # return mask that is 1 if the corresponding action is feasible, 0 otherwise + + visited_time = td["visited_time"] + bs, gs = visited_time.size() + visited_time = visited_time % gs + arange = torch.arange(bs) + + visited_order_map = visited_time.view(bs, gs, 1) > visited_time.view(bs, 1, gs) + mask = visited_order_map.clone() + mask[arange, selected_node.view(-1)] = True + mask[arange, selected_node.view(-1) + gs // 2] = True + mask[arange, :, selected_node.view(-1)] = True + mask[arange, :, selected_node.view(-1) + gs // 2] = True + + bs, gs, _ = visited_order_map.size() + + return ~mask + + @classmethod + def _random_action(cls, td): + batch_size, graph_size = td["rec_best"].size() + selected_node = ( + (torch.rand(batch_size, 1) * graph_size // 2) % (graph_size // 2) + ).long() + mask = cls.get_mask(selected_node + 1, td) + logits = torch.rand(batch_size, graph_size, graph_size) + logits[~mask] = -1e20 + prob = torch.softmax(logits.view(batch_size, -1), -1) + sample = prob.multinomial(1) + action = torch.cat( + (selected_node, sample // (graph_size), sample % (graph_size)), -1 + ) + td["action"] = action + return action + + @classmethod + def render(cls, td: TensorDict, actions: torch.Tensor = None, ax=None): + solution_current = cls.get_current_solution(td) + solution_best = cls.get_best_solution(td) + return render_improvement(td, solution_current, solution_best) diff --git a/rl4co/envs/routing/pdp/generator.py b/rl4co/envs/routing/pdp/generator.py new file mode 100644 index 00000000..1c6dfd37 --- /dev/null +++ b/rl4co/envs/routing/pdp/generator.py @@ -0,0 +1,152 @@ +from typing import Callable, Union + +import torch + +from tensordict.tensordict import TensorDict +from torch.distributions import Uniform + +from rl4co.envs.common.utils import Generator, get_sampler +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class PDPGenerator(Generator): + """Data generator for the Pickup and Delivery Problem (PDP). + Args: + num_loc: number of locations (customers) in the PDP, without the depot. (e.g. 10 means 10 locs + 1 depot) + - 1 depot + - `num_loc` / 2 pickup locations + - `num_loc` / 2 delivery locations + min_loc: minimum value for the location coordinates + max_loc: maximum value for the location coordinates + init_sol_type: the method type used for generating initial solutions (random or greedy) + loc_distribution: distribution for the location coordinates + depot_distribution: distribution for the depot location. If None, sample the depot from the locations + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each customer + depot [batch_size, 2]: location of the depot + """ + + def __init__( + self, + num_loc: int = 20, + min_loc: float = 0.0, + max_loc: float = 1.0, + init_sol_type: str = "random", + loc_distribution: Union[int, float, str, type, Callable] = Uniform, + depot_distribution: Union[int, float, str, type, Callable] = None, + **kwargs, + ): + self.num_loc = num_loc + self.min_loc = min_loc + self.max_loc = max_loc + self.init_sol_type = init_sol_type + + # Number of locations must be even + if num_loc % 2 != 0: + log.warn( + "Number of locations must be even. Adding 1 to the number of locations." + ) + self.num_loc += 1 + + # Location distribution + if kwargs.get("loc_sampler", None) is not None: + self.loc_sampler = kwargs["loc_sampler"] + else: + self.loc_sampler = get_sampler( + "loc", loc_distribution, min_loc, max_loc, **kwargs + ) + + # Depot distribution + if kwargs.get("depot_sampler", None) is not None: + self.depot_sampler = kwargs["depot_sampler"] + else: + self.depot_sampler = get_sampler( + "depot", depot_distribution, min_loc, max_loc, **kwargs + ) if depot_distribution is not None else None + + def _generate(self, batch_size) -> TensorDict: + # Sample locations: depot and customers + if self.depot_sampler is not None: + depot = self.depot_sampler.sample((*batch_size, 2)) + locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2)) + else: + # if depot_sampler is None, sample the depot from the locations + locs = self.loc_sampler.sample((*batch_size, self.num_loc + 1, 2)) + depot = locs[..., 0, :] + locs = locs[..., 1:, :] + + return TensorDict( + { + "locs": locs, + "depot": depot, + }, + batch_size=batch_size, + ) + + # for improvement MDP only (to be refactored by a combination of rollout and the random policy) + def _get_initial_solutions(self, coordinates): + order_size = self.num_loc // 2 + batch_size = coordinates.size(0) + + if self.init_sol_type == "random": + candidates = torch.ones(batch_size, self.num_loc + 1).bool() + candidates[:, order_size + 1 :] = 0 + rec = torch.zeros(batch_size, self.num_loc + 1).long() + selected_node = torch.zeros(batch_size, 1).long() + candidates.scatter_(1, selected_node, 0) + + for i in range(self.num_loc): + dists = torch.ones(batch_size, self.num_loc + 1) + dists.scatter_(1, selected_node, -1e20) + dists[~candidates] = -1e20 + dists = torch.softmax(dists, -1) + next_selected_node = dists.multinomial(1).view(-1, 1) + + add_index = (next_selected_node <= order_size).view(-1) + pairing = ( + next_selected_node[next_selected_node <= order_size].view(-1, 1) + + order_size + ) + candidates[add_index] = candidates[add_index].scatter_(1, pairing, 1) + + rec.scatter_(1, selected_node, next_selected_node) + candidates.scatter_(1, next_selected_node, 0) + selected_node = next_selected_node + + elif self.init_sol_type == "greedy": + candidates = torch.ones(batch_size, self.num_loc + 1).bool() + candidates[:, order_size + 1 :] = 0 + rec = torch.zeros(batch_size, self.num_loc + 1).long() + selected_node = torch.zeros(batch_size, 1).long() + candidates.scatter_(1, selected_node, 0) + + for i in range(self.num_loc): + d1 = coordinates.cpu().gather( + 1, selected_node.unsqueeze(-1).expand(batch_size, self.num_loc + 1, 2) + ) + d2 = coordinates.cpu() + + dists = (d1 - d2).norm(p=2, dim=2) + dists.scatter_(1, selected_node, 1e6) + dists[~candidates] = 1e6 + next_selected_node = dists.min(-1)[1].view(-1, 1) + + add_index = (next_selected_node <= order_size).view(-1) + pairing = ( + next_selected_node[next_selected_node <= order_size].view(-1, 1) + + order_size + ) + candidates[add_index] = candidates[add_index].scatter_(1, pairing, 1) + + rec.scatter_(1, selected_node, next_selected_node) + candidates.scatter_(1, next_selected_node, 0) + selected_node = next_selected_node + + else: + raise NotImplementedError() + + return rec.expand(batch_size, self.num_loc + 1).clone() diff --git a/rl4co/envs/routing/pdp/render.py b/rl4co/envs/routing/pdp/render.py new file mode 100644 index 00000000..2388f743 --- /dev/null +++ b/rl4co/envs/routing/pdp/render.py @@ -0,0 +1,142 @@ +import matplotlib.pyplot as plt +import torch + +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +# Only render the first instance +def render(td, actions=None, ax=None): + markersize = 8 + + td = td.detach().cpu() + # if batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + if actions is not None: + actions = actions[0] + + # Variables + init_deliveries = td["to_deliver"][1:] + delivery_locs = td["locs"][1:][~init_deliveries.bool()] + pickup_locs = td["locs"][1:][init_deliveries.bool()] + depot_loc = td["locs"][0] + actions = actions if actions is not None else td["action"] + + fig, ax = plt.subplots() + + # Plot the actions in order + for i in range(len(actions)): + from_node = actions[i] + to_node = ( + actions[i + 1] if i < len(actions) - 1 else actions[0] + ) # last goes back to depot + from_loc = td["locs"][from_node] + to_loc = td["locs"][to_node] + ax.plot([from_loc[0], to_loc[0]], [from_loc[1], to_loc[1]], "k-") + ax.annotate( + "", + xy=(to_loc[0], to_loc[1]), + xytext=(from_loc[0], from_loc[1]), + arrowprops=dict(arrowstyle="->", color="black"), + annotation_clip=False, + ) + + # Plot the depot location + ax.plot( + depot_loc[0], + depot_loc[1], + "g", + marker="s", + markersize=markersize, + label="Depot", + ) + + # Plot the pickup locations + for i, pickup_loc in enumerate(pickup_locs): + ax.plot( + pickup_loc[0], + pickup_loc[1], + "r", + marker="^", + markersize=markersize, + label="Pickup" if i == 0 else None, + ) + + # Plot the delivery locations + for i, delivery_loc in enumerate(delivery_locs): + ax.plot( + delivery_loc[0], + delivery_loc[1], + "b", + marker="v", + markersize=markersize, + label="Delivery" if i == 0 else None, + ) + + # Setup limits and show + ax.set_xlim(-0.05, 1.05) + ax.set_ylim(-0.05, 1.05) + + +def render_improvement(td, current_soltuion, best_soltuion): + coordinates = td["locs"][0] + real_seq = current_soltuion[:1] + real_best = best_soltuion[:1] + fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(16, 6)) # Create two side-by-side axes + + for ax in [ax1, ax2]: # Plot on both axes + if ax == ax1: + ax.axis([-0.05, 1.05] * 2) + # plot the nodes + ax.scatter( + coordinates[:, 0], coordinates[:, 1], marker="H", s=55, c="blue", zorder=2 + ) + # plot the tour + real_seq_coordinates = coordinates.gather( + 0, real_seq[0].unsqueeze(1).repeat(1, 2) + ) + real_seq_coordinates = torch.cat( + (real_seq_coordinates, real_seq_coordinates[:1]), 0 + ) + ax.plot( + real_seq_coordinates[:, 0], + real_seq_coordinates[:, 1], + color="black", + zorder=1, + ) + # mark node + for i, txt in enumerate(range(real_seq.size(1))): + ax.annotate( + txt, + (coordinates[i, 0] + 0.01, coordinates[i, 1] + 0.01), + ) + ax.set_title("Current Solution") + else: + ax.axis([-0.05, 1.05] * 2) + # plot the nodes + ax.scatter( + coordinates[:, 0], coordinates[:, 1], marker="H", s=55, c="blue", zorder=2 + ) + # plot the tour + real_best_coordinates = coordinates.gather( + 0, real_best[0].unsqueeze(1).repeat(1, 2) + ) + real_best_coordinates = torch.cat( + (real_best_coordinates, real_best_coordinates[:1]), 0 + ) + ax.plot( + real_best_coordinates[:, 0], + real_best_coordinates[:, 1], + color="black", + zorder=1, + ) + # mark node + for i, txt in enumerate(range(real_seq.size(1))): + ax.annotate( + txt, + (coordinates[i, 0] + 0.01, coordinates[i, 1] + 0.01), + ) + ax.set_title("Best Solution") + plt.tight_layout() diff --git a/rl4co/envs/routing/sdvrp/__init__.py b/rl4co/envs/routing/sdvrp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/sdvrp/env.py b/rl4co/envs/routing/sdvrp/env.py new file mode 100644 index 00000000..916a7a9f --- /dev/null +++ b/rl4co/envs/routing/sdvrp/env.py @@ -0,0 +1,205 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +from ..cvrp.env import CVRPEnv +from ..cvrp.generator import CVRPGenerator + +log = get_pylogger(__name__) + + +class SDVRPEnv(CVRPEnv): + """Split Delivery Vehicle Routing Problem (SDVRP) environment. + SDVRP is a generalization of CVRP, where nodes can be visited multiple times and a fraction of the demand can be met. + At each step, the agent chooses a customer to visit depending on the current location and the remaining capacity. + When the agent visits a customer, the remaining capacity is updated. If the remaining capacity is not enough to + visit any customer, the agent must go back to the depot. The reward is the -infinite unless the agent visits all the customers. + In that case, the reward is (-)length of the path: maximizing the reward is equivalent to minimizing the path length. + + Observations: + - location of the depot. + - locations and demand/remaining demand of each customer + - current location of the vehicle. + - the remaining capacity of the vehicle. + + Constraints: + - the tour starts and ends at the depot. + - each customer can be visited multiple times. + - the vehicle cannot visit customers exceed the remaining capacity. + - the vehicle can return to the depot to refill the capacity. + + Finish Condition: + - the vehicle has finished all customers demand and returned to the depot. + + Reward: + - (minus) the negative length of the path. + + Args: + generator: CVRPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "sdvrp" + + def __init__( + self, + generator: CVRPGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(generator, generator_params, **kwargs) + + def _step(self, td: TensorDict) -> TensorDict: + # Update the state + current_node = td["action"][:, None] # Add dimension for step + + # Not selected_demand is demand of first node (by clamp) so incorrect for nodes that visit depot! + selected_demand = gather_by_index( + td["demand_with_depot"], current_node, dim=-1, squeeze=False + )[..., :1] + delivered_demand = torch.min( + selected_demand, td["vehicle_capacity"] - td["used_capacity"] + ) + + # Increase capacity if depot is not visited, otherwise set to 0 + used_capacity = (td["used_capacity"] + delivered_demand) * ( + current_node != 0 + ).float() + + # Update demand + demand_with_depot = td["demand_with_depot"].scatter_add( + -1, current_node, -delivered_demand + ) + + # Get done + done = ~(demand_with_depot > 0).any(-1) + + # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here + reward = torch.zeros_like(done) + + # Update state + td.update( + { + "demand_with_depot": demand_with_depot, + "current_node": current_node, + "used_capacity": used_capacity, + "reward": reward, + "done": done, + } + ) + td.set("action_mask", self.get_action_mask(td)) + return td + + def _reset( + self, + td: Optional[TensorDict] = None, + batch_size: Optional[list] = None, + ) -> TensorDict: + device = td.device + + # Create reset TensorDict + reset_td = TensorDict( + { + "locs": torch.cat((td["depot"][..., None, :], td["locs"]), -2), + "demand": td["demand"], + "demand_with_depot": torch.cat( + (torch.zeros_like(td["demand"][..., 0:1]), td["demand"]), -1 + ), + "current_node": torch.zeros( + *batch_size, 1, dtype=torch.long, device=device + ), + "used_capacity": torch.zeros((*batch_size, 1), device=device), + "vehicle_capacity": torch.full( + (*batch_size, 1), self.generator.vehicle_capacity, device=device + ), + }, + batch_size=batch_size, + ) + reset_td.set("action_mask", self.get_action_mask(reset_td)) + return reset_td + + @staticmethod + def get_action_mask(td: TensorDict) -> torch.Tensor: + mask_loc = (td["demand_with_depot"][..., 1:] == 0) | ( + td["used_capacity"] >= td["vehicle_capacity"] + ) + mask_depot = (td["current_node"] == 0).squeeze(-1) & ( + (mask_loc == 0).int().sum(-1) > 0 + ) + return ~torch.cat((mask_depot[..., None], mask_loc), -1) + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor) -> None: + """Check that the solution is valid (all demand is satisfied)""" + + batch_size, graph_size = td["demand"].size() + + # Each node can be visited multiple times, but we always deliver as much demand as possible + # We check that at the end all demand has been satisfied + demands = torch.cat((-td["vehicle_capacity"], td["demand"]), 1) + + rng = torch.arange(batch_size, out=demands.data.new().long()) + used_cap = torch.zeros_like(td["demand"][..., 0]) + a_prev = None + for a in actions.transpose(0, 1): + assert ( + a_prev is None or (demands[((a_prev == 0) & (a == 0)), :] == 0).all() + ), "Cannot visit depot twice if any nonzero demand" + d = torch.min(demands[rng, a], td["vehicle_capacity"].squeeze(-1) - used_cap) + demands[rng, a] -= d + used_cap += d + used_cap[a == 0] = 0 + a_prev = a + assert (demands == 0).all(), "All demand must be satisfied" + + def _make_spec(self, generator): + """Make the observation and action specs from the parameters.""" + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.num_loc + 1, 2), + dtype=torch.float32, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + demand=Bounded( + low=generator.min_demand, + high=generator.max_demand, + shape=(generator.num_loc, 1), # demand is only for customers + dtype=torch.float32, + ), + demand_with_depot=Bounded( + low=generator.min_demand, + high=generator.max_demand, + shape=(generator.num_loc + 1, 1), + dtype=torch.float32, + ), + used_capacity=Bounded( + low=0, + high=generator.vehicle_capacity, + shape=(1,), + dtype=torch.float32, + ), + action_mask=Unbounded( + shape=(generator.num_loc + 1, 1), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.num_loc + 1, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) diff --git a/rl4co/envs/routing/spctsp/__init__.py b/rl4co/envs/routing/spctsp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/spctsp/env.py b/rl4co/envs/routing/spctsp/env.py new file mode 100644 index 00000000..4f99c070 --- /dev/null +++ b/rl4co/envs/routing/spctsp/env.py @@ -0,0 +1,31 @@ +from rl4co.utils.pylogger import get_pylogger + +from ..pctsp.env import PCTSPEnv + +log = get_pylogger(__name__) + + +class SPCTSPEnv(PCTSPEnv): + """Stochastic Prize Collecting Traveling Salesman Problem (SPCTSP) environment. + + Note: + The only difference with deterministic PCTSP is that the prizes are stochastic + (i.e. the expected prize is not the same as the real prize). + """ + + name = "spctsp" + _stochastic = True + + def __init__(self, **kwargs): + super().__init__(**kwargs) + + @property + def stochastic(self): + return self._stochastic + + @stochastic.setter + def stochastic(self, state: bool): + if state is False: + log.warning( + "Deterministic mode should not be used for SPCTSP. Use PCTSP instead." + ) diff --git a/rl4co/envs/routing/svrp/__init__.py b/rl4co/envs/routing/svrp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/svrp/env.py b/rl4co/envs/routing/svrp/env.py new file mode 100644 index 00000000..afcbae6a --- /dev/null +++ b/rl4co/envs/routing/svrp/env.py @@ -0,0 +1,248 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.ops import gather_by_index, get_distance +from rl4co.utils.pylogger import get_pylogger + +from .generator import SVRPGenerator + +log = get_pylogger(__name__) + + +class SVRPEnv(RL4COEnvBase): + """Skill-Vehicle Routing Problem (SVRP) environment. + Basic Skill-VRP environment. The environment is a variant of the Capacitated Vehicle Routing Problem (CVRP). + Each technician has a certain skill-level and each customer node requires a certain skill-level to be serviced. + Each customer node needs is to be serviced by exactly one technician. Technicians can only service nodes if + their skill-level is greater or equal to the required skill-level of the node. The environment is episodic and + the goal is to minimize the total travel cost of the technicians. The travel cost depends on the skill-level of + the technician. The environment is defined by the following parameters: + + Observations: + - locations of the depot, pickup, and delivery locations + - current location of the vehicle + - the remaining locations to deliver + - the visited locations + - the current step + + Constraints: + - the tour starts and ends at the depot + - each pickup location must be visited before its corresponding delivery location + - the vehicle cannot visit the same location twice + + Finish Condition: + - the vehicle has visited all locations + + Reward: + - (minus) the negative length of the path + + Args: + generator: PDPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "svrp" + + def __init__( + self, + generator: SVRPGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = SVRPGenerator(**generator_params) + self.generator = generator + self.tech_costs = self.generator.tech_costs + self._make_spec(self.generator) + + def _make_spec(self, generator): + """Make the observation and action specs from the parameters.""" + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.num_loc + 1, 2), + dtype=torch.float32, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + skills=Bounded( + low=generator.min_skill, + high=generator.max_skill, + shape=(generator.num_loc, 1), + dtype=torch.float32, + ), + action_mask=Unbounded( + shape=(generator.num_loc + 1, 1), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.num_loc + 1, + ) + self.reward_spec = Unbounded(shape=(1,), dtype=torch.float32) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + @staticmethod + def get_action_mask(td: TensorDict) -> torch.Tensor: + """Calculates the action mask for the Skill-VRP. The action mask is a binary mask that indicates which customer nodes can be services, given the previous decisions. + For the Skill-VRP, a node can be serviced if the technician has the required skill-level and the node has not been visited yet. + The depot cannot be visited if there are still unserved nodes and the technician either just visited the depot or is the last technician + (because every customer node needs to be visited). + """ + batch_size = td["locs"].shape[0] + # check skill level + current_tech_skill = gather_by_index(td["techs"], td["current_tech"]).reshape( + [batch_size, 1] + ) + can_service = td["skills"] <= current_tech_skill.unsqueeze(1).expand_as( + td["skills"] + ) + mask_loc = td["visited"][..., 1:, :].to(can_service.dtype) | ~can_service + # Cannot visit the depot if there are still unserved nodes and I either just visited the depot or am the last technician + mask_depot = ( + (td["current_node"] == 0) | (td["current_tech"] == td["techs"].size(-2) - 1) + ) & ((mask_loc == 0).int().sum(-2) > 0) + return ~torch.cat((mask_depot[..., None], mask_loc), -2).squeeze(-1) + + def _step(self, td: TensorDict) -> torch.Tensor: + """Step function for the Skill-VRP. If a technician returns to the depot, the next technician is sent out. + The visited node is marked as visited. The reward is set to zero and the done flag is set if all nodes have been visited. + """ + current_node = td["action"][:, None] # Add dimension for step + + # if I go back to the depot, send out next technician + td["current_tech"] += (current_node == 0).int() + + # Add one dimension since we write a single value + visited = td["visited"].scatter(-2, current_node[..., None], 1) + + # SECTION: get done + done = visited.sum(-2) == visited.size(-2) + reward = torch.zeros_like(done) + + td.update( + { + "current_node": current_node, + "visited": visited, + "reward": reward, + "done": done, + } + ) + td.set("action_mask", self.get_action_mask(td)) + return td + + def _reset( + self, td: Optional[TensorDict] = None, batch_size: Optional[list] = None + ) -> TensorDict: + device = td.device + + # Create reset TensorDict + td_reset = TensorDict( + { + "locs": torch.cat((td["depot"][:, None, :], td["locs"]), -2), + "techs": td["techs"], + "skills": td["skills"], + "current_node": torch.zeros( + *batch_size, 1, dtype=torch.long, device=device + ), + "current_tech": torch.zeros( + *batch_size, 1, dtype=torch.long, device=device + ), + "visited": torch.zeros( + (*batch_size, td["locs"].shape[-2] + 1, 1), + dtype=torch.uint8, + device=device, + ), + }, + batch_size=batch_size, + ) + td_reset.set("action_mask", self.get_action_mask(td_reset)) + return td_reset + + def _get_reward(self, td: TensorDict, actions: torch.Tensor) -> torch.Tensor: + """Calculated the reward, where the reward is the negative total travel cost of the technicians. + The travel cost depends on the skill-level of the technician.""" + # Check that the solution is valid + if self.check_solution: + self.check_solution_validity(td, actions) + + # Gather dataset in order of tour + batch_size = td["locs"].shape[0] + depot = td["locs"][..., 0:1, :] + locs_ordered = torch.cat( + [ + depot, + gather_by_index(td["locs"], actions).reshape( + [batch_size, actions.size(-1), 2] + ), + ], + dim=1, + ) + + # calculate travelling costs depending on the technicians' skill level + costs = torch.zeros(batch_size, locs_ordered.size(-2), device=self.device) + indices = torch.nonzero(actions == 0) + start = tech = 0 + batch = 0 + for each in indices: + if each[0] > batch: + costs[batch, start:] = self.tech_costs[tech] + start = tech = 0 + batch = each[0] + end = ( + each[-1] + 1 + ) # indices in locs_ordered are shifted by one due to added depot in the front + costs[batch, start:end] = self.tech_costs[tech] + tech += 1 + start = end + costs[batch, start:] = self.tech_costs[tech] + + travel_to = torch.roll(locs_ordered, -1, dims=-2) + distances = get_distance(locs_ordered, travel_to) + return -(distances * costs).sum(-1) + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor) -> None: + """Check that solution is valid: nodes are not visited twice except depot and required skill levels are always met.""" + batch_size, graph_size = td["skills"].shape[0], td["skills"].shape[1] + sorted_pi = actions.data.sort(1).values + + # Sorting it should give all zeros at front and then 1...n + assert ( + torch.arange(1, graph_size + 1, out=sorted_pi.data.new()) + .view(1, -1) + .expand(batch_size, graph_size) + == sorted_pi[:, -graph_size:] + ).all() and (sorted_pi[:, :-graph_size] == 0).all(), "Invalid tour" + + # make sure all required skill levels are met + indices = torch.nonzero(actions == 0) + skills = torch.cat( + [torch.zeros(batch_size, 1, 1, device=td.device), td["skills"]], 1 + ) + skills_ordered = gather_by_index(skills, actions).reshape( + [batch_size, actions.size(-1), 1] + ) + batch = start = tech = 0 + for each in indices: + if each[0] > batch: + start = tech = 0 + batch = each[0] + assert ( + skills_ordered[batch, start : each[1]] <= td["techs"][batch, tech] + ).all(), "Skill level not met" + start = each[1] + 1 # skip the depot + tech += 1 diff --git a/rl4co/envs/routing/svrp/generator.py b/rl4co/envs/routing/svrp/generator.py new file mode 100644 index 00000000..60110559 --- /dev/null +++ b/rl4co/envs/routing/svrp/generator.py @@ -0,0 +1,107 @@ +from typing import Union, Callable + +import torch + +from torch.distributions import Uniform +from tensordict.tensordict import TensorDict + +from rl4co.utils.pylogger import get_pylogger +from rl4co.envs.common.utils import get_sampler, Generator + +log = get_pylogger(__name__) + + +class SVRPGenerator(Generator): + """Data generator for the Skill Vehicle Routing Problem (SVRP). + Args: + num_loc: number of locations (customers) in the TSP + min_loc: minimum value for the location coordinates + max_loc: maximum value for the location coordinates + loc_distribution: distribution for the location coordinates + depot_distribution: distribution for the depot location. If None, sample the depot from the locations min_skill: minimum value for the technic skill + max_skill: maximum value for the technic skill + skill_distribution: distribution for the technic skill + tech_costs: list of the technic costs + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each customer + depot [batch_size, 2]: location of the depot + techs [batch_size, num_loc]: technic requirements of each customer + skills [batch_size, num_loc]: skills of the vehicles + """ + def __init__( + self, + num_loc: int = 20, + min_loc: float = 0.0, + max_loc: float = 1.0, + loc_distribution: Union[ + int, float, str, type, Callable + ] = Uniform, + depot_distribution: Union[ + int, float, str, type, Callable + ] = None, + min_skill: float = 1.0, + max_skill: float = 10.0, + tech_costs: list = [1, 2, 3], + **kwargs + ): + self.num_loc = num_loc + self.min_loc = min_loc + self.max_loc = max_loc + self.min_skill = min_skill + self.max_skill = max_skill + self.num_tech = len(tech_costs) + self.tech_costs = torch.tensor(tech_costs) + + # Location distribution + if kwargs.get("loc_sampler", None) is not None: + self.loc_sampler = kwargs["loc_sampler"] + else: + self.loc_sampler = get_sampler("loc", loc_distribution, min_loc, max_loc, **kwargs) + + # Depot distribution + if kwargs.get("depot_sampler", None) is not None: + self.depot_sampler = kwargs["depot_sampler"] + else: + self.depot_sampler = get_sampler("depot", depot_distribution, min_loc, max_loc, **kwargs) if depot_distribution is not None else None + + def _generate(self, batch_size) -> TensorDict: + """Generate data for the basic Skill-VRP. The data consists of the locations of the customers, + the skill-levels of the technicians and the required skill-levels of the customers. + The data is generated randomly within the given bounds.""" + # Sample locations: depot and customers + if self.depot_sampler is not None: + depot = self.depot_sampler.sample((*batch_size, 2)) + locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2)) + else: + # if depot_sampler is None, sample the depot from the locations + locs = self.loc_sampler.sample((*batch_size, self.num_loc + 1, 2)) + depot = locs[..., 0, :] + locs = locs[..., 1:, :] + + locs_with_depot = torch.cat((depot[:, None, :], locs), dim=1) + + # Initialize technicians and sort ascendingly + techs, _ = torch.sort( + torch.FloatTensor(*batch_size, self.num_tech, 1) + .uniform_(self.min_skill, self.max_skill), + dim=-2, + ) + + # Initialize the skills + skills = ( + torch.FloatTensor(*batch_size, self.num_loc, 1).uniform_(0, 1) + ) + # scale skills + skills = torch.max(techs, dim=1, keepdim=True).values * skills + td = TensorDict( + { + "locs": locs_with_depot[..., 1:, :], + "depot": locs_with_depot[..., 0, :], + "techs": techs, + "skills": skills, + }, + batch_size=batch_size, + ) + return td diff --git a/rl4co/envs/routing/svrp/render.py b/rl4co/envs/routing/svrp/render.py new file mode 100644 index 00000000..88a3d752 --- /dev/null +++ b/rl4co/envs/routing/svrp/render.py @@ -0,0 +1,103 @@ +import torch + +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(td, actions=None, ax=None): + import matplotlib.pyplot as plt + import numpy as np + + from matplotlib import cm, colormaps + + num_routine = (actions == 0).sum().item() + 2 + base = colormaps["nipy_spectral"] + color_list = base(np.linspace(0, 1, num_routine)) + cmap_name = base.name + str(num_routine) + out = base.from_list(cmap_name, color_list, num_routine) + + if ax is None: + # Create a plot of the nodes + _, ax = plt.subplots() + + td = td.detach().cpu() + + if actions is None: + actions = td.get("action", None) + + # if batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + actions = actions[0] + + locs = td["locs"] + + # add the depot at the first action and the end action + actions = torch.cat([torch.tensor([0]), actions, torch.tensor([0])]) + + # gather locs in order of action if available + if actions is None: + log.warning("No action in TensorDict, rendering unsorted locs") + else: + locs = locs + + # Cat the first node to the end to complete the tour + x, y = locs[:, 0], locs[:, 1] + + # plot depot + ax.scatter( + locs[0, 0], + locs[0, 1], + edgecolors=cm.Set2(2), + facecolors="none", + s=100, + linewidths=2, + marker="s", + alpha=1, + ) + + # plot visited nodes + ax.scatter( + x[1:], + y[1:], + edgecolors=cm.Set2(0), + facecolors="none", + s=50, + linewidths=2, + marker="o", + alpha=1, + ) + + # text depot + ax.text( + locs[0, 0], + locs[0, 1] - 0.025, + "Depot", + horizontalalignment="center", + verticalalignment="top", + fontsize=10, + color=cm.Set2(2), + ) + + # plot actions + color_idx = 0 + for action_idx in range(len(actions) - 1): + if actions[action_idx] == 0: + color_idx += 1 + from_loc = locs[actions[action_idx]] + to_loc = locs[actions[action_idx + 1]] + ax.plot( + [from_loc[0], to_loc[0]], + [from_loc[1], to_loc[1]], + color=out(color_idx), + lw=1, + ) + ax.annotate( + "", + xy=(to_loc[0], to_loc[1]), + xytext=(from_loc[0], from_loc[1]), + arrowprops=dict(arrowstyle="-|>", color=out(color_idx)), + size=15, + annotation_clip=False, + ) diff --git a/rl4co/envs/routing/tsp/__init__.py b/rl4co/envs/routing/tsp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/routing/tsp/env.py b/rl4co/envs/routing/tsp/env.py new file mode 100644 index 00000000..c1b41769 --- /dev/null +++ b/rl4co/envs/routing/tsp/env.py @@ -0,0 +1,601 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import ImprovementEnvBase, RL4COEnvBase +from rl4co.utils.ops import gather_by_index, get_distance, get_tour_length +from rl4co.utils.pylogger import get_pylogger + +from .generator import TSPGenerator + +try: + from .local_search import local_search +except ImportError: + # In case some dependencies are not installed (e.g., numba) + local_search = None +from .render import render, render_improvement + +log = get_pylogger(__name__) + + +class TSPEnv(RL4COEnvBase): + """Traveling Salesman Problem (TSP) environment + At each step, the agent chooses a city to visit. The reward is 0 unless the agent visits all the cities. + In that case, the reward is (-)length of the path: maximizing the reward is equivalent to minimizing the path length. + + Observations: + - locations of each customer. + - the current location of the vehicle. + + Constraints: + - the tour must return to the starting customer. + - each customer must be visited exactly once. + + Finish condition: + - the agent has visited all customers and returned to the starting customer. + + Reward: + - (minus) the negative length of the path. + + Args: + generator: TSPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "tsp" + + def __init__( + self, + generator: TSPGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = TSPGenerator(**generator_params) + self.generator = generator + self._make_spec(self.generator) + + @staticmethod + def _step(td: TensorDict) -> TensorDict: + current_node = td["action"] + first_node = current_node if td["i"].all() == 0 else td["first_node"] + + # # Set not visited to 0 (i.e., we visited the node) + available = td["action_mask"].scatter( + -1, current_node.unsqueeze(-1).expand_as(td["action_mask"]), 0 + ) + + # We are done there are no unvisited locations + done = torch.sum(available, dim=-1) == 0 + + # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here + reward = torch.zeros_like(done) + + td.update( + { + "first_node": first_node, + "current_node": current_node, + "i": td["i"] + 1, + "action_mask": available, + "reward": reward, + "done": done, + }, + ) + return td + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + # Initialize locations + device = td.device + init_locs = td["locs"] + + # We do not enforce loading from self for flexibility + num_loc = init_locs.shape[-2] + + # Other variables + current_node = torch.zeros((batch_size), dtype=torch.int64, device=device) + available = torch.ones( + (*batch_size, num_loc), dtype=torch.bool, device=device + ) # 1 means not visited, i.e. action is allowed + i = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device) + + return TensorDict( + { + "locs": init_locs, + "first_node": current_node, + "current_node": current_node, + "i": i, + "action_mask": available, + "reward": torch.zeros((*batch_size, 1), dtype=torch.float32), + }, + batch_size=batch_size, + ) + + def _make_spec(self, generator: TSPGenerator): + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.num_loc, 2), + dtype=torch.float32, + ), + first_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + current_node=Unbounded( + shape=(1), + dtype=torch.int64, + ), + i=Unbounded( + shape=(1), + dtype=torch.int64, + ), + action_mask=Unbounded( + shape=(generator.num_loc), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1), + dtype=torch.int64, + low=0, + high=generator.num_loc, + ) + self.reward_spec = Unbounded(shape=(1)) + self.done_spec = Unbounded(shape=(1), dtype=torch.bool) + + def _get_reward(self, td: TensorDict, actions: torch.Tensor) -> torch.Tensor: + if self.check_solution: + self.check_solution_validity(td, actions) + + # Gather locations in order of tour and return distance between them (i.e., -reward) + locs_ordered = gather_by_index(td["locs"], actions) + return -get_tour_length(locs_ordered) + + @staticmethod + def check_solution_validity(td: TensorDict, actions: torch.Tensor) -> None: + """Check that solution is valid: nodes are visited exactly once""" + assert ( + torch.arange(actions.size(1), out=actions.data.new()) + .view(1, -1) + .expand_as(actions) + == actions.data.sort(1)[0] + ).all(), "Invalid tour" + + def replace_selected_actions( + self, + cur_actions: torch.Tensor, + new_actions: torch.Tensor, + selection_mask: torch.Tensor, + ) -> torch.Tensor: + """ + Replace selected current actions with updated actions based on `selection_mask`. + + Args: + cur_actions [batch_size, num_loc] + new_actions [batch_size, num_loc] + selection_mask [batch_size,] + """ + cur_actions[selection_mask] = new_actions[selection_mask] + return cur_actions + + @staticmethod + def local_search(td: TensorDict, actions: torch.Tensor, **kwargs) -> torch.Tensor: + assert ( + local_search is not None + ), "Cannot import local_search module. Check if `numba` is installed." + return local_search(td, actions, **kwargs) + + @staticmethod + def render(td: TensorDict, actions: torch.Tensor = None, ax=None): + return render(td, actions, ax) + + +class TSPkoptEnv(ImprovementEnvBase): + """Traveling Salesman Problem (PDP) environment for performing the neural k-opt search. + + The goal is to search for optimal solutions to TSP by performing a k-opt neighborhood search on a given initial solution. + + Observations: + - locations of each customer + - current solution to be improved + - the current step + + Constraints: + - the tour must return to the starting customer. + - each customer must be visited exactly once. + + Finish condition: + - None + + Reward: + - the immediate reduced cost over the current best-so-far solution + + Args: + generator: TSPGenerator instance as the data generator + generator_params: parameters for the generator + k_max: the maximum k value for k-opt: + if k_max==2, the MDP in DACT(https://arxiv.org/abs/2110.02544) is used; + if k_max>2, the MDP in NeuOpt(https://arxiv.org/abs/2310.18264) is used; + """ + + name = "tsp_kopt" + + def __init__( + self, + generator: TSPGenerator = None, + generator_params: dict = {}, + k_max: int = 2, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = TSPGenerator(**generator_params) + self.generator = generator + self.k_max = k_max + self.two_opt_mode = k_max == 2 + self._make_spec(self.generator) + + def _step(self, td: TensorDict, solution_to=None) -> TensorDict: + # get state information from td + solution_best = td["rec_best"] + locs = td["locs"] + cost_bsf = td["cost_bsf"] + bs, gs = solution_best.size() + + # perform loca_operator + if solution_to is None: + action = td["action"] + solution = td["rec_current"] + next_rec = self._local_operator(solution, action) + else: + next_rec = solution_to.clone() + new_obj = self.get_costs(locs, next_rec) + + # compute reward and update best-so-far solutions + now_bsf = torch.where(new_obj < cost_bsf, new_obj, cost_bsf) + reward = cost_bsf - now_bsf + index = reward > 0.0 + solution_best[index] = next_rec[index].clone() + + # reset visited_time + visited_time = td["visited_time"] * 0 + pre = torch.zeros((bs), device=visited_time.device).long() + arange = torch.arange(bs) + for i in range(gs): + current_nodes = next_rec[arange, pre] + visited_time[arange, current_nodes] = i + 1 + pre = current_nodes + visited_time = visited_time.long() + + # Update step + td.update( + { + "cost_current": new_obj, + "cost_bsf": now_bsf, + "rec_current": next_rec, + "rec_best": solution_best, + "visited_time": visited_time, + "i": td["i"] + 1 if solution_to is None else td["i"], + "reward": reward, + } + ) + + return td + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + device = td.device + + locs = td["locs"] + current_rec = self.generator._get_initial_solutions(locs).to(device) + + obj = self.get_costs(locs, current_rec) + + # get index according to the solutions in the linked list data structure + bs = batch_size[0] + seq_length = self.generator.num_loc + visited_time = torch.zeros((bs, seq_length)).to(device) + pre = torch.zeros((bs)).to(device).long() + arange = torch.arange(bs) + for i in range(seq_length): + current_nodes = current_rec[arange, pre] + visited_time[arange, current_nodes] = i + 1 + pre = current_nodes + visited_time = visited_time.long() + + i = torch.zeros((*batch_size, 1), dtype=torch.int64).to(device) + + return TensorDict( + { + "locs": locs, + "cost_current": obj, + "cost_bsf": obj.clone(), + "rec_current": current_rec, + "rec_best": current_rec.clone(), + "visited_time": visited_time, + "i": i, + }, + batch_size=batch_size, + ) + + def _local_operator(self, solution, action): + rec = solution.clone() + + if self.two_opt_mode: + # get actions + first = action[:, 0].view(-1, 1) + second = action[:, 1].view(-1, 1) + + # fix connection for first node + argsort = solution.argsort() + pre_first = argsort.gather(1, first) + pre_first = torch.where(pre_first != second, pre_first, first) + rec.scatter_(1, pre_first, second) + + # fix connection for second node + post_second = solution.gather(1, second) + post_second = torch.where(post_second != first, post_second, second) + rec.scatter_(1, first, post_second) + + # reverse loop: + cur = first + for i in range(self.generator.num_loc): + cur_next = solution.gather(1, cur) + rec.scatter_( + 1, cur_next, torch.where(cur != second, cur, rec.gather(1, cur_next)) + ) + cur = torch.where(cur != second, cur_next, cur) + + rec_next = rec + + else: + # action bs * (K_index, K_from, K_to) + selected_index = action[:, : self.k_max] + left = action[:, self.k_max : 2 * self.k_max] + right = action[:, 2 * self.k_max :] + + # prepare + rec_next = rec.clone() + right_nodes = rec.gather(1, selected_index) + argsort = rec.argsort() + + # new rec + rec_next.scatter_(1, left, right) + cur = left[:, :1].clone() + for i in range( + self.generator.num_loc - 2 + ): # self.generator.num_loc - 2 is already correct + next_cur = rec_next.gather(1, cur) + pre_next_wrt_old = argsort.gather(1, next_cur) + reverse_link_condition = (cur != pre_next_wrt_old) & ~( + (next_cur == right_nodes).any(-1, True) + ) + next_next_cur = rec_next.gather(1, next_cur) + rec_next.scatter_( + 1, + next_cur, + torch.where(reverse_link_condition, pre_next_wrt_old, next_next_cur), + ) + # if i >= self.generator.num_loc - 2: assert (reverse_link_condition == False).all() + cur = next_cur + + return rec_next + + def _make_spec(self, generator: TSPGenerator): + """Make the observation and action specs from the parameters.""" + self.observation_spec = Composite( + locs=Bounded( + low=generator.min_loc, + high=generator.max_loc, + shape=(generator.num_loc, 2), + dtype=torch.float32, + ), + cost_current=Unbounded( + shape=(1), + dtype=torch.float32, + ), + cost_bsf=Unbounded( + shape=(1), + dtype=torch.float32, + ), + rec_current=Unbounded( + shape=(self.generator.num_loc), + dtype=torch.int64, + ), + rec_best=Unbounded( + shape=(self.generator.num_loc), + dtype=torch.int64, + ), + visited_time=Unbounded( + shape=(self.generator.num_loc, self.generator.num_loc), + dtype=torch.int64, + ), + i=Unbounded( + shape=(1), + dtype=torch.int64, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(self.k_max * 3,), + dtype=torch.int64, + low=0, + high=self.generator.num_loc, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + def check_solution_validity(self, td, actions=None): + # The function can be called by the agent to check the validity of the best found solution + # Note that the args actions are not used in improvement method. + + solution = td["rec_best"] + batch_size, graph_size = solution.size() + + assert ( + torch.arange(graph_size, out=solution.data.new()) + .view(1, -1) + .expand_as(solution) + == solution.data.sort(1)[0] + ).all(), "Not visiting all nodes" + + def get_mask(self, td): + # return mask that is 1 if the corresponding action is feasible, 0 otherwise + visited_time = td["visited_time"] + bs, gs = visited_time.size() + if self.two_opt_mode: + selfmask = torch.eye(gs).view(1, gs, gs).to(td.device) + masks = selfmask.expand(bs, gs, gs).bool() + return ~masks + else: + assert False, "The masks for NeuOpt are handled within its policy" + + def _random_action(self, td): + bs, gs = td["rec_best"].size() + + if self.two_opt_mode: + mask = self.get_mask(td) + logits = torch.rand(bs, gs, gs) + logits[~mask] = -1e20 + prob = torch.softmax(logits.view(bs, -1), -1) + sample = prob.multinomial(1) + td["action"] = torch.cat((sample // (gs), sample % (gs)), -1) + + else: + rec = td["rec_current"] + visited_time = td["visited_time"] + action_index = torch.zeros(bs, self.k_max, dtype=torch.long) + k_action_left = torch.zeros(bs, self.k_max + 1, dtype=torch.long) + k_action_right = torch.zeros(bs, self.k_max, dtype=torch.long) + next_of_last_action = torch.zeros((bs, 1), dtype=torch.long) - 1 + mask = torch.zeros((bs, gs), dtype=torch.bool) + stopped = torch.ones(bs, dtype=torch.bool) + + for i in range(self.k_max): + # Sample action for a_i + logits = torch.rand(bs, gs) + logits[mask.clone()] = -1e30 + prob = torch.softmax(logits, -1) + action = prob.multinomial(1) + value_max, action_max = prob.max(-1, True) ### fix bug of pytorch + action = torch.where( + 1 - value_max.view(-1, 1) < 1e-5, action_max.view(-1, 1), action + ) ### fix bug of pytorch + if i > 0: + action = torch.where( + stopped.unsqueeze(-1), action_index[:, :1], action + ) + + # Store and Process actions + next_of_new_action = rec.gather(1, action) + action_index[:, i] = action.squeeze().clone() + k_action_left[stopped, i] = action[stopped].squeeze().clone() + k_action_right[~stopped, i - 1] = action[~stopped].squeeze().clone() + k_action_left[:, i + 1] = next_of_new_action.squeeze().clone() + + # Process if k-opt close + if i > 0: + stopped = stopped | (action == next_of_last_action).squeeze() + else: + stopped = (action == next_of_last_action).squeeze() + k_action_left[stopped, i] = k_action_left[stopped, i - 1] + k_action_right[stopped, i] = k_action_right[stopped, i - 1] + + # Calc next basic masks + if i == 0: + visited_time_tag = ( + visited_time - visited_time.gather(1, action) + ) % gs + mask &= False + mask[(visited_time_tag <= visited_time_tag.gather(1, action))] = True + if i == 0: + mask[visited_time_tag > (gs - 2)] = True + mask[stopped, action[stopped].squeeze()] = ( + False # allow next k-opt starts immediately + ) + # if True:#i == self.k_max - 2: # allow special case: close k-opt at the first selected node + index_allow_first_node = (~stopped) & ( + next_of_new_action.squeeze() == action_index[:, 0] + ) + mask[index_allow_first_node, action_index[index_allow_first_node, 0]] = ( + False + ) + + # Move to next + next_of_last_action = next_of_new_action + next_of_last_action[stopped] = -1 + + # Form final action + k_action_right[~stopped, -1] = k_action_left[~stopped, -1].clone() + k_action_left = k_action_left[:, : self.k_max] + td["action"] = torch.cat((action_index, k_action_left, k_action_right), -1) + + return td["action"] + + @classmethod + def render(cls, td: TensorDict, actions: torch.Tensor = None, ax=None): + solution_current = cls.get_current_solution(td) + solution_best = cls.get_best_solution(td) + return render_improvement(td, solution_current, solution_best) + + +class DenseRewardTSPEnv(TSPEnv): + """ + This is an experimental version of the TSPEnv to be used with stepwise PPO. That is + this environment defines a stepwise reward function for the TSP which is the distance added + to the current tour by the given action. + """ + + def __init__( + self, generator: TSPGenerator = None, generator_params: dict = {}, **kwargs + ): + super().__init__( + generator, + generator_params, + check_solution=False, + _torchrl_mode=True, + **kwargs, + ) + + def _step(self, td): + last_node = td["current_node"].clone() + current_node = td["action"] + + first_node = current_node if td["i"].all() == 0 else td["first_node"] + + # # Set not visited to 0 (i.e., we visited the node) + available = td["action_mask"].scatter( + -1, current_node.unsqueeze(-1).expand_as(td["action_mask"]), 0 + ) + + # We are done there are no unvisited locations + done = torch.sum(available, dim=-1) == 0 + + # calc stepwise reward + last_node_loc = gather_by_index(td["locs"], last_node) + curr_node_loc = gather_by_index(td["locs"], current_node) + reward = get_distance(last_node_loc, curr_node_loc)[:, None] + + td.update( + { + "first_node": first_node, + "current_node": current_node, + "i": td["i"] + 1, + "action_mask": available, + "reward": reward, + "done": done, + }, + ) + return td + + def _get_reward(self, td, actions=None) -> TensorDict: + if actions is not None: + # Gather locations in order of tour and return distance between them (i.e., -reward) + locs_ordered = gather_by_index(td["locs"], actions) + return -get_tour_length(locs_ordered) + return -td["reward"] diff --git a/rl4co/envs/routing/tsp/generator.py b/rl4co/envs/routing/tsp/generator.py new file mode 100644 index 00000000..0c0dda04 --- /dev/null +++ b/rl4co/envs/routing/tsp/generator.py @@ -0,0 +1,99 @@ +from typing import Callable, Union + +import torch + +from tensordict.tensordict import TensorDict +from torch.distributions import Uniform + +from rl4co.envs.common.utils import Generator, get_sampler +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class TSPGenerator(Generator): + """Data generator for the Travelling Salesman Problem (TSP). + + Args: + num_loc: number of locations (customers) in the TSP + min_loc: minimum value for the location coordinates + max_loc: maximum value for the location coordinates + init_sol_type: the method type used for generating initial solutions (random or greedy) + loc_distribution: distribution for the location coordinates + + Returns: + A TensorDict with the following keys: + locs [batch_size, num_loc, 2]: locations of each customer + """ + + def __init__( + self, + num_loc: int = 20, + min_loc: float = 0.0, + max_loc: float = 1.0, + init_sol_type: str = "random", + loc_distribution: Union[int, float, str, type, Callable] = Uniform, + **kwargs, + ): + self.num_loc = num_loc + self.min_loc = min_loc + self.max_loc = max_loc + self.init_sol_type = init_sol_type + + # Location distribution + if kwargs.get("loc_sampler", None) is not None: + self.loc_sampler = kwargs["loc_sampler"] + else: + self.loc_sampler = get_sampler( + "loc", loc_distribution, min_loc, max_loc, **kwargs + ) + + def _generate(self, batch_size) -> TensorDict: + # Sample locations + locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2)) + + return TensorDict( + { + "locs": locs, + }, + batch_size=batch_size, + ) + + # for improvement MDP only (to be refactored by a combination of rollout and the random policy) + def _get_initial_solutions(self, coordinates): + batch_size = coordinates.size(0) + + if self.init_sol_type == "random": + set = torch.rand(batch_size, self.num_loc).argsort().long() + rec = torch.zeros(batch_size, self.num_loc).long() + index = torch.zeros(batch_size, 1).long() + + for i in range(self.num_loc - 1): + rec.scatter_(1, set.gather(1, index + i), set.gather(1, index + i + 1)) + + rec.scatter_(1, set[:, -1].view(-1, 1), set.gather(1, index)) + + elif self.init_sol_type == "greedy": + candidates = torch.ones(batch_size, self.num_loc).bool() + rec = torch.zeros(batch_size, self.num_loc).long() + selected_node = torch.zeros(batch_size, 1).long() + candidates.scatter_(1, selected_node, 0) + + for i in range(self.num_loc - 1): + d1 = coordinates.cpu().gather( + 1, selected_node.unsqueeze(-1).expand(batch_size, self.num_loc, 2) + ) + d2 = coordinates.cpu() + + dists = (d1 - d2).norm(p=2, dim=2) + dists[~candidates] = 1e5 + + next_selected_node = dists.min(-1)[1].view(-1, 1) + rec.scatter_(1, selected_node, next_selected_node) + candidates.scatter_(1, next_selected_node, 0) + selected_node = next_selected_node + + else: + raise NotImplementedError() + + return rec.expand(batch_size, self.num_loc).clone() diff --git a/rl4co/envs/routing/tsp/local_search.py b/rl4co/envs/routing/tsp/local_search.py new file mode 100644 index 00000000..a8bd2908 --- /dev/null +++ b/rl4co/envs/routing/tsp/local_search.py @@ -0,0 +1,74 @@ +import concurrent.futures + +import numpy as np +import numba as nb +import torch +from tensordict.tensordict import TensorDict + +from rl4co.utils.ops import get_distance_matrix +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def local_search(td: TensorDict, actions: torch.Tensor, max_iterations: int = 1000) -> torch.Tensor: + """ + Improve the solution using local search, especially 2-opt for TSP. + Implementation credits to: https://github.com/henry-yeh/DeepACO + + Args: + td: TensorDict, td from env with shape [batch_size,] + actions: torch.Tensor, Tour indices with shape [batch_size, num_loc] + max_iterations: int, maximum number of iterations for 2-opt + Returns: + torch.Tensor, Improved tour indices with shape [batch_size, num_loc] + """ + distances = td.get("distances", None) + if distances is None: + distances_np = get_distance_matrix(td["locs"]).numpy() + else: + distances_np = distances.detach().cpu().numpy() + distances_np = distances_np + 1e9 * np.eye(distances_np.shape[1], dtype=np.float32)[None, :, :] + + actions_np = actions.detach().cpu().numpy().astype(np.uint16) + with concurrent.futures.ThreadPoolExecutor() as executor: + futures = [] + for dist, tour in zip(distances_np, actions_np): + future = executor.submit(_two_opt_python, distmat=dist, tour=tour, max_iterations=max_iterations) + futures.append(future) + return torch.from_numpy(np.stack([f.result() for f in futures]).astype(np.int64)).to(actions.device) + + +@nb.njit(nb.float32(nb.float32[:,:], nb.uint16[:], nb.uint16), nogil=True) +def two_opt_once(distmat, tour, fixed_i = 0): + '''in-place operation''' + n = tour.shape[0] + p = q = 0 + delta = 0 + for i in range(1, n - 1) if fixed_i==0 else range(fixed_i, fixed_i + 1): + for j in range(i + 1, n): + node_i, node_j = tour[i], tour[j] + node_prev, node_next = tour[i - 1], tour[(j + 1) % n] + if node_prev == node_j or node_next == node_i: + continue + change = ( + distmat[node_prev, node_j] + distmat[node_i, node_next] + - distmat[node_prev, node_i] - distmat[node_j, node_next] + ) + if change < delta: + p, q, delta = i, j, change + if delta < -1e-6: + tour[p: q + 1] = np.flip(tour[p: q + 1]) + return delta + else: + return 0.0 + + +@nb.njit(nb.uint16[:](nb.float32[:,:], nb.uint16[:], nb.int64), nogil=True) +def _two_opt_python(distmat, tour, max_iterations=1000): + iterations = 0 + min_change = -1.0 + while min_change < -1e-6 and iterations < max_iterations: + min_change = two_opt_once(distmat, tour, 0) + iterations += 1 + return tour diff --git a/rl4co/envs/routing/tsp/render.py b/rl4co/envs/routing/tsp/render.py new file mode 100644 index 00000000..5f703f90 --- /dev/null +++ b/rl4co/envs/routing/tsp/render.py @@ -0,0 +1,110 @@ +import matplotlib.pyplot as plt +import numpy as np +import torch + +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(td, actions=None, ax=None): + if ax is None: + # Create a plot of the nodes + _, ax = plt.subplots() + + td = td.detach().cpu() + + if actions is None: + actions = td.get("action", None) + + # If batch_size greater than 0 , we need to select the first batch element + if td.batch_size != torch.Size([]): + td = td[0] + actions = actions[0] + + locs = td["locs"] + + # Gather locs in order of action if available + if actions is None: + log.warning("No action in TensorDict, rendering unsorted locs") + else: + actions = actions.detach().cpu() + locs = gather_by_index(locs, actions, dim=0) + + # Cat the first node to the end to complete the tour + locs = torch.cat((locs, locs[0:1])) + x, y = locs[:, 0], locs[:, 1] + + # Plot the visited nodes + ax.scatter(x, y, color="tab:blue") + + # Add arrows between visited nodes as a quiver plot + dx, dy = np.diff(x), np.diff(y) + ax.quiver(x[:-1], y[:-1], dx, dy, scale_units="xy", angles="xy", scale=1, color="k") + + # Setup limits and show + ax.set_xlim(-0.05, 1.05) + ax.set_ylim(-0.05, 1.05) + + +def render_improvement(td, current_soltuion, best_soltuion): + coordinates = td["locs"][0] + real_seq = current_soltuion[:1] + real_best = best_soltuion[:1] + fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(16, 6)) # Create two side-by-side axes + + for ax in [ax1, ax2]: # Plot on both axes + if ax == ax1: + ax.axis([-0.05, 1.05] * 2) + # plot the nodes + ax.scatter( + coordinates[:, 0], coordinates[:, 1], marker="H", s=55, c="blue", zorder=2 + ) + # plot the tour + real_seq_coordinates = coordinates.gather( + 0, real_seq[0].unsqueeze(1).repeat(1, 2) + ) + real_seq_coordinates = torch.cat( + (real_seq_coordinates, real_seq_coordinates[:1]), 0 + ) + ax.plot( + real_seq_coordinates[:, 0], + real_seq_coordinates[:, 1], + color="black", + zorder=1, + ) + # mark node + for i, txt in enumerate(range(real_seq.size(1))): + ax.annotate( + txt, + (coordinates[i, 0] + 0.01, coordinates[i, 1] + 0.01), + ) + ax.set_title("Current Solution") + else: + ax.axis([-0.05, 1.05] * 2) + # plot the nodes + ax.scatter( + coordinates[:, 0], coordinates[:, 1], marker="H", s=55, c="blue", zorder=2 + ) + # plot the tour + real_best_coordinates = coordinates.gather( + 0, real_best[0].unsqueeze(1).repeat(1, 2) + ) + real_best_coordinates = torch.cat( + (real_best_coordinates, real_best_coordinates[:1]), 0 + ) + ax.plot( + real_best_coordinates[:, 0], + real_best_coordinates[:, 1], + color="black", + zorder=1, + ) + # mark node + for i, txt in enumerate(range(real_seq.size(1))): + ax.annotate( + txt, + (coordinates[i, 0] + 0.01, coordinates[i, 1] + 0.01), + ) + ax.set_title("Best Solution") + plt.tight_layout() diff --git a/rl4co/envs/scheduling/__init__.py b/rl4co/envs/scheduling/__init__.py new file mode 100644 index 00000000..febb183c --- /dev/null +++ b/rl4co/envs/scheduling/__init__.py @@ -0,0 +1,4 @@ +from .ffsp.env import FFSPEnv +from .fjsp.env import FJSPEnv +from .jssp.env import JSSPEnv +from .smtwtp.env import SMTWTPEnv diff --git a/rl4co/envs/scheduling/ffsp/__init__.py b/rl4co/envs/scheduling/ffsp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/scheduling/ffsp/env.py b/rl4co/envs/scheduling/ffsp/env.py new file mode 100644 index 00000000..26191053 --- /dev/null +++ b/rl4co/envs/scheduling/ffsp/env.py @@ -0,0 +1,453 @@ +import itertools + +from math import factorial +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.data.dataset import FastTdDataset +from rl4co.envs.common.base import RL4COEnvBase + +from .generator import FFSPGenerator + + +class FFSPEnv(RL4COEnvBase): + """Flexible Flow Shop Problem (FFSP) environment. + The goal is to schedule a set of jobs on a set of machines such that the makespan is minimized. + + Observations: + - time index + - sub time index + - batch index + - machine index + - schedule + - machine wait step + - job location + - job wait step + - job duration + + Constraints: + - each job has to be processed on each machine in a specific order + - the machine has to be available to process the job + - the job has to be available to be processed + + Finish Condition: + - all jobs are scheduled + + Reward: + - (minus) the makespan of the schedule + + Args: + generator: FFSPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "ffsp" + + def __init__( + self, + generator: FFSPGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(check_solution=False, dataset_cls=FastTdDataset, **kwargs) + if generator is None: + generator = FFSPGenerator(**generator_params) + self.generator = generator + + self.num_stage = generator.num_stage + self.num_machine = generator.num_machine + self.num_job = generator.num_job + self.num_machine_total = generator.num_machine_total + self.tables = None + self.step_cnt = None + self.flatten_stages = generator.flatten_stages + + self._make_spec(generator) + + def get_num_starts(self, td): + return factorial(self.num_machine) + + def select_start_nodes(self, td, num_starts): + self.tables.augment_machine_tables(num_starts) + selected = torch.full((num_starts * td.size(0),), self.num_job) + return selected + + def _move_to_next_machine(self, td): + batch_size = td.batch_size + batch_idx = torch.arange(*batch_size, dtype=torch.long, device=td.device) + + time_idx = td["time_idx"] + machine_idx = td["machine_idx"] + sub_time_idx = td["sub_time_idx"] + + machine_wait_step = td["machine_wait_step"] + job_wait_step = td["job_wait_step"] + job_location = td["job_location"] + + ready = torch.flatten(td["done"]) + idx = torch.flatten(batch_idx) + # select minibatch instances that need updates (are not done) + idx = idx[~ready] + + while ~ready.all(): + # increment the stage-machine counter + new_sub_time_idx = sub_time_idx[idx] + 1 + # increment time if all machines-stage combinations have been candidates + step_time_required = new_sub_time_idx == self.num_machine_total + time_idx[idx] += step_time_required.long() + # in this case set the machine-stage counter to zero again + new_sub_time_idx[step_time_required] = 0 + # update machine-stage counter + sub_time_idx[idx] = new_sub_time_idx + # determine current machine candidate + new_machine_idx = self.tables.get_machine_index(idx, new_sub_time_idx) + machine_idx[idx] = new_machine_idx + + # decrease machine wait time by 1 if instance transitioned to new time step + machine_wait_steps = machine_wait_step[idx, :] + machine_wait_steps[step_time_required, :] -= 1 + machine_wait_steps[machine_wait_steps < 0] = 0 + machine_wait_step[idx, :] = machine_wait_steps + + # decrease job wait time by 1 if instance transitioned to new time step + job_wait_steps = job_wait_step[idx, :] + job_wait_steps[step_time_required, :] -= 1 + job_wait_steps[job_wait_steps < 0] = 0 + job_wait_step[idx, :] = job_wait_steps + # machine is ready if its wait time is zero + machine_ready = machine_wait_step[idx, new_machine_idx] == 0 + # job is ready if the current stage matches the stage of the job and + # its wait time is zero (no operation of previous stage is in process) + new_stage_idx = self.tables.get_stage_index(new_sub_time_idx) + job_ready_1 = job_location[idx, : self.num_job] == new_stage_idx[:, None] + job_ready_2 = job_wait_step[idx, : self.num_job] == 0 + job_ready = (job_ready_1 & job_ready_2).any(dim=-1) + # instance ready if at least one job and the current machine are ready + ready = machine_ready & job_ready + assert ready.shape == idx.shape + idx = idx[~ready] + + return td.update( + { + "time_idx": time_idx, + "sub_time_idx": sub_time_idx, + "machine_idx": machine_idx, + "machine_wait_step": machine_wait_step, + "job_wait_step": job_wait_step, + } + ) + + def pre_step(self, td: TensorDict) -> TensorDict: + batch_size = td.batch_size + batch_idx = torch.arange(*batch_size, dtype=torch.long, device=td.device) + sub_time_idx = td["sub_time_idx"] + # update machine index + td["machine_idx"] = self.tables.get_machine_index(batch_idx, sub_time_idx) + # update action mask and stage machine indx + td = self._update_step_state(td) + # perform some checks + assert (td["stage_idx"] == 0).all(), "call pre_step only at beginning of env" + assert torch.all(td["stage_machine_idx"] == td["machine_idx"]) + # return updated td + return td + + def _update_step_state(self, td): + batch_size = td.batch_size + batch_idx = torch.arange(*batch_size, dtype=torch.long, device=td.device) + + sub_time_idx = td["sub_time_idx"] + job_location = td["job_location"] + job_wait_step = td["job_wait_step"] + if len(td["done"].shape) == 2: + done = td["done"].squeeze(1) + else: + done = td["done"] + + # update stage + stage_idx = self.tables.get_stage_index(sub_time_idx) + stage_machine_idx = self.tables.get_stage_machine_index(batch_idx, sub_time_idx) + + job_loc = job_location[:, : self.num_job] + job_wait_time = job_wait_step[:, : self.num_job] + # determine if job can be scheduled in current stage + # (i.e. previous stages are completed) + job_in_stage = job_loc == stage_idx[:, None] + job_not_waiting = job_wait_time == 0 + # job can be scheduled if in current stage and not waiting + job_available = job_in_stage & job_not_waiting + # determine instance for which waiting is allowed. This is the case if either + # 1.) any of its jobs need to be scheduled in a previous stage, + # 2.) any of the jobs wait for an operation of the preceeding stage to finish + # 3.) the instance is done. + job_in_previous_stages = (job_loc < stage_idx[:, None]).any(dim=-1) + job_waiting_in_stage = (job_in_stage & (job_wait_time > 0)).any(dim=-1) + wait_allowed = job_in_previous_stages + job_waiting_in_stage + done + + job_enable = torch.cat((job_available, wait_allowed[:, None]), dim=-1) + job_mask = torch.full_like(td["action_mask"], 0).masked_fill(job_enable, 1) + assert torch.logical_or((job_mask[:, :-1].sum(1) > 0), done).all() + return td.update( + { + "action_mask": job_mask, + "stage_idx": stage_idx, + "stage_machine_idx": stage_machine_idx, + } + ) + + def _step(self, td: TensorDict) -> TensorDict: + self.step_cnt += 1 + batch_size = td.batch_size + batch_idx = torch.arange(*batch_size, dtype=torch.long, device=td.device) + + # job_idx is the action from the model + job_idx = td["action"] + time_idx = td["time_idx"] + machine_idx = td["machine_idx"] + + # increment the operation counter of the selected job + td["job_location"][batch_idx, job_idx] += 1 + # td["job_location"][:, :-1].clip_(0, self.num_stage) + # assert (td["job_location"][:, : self.num_job] <= self.num_stage).all() + # insert start time of the selected job in the schedule + td["schedule"][batch_idx, machine_idx, job_idx] = time_idx + # get the duration of the selected job + job_length = td["job_duration"][batch_idx, job_idx, machine_idx] + # set the number of time steps until the selected machine is available again + td["machine_wait_step"][batch_idx, machine_idx] = job_length + + # set the number of time steps until the next operation of the job can be started + td["job_wait_step"][batch_idx, job_idx] = job_length + # determine whether all jobs are scheduled + td["done"] = (td["job_location"][:, : self.num_job] == self.num_stage).all(dim=-1) + + if td["done"].all(): + pass + else: + td = self._move_to_next_machine(td) + td = self._update_step_state(td) + + if td["done"].all(): + # determine end times of ops by adding the durations to their start times + end_schedule = td["schedule"] + td["job_duration"].permute(0, 2, 1) + # exclude dummy job and determine the makespan per job + end_time_max, _ = end_schedule[:, :, : self.num_job].max(dim=-1) + # determine the max makespan of all jobs + end_time_max, _ = end_time_max.max(dim=-1) + reward = -end_time_max.to(torch.float32) + td.set("reward", reward) + + return td + + def _reset( + self, td: Optional[TensorDict] = None, batch_size: Optional[list] = None + ) -> TensorDict: + """ + Args: + + Returns: + - stage_table [batch_size, num_stage * num_machine] + - machine_table [batch_size, num_machine * num_stage] + - stage_machine_idx [batch_size, num_stage * num_machine] + - time_idx [batch_size] + - sub_time_idx [batch_size] + - batch_idx [batch_size] + - machine_idx [batch_size] + - schedule [batch_size, num_machine_total, num_job+1] + - machine_wait_step [batch_size, num_machine_total] + - job_location [batch_size, num_job+1] + - job_wait_step [batch_size, num_job+1] + - job_duration [batch_size, num_job+1, num_machine * num_stage] + """ + device = td.device + + self.step_cnt = 0 + self.tables = IndexTables(self) + # reset tables to undo the augmentation + # self.tables._reset(device=self.device) + self.tables.set_bs(batch_size[0]) + + # Init index record tensor + time_idx = torch.zeros(size=(*batch_size,), dtype=torch.long, device=device) + sub_time_idx = torch.zeros(size=(*batch_size,), dtype=torch.long, device=device) + + # Scheduling status information + schedule = torch.full( + size=(*batch_size, self.num_machine_total, self.num_job + 1), + dtype=torch.long, + device=device, + fill_value=-999999, + ) + machine_wait_step = torch.zeros( + size=(*batch_size, self.num_machine_total), + dtype=torch.long, + device=device, + ) + job_location = torch.zeros( + size=(*batch_size, self.num_job + 1), + dtype=torch.long, + device=device, + ) + job_wait_step = torch.zeros( + size=(*batch_size, self.num_job + 1), + dtype=torch.long, + device=device, + ) + job_duration = torch.empty( + size=(*batch_size, self.num_job + 1, self.num_machine * self.num_stage), + dtype=torch.long, + device=device, + ) + job_duration[..., : self.num_job, :] = td["run_time"] + job_duration[..., self.num_job, :] = 0 + + # Finish status information + reward = torch.full( + size=(*batch_size,), + dtype=torch.float32, + device=device, + fill_value=float("-inf"), + ) + done = torch.full( + size=(*batch_size,), + dtype=torch.bool, + device=device, + fill_value=False, + ) + + action_mask = torch.ones( + size=(*batch_size, self.num_job + 1), dtype=bool, device=device + ) + action_mask[..., -1] = 0 + + batch_idx = torch.arange(*batch_size, dtype=torch.long, device=td.device) + stage_idx = self.tables.get_stage_index(sub_time_idx) + machine_idx = self.tables.get_machine_index(batch_idx, sub_time_idx) + stage_machine_idx = self.tables.get_stage_machine_index(batch_idx, sub_time_idx) + + return TensorDict( + { + # Index information + "stage_idx": stage_idx, + "time_idx": time_idx, + "sub_time_idx": sub_time_idx, + "machine_idx": machine_idx, + "stage_machine_idx": stage_machine_idx, + # Scheduling status information + "schedule": schedule, + "machine_wait_step": machine_wait_step, + "job_location": job_location, + "job_wait_step": job_wait_step, + "job_duration": job_duration, + # Finish status information + "reward": reward, + "done": done, + "action_mask": action_mask, + }, + batch_size=batch_size, + ) + + def _make_spec(self, generator: FFSPGenerator): + self.observation_spec = Composite( + time_idx=Unbounded( + shape=(1,), + dtype=torch.int64, + ), + sub_time_idx=Unbounded( + shape=(1,), + dtype=torch.int64, + ), + batch_idx=Unbounded( + shape=(1,), + dtype=torch.int64, + ), + machine_idx=Unbounded( + shape=(1,), + dtype=torch.int64, + ), + schedule=Unbounded( + shape=(generator.num_machine_total, generator.num_job + 1), + dtype=torch.int64, + ), + machine_wait_step=Unbounded( + shape=(generator.num_machine_total), + dtype=torch.int64, + ), + job_location=Unbounded( + shape=(generator.num_job + 1), + dtype=torch.int64, + ), + job_wait_step=Unbounded( + shape=(generator.num_job + 1), + dtype=torch.int64, + ), + job_duration=Unbounded( + shape=( + generator.num_job + 1, + generator.num_machine * generator.num_stage, + ), + dtype=torch.int64, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.num_machine_total, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + def _get_reward(self, td, actions) -> TensorDict: + return td["reward"] + + +class IndexTables: + def __init__(self, env: FFSPEnv): + self.stage_table = torch.arange( + env.num_stage, dtype=torch.long, device=env.device + ).repeat_interleave(env.num_machine) + + # determine the increment of machine ids between stages, i.e. [0,4,8] + # for instances with 4 machines and three stages + start_sub_ids = torch.tensor( + list(range(0, env.num_machine * env.num_stage, env.num_machine)), + dtype=torch.long, + device=env.device, + ).repeat_interleave(env.num_machine) + # generate all possible permutations of the machine ids and add the stage increment to it + # (num_permutations, total_machines) + permutations = torch.tensor( + list(itertools.permutations(list(range(env.num_machine)))), + dtype=torch.long, + device=env.device, + ).repeat(1, env.num_stage) + self.machine_table = permutations + start_sub_ids[None] + + if env.flatten_stages: + # when flatting stages, every machine in each stage is treated as a distinct entity (no shared embeddings) + # Therefore, all machine need a unique index which is the same as the machine table + self.stage_machine_table = self.machine_table + else: + # when we do not flatten the stages, machines of different stages with the same subtime index + # share an embedding. In this case, they need the same index (i.e. leave out the stage increment) + self.stage_machine_table = permutations + + def set_bs(self, bs): + self.bs = bs + + def get_stage_index(self, sub_time_idx): + return self.stage_table[sub_time_idx] + + def get_machine_index(self, idx, sub_time_idx): + pomo_idx = idx // self.bs + + return self.machine_table[pomo_idx, sub_time_idx] + + def get_stage_machine_index(self, idx, sub_time_idx): + pomo_idx = idx // self.bs + return self.stage_machine_table[pomo_idx, sub_time_idx] diff --git a/rl4co/envs/scheduling/ffsp/generator.py b/rl4co/envs/scheduling/ffsp/generator.py new file mode 100644 index 00000000..6b33b8b1 --- /dev/null +++ b/rl4co/envs/scheduling/ffsp/generator.py @@ -0,0 +1,65 @@ +import torch + +from tensordict.tensordict import TensorDict + +from rl4co.envs.common.utils import Generator +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class FFSPGenerator(Generator): + """Data generator for the Flow Shop Scheduling Problem (FFSP). + + Args: + num_stage: number of stages + num_machine: number of machines + num_job: number of jobs + min_time: minimum running time of each job on each machine + max_time: maximum running time of each job on each machine + flatten_stages: whether to flatten the stages + + Returns: + A TensorDict with the following key: + run_time [batch_size, num_job, num_machine, num_stage]: running time of each job on each machine + + Note: + - [IMPORTANT] This version of ffsp requires the number of machines in each stage to be the same + """ + + def __init__( + self, + num_stage: int = 2, + num_machine: int = 3, + num_job: int = 4, + min_time: int = 2, + max_time: int = 10, + flatten_stages: bool = True, + **unused_kwargs, + ): + self.num_stage = num_stage + self.num_machine = num_machine + self.num_machine_total = num_machine * num_stage + self.num_job = num_job + self.min_time = min_time + self.max_time = max_time + self.flatten_stages = flatten_stages + + # FFSP environment doen't have any other kwargs + if len(unused_kwargs) > 0: + log.error(f"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}") + + def _generate(self, batch_size) -> TensorDict: + # Init observation: running time of each job on each machine + run_time = torch.randint( + low=self.min_time, + high=self.max_time, + size=(*batch_size, self.num_job, self.num_machine_total), + ) + + return TensorDict( + { + "run_time": run_time, + }, + batch_size=batch_size, + ) diff --git a/rl4co/envs/scheduling/ffsp/render.py b/rl4co/envs/scheduling/ffsp/render.py new file mode 100644 index 00000000..992f3ad4 --- /dev/null +++ b/rl4co/envs/scheduling/ffsp/render.py @@ -0,0 +1,72 @@ +import torch +import numpy as np +import matplotlib.pyplot as plt + +from matplotlib import cm, colormaps +from tensordict.tensordict import TensorDict + +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(td: TensorDict, idx: int): + import matplotlib.patches as patches + import matplotlib.pyplot as plt + + # TODO: fix this render function parameters + num_machine_total = td["num_machine_total"][idx].item() + num_job = td["num_job"][idx].item() + + job_durations = td["job_duration"][idx, :, :] + # shape: (job, machine) + schedule = td["schedule"][idx, :, :] + # shape: (machine, job) + + total_machine_cnt = num_machine_total + makespan = -td["reward"][idx].item() + + # Create figure and axes + fig, ax = plt.subplots(figsize=(makespan / 3, 5)) + cmap = _get_cmap(num_job) + + plt.xlim(0, makespan) + plt.ylim(0, total_machine_cnt) + ax.invert_yaxis() + + plt.plot([0, makespan], [4, 4], "black") + plt.plot([0, makespan], [8, 8], "black") + + for machine_idx in range(total_machine_cnt): + duration = job_durations[:, machine_idx] + # shape: (job) + machine_schedule = schedule[machine_idx, :] + # shape: (job) + + for job_idx in range(num_job): + job_length = duration[job_idx].item() + job_start_time = machine_schedule[job_idx].item() + if job_start_time >= 0: + # Create a Rectangle patch + rect = patches.Rectangle( + (job_start_time, machine_idx), + job_length, + 1, + facecolor=cmap(job_idx), + ) + ax.add_patch(rect) + + ax.grid() + ax.set_axisbelow(True) + plt.show() + +def _get_cmap(color_cnt): + from random import shuffle + + from matplotlib.colors import CSS4_COLORS, ListedColormap + + color_list = list(CSS4_COLORS.keys()) + shuffle(color_list) + cmap = ListedColormap(color_list, N=color_cnt) + return cmap diff --git a/rl4co/envs/scheduling/fjsp/__init__.py b/rl4co/envs/scheduling/fjsp/__init__.py new file mode 100644 index 00000000..4eb6d9df --- /dev/null +++ b/rl4co/envs/scheduling/fjsp/__init__.py @@ -0,0 +1,2 @@ +NO_OP_ID = -1 +INIT_FINISH = 9999.0 diff --git a/rl4co/envs/scheduling/fjsp/env.py b/rl4co/envs/scheduling/fjsp/env.py new file mode 100644 index 00000000..060991b7 --- /dev/null +++ b/rl4co/envs/scheduling/fjsp/env.py @@ -0,0 +1,503 @@ +import torch + +from einops import rearrange, reduce +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import RL4COEnvBase as EnvBase +from rl4co.utils.ops import gather_by_index, sample_n_random_actions + +from . import INIT_FINISH, NO_OP_ID +from .generator import FJSPFileGenerator, FJSPGenerator +from .render import render +from .utils import calc_lower_bound, get_job_ops_mapping, op_is_ready + + +class FJSPEnv(EnvBase): + """Flexible Job-Shop Scheduling Problem (FJSP) environment + At each step, the agent chooses a job-machine combination. The operation to be processed next for the selected job is + then executed on the selected machine. The reward is 0 unless the agent scheduled all operations of all jobs. + In that case, the reward is (-)makespan of the schedule: maximizing the reward is equivalent to minimizing the makespan. + + Observations: + - time: current time + - next_op: next operation per job + - proc_times: processing time of operation-machine pairs + - pad_mask: specifies padded operations + - start_op_per_job: id of first operation per job + - end_op_per_job: id of last operation per job + - start_times: start time of operation (defaults to 0 if not scheduled) + - finish_times: finish time of operation (defaults to INIT_FINISH if not scheduled) + - job_ops_adj: adjacency matrix specifying job-operation affiliation + - ops_job_map: same as above but using ids of jobs to indicate affiliation + - ops_sequence_order: specifies the order in which operations have to be processed + - ma_assignment: specifies which operation has been scheduled on which machine + - busy_until: specifies until when the machine will be busy + - num_eligible: number of machines that can process an operation + - job_in_process: whether job is currently being processed + - job_done: whether the job is done + + Constrains: + the agent may not select: + - machines that are currently busy + - jobs that are done already + - jobs that are currently processed + - job-machine combinations, where the machine cannot process the next operation of the job + + Finish condition: + - the agent has scheduled all operations of all jobs + + Reward: + - the negative makespan of the final schedule + + Args: + generator: FJSPGenerator instance as the data generator + generator_params: parameters for the generator + mask_no_ops: if True, agent may not select waiting operation (unless instance is done) + """ + + name = "fjsp" + + def __init__( + self, + generator: FJSPGenerator = None, + generator_params: dict = {}, + mask_no_ops: bool = True, + check_mask: bool = False, + stepwise_reward: bool = False, + **kwargs, + ): + super().__init__(check_solution=False, **kwargs) + if generator is None: + if generator_params.get("file_path", None) is not None: + generator = FJSPFileGenerator(**generator_params) + else: + generator = FJSPGenerator(**generator_params) + self.generator = generator + self._num_mas = generator.num_mas + self._num_jobs = generator.num_jobs + self._n_ops_max = generator.max_ops_per_job * self.num_jobs + + self.mask_no_ops = mask_no_ops + self.check_mask = check_mask + self.stepwise_reward = stepwise_reward + self._make_spec(self.generator) + + @property + def num_mas(self): + return self._num_mas + + @property + def num_jobs(self): + return self._num_jobs + + @property + def n_ops_max(self): + return self._n_ops_max + + def set_instance_params(self, td): + self._num_jobs = td["start_op_per_job"].size(1) + self._num_mas = td["proc_times"].size(1) + self._n_ops_max = td["proc_times"].size(2) + + def _decode_graph_structure(self, td: TensorDict): + batch_size = td.batch_size + start_op_per_job = td["start_op_per_job"] + end_op_per_job = td["end_op_per_job"] + pad_mask = td["pad_mask"] + n_ops_max = td["pad_mask"].size(-1) + + # here we will generate the operations-job mapping: + ops_job_map, ops_job_bin_map = get_job_ops_mapping( + start_op_per_job, end_op_per_job, n_ops_max + ) + + # mask invalid edges (caused by padding) + ops_job_bin_map[pad_mask.unsqueeze(1).expand_as(ops_job_bin_map)] = 0 + + # generate for each batch a sequence specifying the position of all operations in their respective jobs, + # e.g. [0,1,0,0,1,2,0,1,2,3,0,0] for jops with n_ops=[2,1,3,4,1,1] + # (bs, max_ops) + ops_seq_order = torch.sum( + ops_job_bin_map * (ops_job_bin_map.cumsum(2) - 1), dim=1 + ) + + # predecessor and successor adjacency matrices + pred = torch.diag_embed(torch.ones(n_ops_max - 1), offset=-1)[None].expand( + *batch_size, -1, -1 + ) + # the start of the sequence (of each job) does not have a predecessor, therefore we can + # mask all first ops of a job in the predecessor matrix + pred = pred * ops_seq_order.gt(0).unsqueeze(-1).expand_as(pred).to(pred) + succ = torch.diag_embed(torch.ones(n_ops_max - 1), offset=1)[None].expand( + *batch_size, -1, -1 + ) + # apply the same logic as above to mask the last op of a job, which does not have a successor. The last job of a job + # always comes before the 1st op of the next job, therefore performing a left shift of the ops seq tensor here + succ = succ * torch.cat( + (ops_seq_order[:, 1:], ops_seq_order.new_full((*batch_size, 1), 0)), dim=1 + ).gt(0).to(succ).unsqueeze(-1).expand_as(succ) + + # adjacency matrix = predecessors, successors and self loops + # (bs, max_ops, max_ops, 2) + ops_adj = torch.stack((pred, succ), dim=3) + + td = td.update( + { + "ops_adj": ops_adj, + "job_ops_adj": ops_job_bin_map, + "ops_job_map": ops_job_map, + # "op_spatial_enc": ops_spatial_enc, + "ops_sequence_order": ops_seq_order, + } + ) + + return td, n_ops_max + + def _reset(self, td: TensorDict = None, batch_size=None) -> TensorDict: + self.set_instance_params(td) + + td_reset = td.clone() + + td_reset, n_ops_max = self._decode_graph_structure(td_reset) + + # schedule + start_op_per_job = td_reset["start_op_per_job"] + start_times = torch.zeros((*batch_size, n_ops_max)) + finish_times = torch.full((*batch_size, n_ops_max), INIT_FINISH) + ma_assignment = torch.zeros((*batch_size, self.num_mas, n_ops_max)) + + # reset feature space + busy_until = torch.zeros((*batch_size, self.num_mas)) + # (bs, ma, ops) + ops_ma_adj = (td_reset["proc_times"] > 0).to(torch.float32) + # (bs, ops) + num_eligible = torch.sum(ops_ma_adj, dim=1) + + td_reset = td_reset.update( + { + "start_times": start_times, + "finish_times": finish_times, + "ma_assignment": ma_assignment, + "busy_until": busy_until, + "num_eligible": num_eligible, + "next_op": start_op_per_job.clone().to(torch.int64), + "ops_ma_adj": ops_ma_adj, + "op_scheduled": torch.full((*batch_size, n_ops_max), False), + "job_in_process": torch.full((*batch_size, self.num_jobs), False), + "reward": torch.zeros((*batch_size,), dtype=torch.float32), + "time": torch.zeros((*batch_size,)), + "job_done": torch.full((*batch_size, self.num_jobs), False), + "done": torch.full((*batch_size, 1), False), + }, + ) + + td_reset.set("action_mask", self.get_action_mask(td_reset)) + # add additional features to tensordict + td_reset["lbs"] = calc_lower_bound(td_reset) + td_reset = self._get_features(td_reset) + + return td_reset + + def _get_job_machine_availability(self, td: TensorDict): + batch_size = td.size(0) + + # (bs, jobs, machines) + action_mask = torch.full((batch_size, self.num_jobs, self.num_mas), False).to( + td.device + ) + + # mask jobs that are done already + action_mask.add_(td["job_done"].unsqueeze(2)) + # as well as jobs that are currently processed + action_mask.add_(td["job_in_process"].unsqueeze(2)) + + # mask machines that are currently busy + action_mask.add_(td["busy_until"].gt(td["time"].unsqueeze(1)).unsqueeze(1)) + + # exclude job-machine combinations, where the machine cannot process the next op of the job + next_ops_proc_times = gather_by_index( + td["proc_times"], td["next_op"].unsqueeze(1), dim=2, squeeze=False + ).transpose(1, 2) + action_mask.add_(next_ops_proc_times == 0) + return action_mask + + def get_action_mask(self, td: TensorDict) -> torch.Tensor: + # 1 indicates machine or job is unavailable at current time step + action_mask = self._get_job_machine_availability(td) + if self.mask_no_ops: + # masking is only allowed if instance is finished + no_op_mask = td["done"] + else: + # if no job is currently processed and instance is not finished yet, waiting is not allowed + no_op_mask = ( + td["job_in_process"].any(1, keepdims=True) & (~td["done"]) + ) | td["done"] + # flatten action mask to correspond with logit shape + action_mask = rearrange(action_mask, "bs j m -> bs (j m)") + # NOTE: 1 means feasible action, 0 means infeasible action + mask = torch.cat((no_op_mask, ~action_mask), dim=1) + + return mask + + def _translate_action(self, td): + """This function translates an action into a machine, job tuple.""" + selected_job = td["action"] // self.num_mas + selected_op = td["next_op"].gather(1, selected_job[:, None]).squeeze(1) + selected_machine = td["action"] % self.num_mas + return selected_job, selected_op, selected_machine + + def _step(self, td: TensorDict): + # cloning required to avoid inplace operation which avoids gradient backtracking + td = td.clone() + td["action"].subtract_(1) + # (bs) + dones = td["done"].squeeze(1) + # specify which batch instances require which operation + no_op = td["action"].eq(NO_OP_ID) + no_op = no_op & ~dones + req_op = ~no_op & ~dones + + # transition to next time for no op instances + if no_op.any(): + td, dones = self._transit_to_next_time(no_op, td) + + # select only instances that perform a scheduling action + td_op = td.masked_select(req_op) + + td_op = self._make_step(td_op) + # update the tensordict + td[req_op] = td_op + + # action mask + td.set("action_mask", self.get_action_mask(td)) + + step_complete = self._check_step_complete(td, dones) + while step_complete.any(): + td, dones = self._transit_to_next_time(step_complete, td) + td.set("action_mask", self.get_action_mask(td)) + step_complete = self._check_step_complete(td, dones) + if self.check_mask: + assert reduce(td["action_mask"], "bs ... -> bs", "any").all() + + if self.stepwise_reward: + # if we require a stepwise reward, the change in the calculated lower bounds could serve as such + lbs = calc_lower_bound(td) + td["reward"] = -(lbs.max(1).values - td["lbs"].max(1).values) + td["lbs"] = lbs + else: + td["lbs"] = calc_lower_bound(td) + + # add additional features to tensordict + td = self._get_features(td) + + return td + + def _get_features(self, td): + # after we have transitioned to a next time step, we determine which operations are ready + td["is_ready"] = op_is_ready(td) + # td["lbs"] = calc_lower_bound(td) + + return td + + @staticmethod + def _check_step_complete(td, dones): + """check whether there a feasible actions left to be taken during the current + time step. If this is not the case (and the instance is not done), + we need to adance the timer of the repsective instance + """ + return ~reduce(td["action_mask"], "bs ... -> bs", "any") & ~dones + + def _make_step(self, td: TensorDict) -> TensorDict: + """ + Environment transition function + """ + + batch_idx = torch.arange(td.size(0)) + + # 3*(#req_op) + selected_job, selected_op, selected_machine = self._translate_action(td) + + # mark job as being processed + td["job_in_process"][batch_idx, selected_job] = 1 + + # mark op as schedules + td["op_scheduled"][batch_idx, selected_op] = True + + # update machine state + proc_time_of_action = td["proc_times"][batch_idx, selected_machine, selected_op] + # we may not select a machine that is busy + assert torch.all(td["busy_until"][batch_idx, selected_machine] <= td["time"]) + + # update schedule + td["start_times"][batch_idx, selected_op] = td["time"] + td["finish_times"][batch_idx, selected_op] = td["time"] + proc_time_of_action + td["ma_assignment"][batch_idx, selected_machine, selected_op] = 1 + # update the state of the selected machine + td["busy_until"][batch_idx, selected_machine] = td["time"] + proc_time_of_action + # update adjacency matrices (remove edges) + td["proc_times"] = td["proc_times"].scatter( + 2, + selected_op[:, None, None].expand(-1, self.num_mas, 1), + torch.zeros_like(td["proc_times"]), + ) + td["ops_ma_adj"] = td["proc_times"].contiguous().gt(0).to(torch.float32) + td["num_eligible"] = torch.sum(td["ops_ma_adj"], dim=1) + # update the positions of an operation in the job (subtract 1 from each operation of the selected job) + td["ops_sequence_order"] = ( + td["ops_sequence_order"] - gather_by_index(td["job_ops_adj"], selected_job, 1) + ).clip(0) + # some checks + # assert torch.allclose( + # td["proc_times"].sum(1).gt(0).sum(1), # num ops with eligible machine + # (~(td["op_scheduled"] + td["pad_mask"])).sum(1), # num unscheduled ops + # ) + + return td + + def _transit_to_next_time(self, step_complete, td: TensorDict) -> TensorDict: + """ + Transit to the next time + """ + + # we need a transition to a next time step if either + # 1.) all machines are busy + # 2.) all operations are already currently in process (can only happen if num_jobs < num_machines) + # 3.) idle machines can not process any of the not yet scheduled operations + # 4.) no_op is choosen + available_time_ma = td["busy_until"] + end_op_per_job = td["end_op_per_job"] + # we want to transition to the next time step where a machine becomes idle again. This time step must be + # in the future, therefore we mask all machine idle times lying in the past / present + available_time = ( + torch.where( + available_time_ma > td["time"][:, None], available_time_ma, torch.inf + ) + .min(1) + .values + ) + + assert not torch.any(available_time[step_complete].isinf()) + td["time"] = torch.where(step_complete, available_time, td["time"]) + + # this may only be set when the operation is finished, not when it is scheduled + # operation of job is finished, set next operation and flag job as being idle + curr_ops_end = td["finish_times"].gather(1, td["next_op"]) + op_finished = td["job_in_process"] & (curr_ops_end <= td["time"][:, None]) + # check whether a job is finished, which is the case when the last operation of the job is finished + job_finished = op_finished & (td["next_op"] == end_op_per_job) + # determine the next operation for a job that is not done, but whose latest operation is finished + td["next_op"] = torch.where( + op_finished & ~job_finished, + td["next_op"] + 1, + td["next_op"], + ) + td["job_in_process"][op_finished] = False + + td["job_done"] = td["job_done"] + job_finished + td["done"] = td["job_done"].all(1, keepdim=True) + + return td, td["done"].squeeze(1) + + def _get_reward(self, td, actions=None) -> TensorDict: + if self.stepwise_reward and actions is None: + return td["reward"] + else: + assert td[ + "done" + ].all(), "Set stepwise_reward to True if you want reward prior to completion" + return ( + -td["finish_times"].masked_fill(td["pad_mask"], -torch.inf).max(1).values + ) + + def _make_spec(self, generator: FJSPGenerator): + self.observation_spec = Composite( + time=Unbounded( + shape=(1,), + dtype=torch.int64, + ), + next_op=Unbounded( + shape=(self.num_jobs,), + dtype=torch.int64, + ), + proc_times=Unbounded( + shape=(self.num_mas, self.n_ops_max), + dtype=torch.float32, + ), + pad_mask=Unbounded( + shape=(self.num_mas, self.n_ops_max), + dtype=torch.bool, + ), + start_op_per_job=Unbounded( + shape=(self.num_jobs,), + dtype=torch.bool, + ), + end_op_per_job=Unbounded( + shape=(self.num_jobs,), + dtype=torch.bool, + ), + start_times=Unbounded( + shape=(self.n_ops_max,), + dtype=torch.int64, + ), + finish_times=Unbounded( + shape=(self.n_ops_max,), + dtype=torch.int64, + ), + job_ops_adj=Unbounded( + shape=(self.num_jobs, self.n_ops_max), + dtype=torch.int64, + ), + ops_job_map=Unbounded( + shape=(self.n_ops_max), + dtype=torch.int64, + ), + ops_sequence_order=Unbounded( + shape=(self.n_ops_max), + dtype=torch.int64, + ), + ma_assignment=Unbounded( + shape=(self.num_mas, self.n_ops_max), + dtype=torch.int64, + ), + busy_until=Unbounded( + shape=(self.num_mas,), + dtype=torch.int64, + ), + num_eligible=Unbounded( + shape=(self.n_ops_max,), + dtype=torch.int64, + ), + job_in_process=Unbounded( + shape=(self.num_jobs,), + dtype=torch.bool, + ), + job_done=Unbounded( + shape=(self.num_jobs,), + dtype=torch.bool, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=-1, + high=self.n_ops_max, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + @staticmethod + def render(td, idx): + return render(td, idx) + + def select_start_nodes(self, td: TensorDict, num_starts: int): + return sample_n_random_actions(td, num_starts) + + def get_num_starts(self, td): + # NOTE in the paper they use N_s = 100 + return 100 + + def load_data(self, fpath, batch_size=[]): + g = FJSPFileGenerator(fpath) + return g(batch_size=batch_size) diff --git a/rl4co/envs/scheduling/fjsp/generator.py b/rl4co/envs/scheduling/fjsp/generator.py new file mode 100644 index 00000000..8d2f427f --- /dev/null +++ b/rl4co/envs/scheduling/fjsp/generator.py @@ -0,0 +1,238 @@ +from functools import partial +from typing import List + +import numpy as np +import torch + +from tensordict.tensordict import TensorDict + +from rl4co.envs.common.utils import Generator +from rl4co.utils.pylogger import get_pylogger + +from .parser import get_max_ops_from_files, read + +log = get_pylogger(__name__) + + +class FJSPGenerator(Generator): + """Data generator for the Flexible Job-Shop Scheduling Problem (FJSP). + + Args: + num_stage: number of stages + num_machine: number of machines + num_job: number of jobs + min_time: minimum running time of each job on each machine + max_time: maximum running time of each job on each machine + flatten_stages: whether to flatten the stages + + Returns: + A TensorDict with the following key: + start_op_per_job [batch_size, num_jobs]: first operation of each job + end_op_per_job [batch_size, num_jobs]: last operation of each job + proc_times [batch_size, num_machines, total_n_ops]: processing time of ops on machines + pad_mask [batch_size, total_n_ops]: not all instances have the same number of ops, so padding is used + + """ + + def __init__( + self, + num_jobs: int = 10, + num_machines: int = 5, + min_ops_per_job: int = 4, + max_ops_per_job: int = 6, + min_processing_time: int = 1, + max_processing_time: int = 20, + min_eligible_ma_per_op: int = 1, + max_eligible_ma_per_op: int = None, + same_mean_per_op: bool = True, + **unused_kwargs, + ): + self.num_jobs = num_jobs + self.num_mas = num_machines + self.min_ops_per_job = min_ops_per_job + self.max_ops_per_job = max_ops_per_job + self.min_processing_time = min_processing_time + self.max_processing_time = max_processing_time + self.min_eligible_ma_per_op = min_eligible_ma_per_op + self.max_eligible_ma_per_op = max_eligible_ma_per_op or num_machines + # determines whether to use a fixed number of total operations or let it vary between instances + # NOTE: due to the way rl4co builds datasets, we need a fixed size here + self.n_ops_max = max_ops_per_job * num_jobs + self.same_mean_per_op = same_mean_per_op + # FFSP environment doen't have any other kwargs + if len(unused_kwargs) > 0: + log.error(f"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}") + + def _simulate_processing_times( + self, n_eligible_per_ops: torch.Tensor + ) -> torch.Tensor: + bs, n_ops_max = n_eligible_per_ops.shape + + # (bs, max_ops, machines) + ma_seq_per_ops = torch.arange(1, self.num_mas + 1)[None, None].expand( + bs, n_ops_max, self.num_mas + ) + # generate a matrix of size (ops, mas) per batch, each row having as many ones as the operation eligible machines + # E.g. n_eligible_per_ops=[1,3,2]; num_mas=4 + # [[1,0,0,0], + # 1,1,1,0], + # 1,1,0,0]] + # This will be shuffled randomly to generate a machine-operation mapping + ma_ops_edges_unshuffled = torch.Tensor.float( + ma_seq_per_ops <= n_eligible_per_ops[..., None] + ) + # random shuffling + idx = torch.rand_like(ma_ops_edges_unshuffled).argsort() + ma_ops_edges = ma_ops_edges_unshuffled.gather(2, idx).transpose(1, 2) + + # (bs, max_ops, machines) + if self.same_mean_per_op: + proc_times = torch.ones((bs, self.num_mas, n_ops_max)) + proc_time_means = torch.randint( + self.min_processing_time, self.max_processing_time, (bs, n_ops_max) + ) + low_bounds = torch.maximum( + torch.full_like(proc_times, self.min_processing_time), + (proc_time_means * (1 - 0.2)).round().unsqueeze(1), + ) + high_bounds = ( + torch.minimum( + torch.full_like(proc_times, self.max_processing_time), + (proc_time_means * (1 + 0.2)).round().unsqueeze(1), + ) + + 1 + ) + proc_times = ( + torch.randint(2**63 - 1, size=proc_times.shape) + % (high_bounds - low_bounds) + + low_bounds + ) + else: + proc_times = torch.randint( + self.min_processing_time, + self.max_processing_time + 1, + size=(bs, self.num_mas, n_ops_max), + ) + + # remove proc_times for which there is no corresponding ma-ops connection + proc_times = proc_times * ma_ops_edges + return proc_times + + def _generate(self, batch_size) -> TensorDict: + # simulate how many operations each job has + n_ope_per_job = torch.randint( + self.min_ops_per_job, + self.max_ops_per_job + 1, + size=(*batch_size, self.num_jobs), + ) + + # determine the total number of operations per batch instance (which may differ) + n_ops_batch = n_ope_per_job.sum(1) # (bs) + # determine the maximum total number of operations over all batch instances + n_ops_max = self.n_ops_max or n_ops_batch.max() + + # generate a mask, specifying which operations are padded + pad_mask = torch.arange(n_ops_max).unsqueeze(0).expand(*batch_size, -1) + pad_mask = pad_mask.ge(n_ops_batch[:, None].expand_as(pad_mask)) + + # determine the id of the end operation for each job + end_op_per_job = n_ope_per_job.cumsum(1) - 1 + + # determine the id of the starting operation for each job + # (bs, num_jobs) + start_op_per_job = torch.cat( + ( + torch.zeros((*batch_size, 1)).to(end_op_per_job), + end_op_per_job[:, :-1] + 1, + ), + dim=1, + ) + + # here we simulate the eligible machines per operation and the processing times + n_eligible_per_ops = torch.randint( + self.min_eligible_ma_per_op, + self.max_eligible_ma_per_op + 1, + (*batch_size, n_ops_max), + ) + n_eligible_per_ops[pad_mask] = 0 + + # simulate processing times for machine-operation pairs + # (bs, num_mas, n_ops_max) + proc_times = self._simulate_processing_times(n_eligible_per_ops) + + td = TensorDict( + { + "start_op_per_job": start_op_per_job, + "end_op_per_job": end_op_per_job, + "proc_times": proc_times, + "pad_mask": pad_mask, + }, + batch_size=batch_size, + ) + + return td + + +class FJSPFileGenerator(Generator): + """Data generator for the Flexible Job-Shop Scheduling Problem (FJSP) using instance files + + Args: + path: path to files + + Returns: + A TensorDict with the following key: + start_op_per_job [batch_size, num_jobs]: first operation of each job + end_op_per_job [batch_size, num_jobs]: last operation of each job + proc_times [batch_size, num_machines, total_n_ops]: processing time of ops on machines + pad_mask [batch_size, total_n_ops]: not all instances have the same number of ops, so padding is used + + """ + + def __init__(self, file_path: str, n_ops_max: int = None, **unused_kwargs): + self.files = self.list_files(file_path) + self.num_samples = len(self.files) + + if len(unused_kwargs) > 0: + log.error(f"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}") + + if len(self.files) > 1: + n_ops_max = get_max_ops_from_files(self.files) + + ret = map(partial(read, max_ops=n_ops_max), self.files) + + td_list, num_jobs, num_machines, max_ops_per_job = list(zip(*list(ret))) + num_jobs, num_machines = map(lambda x: x[0], (num_jobs, num_machines)) + max_ops_per_job = max(max_ops_per_job) + + self.td = torch.cat(td_list, dim=0) + self.num_mas = num_machines + self.num_jobs = num_jobs + self.max_ops_per_job = max_ops_per_job + self.n_ops_max = max_ops_per_job * num_jobs + + self.start_idx = 0 + + def _generate(self, batch_size: List[int]) -> TensorDict: + batch_size = np.prod(batch_size) + if batch_size > self.num_samples: + log.warning( + f"Only found {self.num_samples} instance files, but specified dataset size is {batch_size}" + ) + end_idx = self.start_idx + batch_size + td = self.td[self.start_idx : end_idx] + self.start_idx += batch_size + if self.start_idx >= self.num_samples: + self.start_idx = 0 + return td + + @staticmethod + def list_files(path): + import os + + files = [ + os.path.join(path, f) + for f in os.listdir(path) + if os.path.isfile(os.path.join(path, f)) + ] + assert len(files) > 0 + return files diff --git a/rl4co/envs/scheduling/fjsp/parser.py b/rl4co/envs/scheduling/fjsp/parser.py new file mode 100644 index 00000000..f05c8fca --- /dev/null +++ b/rl4co/envs/scheduling/fjsp/parser.py @@ -0,0 +1,180 @@ +import os + +from functools import partial +from pathlib import Path +from typing import List, Tuple, Union + +import torch + +from tensordict import TensorDict + +ProcessingData = List[Tuple[int, int]] + + +def list_files(path): + import os + + files = [ + os.path.join(path, f) + for f in os.listdir(path) + if os.path.isfile(os.path.join(path, f)) + ] + return files + + +def parse_job_line(line: Tuple[int]) -> Tuple[ProcessingData]: + """ + Parses a FJSPLIB job data line of the following form: + + * ( * ( )) + + In words, the first value is the number of operations. Then, for each + operation, the first number represents the number of machines that can + process the operation, followed by, the machine index and processing time + for each eligible machine. + + Note that the machine indices start from 1, so we subtract 1 to make them + zero-based. + """ + num_operations = line[0] + operations = [] + idx = 1 + + for _ in range(num_operations): + num_pairs = int(line[idx]) * 2 + machines = line[idx + 1 : idx + 1 + num_pairs : 2] + durations = line[idx + 2 : idx + 2 + num_pairs : 2] + operations.append([(m, d) for m, d in zip(machines, durations)]) + + idx += 1 + num_pairs + + return operations + + +def get_n_ops_of_instance(file): + lines = file2lines(file) + jobs = [parse_job_line(line) for line in lines[1:]] + n_ope_per_job = torch.Tensor([len(x) for x in jobs]).unsqueeze(0) + total_ops = int(n_ope_per_job.sum()) + return total_ops + + +def get_max_ops_from_files(files): + return max(map(get_n_ops_of_instance, files)) + + +def read(loc: Path, max_ops=None): + """ + Reads an FJSPLIB instance. + + Args: + loc: location of instance file + max_ops: optionally specify the maximum number of total operations (will be filled by padding) + + Returns: + instance: the parsed instance + """ + lines = file2lines(loc) + + # First line contains metadata. + num_jobs, num_machines = lines[0][0], lines[0][1] + + # The remaining lines contain the job-operation data, where each line + # represents a job and its operations. + jobs = [parse_job_line(line) for line in lines[1:]] + n_ope_per_job = torch.Tensor([len(x) for x in jobs]).unsqueeze(0) + total_ops = int(n_ope_per_job.sum()) + if max_ops is not None: + assert total_ops <= max_ops, "got more operations then specified through max_ops" + max_ops = max_ops or total_ops + max_ops_per_job = int(n_ope_per_job.max()) + + end_op_per_job = n_ope_per_job.cumsum(1) - 1 + start_op_per_job = torch.cat((torch.zeros((1, 1)), end_op_per_job[:, :-1] + 1), dim=1) + + pad_mask = torch.arange(max_ops) + pad_mask = pad_mask.ge(total_ops).unsqueeze(0) + + proc_times = torch.zeros((num_machines, max_ops)) + op_cnt = 0 + for job in jobs: + for op in job: + for ma, dur in op: + # subtract one to let indices start from zero + proc_times[ma - 1, op_cnt] = dur + op_cnt += 1 + proc_times = proc_times.unsqueeze(0) + + td = TensorDict( + { + "start_op_per_job": start_op_per_job, + "end_op_per_job": end_op_per_job, + "proc_times": proc_times, + "pad_mask": pad_mask, + }, + batch_size=[1], + ) + + return td, num_jobs, num_machines, max_ops_per_job + + +def file2lines(loc: Union[Path, str]) -> List[List[int]]: + with open(loc, "r") as fh: + lines = [line for line in fh.readlines() if line.strip()] + + def parse_num(word: str): + return int(word) if "." not in word else int(float(word)) + + return [[parse_num(x) for x in line.split()] for line in lines] + + +def write_one(args, where=None): + id, instance = args + assert ( + len(instance["proc_times"].shape) == 2 + ), "no batch dimension allowed in write operation" + lines = [] + + # The flexibility is the average number of eligible machines per operation. + num_eligible = (instance["proc_times"] > 0).sum() + n_ops = (~instance["pad_mask"]).sum() + num_jobs = instance["next_op"].size(0) + num_machines = instance["proc_times"].size(0) + flexibility = round(int(num_eligible) / int(n_ops), 5) + + metadata = f"{num_jobs}\t{num_machines}\t{flexibility}" + lines.append(metadata) + + for i in range(num_jobs): + ops_of_job = instance["job_ops_adj"][i].nonzero().squeeze(1) + job = [len(ops_of_job)] # number of operations of the job + + for op in ops_of_job: + eligible_ma = instance["proc_times"][:, op].nonzero().squeeze(1) + job.append(eligible_ma.size(0)) # num_eligible + + for machine in eligible_ma: + duration = instance["proc_times"][machine, op] + assert duration > 0, "something is wrong" + # add one since in song instances ma indices start from one + job.extend([int(machine.item()) + 1, int(duration.item())]) + + line = " ".join(str(num) for num in job) + lines.append(line) + + formatted = "\n".join(lines) + + file_name = f"{str(id+1).rjust(4, '0')}_{num_jobs}j_{num_machines}m.txt" + full_path = os.path.join(where, file_name) + + with open(full_path, "w") as fh: + fh.write(formatted) + + return formatted + + +def write(where: Union[Path, str], instances: TensorDict): + if not os.path.exists(where): + os.makedirs(where) + + return list(map(partial(write_one, where=where), enumerate(iter(instances)))) diff --git a/rl4co/envs/scheduling/fjsp/render.py b/rl4co/envs/scheduling/fjsp/render.py new file mode 100644 index 00000000..bfb86bf4 --- /dev/null +++ b/rl4co/envs/scheduling/fjsp/render.py @@ -0,0 +1,72 @@ +from collections import defaultdict + +import matplotlib.pyplot as plt +import numpy as np + +from matplotlib.colors import ListedColormap +from tensordict.tensordict import TensorDict + +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(td: TensorDict, idx: int): + inst = td[idx] + num_jobs = inst["job_ops_adj"].size(0) + + # Define a colormap with a color for each job + colors = plt.cm.tab10(np.linspace(0, 1, num_jobs)) + cmap = ListedColormap(colors) + + assign = inst["ma_assignment"].nonzero() + + schedule = defaultdict(list) + + for val in assign: + machine = val[0].item() + op = val[1].item() + # get start and end times of operation + start = inst["start_times"][val[1]] + end = inst["finish_times"][val[1]] + # write information to schedule dictionary + schedule[machine].append((op, start, end)) + + _, ax = plt.subplots() + + # Plot horizontal bars for each task + for ma, ops in schedule.items(): + for op, start, end in ops: + job = inst["job_ops_adj"][:, op].nonzero().item() + ax.barh( + ma, + end - start, + left=start, + height=0.6, + color=cmap(job), + edgecolor="black", + linewidth=1, + ) + + ax.text( + start + (end - start) / 2, ma, op, ha="center", va="center", color="white" + ) + + # Set labels and title + ax.set_yticks(range(len(schedule))) + ax.set_yticklabels([f"Machine {i}" for i in range(len(schedule))]) + ax.set_xlabel("Time") + ax.set_title("Gantt Chart") + + # Add a legend for class labels + handles = [plt.Rectangle((0, 0), 1, 1, color=cmap(i)) for i in range(num_jobs)] + ax.legend( + handles, + [f"Job {label}" for label in range(num_jobs)], + loc="center left", + bbox_to_anchor=(1, 0.5), + ) + + plt.tight_layout() + # Show the Gantt chart + plt.show() diff --git a/rl4co/envs/scheduling/fjsp/utils.py b/rl4co/envs/scheduling/fjsp/utils.py new file mode 100644 index 00000000..f870e8b6 --- /dev/null +++ b/rl4co/envs/scheduling/fjsp/utils.py @@ -0,0 +1,334 @@ +import logging + +from typing import List, Tuple, Union + +import torch + +from tensordict import TensorDict +from torch import Size, Tensor + +from rl4co.envs.scheduling.fjsp import INIT_FINISH + +logger = logging.getLogger(__name__) + + +def get_op_features(td: TensorDict): + return torch.stack((td["lbs"], td["is_ready"], td["num_eligible"]), dim=-1) + + +def cat_and_norm_features( + td: TensorDict, feats: List[str], time_feats: List[str], norm_const: int +): + # logger.info(f"will scale the features {','.join(time_feats)} with a constant ({norm_const})") + feature_list = [] + for feat in feats: + if feat in time_feats: + feature_list.append(td[feat] / norm_const) + else: + feature_list.append(td[feat]) + + return torch.stack(feature_list, dim=-1).to(torch.float32) + + +def view( + tensor: Tensor, + idx: Tuple[Tensor], + pad_mask: Tensor, + new_shape: Union[Size, List[int]], + pad_value: Union[float, int], +): + # convert mask specifying which entries are padded into mask specifying which entries to keep + mask = ~pad_mask + new_view = tensor.new_full(size=new_shape, fill_value=pad_value) + new_view[idx] = tensor[mask] + return new_view + + +def _get_idx_for_job_op_view(td: TensorDict) -> tuple: + bs, _, n_total_ops = td["job_ops_adj"].shape + # (bs, ops) + batch_idx = torch.arange(bs, device=td.device).repeat_interleave(n_total_ops) + batch_idx = batch_idx.reshape(bs, -1) + # (bs, ops) + ops_job_map = td["ops_job_map"] + # (bs, ops) + ops_sequence_order = td["ops_sequence_order"] + # (bs*n_ops_max, 3) + idx = ( + torch.stack((batch_idx, ops_job_map, ops_sequence_order), dim=-1) + .to(torch.long) + .flatten(0, 1) + ) + # (bs, n_ops_max) + mask = ~td["pad_mask"] + # (total_ops_in_batch, 3) + idx = idx[mask.flatten(0, 1)] + b, j, o = map(lambda x: x.squeeze(1), idx.chunk(3, dim=-1)) + return b, j, o + + +def get_job_op_view( + td: TensorDict, keys: List[str] = [], pad_value: Union[float, int] = 0 +): + """This function reshapes all tensors of the tensordict from a flat operations-only view + to a nested job-operation view and creates a new tensordict from it. + :param _type_ td: tensordict + :return _type_: dict + """ + # ============= Prepare the new index ============= + bs, num_jobs, _ = td["job_ops_adj"].shape + max_ops_per_job = int(td["job_ops_adj"].sum(-1).max()) + idx = _get_idx_for_job_op_view(td) + new_shape = Size((bs, num_jobs, max_ops_per_job)) + pad_mask = td["pad_mask"] + # ============================================== + + # due to special structure, processing times are treated seperately + if "proc_times" in keys: + keys.remove("proc_times") + # reshape processing times; (bs, ma, ops) -> (bs, ma, jobs, ops_per_job) + new_proc_times_view = view( + td["proc_times"].permute(0, 2, 1), idx, pad_mask, new_shape, pad_value + ).permute(0, 3, 1, 2) + + # add padding mask if not in keys + if "pad_mask" not in keys: + keys.append("pad_mask") + + new_views = dict( + map(lambda key: (key, view(td[key], idx, pad_mask, new_shape)), keys) + ) + + # update tensordict clone with reshaped tensors + return {"proc_times": new_proc_times_view, **new_views} + + +def blockify(td, tensor: Tensor, pad_value: Union[float, int] = 0): + assert len(tensor.shape) in [ + 2, + 3, + ], "blockify only supports tensors of shape (bs, seq, (d)), where the feature dim d is optional" + # get the size of the blockified tensor + bs, _, *d = tensor.shape + num_jobs = td["job_ops_adj"].size(1) + max_ops_per_job = int(td["job_ops_adj"].sum(-1).max()) + new_shape = Size((bs, num_jobs, max_ops_per_job, *d)) + # get indices of valid entries of blockified tensor + idx = _get_idx_for_job_op_view(td) + pad_mask = td["pad_mask"] + # create the blockified view + new_view_tensor = view(tensor, idx, pad_mask, new_shape, pad_value) + return new_view_tensor + + +def unblockify( + td: TensorDict, tensor: Tensor, mask: Tensor = None, pad_value: Union[float, int] = 0 +): + assert len(tensor.shape) in [ + 3, + 4, + ], "blockify only supports tensors of shape (bs, nb, s, (d)), where the feature dim d is optional" + # get the size of the blockified tensor + bs, _, _, *d = tensor.shape + n_ops_per_batch = td["job_ops_adj"].sum((1, 2)).unsqueeze(1) # (bs) + seq_len = int(n_ops_per_batch.max()) + new_shape = Size((bs, seq_len, *d)) + + # create the mask to gather then entries of the blockified tensor. NOTE that only by + # blockifying the original pad_mask + pad_mask = td["pad_mask"] + pad_mask = blockify(td, pad_mask, True) + + # get indices of valid entrie in flat matrix + b = torch.arange(bs, device=td.device).repeat_interleave(seq_len).reshape(bs, seq_len) + i = torch.arange(seq_len, device=td.device)[None].repeat(bs, 1) + idx = tuple(map(lambda x: x[i < n_ops_per_batch], (b, i))) + # create view + new_tensor = view(tensor, idx, pad_mask, new_shape, pad_value=pad_value) + return new_tensor + + +def first_diff(x: Tensor, dim: int): + shape = x.shape + shape = (*shape[:dim], 1, *shape[dim + 1 :]) + seq_cutoff = x.index_select(dim, torch.arange(x.size(dim) - 1, device=x.device)) + first_diff_seq = x - torch.cat((seq_cutoff.new_zeros(*shape), seq_cutoff), dim=dim) + return first_diff_seq + + +def spatial_encoding(td: TensorDict): + """We use a spatial encoing as proposed in GraphFormer (https://arxiv.org/abs/2106.05234) + The spatial encoding in GraphFormer determines the distance of the shortest path between and + nodes i and j and uses a special value for node pairs that cannot be connected at all. + For any two operations i e=2) and for i>j the negative number of + operations that starting from j, have been completet before arriving at i (e.g. i=5 j=3 -> e=-2). + For i=j we set e=0 as well as for operations of different jobs. + + :param torch.Tensor[bs, n_ops] ops_job_map: tensor specifying the index of its corresponding job + :return torch.Tensor[bs, n_ops, n_ops]: length of shortest path between any two operations + """ + bs, _, n_total_ops = td["job_ops_adj"].shape + max_ops_per_job = int(td["job_ops_adj"].sum(-1).max()) + ops_job_map = td["ops_job_map"] + pad_mask = td["pad_mask"] + + same_job = (ops_job_map[:, None] == ops_job_map[..., None]).to(torch.int32) + # mask padded + same_job[pad_mask.unsqueeze(2).expand_as(same_job)] = 0 + same_job[pad_mask.unsqueeze(1).expand_as(same_job)] = 0 + # take upper triangular of same_job and set diagonal to zero for counting purposes + upper_tri = torch.triu(same_job) - torch.diag( + torch.ones(n_total_ops, device=td.device) + )[None].expand_as(same_job) + # cumsum and masking of operations that do not belong to the same job + num_jumps = upper_tri.cumsum(2) * upper_tri + # mirror the matrix + num_jumps = num_jumps + num_jumps.transpose(1, 2) + # NOTE: shifted this logic into the spatial encoding module + # num_jumps = num_jumps + (-num_jumps.transpose(1,2)) + assert not torch.any(num_jumps >= max_ops_per_job) + # special value for ops of different jobs and self-loops + num_jumps = torch.where(num_jumps == 0, -1, num_jumps) + self_mask = torch.eye(n_total_ops).repeat(bs, 1, 1).bool() + num_jumps[self_mask] = 0 + return num_jumps + + +def calc_lower_bound(td: TensorDict): + """Here we calculate the lower bound of the operations finish times. In the FJSP case, multiple things need to + be taken into account due to the usability of the different machines for multiple ops of different jobs: + + 1.) Operations may only start once their direct predecessor is finished. We calculate its lower bound by + adding the minimum possible operation time to this detected start time. However, we cannot use the proc_times + directly, but need to account for the fact, that machines might still be busy, once an operation can be processed. + We detect this offset by detecting ops-machine pairs, where the first possible start point of the operation is before + the machine becomes idle again - Therefore, we add this discrepancy to the proc_time of the respective ops-ma combination + + 2.) If an operation has been scheduled, we use its actual finishing time as lower bound. In this case, using the cumulative sum + of all peedecessors of a job does not make sense, since it is likely to differ from the real finishing time of its direct + predecessor (its only a lower bound). Therefore, we add the finish time to the cumulative sum of processing time of all + UNSCHEDULED operations, to obtain the lower bound. + Making this work is a bit hacky: We compute the first differences of finishing times of those operations scheduled and + add them to the matrix of processing times, where already processed operations are masked (with zero) + + + """ + + proc_times = td["proc_times"].clone() # (bs, ma, ops) + busy_until = td["busy_until"] # (bs, ma) + ops_adj = td["ops_adj"] # (bs, ops, ops, 2) + finish_times = td["finish_times"] # (bs, ops) + job_ops_adj = td["job_ops_adj"] # (bs, jobs, ops) + op_scheduled = td["op_scheduled"].to(torch.float32) # (bs, ops) + + ############## REGARDING POINT 1 OF DOCSTRING ############## + # for operations whose immidiate predecessor is scheduled, we can determine its earliest + # start time by the end time of the predecessor. + # (bs, num_ops, 1) + maybe_start_at = torch.bmm(ops_adj[..., 0], finish_times[..., None]).squeeze(2) + # using the start_time, we can determine if and how long an op needs to wait for a machine to finish + wait_for_ma_offset = torch.clip(busy_until[..., None] - maybe_start_at[:, None], 0) + # we add this required waiting time to the respective processing time + proc_time_plus_wait = torch.where( + proc_times == 0, proc_times, proc_times + wait_for_ma_offset + ) + # NOTE get the mean processing time over all eligible machines for lb calulation + # ops_proc_times = torch.where(proc_times == 0, torch.inf, proc_time_plus_wait).min(1).values) + ops_proc_times = proc_time_plus_wait.sum(1) / (proc_times.gt(0).sum(1) + 1e-9) + # mask proc times for already scheduled ops + ops_proc_times[op_scheduled.to(torch.bool)] = 0 + + ############### REGARDING POINT 2 OF DOCSTRING ################### + # Now we determine all operations that are not scheduled yet (and thus have no finish_time). We will compute the cumulative + # sum over the processing time to determine the lower bound of unscheduled operations... + proc_matrix = job_ops_adj + ops_assigned = proc_matrix * op_scheduled[:, None] + proc_matrix_not_scheduled = proc_matrix * ( + torch.ones_like(proc_matrix) - op_scheduled[:, None] + ) + + # ...and add the finish_time of the last scheduled operation of the respective job to that. To make this work, using the cumsum logic, + # we calc the first differences of the finish times and seperate by job. + # We use the first differences, so that the finish times do not add up during cumulative sum below + # (bs, num_jobs, num_ops) + finish_times_1st_diff = ops_assigned * first_diff( + ops_assigned * finish_times[:, None], 2 + ) + + # masking the processing time of scheduled operations and add their finish times instead (first diff thereof) + lb_end_expand = ( + proc_matrix_not_scheduled * ops_proc_times.unsqueeze(1).expand_as(job_ops_adj) + + finish_times_1st_diff + ) + # (bs, max_ops); lower bound finish time per operation using the cumsum logic + LBs = torch.sum(job_ops_adj * lb_end_expand.cumsum(-1), dim=1) + # remove nans + LBs = torch.nan_to_num(LBs, nan=0.0) + + # test + assert torch.where( + finish_times != INIT_FINISH, torch.isclose(LBs, finish_times), True + ).all() + + return LBs + + +def op_is_ready(td: TensorDict): + # compare finish times of predecessors with current time step; shape=(b, n_ops_max) + is_ready = ( + torch.bmm(td["ops_adj"][..., 0], td["finish_times"][..., None]).squeeze(2) + <= td["time"][:, None] + ) + # shape=(b, n_ops_max) + is_scheduled = td["ma_assignment"].sum(1).bool() + # op is ready for scheduling if it has not been scheduled and its predecessor is finished + return torch.logical_and(is_ready, ~is_scheduled) + + +def get_job_ops_mapping( + start_op_per_job: torch.Tensor, end_op_per_job: torch.Tensor, n_ops_max: int +) -> Tuple[torch.Tensor, torch.Tensor]: + """Implements a mapping function from operations to jobs + + :param torch.Tensor start_op_per_job: index of first operation of each job + :param torch.Tensor end_op_per_job: index of last operation of each job + :return Tuple[torch.Tensor, torch.Tensor]: + 1st.) index mapping (bs, num_ops): [0,0,1,1,1] means that first two operations belong to job 0 + 2st.) binary mapping (bs, num_jobs, num_ops): [[1,1,0], [0,0,1]] means that first two operations belong to job 0 + """ + device = end_op_per_job.device + end_op_per_job = end_op_per_job.clone() + + bs, num_jobs = end_op_per_job.shape + + # in order to avoid shape conflicts, set the end operation id to the id of max_ops (all batches have same #ops) + end_op_per_job[:, -1] = n_ops_max - 1 + + # here we will generate the operations-job mapping: + # Therefore we first generate a sequence of operation ids and expand it the the size of the mapping matrix: + # (bs, jobs, max_ops) + ops_seq_exp = torch.arange(n_ops_max, device=device)[None, None].expand( + bs, num_jobs, -1 + ) + # (bs, jobs, max_ops) # expanding start and end operation ids + end_op_per_job_exp = end_op_per_job[..., None].expand_as(ops_seq_exp) + start_op_per_job_exp = start_op_per_job[..., None].expand_as(ops_seq_exp) + # given ids of start and end operations per job, this generates the mapping of ops to jobs + # (bs, jobs, max_ops) + ops_job_map = torch.nonzero( + (ops_seq_exp <= end_op_per_job_exp) & (ops_seq_exp >= start_op_per_job_exp) + ) + # (bs, max_ops) + ops_job_map = torch.stack(ops_job_map[:, 1].split(n_ops_max), dim=0) + + # we might also want a binary mapping / adjacency matrix connecting jobs to operations + # (bs, num_jobs, num_ops) + ops_job_bin_map = torch.scatter_add( + input=ops_job_map.new_zeros((bs, num_jobs, n_ops_max)), + dim=1, + index=ops_job_map.unsqueeze(1), + src=ops_job_map.new_ones((bs, num_jobs, n_ops_max)), + ) + + return ops_job_map, ops_job_bin_map diff --git a/rl4co/envs/scheduling/jssp/__init__.py b/rl4co/envs/scheduling/jssp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/scheduling/jssp/env.py b/rl4co/envs/scheduling/jssp/env.py new file mode 100644 index 00000000..2381836a --- /dev/null +++ b/rl4co/envs/scheduling/jssp/env.py @@ -0,0 +1,123 @@ +import torch + +from einops import einsum, reduce +from tensordict import TensorDict +from torch._tensor import Tensor + +from rl4co.envs.scheduling.fjsp.env import FJSPEnv +from rl4co.utils.ops import gather_by_index + +from .generator import JSSPFileGenerator, JSSPGenerator + + +class JSSPEnv(FJSPEnv): + """Job-Shop Scheduling Problem (JSSP) environment + At each step, the agent chooses a job. The operation to be processed next for the selected job is + then executed on the associated machine. The reward is 0 unless the agent scheduled all operations of all jobs. + In that case, the reward is (-)makespan of the schedule: maximizing the reward is equivalent to minimizing the makespan. + NOTE: The JSSP is a special case of the FJSP, when the number of eligible machines per operation is equal to one for all + operations. Therefore, this environment is a subclass of the FJSP environment. + Observations: + - time: current time + - next_op: next operation per job + - proc_times: processing time of operation-machine pairs + - pad_mask: specifies padded operations + - start_op_per_job: id of first operation per job + - end_op_per_job: id of last operation per job + - start_times: start time of operation (defaults to 0 if not scheduled) + - finish_times: finish time of operation (defaults to INIT_FINISH if not scheduled) + - job_ops_adj: adjacency matrix specifying job-operation affiliation + - ops_job_map: same as above but using ids of jobs to indicate affiliation + - ops_sequence_order: specifies the order in which operations have to be processed + - ma_assignment: specifies which operation has been scheduled on which machine + - busy_until: specifies until when the machine will be busy + - num_eligible: number of machines that can process an operation + - job_in_process: whether job is currently being processed + - job_done: whether the job is done + + Constrains: + the agent may not select: + - jobs that are done already + - jobs that are currently processed + + Finish condition: + - the agent has scheduled all operations of all jobs + + Reward: + - the negative makespan of the final schedule + + Args: + generator: JSSPGenerator instance as the data generator + generator_params: parameters for the generator + mask_no_ops: if True, agent may not select waiting operation (unless instance is done) + """ + + name = "jssp" + + def __init__( + self, + generator: JSSPGenerator = None, + generator_params: dict = {}, + mask_no_ops: bool = True, + **kwargs, + ): + if generator is None: + if generator_params.get("file_path", None) is not None: + generator = JSSPFileGenerator(**generator_params) + else: + generator = JSSPGenerator(**generator_params) + + super().__init__(generator, generator_params, mask_no_ops, **kwargs) + + def _get_features(self, td): + td = super()._get_features(td) + # get the id of the machine that executes an operation: + # (bs, ops, ma) + ops_ma_adj = td["ops_ma_adj"].transpose(1, 2) + # (bs, jobs, ma) + ma_of_next_op = gather_by_index(ops_ma_adj, td["next_op"], dim=1) + # (bs, jobs) + td["next_ma"] = ma_of_next_op.argmax(-1) + + # adjacency matrix specifying neighbors of an operation, including its + # predecessor and successor operations and operations on the same machine + ops_on_same_ma_adj = einsum( + td["ops_ma_adj"], td["ops_ma_adj"], "b m o1, b m o2 -> b o1 o2 " + ) + # concat pred, succ and ops on same machine + adj = torch.cat((td["ops_adj"], ops_on_same_ma_adj.unsqueeze(-1)), dim=-1).sum(-1) + # mask padded operations and those scheduled + mask = td["pad_mask"] + td["op_scheduled"] + adj.masked_fill_(mask.unsqueeze(1), 0) + td["adjacency"] = adj + + return td + + def get_action_mask(self, td: TensorDict) -> Tensor: + action_mask = self._get_job_machine_availability(td) + if self.mask_no_ops: + # masking is only allowed if instance is finished + no_op_mask = td["done"] + else: + # if no job is currently processed and instance is not finished yet, waiting is not allowed + no_op_mask = ( + td["job_in_process"].any(1, keepdims=True) & (~td["done"]) + ) | td["done"] + # reduce action mask to correspond with logit shape + action_mask = reduce(action_mask, "bs j m -> bs j", reduction="all") + # NOTE: 1 means feasible action, 0 means infeasible action + # (bs, 1 + n_j) + mask = torch.cat((no_op_mask, ~action_mask), dim=1) + return mask + + def _translate_action(self, td): + job = td["action"] + op = gather_by_index(td["next_op"], job, dim=1) + # get the machine that corresponds to the selected operation + ma = gather_by_index(td["ops_ma_adj"], op.unsqueeze(1), dim=2).nonzero()[:, 1] + return job, op, ma + + @staticmethod + def load_data(fpath, batch_size=[]): + g = JSSPFileGenerator(fpath) + return g(batch_size=batch_size) diff --git a/rl4co/envs/scheduling/jssp/generator.py b/rl4co/envs/scheduling/jssp/generator.py new file mode 100644 index 00000000..bc9f1fc6 --- /dev/null +++ b/rl4co/envs/scheduling/jssp/generator.py @@ -0,0 +1,208 @@ +import os + +from functools import partial +from typing import List + +import numpy as np +import torch + +from tensordict.tensordict import TensorDict +from torch.nn.functional import one_hot + +from rl4co.envs.common.utils import Generator +from rl4co.utils.pylogger import get_pylogger + +from .parser import get_max_ops_from_files, read + +log = get_pylogger(__name__) + + +class JSSPGenerator(Generator): + + """Data generator for the Job-Shop Scheduling Problem (JSSP) + + Args: + num_stage: number of stages + num_machine: number of machines + num_job: number of jobs + min_time: minimum running time of each job on each machine + max_time: maximum running time of each job on each machine + flatten_stages: whether to flatten the stages + one2one_ma_map: whether each machine should have exactly one operation per job (common in jssp benchmark instances) + + Returns: + A TensorDict with the following key: + start_op_per_job [batch_size, num_jobs]: first operation of each job + end_op_per_job [batch_size, num_jobs]: last operation of each job + proc_times [batch_size, num_machines, total_n_ops]: processing time of ops on machines + pad_mask [batch_size, total_n_ops]: not all instances have the same number of ops, so padding is used + + """ + + def __init__( + self, + num_jobs: int = 6, + num_machines: int = 6, + min_ops_per_job: int = None, + max_ops_per_job: int = None, + min_processing_time: int = 1, + max_processing_time: int = 99, + one2one_ma_map: bool = True, + **unused_kwargs, + ): + self.num_jobs = num_jobs + self.num_mas = num_machines + # quite common in jssp to have as many ops per job as there are machines + self.min_ops_per_job = min_ops_per_job or self.num_mas + self.max_ops_per_job = max_ops_per_job or self.num_mas + self.min_processing_time = min_processing_time + self.max_processing_time = max_processing_time + self.one2one_ma_map = one2one_ma_map + if self.one2one_ma_map: + assert self.min_ops_per_job == self.max_ops_per_job == self.num_mas + + # determines whether to use a fixed number of total operations or let it vary between instances + # NOTE: due to the way rl4co builds datasets, we need a fixed size here + self.n_ops_max = self.max_ops_per_job * self.num_jobs + + # FFSP environment doen't have any other kwargs + if len(unused_kwargs) > 0: + log.error(f"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}") + + def _simulate_processing_times(self, bs, n_ops_max) -> torch.Tensor: + if self.one2one_ma_map: + ops_machine_ids = ( + torch.rand((*bs, self.num_jobs, self.num_mas)) + .argsort(dim=-1) + .flatten(1, 2) + ) + else: + ops_machine_ids = torch.randint( + low=0, + high=self.num_mas, + size=(*bs, n_ops_max), + ) + ops_machine_adj = one_hot(ops_machine_ids, num_classes=self.num_mas) + + # (bs, max_ops, machines) + proc_times = torch.ones((*bs, n_ops_max, self.num_mas)) + proc_times = torch.randint( + self.min_processing_time, + self.max_processing_time + 1, + size=(*bs, self.num_mas, n_ops_max), + ) + + # remove proc_times for which there is no corresponding ma-ops connection + proc_times = proc_times * ops_machine_adj.transpose(1, 2) + # in JSSP there is only one machine capable to process an operation + assert (proc_times > 0).sum(1).eq(1).all() + return proc_times.to(torch.float32) + + def _generate(self, batch_size) -> TensorDict: + # simulate how many operations each job has + n_ope_per_job = torch.randint( + self.min_ops_per_job, + self.max_ops_per_job + 1, + size=(*batch_size, self.num_jobs), + ) + + # determine the total number of operations per batch instance (which may differ) + n_ops_batch = n_ope_per_job.sum(1) # (bs) + # determine the maximum total number of operations over all batch instances + n_ops_max = self.n_ops_max or n_ops_batch.max() + + # generate a mask, specifying which operations are padded + pad_mask = torch.arange(n_ops_max).unsqueeze(0).expand(*batch_size, -1) + pad_mask = pad_mask.ge(n_ops_batch[:, None].expand_as(pad_mask)) + + # determine the id of the end operation for each job + end_op_per_job = n_ope_per_job.cumsum(1) - 1 + + # determine the id of the starting operation for each job + # (bs, num_jobs) + start_op_per_job = torch.cat( + ( + torch.zeros((*batch_size, 1)).to(end_op_per_job), + end_op_per_job[:, :-1] + 1, + ), + dim=1, + ) + + # simulate processing times for machine-operation pairs + # (bs, num_mas, n_ops_max) + proc_times = self._simulate_processing_times(batch_size, n_ops_max) + + td = TensorDict( + { + "start_op_per_job": start_op_per_job, + "end_op_per_job": end_op_per_job, + "proc_times": proc_times, + "pad_mask": pad_mask, + }, + batch_size=batch_size, + ) + + return td + + +class JSSPFileGenerator(Generator): + """Data generator for the Job-Shop Scheduling Problem (JSSP) using instance files + + Args: + path: path to files + + Returns: + A TensorDict with the following key: + start_op_per_job [batch_size, num_jobs]: first operation of each job + end_op_per_job [batch_size, num_jobs]: last operation of each job + proc_times [batch_size, num_machines, total_n_ops]: processing time of ops on machines + pad_mask [batch_size, total_n_ops]: not all instances have the same number of ops, so padding is used + + """ + + def __init__(self, file_path: str, n_ops_max: int = None, **unused_kwargs): + self.files = ( + [file_path] if os.path.isfile(file_path) else self.list_files(file_path) + ) + self.num_samples = len(self.files) + + if len(unused_kwargs) > 0: + log.error(f"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}") + + if len(self.files) > 1: + n_ops_max = get_max_ops_from_files(self.files) + + ret = map(partial(read, max_ops=n_ops_max), self.files) + + td_list, num_jobs, num_machines, max_ops_per_job = list(zip(*list(ret))) + num_jobs, num_machines = map(lambda x: x[0], (num_jobs, num_machines)) + max_ops_per_job = max(max_ops_per_job) + + self.td = torch.cat(td_list, dim=0) + self.num_mas = num_machines + self.num_jobs = num_jobs + self.max_ops_per_job = max_ops_per_job + self.start_idx = 0 + + def _generate(self, batch_size: List[int]) -> TensorDict: + batch_size = np.prod(batch_size) + if batch_size > self.num_samples: + log.warning( + f"Only found {self.num_samples} instance files, but specified dataset size is {batch_size}" + ) + end_idx = self.start_idx + batch_size + td = self.td[self.start_idx : end_idx] + self.start_idx += batch_size + if self.start_idx >= self.num_samples: + self.start_idx = 0 + return td + + @staticmethod + def list_files(path): + files = [ + os.path.join(path, f) + for f in os.listdir(path) + if os.path.isfile(os.path.join(path, f)) + ] + assert len(files) > 0, "No files found in the specified path" + return files diff --git a/rl4co/envs/scheduling/jssp/parser.py b/rl4co/envs/scheduling/jssp/parser.py new file mode 100644 index 00000000..9fcdb4bf --- /dev/null +++ b/rl4co/envs/scheduling/jssp/parser.py @@ -0,0 +1,110 @@ +from pathlib import Path +from typing import List, Tuple, Union + +import torch + +from tensordict import TensorDict + +ProcessingData = List[Tuple[int, int]] + + +def parse_job_line(line: Tuple[int]) -> Tuple[ProcessingData]: + """ + Parses a JSSP job data line of the following form: + + * ( ) + + In words, a line consist of n_ops pairs of values, where the first value is the + machine identifier and the second value is the processing time of the corresponding + operation-machine combination + + Note that the machine indices start from 1, so we subtract 1 to make them + zero-based. + """ + + operations = [] + i = 0 + + while i < len(line): + machine = int(line[i]) + duration = int(line[i + 1]) + operations.append((machine, duration)) + i += 2 + + return operations + + +def get_n_ops_of_instance(file): + lines = file2lines(file) + jobs = [parse_job_line(line) for line in lines[1:]] + n_ope_per_job = torch.Tensor([len(x) for x in jobs]).unsqueeze(0) + total_ops = int(n_ope_per_job.sum()) + return total_ops + + +def get_max_ops_from_files(files): + return max(map(get_n_ops_of_instance, files)) + + +def read(loc: Path, max_ops=None): + """ + Reads an JSSP instance. + + Args: + loc: location of instance file + max_ops: optionally specify the maximum number of total operations (will be filled by padding) + + Returns: + instance: the parsed instance + """ + lines = file2lines(loc) + + # First line contains metadata. + num_jobs, num_machines = lines[0][0], lines[0][1] + + # The remaining lines contain the job-operation data, where each line + # represents a job and its operations. + jobs = [parse_job_line(line) for line in lines[1:]] + n_ope_per_job = torch.Tensor([len(x) for x in jobs]).unsqueeze(0) + total_ops = int(n_ope_per_job.sum()) + if max_ops is not None: + assert total_ops <= max_ops, "got more operations then specified through max_ops" + max_ops = max_ops or total_ops + max_ops_per_job = int(n_ope_per_job.max()) + + end_op_per_job = n_ope_per_job.cumsum(1) - 1 + start_op_per_job = torch.cat((torch.zeros((1, 1)), end_op_per_job[:, :-1] + 1), dim=1) + + pad_mask = torch.arange(max_ops) + pad_mask = pad_mask.ge(total_ops).unsqueeze(0) + + proc_times = torch.zeros((num_machines, max_ops)) + op_cnt = 0 + for job in jobs: + for ma, dur in job: + # subtract one to let indices start from zero + proc_times[ma - 1, op_cnt] = dur + op_cnt += 1 + proc_times = proc_times.unsqueeze(0) + + td = TensorDict( + { + "start_op_per_job": start_op_per_job, + "end_op_per_job": end_op_per_job, + "proc_times": proc_times, + "pad_mask": pad_mask, + }, + batch_size=[1], + ) + + return td, num_jobs, num_machines, max_ops_per_job + + +def file2lines(loc: Union[Path, str]) -> List[List[int]]: + with open(loc, "r") as fh: + lines = [line for line in fh.readlines() if line.strip()] + + def parse_num(word: str): + return int(word) if "." not in word else int(float(word)) + + return [[parse_num(x) for x in line.split()] for line in lines] diff --git a/rl4co/envs/scheduling/smtwtp/__init__.py b/rl4co/envs/scheduling/smtwtp/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/envs/scheduling/smtwtp/env.py b/rl4co/envs/scheduling/smtwtp/env.py new file mode 100644 index 00000000..8abfc06d --- /dev/null +++ b/rl4co/envs/scheduling/smtwtp/env.py @@ -0,0 +1,198 @@ +from typing import Optional + +import torch + +from tensordict.tensordict import TensorDict +from torchrl.data import Bounded, Composite, Unbounded + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.pylogger import get_pylogger + +from .generator import SMTWTPGenerator +from .render import render + +log = get_pylogger(__name__) + + +class SMTWTPEnv(RL4COEnvBase): + """ + Single Machine Total Weighted Tardiness Problem environment as described in DeepACO (https://arxiv.org/pdf/2309.14032.pdf) + SMTWTP is a scheduling problem in which a set of jobs must be processed on a single machine. + Each job i has a processing time, a weight, and a due date. The objective is to minimize the sum of the weighted tardiness of all jobs, + where the weighted tardiness of a job is defined as the product of its weight and the duration by which its completion time exceeds its due date. + At each step, the agent chooses a job to process. The reward is 0 unless the agent processes all the jobs. + In that case, the reward is (-)objective value of the processing order: maximizing the reward is equivalent to minimizing the objective. + + Observation: + - job_due_time: the due time of each job + - job_weight: the weight of each job + - job_process_time: the process time of each job + - current_node: the current node + - action_mask: a mask of available actions + - current_time: the current time + + Constants: + - num_job: number of jobs + - min_time_span: lower bound of jobs' due time. By default, jobs' due time is uniformly sampled from (min_time_span, max_time_span) + - max_time_span: upper bound of jobs' due time. By default, it will be set to num_job / 2 + - min_job_weight: lower bound of jobs' weights. By default, jobs' weights are uniformly sampled from (min_job_weight, max_job_weight) + - max_job_weight: upper bound of jobs' weights + - min_process_time: lower bound of jobs' process time. By default, jobs' process time is uniformly sampled from (min_process_time, max_process_time) + - max_process_time: upper bound of jobs' process time + + Finishing condition: + - All jobs are processed + + Reward: + - The reward is 0 unless the agent processes all the jobs. + - In that case, the reward is (-)objective value of the processing order: maximizing the reward is equivalent to minimizing the objective. + + Args: + generator: FFSPGenerator instance as the data generator + generator_params: parameters for the generator + """ + + name = "smtwtp" + + def __init__( + self, + generator: SMTWTPGenerator = None, + generator_params: dict = {}, + **kwargs, + ): + super().__init__(**kwargs) + if generator is None: + generator = SMTWTPGenerator(**generator_params) + self.generator = generator + self._make_spec(self.generator) + + @staticmethod + def _step(td: TensorDict) -> TensorDict: + current_job = td["action"] + + # Set not visited to 0 (i.e., we visited the node) + available = td["action_mask"].scatter( + -1, current_job.unsqueeze(-1).expand_as(td["action_mask"]), 0 + ) + + # Increase used time + selected_process_time = td["job_process_time"][ + torch.arange(current_job.size(0)), current_job + ] + current_time = td["current_time"] + selected_process_time.unsqueeze(-1) + + # We are done there are no unvisited locations + done = torch.count_nonzero(available, dim=-1) <= 0 + + # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here + reward = torch.zeros_like(done) + + td.update( + { + "current_job": current_job, + "current_time": current_time, + "action_mask": available, + "reward": reward, + "done": done, + } + ) + return td + + def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: + device = td.device + + init_job_due_time = td["job_due_time"] + init_job_process_time = td["job_process_time"] + init_job_weight = td["job_weight"] + + # Other variables + current_job = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device) + current_time = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device) + available = torch.ones( + (*batch_size, self.generator.num_job + 1), dtype=torch.bool, device=device + ) + available[:, 0] = 0 # mask the starting dummy node + + return TensorDict( + { + "job_due_time": init_job_due_time, + "job_weight": init_job_weight, + "job_process_time": init_job_process_time, + "current_job": current_job, + "current_time": current_time, + "action_mask": available, + }, + batch_size=batch_size, + ) + + def _make_spec(self, generator: SMTWTPGenerator) -> None: + self.observation_spec = Composite( + job_due_time=Bounded( + low=generator.min_time_span, + high=generator.max_time_span, + shape=(generator.num_job + 1,), + dtype=torch.float32, + ), + job_weight=Bounded( + low=generator.min_job_weight, + high=generator.max_job_weight, + shape=(generator.num_job + 1,), + dtype=torch.float32, + ), + job_process_time=Bounded( + low=generator.min_process_time, + high=generator.max_process_time, + shape=(generator.num_job + 1,), + dtype=torch.float32, + ), + current_node=Unbounded( + shape=(1,), + dtype=torch.int64, + ), + action_mask=Unbounded( + shape=(generator.num_job + 1,), + dtype=torch.bool, + ), + current_time=Unbounded( + shape=(1,), + dtype=torch.float32, + ), + shape=(), + ) + self.action_spec = Bounded( + shape=(1,), + dtype=torch.int64, + low=0, + high=generator.num_job + 1, + ) + self.reward_spec = Unbounded(shape=(1,)) + self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) + + def _get_reward(self, td, actions) -> TensorDict: + job_due_time = td["job_due_time"] + job_weight = td["job_weight"] + job_process_time = td["job_process_time"] + + batch_idx = torch.arange( + job_process_time.shape[0], device=job_process_time.device + ).unsqueeze(1) + + ordered_process_time = job_process_time[batch_idx, actions] + ordered_due_time = job_due_time[batch_idx, actions] + ordered_job_weight = job_weight[batch_idx, actions] + presum_process_time = torch.cumsum( + ordered_process_time, dim=1 + ) # ending time of each job + job_tardiness = presum_process_time - ordered_due_time + job_tardiness[job_tardiness < 0] = 0 + job_weighted_tardiness = ordered_job_weight * job_tardiness + + return -job_weighted_tardiness.sum(-1) + + def check_solution_validity(self, td, actions): + log.warning("Checking solution validity is not implemented for SMTWTP") + pass + + @staticmethod + def render(td, actions=None, ax=None): + raise render(td, actions, ax) diff --git a/rl4co/envs/scheduling/smtwtp/generator.py b/rl4co/envs/scheduling/smtwtp/generator.py new file mode 100644 index 00000000..39701478 --- /dev/null +++ b/rl4co/envs/scheduling/smtwtp/generator.py @@ -0,0 +1,88 @@ +import os +import zipfile +from typing import Union, Callable + +import torch +import numpy as np + +from robust_downloader import download +from torch.distributions import Uniform +from tensordict.tensordict import TensorDict + +from rl4co.data.utils import load_npz_to_tensordict +from rl4co.utils.pylogger import get_pylogger +from rl4co.envs.common.utils import get_sampler, Generator + +log = get_pylogger(__name__) + + +class SMTWTPGenerator(Generator): + """Data generator for the Single Machine Total Weighted Tardiness Problem (SMTWTP) environment + + Args: + num_job: number of jobs + min_time_span: lower bound of jobs' due time. By default, jobs' due time is uniformly sampled from (min_time_span, max_time_span) + max_time_span: upper bound of jobs' due time. By default, it will be set to num_job / 2 + min_job_weight: lower bound of jobs' weights. By default, jobs' weights are uniformly sampled from (min_job_weight, max_job_weight) + max_job_weight: upper bound of jobs' weights + min_process_time: lower bound of jobs' process time. By default, jobs' process time is uniformly sampled from (min_process_time, max_process_time) + max_process_time: upper bound of jobs' process time + + Returns: + A TensorDict with the following key: + job_due_time [batch_size, num_job + 1]: the due time of each job + job_weight [batch_size, num_job + 1]: the weight of each job + job_process_time [batch_size, num_job + 1]: the process time of each job + """ + def __init__( + self, + num_job: int = 10, + min_time_span: float = 0, + max_time_span: float = None, # will be set to num_job / 2 by default. In DeepACO, it is set to num_job, which would be too simple + min_job_weight: float = 0, + max_job_weight: float = 1, + min_process_time: float = 0, + max_process_time: float = 1, + **unused_kwargs + ): + self.num_job = num_job + self.min_time_span = min_time_span + self.max_time_span = num_job / 2 if max_time_span is None else max_time_span + self.min_job_weight = min_job_weight + self.max_job_weight = max_job_weight + self.min_process_time = min_process_time + self.max_process_time = max_process_time + + # SMTWTP environment doen't have any other kwargs + if len(unused_kwargs) > 0: + log.error(f"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}") + + def _generate(self, batch_size) -> TensorDict: + batch_size = [batch_size] if isinstance(batch_size, int) else batch_size + # Sampling according to Ye et al. (2023) + job_due_time = ( + torch.FloatTensor(*batch_size, self.num_job + 1) + .uniform_(self.min_time_span, self.max_time_span) + ) + job_weight = ( + torch.FloatTensor(*batch_size, self.num_job + 1) + .uniform_(self.min_job_weight, self.max_job_weight) + ) + job_process_time = ( + torch.FloatTensor(*batch_size, self.num_job + 1) + .uniform_(self.min_process_time, self.max_process_time) + ) + + # Rollouts begin at dummy node 0, whose features are set to 0 + job_due_time[:, 0] = 0 + job_weight[:, 0] = 0 + job_process_time[:, 0] = 0 + + return TensorDict( + { + "job_due_time": job_due_time, + "job_weight": job_weight, + "job_process_time": job_process_time, + }, + batch_size=batch_size, + ) diff --git a/rl4co/envs/scheduling/smtwtp/render.py b/rl4co/envs/scheduling/smtwtp/render.py new file mode 100644 index 00000000..9f8eedf0 --- /dev/null +++ b/rl4co/envs/scheduling/smtwtp/render.py @@ -0,0 +1,15 @@ +import torch +import numpy as np +import matplotlib.pyplot as plt + +from matplotlib import cm, colormaps +from tensordict.tensordict import TensorDict + +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def render(td: TensorDict, actions=None, ax=None): + raise NotImplementedError diff --git a/rl4co/models/__init__.py b/rl4co/models/__init__.py new file mode 100644 index 00000000..339c3b01 --- /dev/null +++ b/rl4co/models/__init__.py @@ -0,0 +1,49 @@ +from rl4co.models.common.constructive.autoregressive import ( + AutoregressiveDecoder, + AutoregressiveEncoder, + AutoregressivePolicy, +) +from rl4co.models.common.constructive.base import ( + ConstructiveDecoder, + ConstructiveEncoder, + ConstructivePolicy, +) +from rl4co.models.common.constructive.nonautoregressive import ( + NonAutoregressiveDecoder, + NonAutoregressiveEncoder, + NonAutoregressivePolicy, +) +from rl4co.models.common.transductive import TransductiveModel +from rl4co.models.rl import StepwisePPO +from rl4co.models.rl.a2c.a2c import A2C +from rl4co.models.rl.common.base import RL4COLitModule +from rl4co.models.rl.ppo.ppo import PPO +from rl4co.models.rl.reinforce.baselines import REINFORCEBaseline, get_reinforce_baseline +from rl4co.models.rl.reinforce.reinforce import REINFORCE +from rl4co.models.zoo.active_search import ActiveSearch +from rl4co.models.zoo.am import AttentionModel, AttentionModelPolicy +from rl4co.models.zoo.amppo import AMPPO +from rl4co.models.zoo.dact import DACT, DACTPolicy +from rl4co.models.zoo.deepaco import DeepACO, DeepACOPolicy +from rl4co.models.zoo.eas import EAS, EASEmb, EASLay +from rl4co.models.zoo.ham import ( + HeterogeneousAttentionModel, + HeterogeneousAttentionModelPolicy, +) +from rl4co.models.zoo.l2d import ( + L2DAttnPolicy, + L2DModel, + L2DPolicy, + L2DPolicy4PPO, + L2DPPOModel, +) +from rl4co.models.zoo.matnet import MatNet, MatNetPolicy +from rl4co.models.zoo.mdam import MDAM, MDAMPolicy +from rl4co.models.zoo.mvmoe import MVMoE_AM, MVMoE_POMO +from rl4co.models.zoo.n2s import N2S, N2SPolicy +from rl4co.models.zoo.nargnn import NARGNNPolicy +from rl4co.models.zoo.neuopt import NeuOpt, NeuOptPolicy +from rl4co.models.zoo.polynet import PolyNet +from rl4co.models.zoo.pomo import POMO +from rl4co.models.zoo.ptrnet import PointerNetwork, PointerNetworkPolicy +from rl4co.models.zoo.symnco import SymNCO, SymNCOPolicy diff --git a/rl4co/models/common/__init__.py b/rl4co/models/common/__init__.py new file mode 100644 index 00000000..57eea304 --- /dev/null +++ b/rl4co/models/common/__init__.py @@ -0,0 +1,21 @@ +from rl4co.models.common.constructive.autoregressive import ( + AutoregressiveDecoder, + AutoregressiveEncoder, + AutoregressivePolicy, +) +from rl4co.models.common.constructive.base import ( + ConstructiveDecoder, + ConstructiveEncoder, + ConstructivePolicy, +) +from rl4co.models.common.constructive.nonautoregressive import ( + NonAutoregressiveDecoder, + NonAutoregressiveEncoder, + NonAutoregressivePolicy, +) +from rl4co.models.common.improvement import ( + ImprovementDecoder, + ImprovementEncoder, + ImprovementPolicy, +) +from rl4co.models.common.transductive.base import TransductiveModel diff --git a/rl4co/models/common/constructive/__init__.py b/rl4co/models/common/constructive/__init__.py new file mode 100644 index 00000000..e8e4739a --- /dev/null +++ b/rl4co/models/common/constructive/__init__.py @@ -0,0 +1,15 @@ +from rl4co.models.common.constructive.autoregressive import ( + AutoregressiveDecoder, + AutoregressiveEncoder, + AutoregressivePolicy, +) +from rl4co.models.common.constructive.base import ( + ConstructiveDecoder, + ConstructiveEncoder, + ConstructivePolicy, +) +from rl4co.models.common.constructive.nonautoregressive import ( + NonAutoregressiveDecoder, + NonAutoregressiveEncoder, + NonAutoregressivePolicy, +) diff --git a/rl4co/models/common/constructive/autoregressive/__init__.py b/rl4co/models/common/constructive/autoregressive/__init__.py new file mode 100644 index 00000000..976742f2 --- /dev/null +++ b/rl4co/models/common/constructive/autoregressive/__init__.py @@ -0,0 +1,3 @@ +from rl4co.models.common.constructive.autoregressive.decoder import AutoregressiveDecoder +from rl4co.models.common.constructive.autoregressive.encoder import AutoregressiveEncoder +from rl4co.models.common.constructive.autoregressive.policy import AutoregressivePolicy diff --git a/rl4co/models/common/constructive/autoregressive/decoder.py b/rl4co/models/common/constructive/autoregressive/decoder.py new file mode 100644 index 00000000..b901e969 --- /dev/null +++ b/rl4co/models/common/constructive/autoregressive/decoder.py @@ -0,0 +1,13 @@ +import abc + +from rl4co.models.common.constructive.base import ConstructiveDecoder + + +class AutoregressiveDecoder(ConstructiveDecoder, metaclass=abc.ABCMeta): + """Template class for an autoregressive decoder, simple wrapper around + :class:`rl4co.models.common.constructive.base.ConstructiveDecoder` + + Tip: + This class will not work as it is and is just a template. + An example for autoregressive encoder can be found as :class:`rl4co.models.zoo.am.decoder.AttentionModelDecoder`. + """ diff --git a/rl4co/models/common/constructive/autoregressive/encoder.py b/rl4co/models/common/constructive/autoregressive/encoder.py new file mode 100644 index 00000000..d33e104f --- /dev/null +++ b/rl4co/models/common/constructive/autoregressive/encoder.py @@ -0,0 +1,13 @@ +import abc + +from rl4co.models.common.constructive.base import ConstructiveEncoder + + +class AutoregressiveEncoder(ConstructiveEncoder, metaclass=abc.ABCMeta): + """Template class for an autoregressive encoder, simple wrapper around + :class:`rl4co.models.common.constructive.base.ConstructiveEncoder`. + + Tip: + This class will not work as it is and is just a template. + An example for autoregressive encoder can be found as :class:`rl4co.models.zoo.am.encoder.AttentionModelEncoder`. + """ diff --git a/rl4co/models/common/constructive/autoregressive/policy.py b/rl4co/models/common/constructive/autoregressive/policy.py new file mode 100644 index 00000000..3cad5961 --- /dev/null +++ b/rl4co/models/common/constructive/autoregressive/policy.py @@ -0,0 +1,46 @@ +from rl4co.models.common.constructive.base import ConstructivePolicy + +from .decoder import AutoregressiveDecoder +from .encoder import AutoregressiveEncoder + + +class AutoregressivePolicy(ConstructivePolicy): + """Template class for an autoregressive policy, simple wrapper around + :class:`rl4co.models.common.constructive.base.ConstructivePolicy`. + + Note: + While a decoder is required, an encoder is optional and will be initialized to + :class:`rl4co.models.common.constructive.autoregressive.encoder.NoEncoder`. + This can be used in decoder-only models in which at each step actions do not depend on + previously encoded states. + """ + + def __init__( + self, + encoder: AutoregressiveEncoder, + decoder: AutoregressiveDecoder, + env_name: str = "tsp", + temperature: float = 1.0, + tanh_clipping: float = 0, + mask_logits: bool = True, + train_decode_type: str = "sampling", + val_decode_type: str = "greedy", + test_decode_type: str = "greedy", + **unused_kw, + ): + # We raise an error for the user if no decoder was provided + if decoder is None: + raise ValueError("AutoregressivePolicy requires a decoder to be provided.") + + super(AutoregressivePolicy, self).__init__( + encoder=encoder, + decoder=decoder, + env_name=env_name, + temperature=temperature, + tanh_clipping=tanh_clipping, + mask_logits=mask_logits, + train_decode_type=train_decode_type, + val_decode_type=val_decode_type, + test_decode_type=test_decode_type, + **unused_kw, + ) diff --git a/rl4co/models/common/constructive/base.py b/rl4co/models/common/constructive/base.py new file mode 100644 index 00000000..08efa764 --- /dev/null +++ b/rl4co/models/common/constructive/base.py @@ -0,0 +1,268 @@ +import abc + +from typing import Any, Callable, Optional, Tuple, Union + +import torch.nn as nn + +from tensordict import TensorDict +from torch import Tensor + +from rl4co.envs import RL4COEnvBase, get_env +from rl4co.utils.decoding import ( + DecodingStrategy, + get_decoding_strategy, + get_log_likelihood, +) +from rl4co.utils.ops import calculate_entropy +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class ConstructiveEncoder(nn.Module, metaclass=abc.ABCMeta): + """Base class for the encoder of constructive models""" + + @abc.abstractmethod + def forward(self, td: TensorDict) -> Tuple[Any, Tensor]: + """Forward pass for the encoder + + Args: + td: TensorDict containing the input data + + Returns: + Tuple containing: + - latent representation (any type) + - initial embeddings (from feature space to embedding space) + """ + raise NotImplementedError("Implement me in subclass!") + + +class ConstructiveDecoder(nn.Module, metaclass=abc.ABCMeta): + """Base decoder model for constructive models. The decoder is responsible for generating the logits for the action""" + + @abc.abstractmethod + def forward( + self, td: TensorDict, hidden: Any = None, num_starts: int = 0 + ) -> Tuple[Tensor, Tensor]: + """Obtain logits for current action to the next ones + + Args: + td: TensorDict containing the input data + hidden: Hidden state from the encoder. Can be any type + num_starts: Number of starts for multistart decoding + + Returns: + Tuple containing the logits and the action mask + """ + raise NotImplementedError("Implement me in subclass!") + + def pre_decoder_hook( + self, td: TensorDict, env: RL4COEnvBase, hidden: Any = None, num_starts: int = 0 + ) -> Tuple[TensorDict, Any, RL4COEnvBase]: + """By default, we don't need to do anything here. + + Args: + td: TensorDict containing the input data + hidden: Hidden state from the encoder + env: Environment for decoding + num_starts: Number of starts for multistart decoding + + Returns: + Tuple containing the updated hidden state, TensorDict, and environment + """ + return td, env, hidden + + +class NoEncoder(ConstructiveEncoder): + """Default encoder decoder-only models, i.e. autoregressive models that re-encode all the state at each decoding step.""" + + def forward(self, td: TensorDict) -> Tuple[Tensor, Tensor]: + """Return Nones for the hidden state and initial embeddings""" + return None, None + + +class ConstructivePolicy(nn.Module): + """ + Base class for constructive policies. Constructive policies take as input and instance and output a solution (sequence of actions). + "Constructive" means that a solution is created from scratch by the model. + + The structure follows roughly the following steps: + 1. Create a hidden state from the encoder + 2. Initialize decoding strategy (such as greedy, sampling, etc.) + 3. Decode the action given the hidden state and the environment state at the current step + 4. Update the environment state with the action. Repeat 3-4 until all sequences are done + 5. Obtain log likelihood, rewards etc. + + Note that an encoder is not strictly needed (see :class:`NoEncoder`).). A decoder however is always needed either in the form of a + network or a function. + + Note: + There are major differences between this decoding and most RL problems. The most important one is + that reward may not defined for partial solutions, hence we have to wait for the environment to reach a terminal + state before we can compute the reward with `env.get_reward()`. + + Warning: + We suppose environments in the `done` state are still available for sampling. This is because in NCO we need to + wait for all the environments to reach a terminal state before we can stop the decoding process. This is in + contrast with the TorchRL framework (at the moment) where the `env.rollout` function automatically resets. + You may follow tighter integration with TorchRL here: https://github.com/ai4co/rl4co/issues/72. + + Args: + encoder: Encoder to use + decoder: Decoder to use + env_name: Environment name to solve (used for automatically instantiating networks) + temperature: Temperature for the softmax during decoding + tanh_clipping: Clipping value for the tanh activation (see Bello et al. 2016) during decoding + mask_logits: Whether to mask the logits or not during decoding + train_decode_type: Decoding strategy for training + val_decode_type: Decoding strategy for validation + test_decode_type: Decoding strategy for testing + """ + + def __init__( + self, + encoder: Union[ConstructiveEncoder, Callable], + decoder: Union[ConstructiveDecoder, Callable], + env_name: str = "tsp", + temperature: float = 1.0, + tanh_clipping: float = 0, + mask_logits: bool = True, + train_decode_type: str = "sampling", + val_decode_type: str = "greedy", + test_decode_type: str = "greedy", + **unused_kw, + ): + super(ConstructivePolicy, self).__init__() + + if len(unused_kw) > 0: + log.error(f"Found {len(unused_kw)} unused kwargs: {unused_kw}") + + self.env_name = env_name + + # Encoder and decoder + if encoder is None: + log.warning("`None` was provided as encoder. Using `NoEncoder`.") + encoder = NoEncoder() + self.encoder = encoder + self.decoder = decoder + + # Decoding strategies + self.temperature = temperature + self.tanh_clipping = tanh_clipping + self.mask_logits = mask_logits + self.train_decode_type = train_decode_type + self.val_decode_type = val_decode_type + self.test_decode_type = test_decode_type + + def forward( + self, + td: TensorDict, + env: Optional[Union[str, RL4COEnvBase]] = None, + phase: str = "train", + calc_reward: bool = True, + return_actions: bool = True, + return_entropy: bool = False, + return_hidden: bool = False, + return_init_embeds: bool = False, + return_sum_log_likelihood: bool = True, + actions=None, + max_steps=1_000_000, + **decoding_kwargs, + ) -> dict: + """Forward pass of the policy. + + Args: + td: TensorDict containing the environment state + env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that + it is more efficient to pass an already instantiated environment each time for fine-grained control + phase: Phase of the algorithm (train, val, test) + calc_reward: Whether to calculate the reward + return_actions: Whether to return the actions + return_entropy: Whether to return the entropy + return_hidden: Whether to return the hidden state + return_init_embeds: Whether to return the initial embeddings + return_sum_log_likelihood: Whether to return the sum of the log likelihood + actions: Actions to use for evaluating the policy. + If passed, use these actions instead of sampling from the policy to calculate log likelihood + max_steps: Maximum number of decoding steps for sanity check to avoid infinite loops if envs are buggy (i.e. do not reach `done`) + decoding_kwargs: Keyword arguments for the decoding strategy. See :class:`rl4co.utils.decoding.DecodingStrategy` for more information. + + Returns: + out: Dictionary containing the reward, log likelihood, and optionally the actions and entropy + """ + + # Encoder: get encoder output and initial embeddings from initial state + hidden, init_embeds = self.encoder(td) + + # Instantiate environment if needed + if isinstance(env, str) or env is None: + env_name = self.env_name if env is None else env + log.info(f"Instantiated environment not provided; instantiating {env_name}") + env = get_env(env_name) + + # Get decode type depending on phase and whether actions are passed for evaluation + decode_type = decoding_kwargs.pop("decode_type", None) + if actions is not None: + decode_type = "evaluate" + elif decode_type is None: + decode_type = getattr(self, f"{phase}_decode_type") + + # Setup decoding strategy + # we pop arguments that are not part of the decoding strategy + decode_strategy: DecodingStrategy = get_decoding_strategy( + decode_type, + temperature=decoding_kwargs.pop("temperature", self.temperature), + tanh_clipping=decoding_kwargs.pop("tanh_clipping", self.tanh_clipping), + mask_logits=decoding_kwargs.pop("mask_logits", self.mask_logits), + store_all_logp=decoding_kwargs.pop("store_all_logp", return_entropy), + **decoding_kwargs, + ) + + # Pre-decoding hook: used for the initial step(s) of the decoding strategy + td, env, num_starts = decode_strategy.pre_decoder_hook(td, env) + + # Additionally call a decoder hook if needed before main decoding + td, env, hidden = self.decoder.pre_decoder_hook(td, env, hidden, num_starts) + + # Main decoding: loop until all sequences are done + step = 0 + while not td["done"].all(): + logits, mask = self.decoder(td, hidden, num_starts) + td = decode_strategy.step( + logits, + mask, + td, + action=actions[..., step] if actions is not None else None, + ) + td = env.step(td)["next"] + step += 1 + if step > max_steps: + log.error( + f"Exceeded maximum number of steps ({max_steps}) duing decoding" + ) + break + + # Post-decoding hook: used for the final step(s) of the decoding strategy + logprobs, actions, td, env = decode_strategy.post_decoder_hook(td, env) + + # Output dictionary construction + if calc_reward: + td.set("reward", env.get_reward(td, actions)) + + outdict = { + "reward": td["reward"], + "log_likelihood": get_log_likelihood( + logprobs, actions, td.get("mask", None), return_sum_log_likelihood + ), + } + + if return_actions: + outdict["actions"] = actions + if return_entropy: + outdict["entropy"] = calculate_entropy(logprobs) + if return_hidden: + outdict["hidden"] = hidden + if return_init_embeds: + outdict["init_embeds"] = init_embeds + + return outdict diff --git a/rl4co/models/common/constructive/nonautoregressive/__init__.py b/rl4co/models/common/constructive/nonautoregressive/__init__.py new file mode 100644 index 00000000..f170d079 --- /dev/null +++ b/rl4co/models/common/constructive/nonautoregressive/__init__.py @@ -0,0 +1,9 @@ +from rl4co.models.common.constructive.nonautoregressive.decoder import ( + NonAutoregressiveDecoder, +) +from rl4co.models.common.constructive.nonautoregressive.encoder import ( + NonAutoregressiveEncoder, +) +from rl4co.models.common.constructive.nonautoregressive.policy import ( + NonAutoregressivePolicy, +) diff --git a/rl4co/models/common/constructive/nonautoregressive/decoder.py b/rl4co/models/common/constructive/nonautoregressive/decoder.py new file mode 100644 index 00000000..a649121e --- /dev/null +++ b/rl4co/models/common/constructive/nonautoregressive/decoder.py @@ -0,0 +1,40 @@ +from functools import lru_cache + +import torch + +from tensordict import TensorDict + +from rl4co.models.common.constructive.base import ConstructiveDecoder +from rl4co.utils.ops import batchify + + +@lru_cache(10) +def _multistart_batched_index(batch_size: int, num_starts: int): + """Create a batched index for multistart decoding""" + arr = torch.arange(batch_size) + if num_starts <= 1: + return arr + else: + return batchify(arr, num_starts) + + +class NonAutoregressiveDecoder(ConstructiveDecoder): + """The nonautoregressive decoder is a simple callable class that + takes the tensor dictionary and the heatmaps logits and returns the logits for the current + action logits and the action mask. + """ + + def forward(self, td: TensorDict, heatmaps_logits: torch.Tensor, num_starts: int): + return self.heatmap_to_logits(td, heatmaps_logits, num_starts) + + @staticmethod + def heatmap_to_logits(td: TensorDict, heatmaps_logits: torch.Tensor, num_starts: int): + """Obtain heatmap logits for current action to the next ones""" + current_action = td.get("action", None) + if current_action is None: + logits = heatmaps_logits.mean(-1) + else: + batch_size = heatmaps_logits.shape[0] + _indexer = _multistart_batched_index(batch_size, num_starts) + logits = heatmaps_logits[_indexer, current_action, :] + return logits, td["action_mask"] diff --git a/rl4co/models/common/constructive/nonautoregressive/encoder.py b/rl4co/models/common/constructive/nonautoregressive/encoder.py new file mode 100644 index 00000000..cfaf5392 --- /dev/null +++ b/rl4co/models/common/constructive/nonautoregressive/encoder.py @@ -0,0 +1,13 @@ +import abc + +from rl4co.models.common.constructive.base import ConstructiveEncoder + + +class NonAutoregressiveEncoder(ConstructiveEncoder, metaclass=abc.ABCMeta): + """Template class for an autoregressive encoder, simple wrapper around + :class:`rl4co.models.common.constructive.base.ConstructiveEncoder`. + + Tip: + This class will not work as it is and is just a template. + An example for autoregressive encoder can be found as :class:`rl4co.models.zoo.am.encoder.AttentionModelEncoder`. + """ diff --git a/rl4co/models/common/constructive/nonautoregressive/policy.py b/rl4co/models/common/constructive/nonautoregressive/policy.py new file mode 100644 index 00000000..ad5b724c --- /dev/null +++ b/rl4co/models/common/constructive/nonautoregressive/policy.py @@ -0,0 +1,40 @@ +from rl4co.models.common.constructive.base import ConstructivePolicy + +from .decoder import NonAutoregressiveDecoder +from .encoder import NonAutoregressiveEncoder + + +class NonAutoregressivePolicy(ConstructivePolicy): + """Template class for an nonautoregressive policy, simple wrapper around + :class:`rl4co.models.common.constructive.base.ConstructivePolicy`. + """ + + def __init__( + self, + encoder: NonAutoregressiveEncoder, + decoder: NonAutoregressiveDecoder = None, + env_name: str = "tsp", + temperature: float = 1.0, + tanh_clipping: float = 0, + mask_logits: bool = True, + train_decode_type: str = "sampling", + val_decode_type: str = "greedy", + test_decode_type: str = "greedy", + **unused_kw, + ): + # If decoder is not passed, we default to the non-autoregressive decoder that decodes the heatmap + if decoder is None: + decoder = NonAutoregressiveDecoder() + + super(NonAutoregressivePolicy, self).__init__( + encoder=encoder, + decoder=decoder, + env_name=env_name, + temperature=temperature, + tanh_clipping=tanh_clipping, + mask_logits=mask_logits, + train_decode_type=train_decode_type, + val_decode_type=val_decode_type, + test_decode_type=test_decode_type, + **unused_kw, + ) diff --git a/rl4co/models/common/improvement/__init__.py b/rl4co/models/common/improvement/__init__.py new file mode 100644 index 00000000..3eb4a954 --- /dev/null +++ b/rl4co/models/common/improvement/__init__.py @@ -0,0 +1 @@ +from rl4co.models.common.improvement.base import ImprovementDecoder, ImprovementEncoder, ImprovementPolicy \ No newline at end of file diff --git a/rl4co/models/common/improvement/base.py b/rl4co/models/common/improvement/base.py new file mode 100644 index 00000000..9012fc70 --- /dev/null +++ b/rl4co/models/common/improvement/base.py @@ -0,0 +1,146 @@ +import abc + +from typing import Tuple, Union + +import torch.nn as nn + +from tensordict import TensorDict +from torch import Tensor + +from rl4co.envs import RL4COEnvBase +from rl4co.models.nn.env_embeddings import env_init_embedding +from rl4co.models.nn.pos_embeddings import pos_init_embedding +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class ImprovementEncoder(nn.Module): + """Base class for the encoder of improvement models""" + + def __init__( + self, + embed_dim: int = 128, + init_embedding: nn.Module = None, + pos_embedding: nn.Module = None, + env_name: str = "pdp_ruin_repair", + pos_type: str = "CPE", + num_heads: int = 4, + num_layers: int = 3, + normalization: str = "layer", + feedforward_hidden: int = 128, + linear_bias: bool = False, + ): + super(ImprovementEncoder, self).__init__() + + if isinstance(env_name, RL4COEnvBase): + env_name = env_name.name + self.env_name = env_name + self.init_embedding = ( + env_init_embedding( + self.env_name, {"embed_dim": embed_dim, "linear_bias": linear_bias} + ) + if init_embedding is None + else init_embedding + ) + + self.pos_type = pos_type + self.pos_embedding = ( + pos_init_embedding(self.pos_type, {"embed_dim": embed_dim}) + if pos_embedding is None + else pos_embedding + ) + + @abc.abstractmethod + def _encoder_forward(self, init_h: Tensor, init_p: Tensor) -> Tuple[Tensor, Tensor]: + """Process the node embeddings and positional embeddings to the final embeddings + + Args: + init_h: initialized node embeddings + init_p: initialized positional embeddings + + Returns: + Tuple containing the final node embeddings and final positional embeddings (if any) + """ + raise NotImplementedError("Implement me in subclass!") + + def forward(self, td: TensorDict) -> Tuple[Tensor, Tensor]: + """Forward pass of the encoder. + Transform the input TensorDict into a latent representation. + + Args: + td: Input TensorDict containing the environment state + + Returns: + h: Latent representation of the input + init_h: Initial embedding of the input + """ + # Transfer to embedding space (node) + init_h = self.init_embedding(td) + + # Transfer to embedding space (solution) + init_p = self.pos_embedding(td) + + # Process embedding + final_h, final_p = self._encoder_forward(init_h, init_p) + + # Return latent representation and initial embedding + return final_h, final_p + + +class ImprovementDecoder(nn.Module, metaclass=abc.ABCMeta): + """Base decoder model for improvement models. The decoder is responsible for generating the logits of the action""" + + @abc.abstractmethod + def forward(self, td: TensorDict, final_h: Tensor, final_p: Tensor) -> Tensor: + """Obtain logits to perform operators that improve the current solution to the next ones + + Args: + td: TensorDict with the current environment state + final_h: final node embeddings + final_p: final positional embeddings + + Returns: + Tuple containing the logits + """ + raise NotImplementedError("Implement me in subclass!") + + +class ImprovementPolicy(nn.Module): + """ + Base class for improvement policies. Improvement policies take an instance + a solution as input and output a specific operator that changes the current solution to a new one. + + "Improvement" means that a solution is (potentially) improved to a new one by the model. + + """ + + @abc.abstractmethod + def forward( + self, + td: TensorDict, + env: Union[str, RL4COEnvBase] = None, + phase: str = "train", + return_actions: bool = True, + return_entropy: bool = False, + return_init_embeds: bool = False, + actions=None, + **decoding_kwargs, + ) -> dict: + """Forward pass of the policy. + + Args: + td: TensorDict containing the environment state + env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that + it is more efficient to pass an already instantiated environment each time for fine-grained control + phase: Phase of the algorithm (train, val, test) + return_actions: Whether to return the actions + return_entropy: Whether to return the entropy + return_init_embeds: Whether to return the initial embeddings + actions: Actions to use for evaluating the policy. + If passed, use these actions instead of sampling from the policy to calculate log likelihood + decoding_kwargs: Keyword arguments for the decoding strategy. See :class:`rl4co.utils.decoding.DecodingStrategy` for more information. + + Returns: + out: Dictionary containing the reward, log likelihood, and optionally the actions and entropy + """ + raise NotImplementedError("Implement me in subclass!") diff --git a/rl4co/models/common/transductive/__init__.py b/rl4co/models/common/transductive/__init__.py new file mode 100644 index 00000000..961db6ff --- /dev/null +++ b/rl4co/models/common/transductive/__init__.py @@ -0,0 +1 @@ +from rl4co.models.common.transductive.base import TransductiveModel diff --git a/rl4co/models/common/transductive/base.py b/rl4co/models/common/transductive/base.py new file mode 100644 index 00000000..1ba42082 --- /dev/null +++ b/rl4co/models/common/transductive/base.py @@ -0,0 +1,93 @@ +import abc + +from typing import Any, Optional, Union + +from lightning.pytorch.utilities.types import STEP_OUTPUT +from torch.utils.data import Dataset + +from rl4co.models.rl.common.base import RL4COLitModule + + +class TransductiveModel(RL4COLitModule, metaclass=abc.ABCMeta): + """Base class for transductive algorithms (i.e. that optimize policy parameters for + specific instances, see https://en.wikipedia.org/wiki/Transduction_(machine_learning)). + Transductive algorithms are used online to find better solutions for a given dataset, i.e. + given a policy, improve (a part of) its parameters such that + the policy performs better on the given dataset. + + Note: + By default, we use manual optimization to handle the search. + + Args: + env: RL4CO environment + policy: policy network + dataset: dataset to use for training + batch_size: batch size + max_iters: maximum number of iterations + max_runtime: maximum runtime in seconds + save_path: path to save the model + **kwargs: additional arguments + """ + + def __init__( + self, + env, + policy, + dataset: Union[Dataset, str], + batch_size: int = 1, + max_iters: int = 100, + max_runtime: Optional[int] = 86_400, + save_path: Optional[str] = None, + **kwargs, + ): + self.save_hyperparameters(logger=False) + super().__init__(env, policy, **kwargs) + self.dataset = dataset + self.automatic_optimization = False # we optimize manually + + def setup(self, stage="fit"): + """Setup the dataset and attributes. + The RL4COLitModulebase class automatically loads the data. + """ + if isinstance(self.dataset, str): + # load from file + self.dataset = self.env.dataset(filename=self.dataset) + + # Set all datasets and batch size as the same + for split in ["train", "val", "test"]: + setattr(self, f"{split}_dataset", self.dataset) + setattr(self, f"{split}_batch_size", self.hparams.batch_size) + + # Setup loggers + self.setup_loggers() + + def on_train_batch_start(self, batch: Any, batch_idx: int): + """Called before training (i.e. search) for a new batch begins. + This can be used to perform changes to the model or optimizer at the start of each batch. + """ + pass # Implement in subclass + + @abc.abstractmethod + def training_step(self, batch, batch_idx): + """Main search loop. We use the training step to effectively adapt to a `batch` of instances.""" + raise NotImplementedError("Implement in subclass") + + def on_train_batch_end( + self, outputs: STEP_OUTPUT, batch: Any, batch_idx: int + ) -> None: + """Called when the train batch ends. This can be used for + instance for logging or clearing cache. + """ + pass # Implement in subclass + + def on_train_epoch_end(self) -> None: + """Called when the train ends.""" + pass # Implement in subclass + + def validation_step(self, batch: Any, batch_idx: int): + """Not used during search""" + pass + + def test_step(self, batch: Any, batch_idx: int): + """Not used during search""" + pass diff --git a/rl4co/models/nn/__init__.py b/rl4co/models/nn/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/models/nn/attention.py b/rl4co/models/nn/attention.py new file mode 100644 index 00000000..0dfa5973 --- /dev/null +++ b/rl4co/models/nn/attention.py @@ -0,0 +1,538 @@ +import itertools +import math +import warnings + +from typing import Callable, Optional, Union + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from einops import rearrange + +from rl4co.models.nn.moe import MoE +from rl4co.utils import get_pylogger + +log = get_pylogger(__name__) + + +def scaled_dot_product_attention_simple( + q, k, v, attn_mask=None, dropout_p=0.0, is_causal=False +): + """Simple (exact) Scaled Dot-Product Attention in RL4CO without customized kernels (i.e. no Flash Attention).""" + + # Check for causal and attn_mask conflict + if is_causal and attn_mask is not None: + raise ValueError("Cannot set both is_causal and attn_mask") + + # Calculate scaled dot product + scores = torch.matmul(q, k.transpose(-2, -1)) / (k.size(-1) ** 0.5) + + # Apply the provided attention mask + if attn_mask is not None: + if attn_mask.dtype == torch.bool: + scores.masked_fill_(~attn_mask, float("-inf")) + else: + scores += attn_mask + + # Apply causal mask + if is_causal: + s, l_ = scores.size(-2), scores.size(-1) + mask = torch.triu(torch.ones((s, l_), device=scores.device), diagonal=1) + scores.masked_fill_(mask.bool(), float("-inf")) + + # Softmax to get attention weights + attn_weights = F.softmax(scores, dim=-1) + + # Apply dropout + if dropout_p > 0.0: + attn_weights = F.dropout(attn_weights, p=dropout_p) + + # Compute the weighted sum of values + return torch.matmul(attn_weights, v) + + +try: + from torch.nn.functional import scaled_dot_product_attention +except ImportError: + log.warning( + "torch.nn.functional.scaled_dot_product_attention not found. Make sure you are using PyTorch >= 2.0.0." + "Alternatively, install Flash Attention https://github.com/HazyResearch/flash-attention ." + "Using custom implementation of scaled_dot_product_attention without Flash Attention. " + ) + scaled_dot_product_attention = scaled_dot_product_attention_simple + + +class MultiHeadAttention(nn.Module): + """PyTorch native implementation of Flash Multi-Head Attention with automatic mixed precision support. + Uses PyTorch's native `scaled_dot_product_attention` implementation, available from 2.0 + + Note: + If `scaled_dot_product_attention` is not available, use custom implementation of `scaled_dot_product_attention` without Flash Attention. + + Args: + embed_dim: total dimension of the model + num_heads: number of heads + bias: whether to use bias + attention_dropout: dropout rate for attention weights + causal: whether to apply causal mask to attention scores + device: torch device + dtype: torch dtype + sdpa_fn: scaled dot product attention function (SDPA) implementation + """ + + def __init__( + self, + embed_dim: int, + num_heads: int, + bias: bool = True, + attention_dropout: float = 0.0, + causal: bool = False, + device: str = None, + dtype: torch.dtype = None, + sdpa_fn: Optional[Callable] = None, + ) -> None: + factory_kwargs = {"device": device, "dtype": dtype} + super().__init__() + self.embed_dim = embed_dim + self.causal = causal + self.attention_dropout = attention_dropout + self.sdpa_fn = sdpa_fn if sdpa_fn is not None else scaled_dot_product_attention + + self.num_heads = num_heads + assert self.embed_dim % num_heads == 0, "self.kdim must be divisible by num_heads" + self.head_dim = self.embed_dim // num_heads + assert ( + self.head_dim % 8 == 0 and self.head_dim <= 128 + ), "Only support head_dim <= 128 and divisible by 8" + + self.Wqkv = nn.Linear(embed_dim, 3 * embed_dim, bias=bias, **factory_kwargs) + self.out_proj = nn.Linear(embed_dim, embed_dim, bias=bias, **factory_kwargs) + + def forward(self, x, attn_mask=None): + """x: (batch, seqlen, hidden_dim) (where hidden_dim = num heads * head dim) + attn_mask: bool tensor of shape (batch, seqlen) + """ + # Project query, key, value + q, k, v = rearrange( + self.Wqkv(x), "b s (three h d) -> three b h s d", three=3, h=self.num_heads + ).unbind(dim=0) + + if attn_mask is not None: + attn_mask = ( + attn_mask.unsqueeze(1) + if attn_mask.ndim == 3 + else attn_mask.unsqueeze(1).unsqueeze(2) + ) + + # Scaled dot product attention + out = self.sdpa_fn( + q, + k, + v, + attn_mask=attn_mask, + dropout_p=self.attention_dropout, + ) + return self.out_proj(rearrange(out, "b h s d -> b s (h d)")) + + +def sdpa_fn_wrapper(q, k, v, attn_mask=None, dmat=None, dropout_p=0.0, is_causal=False): + if dmat is not None: + log.warning( + "Edge weights passed to simple attention-fn, which is not supported. Weights will be ignored..." + ) + return scaled_dot_product_attention( + q, k, v, attn_mask=attn_mask, dropout_p=dropout_p, is_causal=is_causal + ) + + +class MultiHeadCrossAttention(nn.Module): + """PyTorch native implementation of Flash Multi-Head Cross Attention with automatic mixed precision support. + Uses PyTorch's native `scaled_dot_product_attention` implementation, available from 2.0 + + Note: + If `scaled_dot_product_attention` is not available, use custom implementation of `scaled_dot_product_attention` without Flash Attention. + + Args: + embed_dim: total dimension of the model + num_heads: number of heads + bias: whether to use bias + attention_dropout: dropout rate for attention weights + device: torch device + dtype: torch dtype + sdpa_fn: scaled dot product attention function (SDPA) + """ + + def __init__( + self, + embed_dim: int, + num_heads: int, + bias: bool = False, + attention_dropout: float = 0.0, + device: str = None, + dtype: torch.dtype = None, + sdpa_fn: Optional[Union[Callable, nn.Module]] = None, + ) -> None: + factory_kwargs = {"device": device, "dtype": dtype} + super().__init__() + self.embed_dim = embed_dim + self.attention_dropout = attention_dropout + + # Default to `scaled_dot_product_attention` if `sdpa_fn` is not provided + if sdpa_fn is None: + sdpa_fn = sdpa_fn_wrapper + self.sdpa_fn = sdpa_fn + + self.num_heads = num_heads + assert self.embed_dim % num_heads == 0, "self.kdim must be divisible by num_heads" + self.head_dim = self.embed_dim // num_heads + assert ( + self.head_dim % 8 == 0 and self.head_dim <= 128 + ), "Only support head_dim <= 128 and divisible by 8" + + self.Wq = nn.Linear(embed_dim, embed_dim, bias=bias, **factory_kwargs) + self.Wkv = nn.Linear(embed_dim, 2 * embed_dim, bias=bias, **factory_kwargs) + self.out_proj = nn.Linear(embed_dim, embed_dim, bias=bias, **factory_kwargs) + + def forward(self, q_input, kv_input, cross_attn_mask=None, dmat=None): + # Project query, key, value + q = rearrange( + self.Wq(q_input), "b m (h d) -> b h m d", h=self.num_heads + ) # [b, h, m, d] + k, v = rearrange( + self.Wkv(kv_input), "b n (two h d) -> two b h n d", two=2, h=self.num_heads + ).unbind( + dim=0 + ) # [b, h, n, d] + + if cross_attn_mask is not None: + # add head dim + cross_attn_mask = cross_attn_mask.unsqueeze(1) + + # Scaled dot product attention + out = self.sdpa_fn( + q, + k, + v, + attn_mask=cross_attn_mask, + dmat=dmat, + dropout_p=self.attention_dropout, + ) + return self.out_proj(rearrange(out, "b h s d -> b s (h d)")) + + +class PointerAttention(nn.Module): + """Calculate logits given query, key and value and logit key. + This follows the pointer mechanism of Vinyals et al. (2015) (https://arxiv.org/abs/1506.03134). + + Note: + With Flash Attention, masking is not supported + + Performs the following: + 1. Apply cross attention to get the heads + 2. Project heads to get glimpse + 3. Compute attention score between glimpse and logit key + + Args: + embed_dim: total dimension of the model + num_heads: number of heads + mask_inner: whether to mask inner attention + linear_bias: whether to use bias in linear projection + check_nan: whether to check for NaNs in logits + sdpa_fn: scaled dot product attention function (SDPA) implementation + """ + + def __init__( + self, + embed_dim: int, + num_heads: int, + mask_inner: bool = True, + out_bias: bool = False, + check_nan: bool = True, + sdpa_fn: Optional[Callable] = None, + **kwargs, + ): + super(PointerAttention, self).__init__() + self.num_heads = num_heads + self.mask_inner = mask_inner + + # Projection - query, key, value already include projections + self.project_out = nn.Linear(embed_dim, embed_dim, bias=out_bias) + self.sdpa_fn = sdpa_fn if sdpa_fn is not None else scaled_dot_product_attention + self.check_nan = check_nan + + def forward(self, query, key, value, logit_key, attn_mask=None): + """Compute attention logits given query, key, value, logit key and attention mask. + + Args: + query: query tensor of shape [B, ..., L, E] + key: key tensor of shape [B, ..., S, E] + value: value tensor of shape [B, ..., S, E] + logit_key: logit key tensor of shape [B, ..., S, E] + attn_mask: attention mask tensor of shape [B, ..., S]. Note that `True` means that the value _should_ take part in attention + as described in the [PyTorch Documentation](https://pytorch.org/docs/stable/generated/torch.nn.functional.scaled_dot_product_attention.html) + """ + # Compute inner multi-head attention with no projections. + heads = self._inner_mha(query, key, value, attn_mask) + glimpse = self._project_out(heads, attn_mask) + + # Batch matrix multiplication to compute logits (batch_size, num_steps, graph_size) + # bmm is slightly faster than einsum and matmul + logits = (torch.bmm(glimpse, logit_key.squeeze(-2).transpose(-2, -1))).squeeze( + -2 + ) / math.sqrt(glimpse.size(-1)) + + if self.check_nan: + assert not torch.isnan(logits).any(), "Logits contain NaNs" + + return logits + + def _inner_mha(self, query, key, value, attn_mask): + q = self._make_heads(query) + k = self._make_heads(key) + v = self._make_heads(value) + if self.mask_inner: + # make mask the same number of dimensions as q + attn_mask = ( + attn_mask.unsqueeze(1) + if attn_mask.ndim == 3 + else attn_mask.unsqueeze(1).unsqueeze(2) + ) + else: + attn_mask = None + heads = self.sdpa_fn(q, k, v, attn_mask=attn_mask) + return rearrange(heads, "... h n g -> ... n (h g)", h=self.num_heads) + + def _make_heads(self, v): + return rearrange(v, "... g (h s) -> ... h g s", h=self.num_heads) + + def _project_out(self, out, *kwargs): + return self.project_out(out) + + +class PointerAttnMoE(PointerAttention): + """Calculate logits given query, key and value and logit key. + This follows the pointer mechanism of Vinyals et al. (2015) , + and the MoE gating mechanism of Zhou et al. (2024) . + + Note: + With Flash Attention, masking is not supported + + Performs the following: + 1. Apply cross attention to get the heads + 2. Project heads to get glimpse + 3. Compute attention score between glimpse and logit key + + Args: + embed_dim: total dimension of the model + num_heads: number of heads + mask_inner: whether to mask inner attention + linear_bias: whether to use bias in linear projection + check_nan: whether to check for NaNs in logits + sdpa_fn: scaled dot product attention function (SDPA) implementation + moe_kwargs: Keyword arguments for MoE + """ + + def __init__( + self, + embed_dim: int, + num_heads: int, + mask_inner: bool = True, + out_bias: bool = False, + check_nan: bool = True, + sdpa_fn: Optional[Callable] = None, + moe_kwargs: Optional[dict] = None, + ): + super(PointerAttnMoE, self).__init__( + embed_dim, num_heads, mask_inner, out_bias, check_nan, sdpa_fn + ) + self.moe_kwargs = moe_kwargs + + self.project_out = None + self.project_out_moe = MoE( + embed_dim, embed_dim, num_neurons=[], out_bias=out_bias, **moe_kwargs + ) + if self.moe_kwargs["light_version"]: + self.dense_or_moe = nn.Linear(embed_dim, 2, bias=False) + self.project_out = nn.Linear(embed_dim, embed_dim, bias=out_bias) + + def _project_out(self, out, attn_mask): + """Implementation of Hierarchical Gating based on Zhou et al. (2024) .""" + if self.moe_kwargs["light_version"]: + num_nodes, num_available_nodes = attn_mask.size(-1), attn_mask.sum(-1) + # only do this at the "second" step, which is depot -> pomo -> first select + if (num_available_nodes >= num_nodes - 1).any(): + self.probs = F.softmax( + self.dense_or_moe( + out.view(-1, out.size(-1)).mean(dim=0, keepdim=True) + ), + dim=-1, + ) + selected = self.probs.multinomial(1).squeeze(0) + out = ( + self.project_out_moe(out) + if selected.item() == 1 + else self.project_out(out) + ) + glimpse = out * self.probs.squeeze(0)[selected] + else: + glimpse = self.project_out_moe(out) + return glimpse + + +# Deprecated +class LogitAttention(PointerAttention): + def __init__(self, *args, **kwargs): + warnings.simplefilter("always", DeprecationWarning) + warnings.warn( + "LogitAttention is deprecated and will be removed in a future release. " + "Please use PointerAttention instead." + "Note that several components of the previous LogitAttention have moved to `rl4co.models.nn.dec_strategies`.", + category=DeprecationWarning, + ) + super(LogitAttention, self).__init__(*args, **kwargs) + + +# MultiHeadCompat +class MultiHeadCompat(nn.Module): + def __init__(self, n_heads, input_dim, embed_dim=None, val_dim=None, key_dim=None): + super(MultiHeadCompat, self).__init__() + + if val_dim is None: + # assert embed_dim is not None, "Provide either embed_dim or val_dim" + val_dim = embed_dim // n_heads + if key_dim is None: + key_dim = val_dim + + self.n_heads = n_heads + self.input_dim = input_dim + self.embed_dim = embed_dim + self.val_dim = val_dim + self.key_dim = key_dim + + self.W_query = nn.Parameter(torch.Tensor(n_heads, input_dim, key_dim)) + self.W_key = nn.Parameter(torch.Tensor(n_heads, input_dim, key_dim)) + + self.init_parameters() + + # used for init nn.Parameter + def init_parameters(self): + for param in self.parameters(): + stdv = 1.0 / math.sqrt(param.size(-1)) + param.data.uniform_(-stdv, stdv) + + def forward(self, q, h=None, mask=None): + """ + + :param q: queries (batch_size, n_query, input_dim) + :param h: data (batch_size, graph_size, input_dim) + :param mask: mask (batch_size, n_query, graph_size) or viewable as that (i.e. can be 2 dim if n_query == 1) + Mask should contain 1 if attention is not possible (i.e. mask is negative adjacency) + :return: + """ + + if h is None: + h = q # compute self-attention + + # h should be (batch_size, graph_size, input_dim) + batch_size, graph_size, input_dim = h.size() + n_query = q.size(1) + + hflat = h.contiguous().view(-1, input_dim) ################# reshape + qflat = q.contiguous().view(-1, input_dim) + + # last dimension can be different for keys and values + shp = (self.n_heads, batch_size, graph_size, -1) + shp_q = (self.n_heads, batch_size, n_query, -1) + + # Calculate queries, (n_heads, n_query, graph_size, key/val_size) + Q = torch.matmul(qflat, self.W_query).view(shp_q) + K = torch.matmul(hflat, self.W_key).view(shp) + + # Calculate compatibility (n_heads, batch_size, n_query, graph_size) + compatibility_s2n = torch.matmul(Q, K.transpose(2, 3)) + + return compatibility_s2n + + +class PolyNetAttention(PointerAttention): + """Calculate logits given query, key and value and logit key. + This implements a modified version the pointer mechanism of Vinyals et al. (2015) (https://arxiv.org/abs/1506.03134) + as described in Hottung et al. (2024) (https://arxiv.org/abs/2402.14048) PolyNetAttention conditions the attention logits on + a set of k different binary vectors allowing to learn k different solution strategies. + + Note: + With Flash Attention, masking is not supported + + Performs the following: + 1. Apply cross attention to get the heads + 2. Project heads to get glimpse + 3. Apply PolyNet layers + 4. Compute attention score between glimpse and logit key + + Args: + k: Number unique bit vectors used to compute attention score + embed_dim: total dimension of the model + poly_layer_dim: Dimension of the PolyNet layers + num_heads: number of heads + mask_inner: whether to mask inner attention + linear_bias: whether to use bias in linear projection + check_nan: whether to check for NaNs in logits + sdpa_fn: scaled dot product attention function (SDPA) implementation + """ + + def __init__( + self, k: int, embed_dim: int, poly_layer_dim: int, num_heads: int, **kwargs + ): + super(PolyNetAttention, self).__init__(embed_dim, num_heads, **kwargs) + + self.k = k + self.binary_vector_dim = math.ceil(math.log2(k)) + self.binary_vectors = torch.nn.Parameter( + torch.Tensor( + list(itertools.product([0, 1], repeat=self.binary_vector_dim))[:k] + ), + requires_grad=False, + ) + + self.poly_layer_1 = nn.Linear(embed_dim + self.binary_vector_dim, poly_layer_dim) + self.poly_layer_2 = nn.Linear(poly_layer_dim, embed_dim) + + def forward(self, query, key, value, logit_key, attn_mask=None): + """Compute attention logits given query, key, value, logit key and attention mask. + + Args: + query: query tensor of shape [B, ..., L, E] + key: key tensor of shape [B, ..., S, E] + value: value tensor of shape [B, ..., S, E] + logit_key: logit key tensor of shape [B, ..., S, E] + attn_mask: attention mask tensor of shape [B, ..., S]. Note that `True` means that the value _should_ take part in attention + as described in the [PyTorch Documentation](https://pytorch.org/docs/stable/generated/torch.nn.functional.scaled_dot_product_attention.html) + """ + # Compute inner multi-head attention with no projections. + heads = self._inner_mha(query, key, value, attn_mask) + glimpse = self.project_out(heads) + + num_solutions = glimpse.shape[1] + z = self.binary_vectors.repeat(math.ceil(num_solutions / self.k), 1)[ + :num_solutions + ] + z = z[None].expand(glimpse.shape[0], num_solutions, self.binary_vector_dim) + + # PolyNet layers + poly_out = self.poly_layer_1(torch.cat((glimpse, z), dim=2)) + poly_out = F.relu(poly_out) + poly_out = self.poly_layer_2(poly_out) + + glimpse += poly_out + + # Batch matrix multiplication to compute logits (batch_size, num_steps, graph_size) + # bmm is slightly faster than einsum and matmul + logits = (torch.bmm(glimpse, logit_key.squeeze(-2).transpose(-2, -1))).squeeze( + -2 + ) / math.sqrt(glimpse.size(-1)) + + if self.check_nan: + assert not torch.isnan(logits).any(), "Logits contain NaNs" + + return logits diff --git a/rl4co/models/nn/env_embeddings/__init__.py b/rl4co/models/nn/env_embeddings/__init__.py new file mode 100644 index 00000000..0c0e870e --- /dev/null +++ b/rl4co/models/nn/env_embeddings/__init__.py @@ -0,0 +1,4 @@ +from rl4co.models.nn.env_embeddings.context import env_context_embedding +from rl4co.models.nn.env_embeddings.dynamic import env_dynamic_embedding +from rl4co.models.nn.env_embeddings.edge import env_edge_embedding +from rl4co.models.nn.env_embeddings.init import env_init_embedding diff --git a/rl4co/models/nn/env_embeddings/context.py b/rl4co/models/nn/env_embeddings/context.py new file mode 100644 index 00000000..b6059f04 --- /dev/null +++ b/rl4co/models/nn/env_embeddings/context.py @@ -0,0 +1,372 @@ +import torch +import torch.nn as nn + +from tensordict import TensorDict + +from rl4co.utils.ops import gather_by_index + + +def env_context_embedding(env_name: str, config: dict) -> nn.Module: + """Get environment context embedding. The context embedding is used to modify the + query embedding of the problem node of the current partial solution. + Usually consists of a projection of gathered node embeddings and features to the embedding space. + + Args: + env: Environment or its name. + config: A dictionary of configuration options for the environment. + """ + embedding_registry = { + "tsp": TSPContext, + "atsp": TSPContext, + "cvrp": VRPContext, + "cvrptw": VRPTWContext, + "ffsp": FFSPContext, + "svrp": SVRPContext, + "sdvrp": VRPContext, + "pctsp": PCTSPContext, + "spctsp": PCTSPContext, + "op": OPContext, + "dpp": DPPContext, + "mdpp": DPPContext, + "pdp": PDPContext, + "mtsp": MTSPContext, + "smtwtp": SMTWTPContext, + "mdcpdp": MDCPDPContext, + "mtvrp": MTVRPContext, + } + + if env_name not in embedding_registry: + raise ValueError( + f"Unknown environment name '{env_name}'. Available context embeddings: {embedding_registry.keys()}" + ) + + return embedding_registry[env_name](**config) + + +class EnvContext(nn.Module): + """Base class for environment context embeddings. The context embedding is used to modify the + query embedding of the problem node of the current partial solution. + Consists of a linear layer that projects the node features to the embedding space.""" + + def __init__(self, embed_dim, step_context_dim=None, linear_bias=False): + super(EnvContext, self).__init__() + self.embed_dim = embed_dim + step_context_dim = step_context_dim if step_context_dim is not None else embed_dim + self.project_context = nn.Linear(step_context_dim, embed_dim, bias=linear_bias) + + def _cur_node_embedding(self, embeddings, td): + """Get embedding of current node""" + cur_node_embedding = gather_by_index(embeddings, td["current_node"]) + return cur_node_embedding + + def _state_embedding(self, embeddings, td): + """Get state embedding""" + raise NotImplementedError("Implement for each environment") + + def forward(self, embeddings, td): + cur_node_embedding = self._cur_node_embedding(embeddings, td) + state_embedding = self._state_embedding(embeddings, td) + context_embedding = torch.cat([cur_node_embedding, state_embedding], -1) + return self.project_context(context_embedding) + + +class FFSPContext(EnvContext): + def __init__(self, embed_dim, stage_cnt=None): + self.has_stage_emb = stage_cnt is not None + step_context_dim = (1 + int(self.has_stage_emb)) * embed_dim + super().__init__(embed_dim=embed_dim, step_context_dim=step_context_dim) + if self.has_stage_emb: + self.stage_emb = nn.Parameter(torch.rand(stage_cnt, embed_dim)) + + def _cur_node_embedding(self, embeddings: TensorDict, td): + cur_node_embedding = gather_by_index( + embeddings["machine_embeddings"], td["stage_machine_idx"] + ) + return cur_node_embedding + + def forward(self, embeddings, td): + cur_node_embedding = self._cur_node_embedding(embeddings, td) + if self.has_stage_emb: + state_embedding = self._state_embedding(embeddings, td) + context_embedding = torch.cat([cur_node_embedding, state_embedding], -1) + return self.project_context(context_embedding) + else: + return self.project_context(cur_node_embedding) + + def _state_embedding(self, _, td): + cur_stage_emb = self.stage_emb[td["stage_idx"]] + return cur_stage_emb + + +class TSPContext(EnvContext): + """Context embedding for the Traveling Salesman Problem (TSP). + Project the following to the embedding space: + - first node embedding + - current node embedding + """ + + def __init__(self, embed_dim): + super(TSPContext, self).__init__(embed_dim, 2 * embed_dim) + self.W_placeholder = nn.Parameter( + torch.Tensor(2 * self.embed_dim).uniform_(-1, 1) + ) + + def forward(self, embeddings, td): + batch_size = embeddings.size(0) + # By default, node_dim = -1 (we only have one node embedding per node) + node_dim = ( + (-1,) if td["first_node"].dim() == 1 else (td["first_node"].size(-1), -1) + ) + if td["i"][(0,) * td["i"].dim()].item() < 1: # get first item fast + if len(td.batch_size) < 2: + context_embedding = self.W_placeholder[None, :].expand( + batch_size, self.W_placeholder.size(-1) + ) + else: + context_embedding = self.W_placeholder[None, None, :].expand( + batch_size, td.batch_size[1], self.W_placeholder.size(-1) + ) + else: + context_embedding = gather_by_index( + embeddings, + torch.stack([td["first_node"], td["current_node"]], -1).view( + batch_size, -1 + ), + ).view(batch_size, *node_dim) + return self.project_context(context_embedding) + + +class VRPContext(EnvContext): + """Context embedding for the Capacitated Vehicle Routing Problem (CVRP). + Project the following to the embedding space: + - current node embedding + - remaining capacity (vehicle_capacity - used_capacity) + """ + + def __init__(self, embed_dim): + super(VRPContext, self).__init__( + embed_dim=embed_dim, step_context_dim=embed_dim + 1 + ) + + def _state_embedding(self, embeddings, td): + state_embedding = td["vehicle_capacity"] - td["used_capacity"] + return state_embedding + + +class VRPTWContext(VRPContext): + """Context embedding for the Capacitated Vehicle Routing Problem (CVRP). + Project the following to the embedding space: + - current node embedding + - remaining capacity (vehicle_capacity - used_capacity) + - current time + """ + + def __init__(self, embed_dim): + super(VRPContext, self).__init__( + embed_dim=embed_dim, step_context_dim=embed_dim + 2 + ) + + def _state_embedding(self, embeddings, td): + capacity = super()._state_embedding(embeddings, td) + current_time = td["current_time"] + return torch.cat([capacity, current_time], -1) + + +class SVRPContext(EnvContext): + """Context embedding for the Skill Vehicle Routing Problem (SVRP). + Project the following to the embedding space: + - current node embedding + - current technician + """ + + def __init__(self, embed_dim): + super(SVRPContext, self).__init__(embed_dim=embed_dim, step_context_dim=embed_dim) + + def forward(self, embeddings, td): + cur_node_embedding = self._cur_node_embedding(embeddings, td).squeeze() + return self.project_context(cur_node_embedding) + + +class PCTSPContext(EnvContext): + """Context embedding for the Prize Collecting TSP (PCTSP). + Project the following to the embedding space: + - current node embedding + - remaining prize (prize_required - cur_total_prize) + """ + + def __init__(self, embed_dim): + super(PCTSPContext, self).__init__(embed_dim, embed_dim + 1) + + def _state_embedding(self, embeddings, td): + state_embedding = torch.clamp( + td["prize_required"] - td["cur_total_prize"], min=0 + )[..., None] + return state_embedding + + +class OPContext(EnvContext): + """Context embedding for the Orienteering Problem (OP). + Project the following to the embedding space: + - current node embedding + - remaining distance (max_length - tour_length) + """ + + def __init__(self, embed_dim): + super(OPContext, self).__init__(embed_dim, embed_dim + 1) + + def _state_embedding(self, embeddings, td): + state_embedding = td["max_length"][..., 0] - td["tour_length"] + return state_embedding[..., None] + + +class DPPContext(EnvContext): + """Context embedding for the Decap Placement Problem (DPP), EDA (electronic design automation). + Project the following to the embedding space: + - current cell embedding + """ + + def __init__(self, embed_dim): + super(DPPContext, self).__init__(embed_dim) + + def forward(self, embeddings, td): + """Context cannot be defined by a single node embedding for DPP, hence 0. + We modify the dynamic embedding instead to capture placed items + """ + return embeddings.new_zeros(embeddings.size(0), self.embed_dim) + + +class PDPContext(EnvContext): + """Context embedding for the Pickup and Delivery Problem (PDP). + Project the following to the embedding space: + - current node embedding + """ + + def __init__(self, embed_dim): + super(PDPContext, self).__init__(embed_dim, embed_dim) + + def forward(self, embeddings, td): + cur_node_embedding = self._cur_node_embedding(embeddings, td).squeeze() + return self.project_context(cur_node_embedding) + + +class MTSPContext(EnvContext): + """Context embedding for the Multiple Traveling Salesman Problem (mTSP). + Project the following to the embedding space: + - current node embedding + - remaining_agents + - current_length + - max_subtour_length + - distance_from_depot + """ + + def __init__(self, embed_dim, linear_bias=False): + super(MTSPContext, self).__init__(embed_dim, 2 * embed_dim) + proj_in_dim = ( + 4 # remaining_agents, current_length, max_subtour_length, distance_from_depot + ) + self.proj_dynamic_feats = nn.Linear(proj_in_dim, embed_dim, bias=linear_bias) + + def _cur_node_embedding(self, embeddings, td): + cur_node_embedding = gather_by_index(embeddings, td["current_node"]) + return cur_node_embedding.squeeze() + + def _state_embedding(self, embeddings, td): + dynamic_feats = torch.stack( + [ + (td["num_agents"] - td["agent_idx"]).float(), + td["current_length"], + td["max_subtour_length"], + self._distance_from_depot(td), + ], + dim=-1, + ) + return self.proj_dynamic_feats(dynamic_feats) + + def _distance_from_depot(self, td): + # Euclidean distance from the depot (loc[..., 0, :]) + cur_loc = gather_by_index(td["locs"], td["current_node"]) + return torch.norm(cur_loc - td["locs"][..., 0, :], dim=-1) + + +class SMTWTPContext(EnvContext): + """Context embedding for the Single Machine Total Weighted Tardiness Problem (SMTWTP). + Project the following to the embedding space: + - current node embedding + - current time + """ + + def __init__(self, embed_dim): + super(SMTWTPContext, self).__init__(embed_dim, embed_dim + 1) + + def _cur_node_embedding(self, embeddings, td): + cur_node_embedding = gather_by_index(embeddings, td["current_job"]) + return cur_node_embedding + + def _state_embedding(self, embeddings, td): + state_embedding = td["current_time"] + return state_embedding + + +class MDCPDPContext(EnvContext): + """Context embedding for the MDCPDP. + Project the following to the embedding space: + - current node embedding + """ + + def __init__(self, embed_dim): + super(MDCPDPContext, self).__init__(embed_dim, embed_dim) + + def forward(self, embeddings, td): + cur_node_embedding = self._cur_node_embedding(embeddings, td).squeeze() + return self.project_context(cur_node_embedding) + + +class SchedulingContext(nn.Module): + def __init__(self, embed_dim: int, scaling_factor: int = 1000): + super().__init__() + self.scaling_factor = scaling_factor + self.proj_busy = nn.Linear(1, embed_dim, bias=False) + + def forward(self, h, td): + busy_for = (td["busy_until"] - td["time"].unsqueeze(1)) / self.scaling_factor + busy_proj = self.proj_busy(busy_for.unsqueeze(-1)) + # (b m e) + return h + busy_proj + + +class MTVRPContext(VRPContext): + """Context embedding for Multi-Task VRPEnv. + Project the following to the embedding space: + - current node embedding + - remaining_linehaul_capacity (vehicle_capacity - used_capacity_linehaul) + - remaining_backhaul_capacity (vehicle_capacity - used_capacity_backhaul) + - current time + - current_route_length + - open route indicator + """ + + def __init__(self, embed_dim): + super(VRPContext, self).__init__( + embed_dim=embed_dim, step_context_dim=embed_dim + 5 + ) + + def _state_embedding(self, embeddings, td): + remaining_linehaul_capacity = ( + td["vehicle_capacity"] - td["used_capacity_linehaul"] + ) + remaining_backhaul_capacity = ( + td["vehicle_capacity"] - td["used_capacity_backhaul"] + ) + current_time = td["current_time"] + current_route_length = td["current_route_length"] + open_route = td["open_route"] + return torch.cat( + [ + remaining_linehaul_capacity, + remaining_backhaul_capacity, + current_time, + current_route_length, + open_route, + ], + -1, + ) diff --git a/rl4co/models/nn/env_embeddings/dynamic.py b/rl4co/models/nn/env_embeddings/dynamic.py new file mode 100644 index 00000000..470af835 --- /dev/null +++ b/rl4co/models/nn/env_embeddings/dynamic.py @@ -0,0 +1,121 @@ +import torch +import torch.nn as nn + +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def env_dynamic_embedding(env_name: str, config: dict) -> nn.Module: + """Get environment dynamic embedding. The dynamic embedding is used to modify query, key and value vectors of the attention mechanism + based on the current state of the environment (which is changing during the rollout). + Consists of a linear layer that projects the node features to the embedding space. + + Args: + env: Environment or its name. + config: A dictionary of configuration options for the environment. + """ + embedding_registry = { + "tsp": StaticEmbedding, + "atsp": StaticEmbedding, + "cvrp": StaticEmbedding, + "cvrptw": StaticEmbedding, + "ffsp": StaticEmbedding, + "svrp": StaticEmbedding, + "sdvrp": SDVRPDynamicEmbedding, + "pctsp": StaticEmbedding, + "spctsp": StaticEmbedding, + "op": StaticEmbedding, + "dpp": StaticEmbedding, + "mdpp": StaticEmbedding, + "pdp": StaticEmbedding, + "mtsp": StaticEmbedding, + "smtwtp": StaticEmbedding, + "jssp": JSSPDynamicEmbedding, + "fjsp": JSSPDynamicEmbedding, + "mtvrp": StaticEmbedding, + } + + if env_name not in embedding_registry: + log.warning( + f"Unknown environment name '{env_name}'. Available dynamic embeddings: {embedding_registry.keys()}. Defaulting to StaticEmbedding." + ) + return embedding_registry.get(env_name, StaticEmbedding)(**config) + + +class StaticEmbedding(nn.Module): + """Static embedding for general problems. + This is used for problems that do not have any dynamic information, except for the + information regarding the current action (e.g. the current node in TSP). See context embedding for more details. + """ + + def __init__(self, *args, **kwargs): + super(StaticEmbedding, self).__init__() + + def forward(self, td): + return 0, 0, 0 + + +class SDVRPDynamicEmbedding(nn.Module): + """Dynamic embedding for the Split Delivery Vehicle Routing Problem (SDVRP). + Embed the following node features to the embedding space: + - demand_with_depot: demand of the customers and the depot + The demand with depot is used to modify the query, key and value vectors of the attention mechanism + based on the current state of the environment (which is changing during the rollout). + """ + + def __init__(self, embed_dim, linear_bias=False): + super(SDVRPDynamicEmbedding, self).__init__() + self.projection = nn.Linear(1, 3 * embed_dim, bias=linear_bias) + + def forward(self, td): + demands_with_depot = td["demand_with_depot"][..., None].clone() + demands_with_depot[..., 0, :] = 0 + glimpse_key_dynamic, glimpse_val_dynamic, logit_key_dynamic = self.projection( + demands_with_depot + ).chunk(3, dim=-1) + return glimpse_key_dynamic, glimpse_val_dynamic, logit_key_dynamic + + +class JSSPDynamicEmbedding(nn.Module): + def __init__(self, embed_dim, linear_bias=False, scaling_factor: int = 1000) -> None: + super().__init__() + self.embed_dim = embed_dim + self.project_node_step = nn.Linear(2, 3 * embed_dim, bias=linear_bias) + self.project_edge_step = nn.Linear(1, 3, bias=linear_bias) + self.scaling_factor = scaling_factor + + def forward(self, td, cache): + ma_emb = cache.node_embeddings["machine_embeddings"] + bs, _, emb_dim = ma_emb.shape + num_jobs = td["next_op"].size(1) + # updates + updates = ma_emb.new_zeros((bs, num_jobs, 3 * emb_dim)) + + lbs = torch.clip(td["lbs"] - td["time"][:, None], 0) / self.scaling_factor + update_feat = torch.stack((lbs, td["is_ready"]), dim=-1) + job_update_feat = gather_by_index(update_feat, td["next_op"], dim=1) + updates = updates + self.project_node_step(job_update_feat) + + ma_busy = td["busy_until"] > td["time"][:, None] + # mask machines currently busy + masked_proc_times = td["proc_times"].clone() / self.scaling_factor + # bs, ma, ops + masked_proc_times[ma_busy] = 0.0 + # bs, ops, ma, 3 + edge_feat = self.project_edge_step(masked_proc_times.unsqueeze(-1)).transpose( + 1, 2 + ) + job_edge_feat = gather_by_index(edge_feat, td["next_op"], dim=1) + # bs, nodes, 3*emb + edge_upd = torch.einsum("ijkl,ikm->ijlm", job_edge_feat, ma_emb).view( + bs, num_jobs, 3 * emb_dim + ) + updates = updates + edge_upd + + # (bs, nodes, emb) + glimpse_key_dynamic, glimpse_val_dynamic, logit_key_dynamic = updates.chunk( + 3, dim=-1 + ) + return glimpse_key_dynamic, glimpse_val_dynamic, logit_key_dynamic diff --git a/rl4co/models/nn/env_embeddings/edge.py b/rl4co/models/nn/env_embeddings/edge.py new file mode 100644 index 00000000..97fa3fb5 --- /dev/null +++ b/rl4co/models/nn/env_embeddings/edge.py @@ -0,0 +1,153 @@ +import torch +import torch.nn as nn + +from torch import Tensor + +try: + from torch_geometric.data import Batch, Data +except ImportError: + Batch = Data = None + +from rl4co.utils.ops import get_distance_matrix, get_full_graph_edge_index, sparsify_graph +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def env_edge_embedding(env_name: str, config: dict) -> nn.Module: + """Retrieve the edge embedding module specific to the environment. Edge embeddings are crucial for + transforming the raw edge features into a format suitable for the neural network, especially in + graph neural networks where edge features can significantly impact the model's performance. + + Args: + env: Environment or its name. + config: A dictionary of configuration options for the environment. + """ + embedding_registry = { + "tsp": TSPEdgeEmbedding, + "atsp": ATSPEdgeEmbedding, + "cvrp": TSPEdgeEmbedding, + "sdvrp": TSPEdgeEmbedding, + "pctsp": TSPEdgeEmbedding, + "spctsp": TSPEdgeEmbedding, + "op": TSPEdgeEmbedding, + "dpp": TSPEdgeEmbedding, + "mdpp": TSPEdgeEmbedding, + "pdp": TSPEdgeEmbedding, + "mtsp": TSPEdgeEmbedding, + "smtwtp": NoEdgeEmbedding, + } + + if env_name not in embedding_registry: + raise ValueError( + f"Unknown environment name '{env_name}'. Available init embeddings: {embedding_registry.keys()}" + ) + + return embedding_registry[env_name](**config) + + +class TSPEdgeEmbedding(nn.Module): + """Edge embedding module for the Traveling Salesman Problem (TSP) and related problems. + This module converts the cost matrix or the distances between nodes into embeddings that can be + used by the neural network. It supports sparsification to focus on a subset of relevant edges, + which is particularly useful for large graphs. + """ + + def __init__( + self, + embed_dim, + linear_bias=True, + sparsify=True, + k_sparse: int = None, + ): + assert Batch is not None, ( + "torch_geometric not found. Please install torch_geometric using instructions from " + "https://pytorch-geometric.readthedocs.io/en/latest/install/installation.html." + ) + + super(TSPEdgeEmbedding, self).__init__() + node_dim = 1 + self.k_sparse = k_sparse + self.sparsify = sparsify + self.edge_embed = nn.Linear(node_dim, embed_dim, linear_bias) + + def forward(self, td, init_embeddings: Tensor): + cost_matrix = get_distance_matrix(td["locs"]) + batch = self._cost_matrix_to_graph(cost_matrix, init_embeddings) + return batch + + def _cost_matrix_to_graph(self, batch_cost_matrix: Tensor, init_embeddings: Tensor): + """Convert batched cost_matrix to batched PyG graph, and calculate edge embeddings. + + Args: + batch_cost_matrix: Tensor of shape [batch_size, n, n] + init_embedding: init embeddings + """ + graph_data = [] + for index, cost_matrix in enumerate(batch_cost_matrix): + if self.sparsify: + edge_index, edge_attr = sparsify_graph( + cost_matrix, self.k_sparse, self_loop=False + ) + else: + edge_index = get_full_graph_edge_index( + cost_matrix.shape[0], self_loop=False + ).to(cost_matrix.device) + edge_attr = cost_matrix[edge_index[0], edge_index[1]] + + graph = Data( + x=init_embeddings[index], + edge_index=edge_index, + edge_attr=edge_attr, + ) + graph_data.append(graph) + + batch = Batch.from_data_list(graph_data) + batch.edge_attr = self.edge_embed(batch.edge_attr) + return batch + + +class ATSPEdgeEmbedding(TSPEdgeEmbedding): + """Edge embedding module for the Asymmetric Traveling Salesman Problem (ATSP). + Inherits from TSPEdgeEmbedding and adapts the edge embedding process to handle + asymmetric cost matrices, where the cost from node i to node j may not be the same as from j to i. + """ + + def forward(self, td, init_embeddings: Tensor): + batch = self._cost_matrix_to_graph(td["cost_matrix"], init_embeddings) + return batch + + +class NoEdgeEmbedding(nn.Module): + """A module for environments that do not require edge embeddings, or where edge features + are not used. This can be useful for simplifying models in problems where only node + features are relevant. + """ + + def __init__(self, embed_dim, self_loop=False, **kwargs): + assert Batch is not None, ( + "torch_geometric not found. Please install torch_geometric using instructions from " + "https://pytorch-geometric.readthedocs.io/en/latest/install/installation.html." + ) + + super(NoEdgeEmbedding, self).__init__() + self.embed_dim = embed_dim + self.self_loop = self_loop + + def forward(self, td, init_embeddings: Tensor): + data_list = [] + n = init_embeddings.shape[1] + device = init_embeddings.device + edge_index = get_full_graph_edge_index(n, self_loop=self.self_loop).to(device) + m = edge_index.shape[1] + + for node_embed in init_embeddings: + data = Data( + x=node_embed, + edge_index=edge_index, + edge_attr=torch.zeros((m, self.embed_dim), device=device), + ) + data_list.append(data) + + batch = Batch.from_data_list(data_list) + return batch diff --git a/rl4co/models/nn/env_embeddings/init.py b/rl4co/models/nn/env_embeddings/init.py new file mode 100644 index 00000000..06391cb2 --- /dev/null +++ b/rl4co/models/nn/env_embeddings/init.py @@ -0,0 +1,512 @@ +import torch +import torch.nn as nn + +from tensordict.tensordict import TensorDict + +from rl4co.models.nn.ops import PositionalEncoding + + +def env_init_embedding(env_name: str, config: dict) -> nn.Module: + """Get environment initial embedding. The init embedding is used to initialize the + general embedding of the problem nodes without any solution information. + Consists of a linear layer that projects the node features to the embedding space. + + Args: + env: Environment or its name. + config: A dictionary of configuration options for the environment. + """ + embedding_registry = { + "tsp": TSPInitEmbedding, + "atsp": TSPInitEmbedding, + "matnet": MatNetInitEmbedding, + "cvrp": VRPInitEmbedding, + "cvrptw": VRPTWInitEmbedding, + "svrp": SVRPInitEmbedding, + "sdvrp": VRPInitEmbedding, + "pctsp": PCTSPInitEmbedding, + "spctsp": PCTSPInitEmbedding, + "op": OPInitEmbedding, + "dpp": DPPInitEmbedding, + "mdpp": MDPPInitEmbedding, + "pdp": PDPInitEmbedding, + "pdp_ruin_repair": TSPInitEmbedding, + "tsp_kopt": TSPInitEmbedding, + "mtsp": MTSPInitEmbedding, + "smtwtp": SMTWTPInitEmbedding, + "mdcpdp": MDCPDPInitEmbedding, + "fjsp": FJSPInitEmbedding, + "jssp": FJSPInitEmbedding, + "mtvrp": MTVRPInitEmbedding, + } + + if env_name not in embedding_registry: + raise ValueError( + f"Unknown environment name '{env_name}'. Available init embeddings: {embedding_registry.keys()}" + ) + + return embedding_registry[env_name](**config) + + +class TSPInitEmbedding(nn.Module): + """Initial embedding for the Traveling Salesman Problems (TSP). + Embed the following node features to the embedding space: + - locs: x, y coordinates of the cities + """ + + def __init__(self, embed_dim, linear_bias=True): + super(TSPInitEmbedding, self).__init__() + node_dim = 2 # x, y + self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias) + + def forward(self, td): + out = self.init_embed(td["locs"]) + return out + + +class MatNetInitEmbedding(nn.Module): + """ + Preparing the initial row and column embeddings for MatNet. + + Reference: + https://github.com/yd-kwon/MatNet/blob/782698b60979effe2e7b61283cca155b7cdb727f/ATSP/ATSP_MatNet/ATSPModel.py#L51 + + + """ + + def __init__(self, embed_dim: int, mode: str = "RandomOneHot") -> None: + super().__init__() + + self.embed_dim = embed_dim + assert mode in { + "RandomOneHot", + "Random", + }, "mode must be one of ['RandomOneHot', 'Random']" + self.mode = mode + + def forward(self, td: TensorDict): + dmat = td["cost_matrix"] + b, r, c = dmat.shape + + row_emb = torch.zeros(b, r, self.embed_dim, device=dmat.device) + + if self.mode == "RandomOneHot": + # MatNet uses one-hot encoding for column embeddings + # https://github.com/yd-kwon/MatNet/blob/782698b60979effe2e7b61283cca155b7cdb727f/ATSP/ATSP_MatNet/ATSPModel.py#L60 + col_emb = torch.zeros(b, c, self.embed_dim, device=dmat.device) + rand = torch.rand(b, c) + rand_idx = rand.argsort(dim=1) + b_idx = torch.arange(b)[:, None].expand(b, c) + n_idx = torch.arange(c)[None, :].expand(b, c) + col_emb[b_idx, n_idx, rand_idx] = 1.0 + + elif self.mode == "Random": + col_emb = torch.rand(b, c, self.embed_dim, device=dmat.device) + else: + raise NotImplementedError + + return row_emb, col_emb, dmat + + +class VRPInitEmbedding(nn.Module): + """Initial embedding for the Vehicle Routing Problems (VRP). + Embed the following node features to the embedding space: + - locs: x, y coordinates of the nodes (depot and customers separately) + - demand: demand of the customers + """ + + def __init__(self, embed_dim, linear_bias=True, node_dim: int = 3): + super(VRPInitEmbedding, self).__init__() + node_dim = node_dim # 3: x, y, demand + self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias) + self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias) # depot embedding + + def forward(self, td): + # [batch, 1, 2]-> [batch, 1, embed_dim] + depot, cities = td["locs"][:, :1, :], td["locs"][:, 1:, :] + depot_embedding = self.init_embed_depot(depot) + # [batch, n_city, 2, batch, n_city, 1] -> [batch, n_city, embed_dim] + node_embeddings = self.init_embed( + torch.cat((cities, td["demand"][..., None]), -1) + ) + # [batch, n_city+1, embed_dim] + out = torch.cat((depot_embedding, node_embeddings), -2) + return out + + +class VRPTWInitEmbedding(VRPInitEmbedding): + def __init__(self, embed_dim, linear_bias=True, node_dim: int = 6): + # node_dim = 6: x, y, demand, tw start, tw end, service time + super(VRPTWInitEmbedding, self).__init__(embed_dim, linear_bias, node_dim) + + def forward(self, td): + depot, cities = td["locs"][:, :1, :], td["locs"][:, 1:, :] + durations = td["durations"][..., 1:] + time_windows = td["time_windows"][..., 1:, :] + # embeddings + depot_embedding = self.init_embed_depot(depot) + node_embeddings = self.init_embed( + torch.cat( + (cities, td["demand"][..., None], time_windows, durations[..., None]), -1 + ) + ) + return torch.cat((depot_embedding, node_embeddings), -2) + + +class SVRPInitEmbedding(nn.Module): + def __init__(self, embed_dim, linear_bias=True, node_dim: int = 3): + super(SVRPInitEmbedding, self).__init__() + node_dim = node_dim # 3: x, y, skill + self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias) + self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias) # depot embedding + + def forward(self, td): + # [batch, 1, 2]-> [batch, 1, embed_dim] + depot, cities = td["locs"][:, :1, :], td["locs"][:, 1:, :] + depot_embedding = self.init_embed_depot(depot) + # [batch, n_city, 2, batch, n_city, 1] -> [batch, n_city, embed_dim] + node_embeddings = self.init_embed(torch.cat((cities, td["skills"]), -1)) + # [batch, n_city+1, embed_dim] + out = torch.cat((depot_embedding, node_embeddings), -2) + return out + + +class PCTSPInitEmbedding(nn.Module): + """Initial embedding for the Prize Collecting Traveling Salesman Problems (PCTSP). + Embed the following node features to the embedding space: + - locs: x, y coordinates of the nodes (depot and customers separately) + - expected_prize: expected prize for visiting the customers. + In PCTSP, this is the actual prize. In SPCTSP, this is the expected prize. + - penalty: penalty for not visiting the customers + """ + + def __init__(self, embed_dim, linear_bias=True): + super(PCTSPInitEmbedding, self).__init__() + node_dim = 4 # x, y, prize, penalty + self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias) + self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias) + + def forward(self, td): + depot, cities = td["locs"][:, :1, :], td["locs"][:, 1:, :] + depot_embedding = self.init_embed_depot(depot) + node_embeddings = self.init_embed( + torch.cat( + ( + cities, + td["expected_prize"][..., None], + td["penalty"][..., 1:, None], + ), + -1, + ) + ) + # batch, n_city+1, embed_dim + out = torch.cat((depot_embedding, node_embeddings), -2) + return out + + +class OPInitEmbedding(nn.Module): + """Initial embedding for the Orienteering Problems (OP). + Embed the following node features to the embedding space: + - locs: x, y coordinates of the nodes (depot and customers separately) + - prize: prize for visiting the customers + """ + + def __init__(self, embed_dim, linear_bias=True): + super(OPInitEmbedding, self).__init__() + node_dim = 3 # x, y, prize + self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias) + self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias) # depot embedding + + def forward(self, td): + depot, cities = td["locs"][:, :1, :], td["locs"][:, 1:, :] + depot_embedding = self.init_embed_depot(depot) + node_embeddings = self.init_embed( + torch.cat( + ( + cities, + td["prize"][..., 1:, None], # exclude depot + ), + -1, + ) + ) + out = torch.cat((depot_embedding, node_embeddings), -2) + return out + + +class DPPInitEmbedding(nn.Module): + """Initial embedding for the Decap Placement Problem (DPP), EDA (electronic design automation). + Embed the following node features to the embedding space: + - locs: x, y coordinates of the nodes (cells) + - probe: index of the (single) probe cell. We embed the euclidean distance from the probe to all cells. + """ + + def __init__(self, embed_dim, linear_bias=True): + super(DPPInitEmbedding, self).__init__() + node_dim = 2 # x, y + self.init_embed = nn.Linear(node_dim, embed_dim // 2, linear_bias) # locs + self.init_embed_probe = nn.Linear(1, embed_dim // 2, linear_bias) # probe + + def forward(self, td): + node_embeddings = self.init_embed(td["locs"]) + probe_embedding = self.init_embed_probe( + self._distance_probe(td["locs"], td["probe"]) + ) + return torch.cat([node_embeddings, probe_embedding], -1) + + def _distance_probe(self, locs, probe): + # Euclidean distance from probe to all locations + probe_loc = torch.gather(locs, 1, probe.unsqueeze(-1).expand(-1, -1, 2)) + return torch.norm(locs - probe_loc, dim=-1).unsqueeze(-1) + + +class MDPPInitEmbedding(nn.Module): + """Initial embedding for the Multi-port Placement Problem (MDPP), EDA (electronic design automation). + Embed the following node features to the embedding space: + - locs: x, y coordinates of the nodes (cells) + - probe: indexes of the probe cells (multiple). We embed the euclidean distance of each cell to the closest probe. + """ + + def __init__(self, embed_dim, linear_bias=True): + super(MDPPInitEmbedding, self).__init__() + node_dim = 2 # x, y + self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias) # locs + self.init_embed_probe_distance = nn.Linear( + 1, embed_dim, linear_bias + ) # probe_distance + self.project_out = nn.Linear(embed_dim * 2, embed_dim, linear_bias) + + def forward(self, td): + probes = td["probe"] + locs = td["locs"] + node_embeddings = self.init_embed(locs) + + # Get the shortest distance from any probe + dist = torch.cdist(locs, locs, p=2) + dist[~probes] = float("inf") + min_dist, _ = torch.min(dist, dim=1) + min_probe_dist_embedding = self.init_embed_probe_distance(min_dist[..., None]) + + return self.project_out( + torch.cat([node_embeddings, min_probe_dist_embedding], -1) + ) + + +class PDPInitEmbedding(nn.Module): + """Initial embedding for the Pickup and Delivery Problem (PDP). + Embed the following node features to the embedding space: + - locs: x, y coordinates of the nodes (depot, pickups and deliveries separately) + Note that pickups and deliveries are interleaved in the input. + """ + + def __init__(self, embed_dim, linear_bias=True): + super(PDPInitEmbedding, self).__init__() + node_dim = 2 # x, y + self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias) + self.init_embed_pick = nn.Linear(node_dim * 2, embed_dim, linear_bias) + self.init_embed_delivery = nn.Linear(node_dim, embed_dim, linear_bias) + + def forward(self, td): + depot, locs = td["locs"][..., 0:1, :], td["locs"][..., 1:, :] + num_locs = locs.size(-2) + pick_feats = torch.cat( + [locs[:, : num_locs // 2, :], locs[:, num_locs // 2 :, :]], -1 + ) # [batch_size, graph_size//2, 4] + delivery_feats = locs[:, num_locs // 2 :, :] # [batch_size, graph_size//2, 2] + depot_embeddings = self.init_embed_depot(depot) + pick_embeddings = self.init_embed_pick(pick_feats) + delivery_embeddings = self.init_embed_delivery(delivery_feats) + # concatenate on graph size dimension + return torch.cat([depot_embeddings, pick_embeddings, delivery_embeddings], -2) + + +class MTSPInitEmbedding(nn.Module): + """Initial embedding for the Multiple Traveling Salesman Problem (mTSP). + Embed the following node features to the embedding space: + - locs: x, y coordinates of the nodes (depot, cities) + """ + + def __init__(self, embed_dim, linear_bias=True): + """NOTE: new made by Fede. May need to be checked""" + super(MTSPInitEmbedding, self).__init__() + node_dim = 2 # x, y + self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias) + self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias) # depot embedding + + def forward(self, td): + depot_embedding = self.init_embed_depot(td["locs"][..., 0:1, :]) + node_embedding = self.init_embed(td["locs"][..., 1:, :]) + return torch.cat([depot_embedding, node_embedding], -2) + + +class SMTWTPInitEmbedding(nn.Module): + """Initial embedding for the Single Machine Total Weighted Tardiness Problem (SMTWTP). + Embed the following node features to the embedding space: + - job_due_time: due time of the jobs + - job_weight: weights of the jobs + - job_process_time: the processing time of jobs + """ + + def __init__(self, embed_dim, linear_bias=True): + super(SMTWTPInitEmbedding, self).__init__() + node_dim = 3 # job_due_time, job_weight, job_process_time + self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias) + + def forward(self, td): + job_due_time = td["job_due_time"] + job_weight = td["job_weight"] + job_process_time = td["job_process_time"] + feat = torch.stack((job_due_time, job_weight, job_process_time), dim=-1) + out = self.init_embed(feat) + return out + + +class MDCPDPInitEmbedding(nn.Module): + """Initial embedding for the MDCPDP environment + Embed the following node features to the embedding space: + - locs: x, y coordinates of the nodes (depot, pickups and deliveries separately) + Note that pickups and deliveries are interleaved in the input. + """ + + def __init__(self, embed_dim, linear_bias=True): + super(MDCPDPInitEmbedding, self).__init__() + node_dim = 2 # x, y + self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias) + self.init_embed_pick = nn.Linear(node_dim * 2, embed_dim, linear_bias) + self.init_embed_delivery = nn.Linear(node_dim, embed_dim, linear_bias) + + def forward(self, td): + num_depots = td["capacity"].size(-1) + depot, locs = td["locs"][..., 0:num_depots, :], td["locs"][..., num_depots:, :] + num_locs = locs.size(-2) + pick_feats = torch.cat( + [locs[:, : num_locs // 2, :], locs[:, num_locs // 2 :, :]], -1 + ) # [batch_size, graph_size//2, 4] + delivery_feats = locs[:, num_locs // 2 :, :] # [batch_size, graph_size//2, 2] + depot_embeddings = self.init_embed_depot(depot) + pick_embeddings = self.init_embed_pick(pick_feats) + delivery_embeddings = self.init_embed_delivery(delivery_feats) + # concatenate on graph size dimension + return torch.cat([depot_embeddings, pick_embeddings, delivery_embeddings], -2) + + +class JSSPInitEmbedding(nn.Module): + def __init__( + self, + embed_dim, + linear_bias: bool = True, + scaling_factor: int = 1000, + num_op_feats=5, + ): + super(JSSPInitEmbedding, self).__init__() + self.embed_dim = embed_dim + self.scaling_factor = scaling_factor + self.init_ops_embed = nn.Linear(num_op_feats, embed_dim, linear_bias) + self.pos_encoder = PositionalEncoding(embed_dim, dropout=0.0) + + def _op_features(self, td): + proc_times = td["proc_times"] + mean_durations = proc_times.sum(1) / (proc_times.gt(0).sum(1) + 1e-9) + feats = [ + mean_durations / self.scaling_factor, + # td["lbs"] / self.scaling_factor, + td["is_ready"], + td["num_eligible"], + td["ops_job_map"], + td["op_scheduled"], + ] + return torch.stack(feats, dim=-1) + + def _init_ops_embed(self, td: TensorDict): + ops_feat = self._op_features(td) + ops_emb = self.init_ops_embed(ops_feat) + ops_emb = self.pos_encoder(ops_emb, td["ops_sequence_order"]) + + # zero out padded and finished ops + mask = td["pad_mask"] # NOTE dont mask scheduled - leads to instable training + ops_emb[mask.unsqueeze(-1).expand_as(ops_emb)] = 0 + return ops_emb + + def forward(self, td): + return self._init_ops_embed(td) + + +class FJSPInitEmbedding(JSSPInitEmbedding): + def __init__(self, embed_dim, linear_bias=False, scaling_factor: int = 100): + super().__init__(embed_dim, linear_bias, scaling_factor) + self.init_ma_embed = nn.Linear(1, self.embed_dim, bias=linear_bias) + self.edge_embed = nn.Linear(1, embed_dim, bias=linear_bias) + + def forward(self, td: TensorDict): + ops_emb = self._init_ops_embed(td) + ma_emb = self._init_machine_embed(td) + edge_emb = self._init_edge_embed(td) + # get edges between operations and machines + # (bs, ops, ma) + edges = td["ops_ma_adj"].transpose(1, 2) + return ops_emb, ma_emb, edge_emb, edges + + def _init_edge_embed(self, td: TensorDict): + proc_times = td["proc_times"].transpose(1, 2) / self.scaling_factor + edge_embed = self.edge_embed(proc_times.unsqueeze(-1)) + return edge_embed + + def _init_machine_embed(self, td: TensorDict): + busy_for = (td["busy_until"] - td["time"].unsqueeze(1)) / self.scaling_factor + ma_embeddings = self.init_ma_embed(busy_for.unsqueeze(2)) + return ma_embeddings + + +class FJSPMatNetInitEmbedding(JSSPInitEmbedding): + def __init__( + self, + embed_dim, + linear_bias: bool = False, + scaling_factor: int = 1000, + ): + super().__init__(embed_dim, linear_bias, scaling_factor) + self.init_ma_embed = nn.Linear(1, self.embed_dim, bias=linear_bias) + + def _init_machine_embed(self, td: TensorDict): + busy_for = (td["busy_until"] - td["time"].unsqueeze(1)) / self.scaling_factor + ma_embeddings = self.init_ma_embed(busy_for.unsqueeze(2)) + return ma_embeddings + + def forward(self, td: TensorDict): + proc_times = td["proc_times"] + ops_emb = self._init_ops_embed(td) + # encoding machines + ma_emb = self._init_machine_embed(td) + # edgeweights for matnet + matnet_edge_weights = proc_times.transpose(1, 2) / self.scaling_factor + return ops_emb, ma_emb, matnet_edge_weights + + +class MTVRPInitEmbedding(VRPInitEmbedding): + def __init__(self, embed_dim, linear_bias=True, node_dim: int = 7): + # node_dim = 7: x, y, demand_linehaul, demand_backhaul, tw start, tw end, service time + super(MTVRPInitEmbedding, self).__init__(embed_dim, linear_bias, node_dim) + + def forward(self, td): + depot, cities = td["locs"][:, :1, :], td["locs"][:, 1:, :] + demand_linehaul, demand_backhaul = ( + td["demand_linehaul"][..., 1:], + td["demand_backhaul"][..., 1:], + ) + service_time = td["service_time"][..., 1:] + time_windows = td["time_windows"][..., 1:, :] + # [!] convert [0, inf] -> [0, 0] if a problem does not include the time window constraint, do not modify in-place + time_windows = torch.nan_to_num(time_windows, posinf=0.0) + # embeddings + depot_embedding = self.init_embed_depot(depot) + node_embeddings = self.init_embed( + torch.cat( + ( + cities, + demand_linehaul[..., None], + demand_backhaul[..., None], + time_windows, + service_time[..., None], + ), + -1, + ) + ) + return torch.cat((depot_embedding, node_embeddings), -2) diff --git a/rl4co/models/nn/flash_attention.py b/rl4co/models/nn/flash_attention.py new file mode 100644 index 00000000..28dff562 --- /dev/null +++ b/rl4co/models/nn/flash_attention.py @@ -0,0 +1,64 @@ +import torch + +try: + # from fla.ops.linear_attn.chunk_fuse import fused_chunk_linear_attn + from fla.ops.linear_attn.chunk import chunk_linear_attn as fused_chunk_linear_attn +except ImportError: + fused_chunk_linear_attn = None + +try: + from flash_attn import flash_attn_func +except ImportError: + flash_attn_func = None + + +def fused_chunk_linear_attn_wrapper( + q: torch.Tensor, + k: torch.Tensor, + v: torch.Tensor, + scale: float = -1, + initial_state: torch.Tensor = None, + output_final_state: bool = False, + normalize: bool = True, + **kwargs, +): + assert ( + fused_chunk_linear_attn is not None + ), "fused_chunk_linear_attn not found. Install Flash Linear Attention using instructions from https://github.com/sustcsonglin/flash-linear-attention" + assert ( + kwargs.get("attn_mask", None) is None + ), "attn_mask is not supported in Flash Linear Attention" + return fused_chunk_linear_attn( + q, k, v, scale, initial_state, output_final_state, normalize + )[0] + + +def scaled_dot_product_attention_flash_attn( + q, k, v, attn_mask=None, dropout_p=0.0, is_causal=False +): + """ + Flash Attention 2 wrapper (https://github.com/Dao-AILab/flash-attention) around `flash_attn_func` to obtain the same behavior as + `torch.nn.functional.scaled_dot_product_attention`. + We need to permute the query, key, and value tensors before calling the scaled dot product attention function + Reference: https://github.com/Dao-AILab/flash-attention/issues/383 + + Note: + Flash Attention does not support masking except for causal masking. + + Args: + q (torch.Tensor): Query tensor of shape `(batch_size, num_heads, seq_len_q, head_dim)` + k (torch.Tensor): Key tensor of shape `(batch_size, num_heads, seq_len_k, head_dim)` + v (torch.Tensor): Value tensor of shape `(batch_size, num_heads, seq_len_v, head_dim)` + attn_mask (torch.Tensor): Attention mask of shape `(batch_size, seq_len_q, seq_len_k)` + dropout_p (float): Dropout probability + is_causal (bool): Whether to apply causal mask to attention scores + """ + assert attn_mask is None, "`attn_mask` is not supported in Flash Attention" + assert flash_attn_func is not None, ( + "Flash Attention not found. Install Flash Attention using instructions from " + "https://github.com/Dao-AILab/flash-attention . " + "Alternatively, use `torch.nn.functional.scaled_dot_product_attention` available from PyTorch 2.0.0" + ) + q, k, v = q.transpose(-2, -3), k.transpose(-2, -3), v.transpose(-2, -3) + out = flash_attn_func(q, k, v, dropout_p=dropout_p, causal=is_causal) + return out.transpose(-2, -3) diff --git a/rl4co/models/nn/graph/__init__.py b/rl4co/models/nn/graph/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/models/nn/graph/attnnet.py b/rl4co/models/nn/graph/attnnet.py new file mode 100644 index 00000000..9bfc29c6 --- /dev/null +++ b/rl4co/models/nn/graph/attnnet.py @@ -0,0 +1,103 @@ +from typing import Callable, Optional + +import torch.nn as nn + +from torch import Tensor + +from rl4co.models.nn.mlp import MLP +from rl4co.models.nn.moe import MoE +from rl4co.models.nn.attention import MultiHeadAttention +from rl4co.models.nn.ops import Normalization, SkipConnection +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class MultiHeadAttentionLayer(nn.Sequential): + """Multi-Head Attention Layer with normalization and feed-forward layer + + Args: + embed_dim: dimension of the embeddings + num_heads: number of heads in the MHA + feedforward_hidden: dimension of the hidden layer in the feed-forward layer + normalization: type of normalization to use (batch, layer, none) + sdpa_fn: scaled dot product attention function (SDPA) + moe_kwargs: Keyword arguments for MoE + """ + + def __init__( + self, + embed_dim: int, + num_heads: int = 8, + feedforward_hidden: int = 512, + normalization: Optional[str] = "batch", + bias: bool = True, + sdpa_fn: Optional[Callable] = None, + moe_kwargs: Optional[dict] = None, + ): + num_neurons = [feedforward_hidden] if feedforward_hidden > 0 else [] + if moe_kwargs is not None: + ffn = MoE(embed_dim, embed_dim, num_neurons=num_neurons, **moe_kwargs) + else: + ffn = MLP(input_dim=embed_dim, output_dim=embed_dim, num_neurons=num_neurons, hidden_act="ReLU") + + super(MultiHeadAttentionLayer, self).__init__( + SkipConnection( + MultiHeadAttention(embed_dim, num_heads, bias=bias, sdpa_fn=sdpa_fn) + ), + Normalization(embed_dim, normalization), + SkipConnection(ffn), + Normalization(embed_dim, normalization), + ) + + +class GraphAttentionNetwork(nn.Module): + """Graph Attention Network to encode embeddings with a series of MHA layers consisting of a MHA layer, + normalization, feed-forward layer, and normalization. Similar to Transformer encoder, as used in Kool et al. (2019). + + Args: + num_heads: number of heads in the MHA + embed_dim: dimension of the embeddings + num_layers: number of MHA layers + normalization: type of normalization to use (batch, layer, none) + feedforward_hidden: dimension of the hidden layer in the feed-forward layer + sdpa_fn: scaled dot product attention function (SDPA) + moe_kwargs: Keyword arguments for MoE + """ + + def __init__( + self, + num_heads: int, + embed_dim: int, + num_layers: int, + normalization: str = "batch", + feedforward_hidden: int = 512, + sdpa_fn: Optional[Callable] = None, + moe_kwargs: Optional[dict] = None, + ): + super(GraphAttentionNetwork, self).__init__() + + self.layers = nn.Sequential( + *( + MultiHeadAttentionLayer( + embed_dim, + num_heads, + feedforward_hidden=feedforward_hidden, + normalization=normalization, + sdpa_fn=sdpa_fn, + moe_kwargs=moe_kwargs, + ) + for _ in range(num_layers) + ) + ) + + def forward(self, x: Tensor, mask: Optional[Tensor] = None) -> Tensor: + """Forward pass of the encoder + + Args: + x: [batch_size, graph_size, embed_dim] initial embeddings to process + mask: [batch_size, graph_size, graph_size] mask for the input embeddings. Unused for now. + """ + assert mask is None, "Mask not yet supported!" + h = self.layers(x) + return h diff --git a/rl4co/models/nn/graph/gcn.py b/rl4co/models/nn/graph/gcn.py new file mode 100644 index 00000000..348c6b21 --- /dev/null +++ b/rl4co/models/nn/graph/gcn.py @@ -0,0 +1,114 @@ +from typing import Callable, Tuple, Union + +import torch.nn as nn +import torch.nn.functional as F + +from tensordict import TensorDict +from torch import Tensor + +try: + from torch_geometric.nn import GCNConv +except ImportError: + GCNConv = None +from rl4co.models.nn.env_embeddings import env_init_embedding +from rl4co.utils.ops import get_full_graph_edge_index +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +EdgeIndexFnSignature = Callable[[TensorDict, int], Tensor] + + +def edge_idx_fn_wrapper(td: TensorDict, num_nodes: int): + # self-loop is added by GCNConv layer + return get_full_graph_edge_index(num_nodes, self_loop=False).to(td.device) + + +class GCNEncoder(nn.Module): + """Graph Convolutional Network to encode embeddings with a series of GCN + layers from the pytorch geometric package + + Args: + embed_dim: dimension of the embeddings + num_nodes: number of nodes in the graph + num_gcn_layer: number of GCN layers + self_loop: whether to add self loop in the graph + residual: whether to use residual connection + """ + + def __init__( + self, + env_name: str, + embed_dim: int, + num_layers: int, + init_embedding: nn.Module = None, + residual: bool = True, + edge_idx_fn: EdgeIndexFnSignature = None, + dropout: float = 0.5, + bias: bool = True, + ): + super().__init__() + + self.env_name = env_name + self.embed_dim = embed_dim + self.residual = residual + self.dropout = dropout + + self.init_embedding = ( + env_init_embedding(self.env_name, {"embed_dim": embed_dim}) + if init_embedding is None + else init_embedding + ) + + if edge_idx_fn is None: + log.warning("No edge indices passed. Assume a fully connected graph") + edge_idx_fn = edge_idx_fn_wrapper + + self.edge_idx_fn = edge_idx_fn + + # Define the GCN layers + self.gcn_layers = nn.ModuleList( + [GCNConv(embed_dim, embed_dim, bias=bias) for _ in range(num_layers)] + ) + + def forward( + self, td: TensorDict, mask: Union[Tensor, None] = None + ) -> Tuple[Tensor, Tensor]: + """Forward pass of the encoder. + Transform the input TensorDict into a latent representation. + + Args: + td: Input TensorDict containing the environment state + mask: Mask to apply to the attention + + Returns: + h: Latent representation of the input + init_h: Initial embedding of the input + """ + # Transfer to embedding space + init_h = self.init_embedding(td) + bs, num_nodes, emb_dim = init_h.shape + # (bs*num_nodes, emb_dim) + update_node_feature = init_h.reshape(-1, emb_dim) + # shape=(2, num_edges) + edge_index = self.edge_idx_fn(td, num_nodes) + + for layer in self.gcn_layers[:-1]: + update_node_feature = layer(update_node_feature, edge_index) + update_node_feature = F.relu(update_node_feature) + update_node_feature = F.dropout( + update_node_feature, training=self.training, p=self.dropout + ) + + # last layer without relu activation and dropout + update_node_feature = self.gcn_layers[-1](update_node_feature, edge_index) + + # De-batch the graph + update_node_feature = update_node_feature.view(bs, num_nodes, emb_dim) + + # Residual + if self.residual: + update_node_feature = update_node_feature + init_h + + return update_node_feature, init_h diff --git a/rl4co/models/nn/graph/gnn.py b/rl4co/models/nn/graph/gnn.py new file mode 100644 index 00000000..91e84ffe --- /dev/null +++ b/rl4co/models/nn/graph/gnn.py @@ -0,0 +1,99 @@ +import torch +import torch.nn as nn + +try: + import torch_geometric.nn as gnn +except ImportError: + gnn = None + +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class GNNLayer(nn.Module): + """Graph Neural Network Layer for processing graph structures. + + Args: + units: The number of units in each linear transformation layer. + act_fn: The name of the activation function to use after each linear layer. Defaults to 'silu'. + agg_fn: The name of the global aggregation function to use for pooling features across the graph. Defaults to 'mean'. + """ + + def __init__(self, units: int, act_fn: str = "silu", agg_fn: str = "mean"): + assert gnn is not None, ( + "torch_geometric not found. Please install torch_geometric using instructions from " + "https://pytorch-geometric.readthedocs.io/en/latest/install/installation.html." + ) + + super(GNNLayer, self).__init__() + self.units = units + self.act_fn = getattr(nn.functional, act_fn) + self.agg_fn = getattr(gnn, f"global_{agg_fn}_pool") + + # Vertex updates + self.v_lin1 = nn.Linear(units, units) + self.v_lin2 = nn.Linear(units, units) + self.v_lin3 = nn.Linear(units, units) + self.v_lin4 = nn.Linear(units, units) + self.v_bn = gnn.BatchNorm(units) + + # Edge updates + self.e_lin = nn.Linear(units, units) + self.e_bn = gnn.BatchNorm(units) + + def forward(self, x, edge_index, edge_attr): + x0 = x + w0 = w = edge_attr + + # Vertex updates + x1 = self.v_lin1(x0) + x2 = self.v_lin2(x0) + x3 = self.v_lin3(x0) + x4 = self.v_lin4(x0) + x = x0 + self.act_fn( + self.v_bn( + x1 + self.agg_fn(torch.sigmoid(w0) * x2[edge_index[1]], edge_index[0]) + ) + ) + + # Edge updates + w1 = self.e_lin(w0) + w = w0 + self.act_fn(self.e_bn(w1 + x3[edge_index[0]] + x4[edge_index[1]])) + return x, w + + +class GNNEncoder(nn.Module): + """Anisotropic Graph Neural Network encoder with edge-gating mechanism as in Joshi et al. (2022) + + Args: + num_layers: The number of GNN layers to stack in the network. + embed_dim: The dimensionality of the embeddings for each node in the graph. + act_fn: The activation function to use in each GNNLayer, see https://pytorch.org/docs/stable/nn.functional.html#non-linear-activation-functions for available options. Defaults to 'silu'. + agg_fn: The aggregation function to use in each GNNLayer for pooling features. Options: 'add', 'mean', 'max'. Defaults to 'mean'. + """ + + def __init__(self, num_layers: int, embed_dim: int, act_fn="silu", agg_fn="mean"): + super(GNNEncoder, self).__init__() + self.act_fn = getattr(nn.functional, act_fn) + self.agg_fn = agg_fn + + # Stack of GNN layers + self.layers = nn.ModuleList( + [GNNLayer(embed_dim, act_fn, agg_fn) for _ in range(num_layers)] + ) + + def forward(self, x, edge_index, w): + """Sequentially passes the input graph data through the stacked GNN layers, + applying specified transformations and aggregations to learn graph representations. + + Args: + x: The node features of the graph with shape [num_nodes, embed_dim]. + edge_index: The edge indices of the graph with shape [2, num_edges]. + w: The edge attributes or weights with shape [num_edges, embed_dim]. + """ + x = self.act_fn(x) + w = self.act_fn(w) + for layer in self.layers: + x, w = layer(x, edge_index, w) + return x, w diff --git a/rl4co/models/nn/graph/hgnn.py b/rl4co/models/nn/graph/hgnn.py new file mode 100644 index 00000000..bd4ce0d2 --- /dev/null +++ b/rl4co/models/nn/graph/hgnn.py @@ -0,0 +1,133 @@ +import math + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from einops import einsum +from torch import Tensor + +from rl4co.models.nn.env_embeddings import env_init_embedding +from rl4co.models.nn.ops import TransformerFFN + + +class HetGNNLayer(nn.Module): + def __init__( + self, + embed_dim: int, + ) -> None: + super().__init__() + + self.self_attn = nn.Parameter(torch.rand(size=(embed_dim, 1), dtype=torch.float)) + self.cross_attn = nn.Parameter(torch.rand(size=(embed_dim, 1), dtype=torch.float)) + self.edge_attn = nn.Parameter(torch.rand(size=(embed_dim, 1), dtype=torch.float)) + self.activation = nn.ReLU() + self.scale = 1 / math.sqrt(embed_dim) + + def forward( + self, self_emb: Tensor, other_emb: Tensor, edge_emb: Tensor, edges: Tensor + ): + bs, n_rows, _ = self_emb.shape + + # concat operation embeddings and o-m edge features (proc times) + # Calculate attention coefficients + er = einsum(self_emb, self.self_attn, "b m e, e one -> b m") * self.scale + ec = einsum(other_emb, self.cross_attn, "b o e, e one -> b o") * self.scale + ee = einsum(edge_emb, self.edge_attn, "b m o e, e one -> b m o") * self.scale + + # element wise multiplication similar to broadcast column logits over rows with masking + ec_expanded = einsum(edges, ec, "b m o, b o -> b m o") + # element wise multiplication similar to broadcast row logits over cols with masking + er_expanded = einsum(edges, er, "b m o, b m -> b m o") + + # adding the projections of different node types and edges together (equivalent to first concat and then project) + # (bs, n_rows, n_cols) + cross_logits = self.activation(ec_expanded + ee + er_expanded) + + # (bs, n_rows, 1) + self_logits = self.activation(er + er).unsqueeze(-1) + + # (bs, n_ma, n_ops + 1) + mask = torch.cat( + ( + edges == 1, + torch.full( + size=(bs, n_rows, 1), + dtype=torch.bool, + fill_value=True, + device=edges.device, + ), + ), + dim=-1, + ) + + # (bs, n_ma, n_ops + 1) + all_logits = torch.cat((cross_logits, self_logits), dim=-1) + all_logits[~mask] = -torch.inf + attn_scores = F.softmax(all_logits, dim=-1) + # (bs, n_ma, n_ops) + cross_attn_scores = attn_scores[..., :-1] + # (bs, n_ma, 1) + self_attn_scores = attn_scores[..., -1].unsqueeze(-1) + + # augment column embeddings with edge features, (bs, r, c, e) + other_emb_aug = edge_emb + other_emb.unsqueeze(-3) + cross_emb = einsum(cross_attn_scores, other_emb_aug, "b m o, b m o e -> b m e") + self_emb = self_emb * self_attn_scores + # (bs, n_ma, emb_dim) + hidden = cross_emb + self_emb + return hidden + + +class HetGNNBlock(nn.Module): + def __init__(self, embed_dim, normalization: str = "batch") -> None: + super().__init__() + self.hgnn1 = HetGNNLayer(embed_dim) + self.hgnn2 = HetGNNLayer(embed_dim) + self.ffn1 = TransformerFFN(embed_dim, embed_dim * 2, normalization=normalization) + self.ffn2 = TransformerFFN(embed_dim, embed_dim * 2, normalization=normalization) + + def forward(self, x1, x2, edge_emb, edges): + h1 = self.hgnn1(x1, x2, edge_emb, edges) + h1 = self.ffn1(h1, x1) + + h2 = self.hgnn2(x2, x1, edge_emb.transpose(1, 2), edges.transpose(1, 2)) + h2 = self.ffn2(h2, x2) + + return h1, h2 + + +class HetGNNEncoder(nn.Module): + def __init__( + self, + embed_dim: int, + num_layers: int = 2, + normalization: str = "batch", + init_embedding=None, + env_name: str = "fjsp", + **init_embedding_kwargs, + ) -> None: + super().__init__() + + if init_embedding is None: + init_embedding_kwargs["embed_dim"] = embed_dim + init_embedding = env_init_embedding(env_name, init_embedding_kwargs) + + self.init_embedding = init_embedding + + self.num_layers = num_layers + self.layers = nn.ModuleList( + [HetGNNBlock(embed_dim, normalization) for _ in range(num_layers)] + ) + + def forward(self, td): + row_emb, col_emb, edge_emb, edges = self.init_embedding(td) + # perform sanity check to validate correct order of row and col embeddings + n_rows, n_cols = edges.shape[1:] + assert row_emb.size(1) == n_rows, "incorrect number of row embeddings" + assert col_emb.size(1) == n_cols, "incorrect number of column embeddings" + + for layer in self.layers: + row_emb, col_emb = layer(row_emb, col_emb, edge_emb, edges) + + return (row_emb, col_emb), None diff --git a/rl4co/models/nn/graph/mpnn.py b/rl4co/models/nn/graph/mpnn.py new file mode 100644 index 00000000..fd6e14af --- /dev/null +++ b/rl4co/models/nn/graph/mpnn.py @@ -0,0 +1,173 @@ +from typing import Tuple, Union + +import torch +import torch.nn as nn + +from tensordict import TensorDict +from torch import Tensor +from torch_geometric.data import Batch, Data +from torch_geometric.nn import MessagePassing + +from rl4co.models.nn.env_embeddings import env_init_embedding +from rl4co.models.nn.mlp import MLP +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class MessagePassingLayer(MessagePassing): + def __init__( + self, + node_indim, + node_outdim, + edge_indim, + edge_outdim, + aggregation="add", + residual=False, + **mlp_params, + ): + super(MessagePassingLayer, self).__init__(aggr=aggregation) + # Init message passing models + self.edge_model = MLP( + input_dim=edge_indim + 2 * node_indim, output_dim=edge_outdim, **mlp_params + ) + self.node_model = MLP( + input_dim=edge_outdim + node_indim, output_dim=node_outdim, **mlp_params + ) + self.residual = residual + + def forward(self, node_feature, edge_feature, edge_index, mask=None): + # Message passing + update_edge_feature = self.edge_update(node_feature, edge_feature, edge_index) + update_node_feature = self.propagate( + edge_index, x=node_feature, edge_features=update_edge_feature + ) + + # Update with residual connection + if self.residual: + update_node_feature = update_node_feature + node_feature + + return update_node_feature, update_edge_feature + + def edge_update(self, nf, ef, edge_index): + row, col = edge_index + x_i, x_j = nf[row], nf[col] + uef = self.edge_model(torch.cat([x_i, x_j, ef], dim=-1)) + return uef + + def message(self, edge_features: torch.tensor): + return edge_features + + def update(self, aggr_msg: torch.tensor, x: torch.tensor): + unf = self.node_model(torch.cat([x, aggr_msg], dim=-1)) + return unf + + +class MessagePassingEncoder(nn.Module): + def __init__( + self, + env_name: str, + embed_dim: int, + num_nodes: int, + num_layers: int, + init_embedding: nn.Module = None, + aggregation: str = "add", + self_loop: bool = False, + residual: bool = True, + ): + """ + Note: + - Support fully connected graph for now. + """ + super(MessagePassingEncoder, self).__init__() + + self.env_name = env_name + + self.init_embedding = ( + env_init_embedding(self.env_name, {"embed_dim": embed_dim}) + if init_embedding is None + else init_embedding + ) + + # Generate edge index for a fully connected graph + adj_matrix = torch.ones(num_nodes, num_nodes) + if self_loop: + adj_matrix.fill_diagonal_(0) # No self-loops + self.edge_index = torch.permute(torch.nonzero(adj_matrix), (1, 0)) + + # Init message passing models + self.mpnn_layers = nn.ModuleList( + [ + MessagePassingLayer( + node_indim=embed_dim, + node_outdim=embed_dim, + edge_indim=1, + edge_outdim=1, + aggregation=aggregation, + residual=residual, + ) + for _ in range(num_layers) + ] + ) + + # Record parameters + self.self_loop = self_loop + + # def forward(self, x, mask=None): + def forward( + self, td: TensorDict, mask: Union[Tensor, None] = None + ) -> Tuple[Tensor, Tensor]: + init_h = self.init_embedding(td) + num_node = init_h.size(-2) + + # Check to update the edge index with different number of node + if num_node != self.edge_index.max().item() + 1: + adj_matrix = torch.ones(num_node, num_node) + if self.self_loop: + adj_matrix.fill_diagonal_(0) + edge_index = torch.permute(torch.nonzero(adj_matrix), (1, 0)) + edge_index = edge_index.to(init_h.device) + else: + edge_index = self.edge_index.to(init_h.device) + + # Generate edge features: distance + edge_feature = torch.norm( + init_h[..., edge_index[0], :] - init_h[..., edge_index[1], :], + dim=-1, + keepdim=True, + ) + + # Create the batched graph + data_list = [ + Data(x=x, edge_index=edge_index, edge_attr=edge_attr) + for x, edge_attr in zip(init_h, edge_feature) + ] + data_batch = Batch.from_data_list(data_list) + update_node_feature = data_batch.x + update_edge_feature = data_batch.edge_attr + edge_index = data_batch.edge_index + + # Message passing + for layer in self.mpnn_layers: + update_node_feature, update_edge_feature = layer( + update_node_feature, update_edge_feature, edge_index + ) + + # De-batch the graph + input_size = init_h.size() + update_node_feature = update_node_feature.view(*input_size) + + return update_node_feature, init_h + + def edge_update(self, nf, ef, edge_index): + row, col = edge_index + x_i, x_j = nf[row], nf[col] + uef = self.edge_model(torch.cat([x_i, x_j, ef], dim=-1)) + return uef + + def message(self, edge_features: torch.tensor): + return edge_features + + def update(self, aggr_msg: torch.tensor, x: torch.tensor): + unf = self.node_model(torch.cat([x, aggr_msg], dim=-1)) + return unf diff --git a/rl4co/models/nn/mlp.py b/rl4co/models/nn/mlp.py new file mode 100644 index 00000000..83afcb62 --- /dev/null +++ b/rl4co/models/nn/mlp.py @@ -0,0 +1,80 @@ +from typing import List, Union + +import torch.nn as nn + +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class MLP(nn.Module): + def __init__( + self, + input_dim: int, + output_dim: int, + num_neurons: List[int] = [64, 32], + dropout_probs: Union[None, List[float]] = None, + hidden_act: str = "ReLU", + out_act: str = "Identity", + input_norm: str = "None", + output_norm: str = "None", + ): + super(MLP, self).__init__() + + assert input_norm in ["Batch", "Layer", "None"] + assert output_norm in ["Batch", "Layer", "None"] + + if dropout_probs is None: + dropout_probs = [0.0] * len(num_neurons) + elif len(dropout_probs) != len(num_neurons): + log.info( + "dropout_probs List length should match the num_neurons List length for MLP, dropouts set to False instead" + ) + dropout_probs = [0.0] * len(num_neurons) + + self.input_dim = input_dim + self.output_dim = output_dim + self.num_neurons = num_neurons + self.hidden_act = getattr(nn, hidden_act)() + self.out_act = getattr(nn, out_act)() + self.dropouts = [] + for i in range(len(dropout_probs)): + self.dropouts.append(nn.Dropout(p=dropout_probs[i])) + + input_dims = [input_dim] + num_neurons + output_dims = num_neurons + [output_dim] + + self.lins = nn.ModuleList() + for i, (in_dim, out_dim) in enumerate(zip(input_dims, output_dims)): + self.lins.append(nn.Linear(in_dim, out_dim)) + + self.input_norm = self._get_norm_layer(input_norm, input_dim) + self.output_norm = self._get_norm_layer(output_norm, output_dim) + + def forward(self, xs): + xs = self.input_norm(xs) + for i, lin in enumerate(self.lins[:-1]): + xs = lin(xs) + xs = self.hidden_act(xs) + xs = self.dropouts[i](xs) + xs = self.lins[-1](xs) + xs = self.out_act(xs) + xs = self.output_norm(xs) + return xs + + @staticmethod + def _get_norm_layer(norm_method, dim): + if norm_method == "Batch": + in_norm = nn.BatchNorm1d(dim) + elif norm_method == "Layer": + in_norm = nn.LayerNorm(dim) + elif norm_method == "None": + in_norm = nn.Identity() # kinda placeholder + else: + raise RuntimeError( + "Not implemented normalization layer type {}".format(norm_method) + ) + return in_norm + + def _get_act(self, is_last): + return self.out_act if is_last else self.hidden_act diff --git a/rl4co/models/nn/moe.py b/rl4co/models/nn/moe.py new file mode 100644 index 00000000..a2b04584 --- /dev/null +++ b/rl4co/models/nn/moe.py @@ -0,0 +1,277 @@ +import torch +import torch.nn as nn +from torch.distributions.normal import Normal + +from rl4co.models.nn.mlp import MLP + +""" + Pytorch Implementation based on + Author: David Rau + Link: +""" + + +class SparseDispatcher(object): + """ + Helper for implementing a mixture of experts. + The purpose of this class is to create input minibatches for the experts + and to combine the results of the experts to form a unified output tensor. + + There are two functions: + dispatch - take an input Tensor and create input Tensors for each expert. + combine - take output Tensors from each expert and form a combined output + Tensor. Outputs from different experts for the same batch element are + summed together, weighted by the provided "gates". + + The class is initialized with a "gates" Tensor, which specifies which + batch elements go to which experts, and the weights to use when combining + the outputs. Batch element b is sent to expert e iff gates[b, e] != 0. + The inputs and outputs are all two-dimensional [batch, depth]. + Caller is responsible for collapsing additional dimensions prior to + calling this class and reshaping the output to the original shape. + See common_layers.reshape_like(). + + Example use: + gates: a float32 `Tensor` with shape `[batch_size, num_experts]` + inputs: a float32 `Tensor` with shape `[batch_size, input_size]` + experts: a list of length `num_experts` containing sub-networks. + dispatcher = SparseDispatcher(num_experts, gates) + expert_inputs = dispatcher.dispatch(inputs) + expert_outputs = [experts[i](expert_inputs[i]) for i in range(num_experts)] + outputs = dispatcher.combine(expert_outputs) + The preceding code sets the output for a particular example b to: + output[b] = Sum_i(gates[b, i] * experts[i](inputs[b])) + This class takes advantage of sparsity in the gate matrix by including in the + `Tensor`s for expert i only the batch elements for which `gates[b, i] > 0`. + """ + + def __init__(self, num_experts, gates): + """Create a SparseDispatcher.""" + + self._gates = gates + self._num_experts = num_experts + # sort experts + sorted_experts, index_sorted_experts = torch.nonzero(gates).sort(0) + # drop indices + _, self._expert_index = sorted_experts.split(1, dim=1) + # get according batch index for each expert + self._batch_index = torch.nonzero(gates)[index_sorted_experts[:, 1], 0] + # calculate num samples that each expert gets + self._part_sizes = (gates > 0).sum(0).tolist() + # expand gates to match with self._batch_index + gates_exp = gates[self._batch_index.flatten()] + self._nonzero_gates = torch.gather(gates_exp, 1, self._expert_index) + + def dispatch(self, inp): + """Create one input Tensor for each expert. + The `Tensor` for a expert `i` contains the slices of `inp` corresponding + to the batch elements `b` where `gates[b, i] > 0`. + Args: + inp: a `Tensor` of shape "[batch_size, ]` + Returns: + a list of `num_experts` `Tensor`s with shapes + [expert_batch_size_i, ]`. + """ + + # assigns samples to experts whose gate is nonzero + # expand according to batch index so we can just split by _part_sizes + inp_exp = inp[self._batch_index].squeeze(1) + return torch.split(inp_exp, self._part_sizes, dim=0) + + def combine(self, expert_out, multiply_by_gates=True): + """Sum together the expert output, weighted by the gates. + The slice corresponding to a particular batch element `b` is computed + as the sum over all experts `i` of the expert output, weighted by the + corresponding gate values. If `multiply_by_gates` is set to False, the + gate values are ignored. + Args: + expert_out: a list of `num_experts` `Tensor`s, each with shape + [expert_batch_size_i, ]`. + multiply_by_gates: a boolean + Returns: + a `Tensor` with shape `[batch_size, ]`. + """ + # apply exp to expert outputs, so we are not longer in log space + stitched = torch.cat(expert_out, 0) + + if multiply_by_gates: + stitched = stitched.mul(self._nonzero_gates) + zeros = torch.zeros(self._gates.size(0), expert_out[-1].size(-1), requires_grad=True, device=stitched.device) + # combine samples that have been processed by the same k experts + combined = zeros.index_add(0, self._batch_index, stitched.float()) + return combined + + def expert_to_gates(self): + """Gate values corresponding to the examples in the per-expert `Tensor`s. + Returns: + a list of `num_experts` one-dimensional `Tensor`s with type `tf.float32` + and shapes `[expert_batch_size_i]` + """ + # split nonzero gates for each expert + return torch.split(self._nonzero_gates, self._part_sizes, dim=0) + + +class MoE(nn.Module): + """Call a Sparsely gated mixture of experts layer with 1-layer Feed-Forward networks as experts. + Args: + input_size: integer - size of the input + output_size: integer - size of the input + num_experts: an integer - number of experts + num_neurons: a list - hidden dimension of the experts + noisy_gating: a boolean + k: an integer - how many experts to use for each batch element + """ + + def __init__(self, input_size, output_size, num_neurons=[], hidden_act="ReLU", out_bias=True, num_experts=4, k=2, noisy_gating=True, **kwargs): + super(MoE, self).__init__() + self.noisy_gating = noisy_gating + self.num_experts = num_experts + self.output_size = output_size + self.input_size = input_size + self.k = k + + # instantiate experts + if num_neurons != []: + self.experts = nn.ModuleList([MLP(input_dim=input_size, output_dim=output_size, num_neurons=num_neurons, + hidden_act=hidden_act) for _ in range(self.num_experts)]) + else: + self.experts = nn.ModuleList([nn.Linear(self.input_size, self.output_size, bias=out_bias) for _ in range(self.num_experts)]) + self.w_gate = nn.Parameter(torch.zeros(input_size, num_experts), requires_grad=True) + self.w_noise = nn.Parameter(torch.zeros(input_size, num_experts), requires_grad=True) + + self.softplus = nn.Softplus() + self.softmax = nn.Softmax(-1) + self.register_buffer("mean", torch.tensor([0.0])) + self.register_buffer("std", torch.tensor([1.0])) + assert(self.k <= self.num_experts) + + def cv_squared(self, x): + """The squared coefficient of variation of a sample. + Useful as a loss to encourage a positive distribution to be more uniform. + Epsilons added for numerical stability. + Returns 0 for an empty Tensor. + Args: + x: a `Tensor`. + Returns: + a `Scalar`. + """ + eps = 1e-10 + # if only num_experts = 1 + + if x.shape[0] == 1: + return torch.tensor([0], device=x.device, dtype=x.dtype) + return x.float().var() / (x.float().mean()**2 + eps) + + def _gates_to_load(self, gates): + """Compute the true load per expert, given the gates. + The load is the number of examples for which the corresponding gate is >0. + Args: + gates: a `Tensor` of shape [batch_size, n] + Returns: + a float32 `Tensor` of shape [n] + """ + return (gates > 0).sum(0) + + def _prob_in_top_k(self, clean_values, noisy_values, noise_stddev, noisy_top_values): + """Helper function to NoisyTopKGating. + Computes the probability that value is in top k, given different random noise. + This gives us a way of backpropagating from a loss that balances the number + of times each expert is in the top k experts per example. + In the case of no noise, pass in None for noise_stddev, and the result will + not be differentiable. + Args: + clean_values: a `Tensor` of shape [batch, n]. + noisy_values: a `Tensor` of shape [batch, n]. Equal to clean values plus + normally distributed noise with standard deviation noise_stddev. + noise_stddev: a `Tensor` of shape [batch, n], or None + noisy_top_values: a `Tensor` of shape [batch, m]. + "values" Output of tf.top_k(noisy_top_values, m). m >= k+1 + Returns: + a `Tensor` of shape [batch, n]. + """ + batch = clean_values.size(0) + m = noisy_top_values.size(1) + top_values_flat = noisy_top_values.flatten() + + threshold_positions_if_in = torch.arange(batch, device=clean_values.device) * m + self.k + threshold_if_in = torch.unsqueeze(torch.gather(top_values_flat, 0, threshold_positions_if_in), 1) + is_in = torch.gt(noisy_values, threshold_if_in) + threshold_positions_if_out = threshold_positions_if_in - 1 + threshold_if_out = torch.unsqueeze(torch.gather(top_values_flat, 0, threshold_positions_if_out), 1) + # is each value currently in the top k. + normal = Normal(self.mean, self.std) + prob_if_in = normal.cdf((clean_values - threshold_if_in)/noise_stddev) + prob_if_out = normal.cdf((clean_values - threshold_if_out)/noise_stddev) + prob = torch.where(is_in, prob_if_in, prob_if_out) + return prob + + def noisy_top_k_gating(self, x, train, noise_epsilon=1e-2): + """Noisy top-k gating. + See paper: . + Args: + x: input Tensor with shape [batch_size, input_size] + train: a boolean - we only add noise at training time. + noise_epsilon: a float + Returns: + gates: a Tensor with shape [batch_size, num_experts] + load: a Tensor with shape [num_experts] + """ + clean_logits = x @ self.w_gate + if self.noisy_gating and train: + raw_noise_stddev = x @ self.w_noise + noise_stddev = self.softplus(raw_noise_stddev) + noise_epsilon + noisy_logits = clean_logits + (torch.randn_like(clean_logits) * noise_stddev) + logits = noisy_logits + else: + logits = clean_logits + + # calculate topk + 1 that will be needed for the noisy gates + logits = self.softmax(logits) + top_logits, top_indices = logits.topk(min(self.k + 1, self.num_experts), dim=-1) + top_k_logits = top_logits[:, :self.k] + top_k_indices = top_indices[:, :self.k] + top_k_gates = top_k_logits / (top_k_logits.sum(1, keepdim=True) + 1e-6) # normalization + + zeros = torch.zeros_like(logits, requires_grad=True) + gates = zeros.scatter(-1, top_k_indices, top_k_gates) # non-topk elements will be 0 + + if self.noisy_gating and self.k < self.num_experts and train: + load = (self._prob_in_top_k(clean_logits, noisy_logits, noise_stddev, top_logits)).sum(0) + else: + load = self._gates_to_load(gates) + return gates, load + + def forward(self, x, loss_coef=0.): + """ + Token/Node-level Gating with the default gating algorithm in . + In specific, each token/node chooses TopK experts, auxiliary losses required for load balancing. + Empirically, we found that the load-balancing loss may conflict with the reinforcement loss, + and thus we do not return loss (i.e., loss_coef=0.). + Please Refer to (Zhou et al, 2024) . + + Args: + x: tensor shape [batch_size, problem_size, input_size] + loss_coef: a scalar - multiplier on load-balancing losses + + Returns: + y: a tensor with shape [batch_size, problem_size, output_size]. + loss: a scalar. This should be added into the overall training loss of the model. + The backpropagation of this loss encourages all experts to be approximately equally used across a batch. + """ + output_shape = list(x.size()[:-1]) + [self.output_size] + x = x.reshape(-1, self.input_size) if x.dim() != 2 else x + + gates, load = self.noisy_top_k_gating(x, self.training) + # calculate importance loss + importance = gates.sum(0) + loss = self.cv_squared(importance) + self.cv_squared(load) + loss *= loss_coef + + dispatcher = SparseDispatcher(self.num_experts, gates) + expert_inputs = dispatcher.dispatch(x) + # gates = dispatcher.expert_to_gates() + expert_outputs = [self.experts[i](expert_inputs[i]) for i in range(self.num_experts)] + y = dispatcher.combine(expert_outputs) + + # return y.reshape(output_shape), loss + return y.reshape(output_shape) diff --git a/rl4co/models/nn/ops.py b/rl4co/models/nn/ops.py new file mode 100644 index 00000000..f6f774fe --- /dev/null +++ b/rl4co/models/nn/ops.py @@ -0,0 +1,137 @@ +import math + +from typing import Tuple, Union + +import torch +import torch.nn as nn + +from rl4co.utils.ops import gather_by_index + + +class SkipConnection(nn.Module): + def __init__(self, module): + super(SkipConnection, self).__init__() + self.module = module + + def forward(self, x): + return x + self.module(x) + + +class AdaptiveSequential(nn.Sequential): + def forward( + self, *inputs: Union[Tuple[torch.Tensor], torch.Tensor] + ) -> Union[Tuple[torch.Tensor], torch.Tensor]: + for module in self._modules.values(): + if type(inputs) == tuple: + inputs = module(*inputs) + else: + inputs = module(inputs) + return inputs + + +class Normalization(nn.Module): + def __init__(self, embed_dim, normalization="batch"): + super(Normalization, self).__init__() + if normalization != "layer": + normalizer_class = { + "batch": nn.BatchNorm1d, + "instance": nn.InstanceNorm1d, + }.get(normalization, None) + + self.normalizer = normalizer_class(embed_dim, affine=True) + else: + self.normalizer = "layer" + + def forward(self, x): + if isinstance(self.normalizer, nn.BatchNorm1d): + return self.normalizer(x.view(-1, x.size(-1))).view(*x.size()) + elif isinstance(self.normalizer, nn.InstanceNorm1d): + return self.normalizer(x.permute(0, 2, 1)).permute(0, 2, 1) + elif self.normalizer == "layer": + return (x - x.mean((1, 2)).view(-1, 1, 1)) / torch.sqrt( + x.var((1, 2)).view(-1, 1, 1) + 1e-05 + ) + else: + assert self.normalizer is None, "Unknown normalizer type" + return x + + +class PositionalEncoding(nn.Module): + def __init__(self, embed_dim: int, dropout: float = 0.1, max_len: int = 1000): + super().__init__() + self.dropout = nn.Dropout(p=dropout) + self.d_model = embed_dim + max_len = max_len + position = torch.arange(max_len).unsqueeze(1) + div_term = torch.exp( + torch.arange(0, self.d_model, 2) * (-math.log(10000.0) / self.d_model) + ) + pe = torch.zeros(max_len, 1, self.d_model) + pe[:, 0, 0::2] = torch.sin(position * div_term) + pe[:, 0, 1::2] = torch.cos(position * div_term) + pe = pe.transpose(0, 1) # [1, max_len, d_model] + self.register_buffer("pe", pe) + + def forward(self, hidden: torch.Tensor, seq_pos) -> torch.Tensor: + """ + Arguments: + x: Tensor, shape ``[batch_size, seq_len, embedding_dim]`` + seq_pos: Tensor, shape ``[batch_size, seq_len]`` + """ + pes = self.pe.expand(hidden.size(0), -1, -1).gather( + 1, seq_pos.unsqueeze(-1).expand(-1, -1, self.d_model) + ) + hidden = hidden + pes + return self.dropout(hidden) + + +class TransformerFFN(nn.Module): + def __init__(self, embed_dim, feed_forward_hidden, normalization="batch") -> None: + super().__init__() + + self.ops = nn.ModuleDict( + { + "norm1": Normalization(embed_dim, normalization), + "ffn": nn.Sequential( + nn.Linear(embed_dim, feed_forward_hidden), + nn.ReLU(), + nn.Linear(feed_forward_hidden, embed_dim), + ), + "norm2": Normalization(embed_dim, normalization), + } + ) + + def forward(self, x, x_old): + x = self.ops["norm1"](x_old + x) + x = self.ops["norm2"](x + self.ops["ffn"](x)) + + return x + + +class RandomEncoding(nn.Module): + """This is like torch.nn.Embedding but with rows of embeddings are randomly + permuted in each forward pass before lookup operation. This might be useful + in cases where classes have no fixed meaning but rather indicate a connection + between different elements in a sequence. Reference is the MatNet model. + """ + + def __init__(self, embed_dim: int, max_classes: int = 100): + super().__init__() + self.embed_dim = embed_dim + self.max_classes = max_classes + rand_emb = torch.rand(max_classes, self.embed_dim) + self.register_buffer("emb", rand_emb) + + def forward(self, hidden: torch.Tensor, classes=None) -> torch.Tensor: + b, s, _ = hidden.shape + if classes is None: + classes = torch.eye(s).unsqueeze(0).expand(b, s) + assert ( + classes.max() < self.max_classes + ), "number of classes larger than embedding table" + classes = classes.unsqueeze(-1).expand(-1, -1, self.embed_dim) + rand_idx = torch.rand(b, self.max_classes).argsort(dim=1) + embs_permuted = self.emb[rand_idx] + rand_emb = gather_by_index(embs_permuted, classes, dim=1) + hidden = hidden + rand_emb + return hidden diff --git a/rl4co/models/nn/pos_embeddings.py b/rl4co/models/nn/pos_embeddings.py new file mode 100644 index 00000000..9d217e63 --- /dev/null +++ b/rl4co/models/nn/pos_embeddings.py @@ -0,0 +1,159 @@ +import numpy as np +import torch +import torch.nn as nn + + +def pos_init_embedding(pos_name: str, config: dict) -> nn.Module: + """Get positional embedding. The positional embedding is used for improvement methods to encode current solutions. + + Args: + pos_name: Positional embeding method name. + config: A dictionary of configuration options for the initlization. + """ + embedding_registry = { + "APE": AbsolutePositionalEmbedding, + "CPE": CyclicPositionalEmbedding, + } + + if pos_name not in embedding_registry: + raise ValueError( + f"Unknown positional embedding name '{pos_name}'. Available positional embeddings: {embedding_registry.keys()}" + ) + + return embedding_registry[pos_name](**config) + + +class AbsolutePositionalEmbedding(nn.Module): + """Absolute Positional Embedding in the original Transformer.""" + + def __init__(self, embed_dim): + super(AbsolutePositionalEmbedding, self).__init__() + self.embed_dim = embed_dim + self.pattern = None + + def _init(self, n_position, emb_dim): + pattern = torch.tensor( + [ + [pos / np.power(10000, 2 * (j // 2) / emb_dim) for j in range(emb_dim)] + for pos in range(1, n_position + 1) + ], + dtype=torch.float32, + ) + + pattern[1:, 0::2] = torch.sin(pattern[1:, 0::2]) # dim 2i + pattern[1:, 1::2] = torch.cos(pattern[1:, 1::2]) # dim 2i+1 + + return pattern + + def forward(self, td): + batch_size, seq_length = td["rec_current"].size() + visited_time = td["visited_time"] + embedding_dim = self.embed_dim + + # expand for every batch + if self.pattern is None or self.pattern.size(0) != seq_length: + self.pattern = self._init(seq_length, self.embed_dim) + + batch_vector = ( + self.pattern.expand(batch_size, seq_length, embedding_dim) + .clone() + .to(visited_time.device) + ) + index = ( + (visited_time % seq_length) + .long() + .unsqueeze(-1) + .expand(batch_size, seq_length, embedding_dim) + ) + + return torch.gather(batch_vector, 1, index) + + +class CyclicPositionalEmbedding(nn.Module): + """Cyclic Positional Embedding presented in Ma et al.(2021) + See https://arxiv.org/abs/2110.02544 + """ + + def __init__(self, embed_dim, mean_pooling=True): + super(CyclicPositionalEmbedding, self).__init__() + self.embed_dim = embed_dim + self.mean_pooling = mean_pooling + self.pattern = None + + def _basesin(self, x, T, fai=0): + return np.sin(2 * np.pi / T * np.abs(np.mod(x, 2 * T) - T) + fai) + + def _basecos(self, x, T, fai=0): + return np.cos(2 * np.pi / T * np.abs(np.mod(x, 2 * T) - T) + fai) + + def _init(self, n_position, emb_dim, mean_pooling): + Td_set = np.linspace( + np.power(n_position, 1 / (emb_dim // 2)), + n_position, + emb_dim // 2, + dtype="int", + ) + x = np.zeros((n_position, emb_dim)) + + for i in range(emb_dim): + Td = ( + Td_set[i // 3 * 3 + 1] + if (i // 3 * 3 + 1) < (emb_dim // 2) + else Td_set[-1] + ) + fai = ( + 0 + if i <= (emb_dim // 2) + else 2 * np.pi * ((-i + (emb_dim // 2)) / (emb_dim // 2)) + ) + longer_pattern = np.arange(0, np.ceil((n_position) / Td) * Td, 0.01) + if i % 2 == 1: + x[:, i] = self._basecos(longer_pattern, Td, fai)[ + np.linspace( + 0, len(longer_pattern), n_position, dtype="int", endpoint=False + ) + ] + else: + x[:, i] = self._basesin(longer_pattern, Td, fai)[ + np.linspace( + 0, len(longer_pattern), n_position, dtype="int", endpoint=False + ) + ] + + pattern = torch.from_numpy(x).type(torch.FloatTensor) + pattern_sum = torch.zeros_like(pattern) + + # averaging the adjacient embeddings if needed (optional, almost the same performance) + arange = torch.arange(n_position) + pooling = [0] if not mean_pooling else [-2, -1, 0, 1, 2] + time = 0 + for i in pooling: + time += 1 + index = (arange + i + n_position) % n_position + pattern_sum += pattern.gather(0, index.view(-1, 1).expand_as(pattern)) + pattern = 1.0 / time * pattern_sum - pattern.mean(0) + + return pattern + + def forward(self, td): + batch_size, seq_length = td["rec_current"].size() + visited_time = td["visited_time"] + embedding_dim = self.embed_dim + + # expand for every batch + if self.pattern is None or self.pattern.size(0) != seq_length: + self.pattern = self._init(seq_length, self.embed_dim, self.mean_pooling) + + batch_vector = ( + self.pattern.expand(batch_size, seq_length, embedding_dim) + .clone() + .to(visited_time.device) + ) + index = ( + (visited_time % seq_length) + .long() + .unsqueeze(-1) + .expand(batch_size, seq_length, embedding_dim) + ) + + return torch.gather(batch_vector, 1, index) diff --git a/rl4co/models/rl/__init__.py b/rl4co/models/rl/__init__.py new file mode 100644 index 00000000..1a3bf7e2 --- /dev/null +++ b/rl4co/models/rl/__init__.py @@ -0,0 +1,6 @@ +from rl4co.models.rl.a2c.a2c import A2C +from rl4co.models.rl.common.base import RL4COLitModule +from rl4co.models.rl.ppo.n_step_ppo import n_step_PPO +from rl4co.models.rl.ppo.ppo import PPO +from rl4co.models.rl.ppo.stepwise_ppo import StepwisePPO +from rl4co.models.rl.reinforce.reinforce import REINFORCE diff --git a/rl4co/models/rl/a2c/__init__.py b/rl4co/models/rl/a2c/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/models/rl/a2c/a2c.py b/rl4co/models/rl/a2c/a2c.py new file mode 100644 index 00000000..09b3f980 --- /dev/null +++ b/rl4co/models/rl/a2c/a2c.py @@ -0,0 +1,58 @@ +import torch.nn as nn + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl.common.critic import CriticNetwork, create_critic_from_actor +from rl4co.models.rl.reinforce.baselines import CriticBaseline +from rl4co.models.rl.reinforce.reinforce import REINFORCE +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class A2C(REINFORCE): + """Advantage Actor Critic (A2C) algorithm. + A2C is a variant of REINFORCE where a baseline is provided by a critic network. + Here we additionally support different optimizers for the actor and the critic. + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + critic: Critic network to use for the algorithm + critic_kwargs: Keyword arguments to pass to the critic network + actor_optimizer_kwargs: Keyword arguments for the policy (=actor) optimizer + critic_optimizer_kwargs: Keyword arguments for the critic optimizer. If None, use the same as actor_optimizer_kwargs + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module, + critic: CriticNetwork = None, + critic_kwargs: dict = {}, + actor_optimizer_kwargs: dict = {"lr": 1e-4}, + critic_optimizer_kwargs: dict = None, + **kwargs, + ): + if critic is None: + log.info("Creating critic network for {}".format(env.name)) + critic = create_critic_from_actor(policy, **critic_kwargs) + + # The baseline is directly created here, so we eliminate the baseline argument + kwargs.pop("baseline", None) + + super().__init__(env, policy, baseline=CriticBaseline(critic), **kwargs) + self.actor_optimizer_kwargs = actor_optimizer_kwargs + self.critic_optimizer_kwargs = ( + critic_optimizer_kwargs + if critic_optimizer_kwargs is not None + else actor_optimizer_kwargs + ) + + def configure_optimizers(self): + """Configure the optimizers for the policy and the critic network (=baseline)""" + parameters = [ + {"params": self.policy.parameters(), **self.actor_optimizer_kwargs}, + ] + [{"params": self.baseline.parameters(), **self.critic_optimizer_kwargs}] + + return super().configure_optimizers(parameters) diff --git a/rl4co/models/rl/common/__init__.py b/rl4co/models/rl/common/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/models/rl/common/base.py b/rl4co/models/rl/common/base.py new file mode 100644 index 00000000..1d30ca52 --- /dev/null +++ b/rl4co/models/rl/common/base.py @@ -0,0 +1,333 @@ +import abc + +from functools import partial +from typing import Any, Iterable, List, Union + +import torch +import torch.nn as nn + +from lightning import LightningModule +from torch.utils.data import DataLoader + +from rl4co.data.generate_data import generate_default_datasets +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.utils.optim_helpers import create_optimizer, create_scheduler +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class RL4COLitModule(LightningModule, metaclass=abc.ABCMeta): + """Base class for Lightning modules for RL4CO. This defines the general training loop in terms of + RL algorithms. Subclasses should implement mainly the `shared_step` to define the specific + loss functions and optimization routines. + + Args: + env: RL4CO environment + policy: policy network (actor) + batch_size: batch size (general one, default used for training) + val_batch_size: specific batch size for validation. If None, will use `batch_size`. If list, will use one for each dataset + test_batch_size: specific batch size for testing. If None, will use `val_batch_size`. If list, will use one for each dataset + train_data_size: size of training dataset for one epoch + val_data_size: size of validation dataset for one epoch + test_data_size: size of testing dataset for one epoch + optimizer: optimizer or optimizer name + optimizer_kwargs: optimizer kwargs + lr_scheduler: learning rate scheduler or learning rate scheduler name + lr_scheduler_kwargs: learning rate scheduler kwargs + lr_scheduler_interval: learning rate scheduler interval + lr_scheduler_monitor: learning rate scheduler monitor + generate_default_data: whether to generate default datasets, filling up the data directory + shuffle_train_dataloader: whether to shuffle training dataloader. Default is False since we recreate dataset every epoch + dataloader_num_workers: number of workers for dataloader + data_dir: data directory + metrics: metrics + litmodule_kwargs: kwargs for `LightningModule` + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module, + batch_size: int = 512, + val_batch_size: Union[List[int], int] = None, + test_batch_size: Union[List[int], int] = None, + train_data_size: int = 100_000, + val_data_size: int = 10_000, + test_data_size: int = 10_000, + optimizer: Union[str, torch.optim.Optimizer, partial] = "Adam", + optimizer_kwargs: dict = {"lr": 1e-4}, + lr_scheduler: Union[str, torch.optim.lr_scheduler.LRScheduler, partial] = None, + lr_scheduler_kwargs: dict = { + "milestones": [80, 95], + "gamma": 0.1, + }, + lr_scheduler_interval: str = "epoch", + lr_scheduler_monitor: str = "val/reward", + generate_default_data: bool = False, + shuffle_train_dataloader: bool = False, + dataloader_num_workers: int = 0, + data_dir: str = "data/", + log_on_step: bool = True, + metrics: dict = {}, + **litmodule_kwargs, + ): + super().__init__(**litmodule_kwargs) + + # This line ensures params passed to LightningModule will be saved to ckpt + # it also allows to access params with 'self.hparams' attribute + # Note: we will send to logger with `self.logger.save_hyperparams` in `setup` + self.save_hyperparameters(logger=False) + + self.env = env + self.policy = policy + + self.instantiate_metrics(metrics) + self.log_on_step = log_on_step + + self.data_cfg = { + "batch_size": batch_size, + "val_batch_size": val_batch_size, + "test_batch_size": test_batch_size, + "generate_default_data": generate_default_data, + "data_dir": data_dir, + "train_data_size": train_data_size, + "val_data_size": val_data_size, + "test_data_size": test_data_size, + } + + self._optimizer_name_or_cls: Union[str, torch.optim.Optimizer] = optimizer + self.optimizer_kwargs: dict = optimizer_kwargs + self._lr_scheduler_name_or_cls: Union[ + str, torch.optim.lr_scheduler.LRScheduler + ] = lr_scheduler + self.lr_scheduler_kwargs: dict = lr_scheduler_kwargs + self.lr_scheduler_interval: str = lr_scheduler_interval + self.lr_scheduler_monitor: str = lr_scheduler_monitor + + self.shuffle_train_dataloader = shuffle_train_dataloader + self.dataloader_num_workers = dataloader_num_workers + + def instantiate_metrics(self, metrics: dict): + """Dictionary of metrics to be logged at each phase""" + + if not metrics: + log.info("No metrics specified, using default") + self.train_metrics = metrics.get("train", ["loss", "reward"]) + self.val_metrics = metrics.get("val", ["reward"]) + self.test_metrics = metrics.get("test", ["reward"]) + self.log_on_step = metrics.get("log_on_step", True) + + def setup(self, stage="fit"): + """Base LightningModule setup method. This will setup the datasets and dataloaders + + Note: + We also send to the loggers all hyperparams that are not `nn.Module` (i.e. the policy). + Apparently PyTorch Lightning does not do this by default. + """ + + log.info("Setting up batch sizes for train/val/test") + train_bs, val_bs, test_bs = ( + self.data_cfg["batch_size"], + self.data_cfg["val_batch_size"], + self.data_cfg["test_batch_size"], + ) + self.train_batch_size = train_bs + self.val_batch_size = train_bs if val_bs is None else val_bs + self.test_batch_size = self.val_batch_size if test_bs is None else test_bs + + if self.data_cfg["generate_default_data"]: + log.info( + "Generating default datasets. If found, they will not be overwritten" + ) + generate_default_datasets(data_dir=self.data_cfg["data_dir"]) + + log.info("Setting up datasets") + self.train_dataset = self.wrap_dataset( + self.env.dataset(self.data_cfg["train_data_size"], phase="train") + ) + self.val_dataset = self.env.dataset(self.data_cfg["val_data_size"], phase="val") + self.test_dataset = self.env.dataset( + self.data_cfg["test_data_size"], phase="test" + ) + self.dataloader_names = None + self.setup_loggers() + self.post_setup_hook() + + def setup_loggers(self): + """Log all hyperparameters except those in `nn.Module`""" + if self.loggers is not None: + hparams_save = { + k: v for k, v in self.hparams.items() if not isinstance(v, nn.Module) + } + for logger in self.loggers: + logger.log_hyperparams(hparams_save) + logger.log_graph(self) + logger.save() + + def post_setup_hook(self): + """Hook to be called after setup. Can be used to set up subclasses without overriding `setup`""" + pass + + def configure_optimizers(self, parameters=None): + """ + Args: + parameters: parameters to be optimized. If None, will use `self.parameters()`, i.e. all parameters + """ + + if parameters is None: + parameters = self.parameters() + + log.info(f"Instantiating optimizer <{self._optimizer_name_or_cls}>") + if isinstance(self._optimizer_name_or_cls, str): + optimizer = create_optimizer( + parameters, self._optimizer_name_or_cls, **self.optimizer_kwargs + ) + elif isinstance(self._optimizer_name_or_cls, partial): + optimizer = self._optimizer_name_or_cls(parameters, **self.optimizer_kwargs) + else: # User-defined optimizer + opt_cls = self._optimizer_name_or_cls + optimizer = opt_cls(parameters, **self.optimizer_kwargs) + assert isinstance(optimizer, torch.optim.Optimizer) + + # instantiate lr scheduler + if self._lr_scheduler_name_or_cls is None: + return optimizer + else: + log.info(f"Instantiating LR scheduler <{self._lr_scheduler_name_or_cls}>") + if isinstance(self._lr_scheduler_name_or_cls, str): + scheduler = create_scheduler( + optimizer, self._lr_scheduler_name_or_cls, **self.lr_scheduler_kwargs + ) + elif isinstance(self._lr_scheduler_name_or_cls, partial): + scheduler = self._lr_scheduler_name_or_cls( + optimizer, **self.lr_scheduler_kwargs + ) + else: # User-defined scheduler + scheduler_cls = self._lr_scheduler_name_or_cls + scheduler = scheduler_cls(optimizer, **self.lr_scheduler_kwargs) + assert isinstance(scheduler, torch.optim.lr_scheduler.LRScheduler) + return [optimizer], { + "scheduler": scheduler, + "interval": self.lr_scheduler_interval, + "monitor": self.lr_scheduler_monitor, + } + + def log_metrics( + self, metric_dict: dict, phase: str, dataloader_idx: Union[int, None] = None + ): + """Log metrics to logger and progress bar""" + metrics = getattr(self, f"{phase}_metrics") + dataloader_name = "" + if dataloader_idx is not None and self.dataloader_names is not None: + dataloader_name = "/" + self.dataloader_names[dataloader_idx] + metrics = { + f"{phase}/{k}{dataloader_name}": v.mean() + if isinstance(v, torch.Tensor) + else v + for k, v in metric_dict.items() + if k in metrics + } + log_on_step = self.log_on_step if phase == "train" else False + on_epoch = False if phase == "train" else True + self.log_dict( + metrics, + on_step=log_on_step, + on_epoch=on_epoch, + prog_bar=True, + sync_dist=True, + add_dataloader_idx=False, # we add manually above + ) + return metrics + + def forward(self, td, **kwargs): + """Forward pass for the model. Simple wrapper around `policy`. Uses `env` from the module if not provided.""" + if kwargs.get("env", None) is None: + env = self.env + else: + log.info("Using env from kwargs") + env = kwargs.pop("env") + return self.policy(td, env, **kwargs) + + def shared_step(self, batch: Any, batch_idx: int, phase: str, **kwargs): + """Shared step between train/val/test. To be implemented in subclass""" + raise NotImplementedError("Shared step is required to implemented in subclass") + + def training_step(self, batch: Any, batch_idx: int): + # To use new data every epoch, we need to call reload_dataloaders_every_epoch=True in Trainer + return self.shared_step(batch, batch_idx, phase="train") + + def validation_step(self, batch: Any, batch_idx: int, dataloader_idx: int = None): + return self.shared_step( + batch, batch_idx, phase="val", dataloader_idx=dataloader_idx + ) + + def test_step(self, batch: Any, batch_idx: int, dataloader_idx: int = None): + return self.shared_step( + batch, batch_idx, phase="test", dataloader_idx=dataloader_idx + ) + + def train_dataloader(self): + return self._dataloader( + self.train_dataset, self.train_batch_size, self.shuffle_train_dataloader + ) + + def val_dataloader(self): + return self._dataloader(self.val_dataset, self.val_batch_size) + + def test_dataloader(self): + return self._dataloader(self.test_dataset, self.test_batch_size) + + def on_train_epoch_end(self): + """Called at the end of the training epoch. This can be used for instance to update the train dataset + with new data (which is the case in RL). + """ + # Only update if not in the first epoch + # If last epoch, we don't need to update since we will not use the dataset anymore + if self.current_epoch < self.trainer.max_epochs - 1: + log.info("Generating training dataset for next epoch...") + train_dataset = self.env.dataset(self.data_cfg["train_data_size"], "train") + self.train_dataset = self.wrap_dataset(train_dataset) + + def wrap_dataset(self, dataset): + """Wrap dataset with policy-specific wrapper. This is useful i.e. in REINFORCE where we need to + collect the greedy rollout baseline outputs. + """ + return dataset + + def _dataloader(self, dataset, batch_size, shuffle=False): + """Handle both single datasets and list / dict of datasets""" + if isinstance(dataset, Iterable): + # load dataloader names if available as dict, else use indices + if isinstance(dataset, dict): + self.dataloader_names = list(dataset.keys()) + else: + self.dataloader_names = [f"{i}" for i in range(len(dataset))] + # if batch size is int, make it into list + if isinstance(batch_size, int): + batch_size = [batch_size] * len(self.dataloader_names) + assert len(batch_size) == len( + self.dataloader_names + ), f"Batch size must match number of datasets. \ + Found: {len(batch_size)} and {len(self.dataloader_names)}" + return [ + self._dataloader_single(dset, bsize, shuffle) + for dset, bsize in zip(dataset.values(), batch_size) + ] + else: + assert isinstance( + batch_size, int + ), f"Batch size must be an integer for a single dataset, found {batch_size}" + return self._dataloader_single(dataset, batch_size, shuffle) + + def _dataloader_single(self, dataset, batch_size, shuffle=False): + """The dataloader used by the trainer. This is a wrapper around the dataset with a custom collate_fn + to efficiently handle TensorDicts. + """ + return DataLoader( + dataset, + batch_size=batch_size, + shuffle=shuffle, + num_workers=self.dataloader_num_workers, + collate_fn=dataset.collate_fn, + ) diff --git a/rl4co/models/rl/common/critic.py b/rl4co/models/rl/common/critic.py new file mode 100644 index 00000000..2a37e273 --- /dev/null +++ b/rl4co/models/rl/common/critic.py @@ -0,0 +1,77 @@ +import copy + +from typing import Optional, Union + +from tensordict import TensorDict +from torch import Tensor, nn + +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class CriticNetwork(nn.Module): + """Create a critic network given an encoder (e.g. as the one in the policy network) + with a value head to transform the embeddings to a scalar value. + + Args: + encoder: Encoder module to encode the input + value_head: Value head to transform the embeddings to a scalar value + embed_dim: Dimension of the embeddings of the value head + hidden_dim: Dimension of the hidden layer of the value head + """ + + def __init__( + self, + encoder: nn.Module, + value_head: Optional[nn.Module] = None, + embed_dim: int = 128, + hidden_dim: int = 512, + customized: bool = False, + ): + super(CriticNetwork, self).__init__() + + self.encoder = encoder + if value_head is None: + # check if embed dim of encoder is different, if so, use it + if getattr(encoder, "embed_dim", embed_dim) != embed_dim: + log.warning( + f"Found encoder with different embed_dim {encoder.embed_dim} than the value head {embed_dim}. Using encoder embed_dim for value head." + ) + embed_dim = getattr(encoder, "embed_dim", embed_dim) + value_head = nn.Sequential( + nn.Linear(embed_dim, hidden_dim), nn.ReLU(), nn.Linear(hidden_dim, 1) + ) + self.value_head = value_head + self.customized = customized + + def forward(self, x: Union[Tensor, TensorDict], hidden=None) -> Tensor: + """Forward pass of the critic network: encode the imput in embedding space and return the value + + Args: + x: Input containing the environment state. Can be a Tensor or a TensorDict + + Returns: + Value of the input state + """ + if not self.customized: # fir for most of costructive tasks + h, _ = self.encoder(x) # [batch_size, N, embed_dim] -> [batch_size, N] + return self.value_head(h).mean(1) # [batch_size, N] -> [batch_size] + else: # custimized encoder and value head with hidden input + h = self.encoder(x) # [batch_size, N, embed_dim] -> [batch_size, N] + return self.value_head(h, hidden) + + +def create_critic_from_actor( + policy: nn.Module, backbone: str = "encoder", **critic_kwargs +): + # we reuse the network of the policy's backbone, such as an encoder + encoder = getattr(policy, backbone, None) + if encoder is None: + raise ValueError( + f"CriticBaseline requires a backbone in the policy network: {backbone}" + ) + critic = CriticNetwork(copy.deepcopy(encoder), **critic_kwargs).to( + next(policy.parameters()).device + ) + return critic diff --git a/rl4co/models/rl/common/utils.py b/rl4co/models/rl/common/utils.py new file mode 100644 index 00000000..6c16976a --- /dev/null +++ b/rl4co/models/rl/common/utils.py @@ -0,0 +1,48 @@ +import torch + + +class RewardScaler: + """This class calculates the running mean and variance of a stepwise observed + quantity, like the RL reward / advantage using the Welford online algorithm. + The mean and variance are either used to standardize the input (scale='norm') or + to scale it (scale='scale'). + + Args: + scale: None | 'scale' | 'mean': specifies how to transform the input; defaults to None + """ + + def __init__(self, scale: str = None): + self.scale = scale + self.count = 0 + self.mean = 0 + self.M2 = 0 + + def __call__(self, scores: torch.Tensor): + if self.scale is None: + return scores + elif isinstance(self.scale, int): + return scores / self.scale + # Score scaling + self.update(scores) + tensor_to_kwargs = dict(dtype=scores.dtype, device=scores.device) + std = (self.M2 / (self.count - 1)).float().sqrt() + score_scaling_factor = std.to(**tensor_to_kwargs) + torch.finfo(scores.dtype).eps + if self.scale == "norm": + scores = (scores - self.mean.to(**tensor_to_kwargs)) / score_scaling_factor + elif self.scale == "scale": + scores /= score_scaling_factor + else: + raise ValueError("unknown scaling operation requested: %s" % self.scale) + return scores + + @torch.no_grad() + def update(self, batch: torch.Tensor): + batch = batch.reshape(-1) + self.count += len(batch) + + # newvalues - oldMean + delta = batch - self.mean + self.mean += (delta / self.count).sum() + # newvalues - newMeant + delta2 = batch - self.mean + self.M2 += (delta * delta2).sum() diff --git a/rl4co/models/rl/ppo/__init__.py b/rl4co/models/rl/ppo/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/models/rl/ppo/n_step_ppo.py b/rl4co/models/rl/ppo/n_step_ppo.py new file mode 100644 index 00000000..57d96815 --- /dev/null +++ b/rl4co/models/rl/ppo/n_step_ppo.py @@ -0,0 +1,280 @@ +from typing import Any + +import torch +import torch.nn as nn + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl.common.base import RL4COLitModule +from rl4co.models.rl.common.critic import CriticNetwork +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class Memory: + def __init__(self): + self.tds = [] + self.actions = [] + self.logprobs = [] + self.rewards = [] + + def clear_memory(self): + del self.tds[:] + del self.actions[:] + del self.logprobs[:] + del self.rewards[:] + + +class n_step_PPO(RL4COLitModule): + """ + An implementation of the n-step dactProximal Policy Optimization (PPO) algorithm (https://arxiv.org/abs/2110.02544) + is presented for training improvement models. + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module, + critic: CriticNetwork = None, + critic_kwargs: dict = {}, + clip_range: float = 0.1, # epsilon of PPO + ppo_epochs: int = 3, # inner epoch, K + vf_lambda: float = 1.0, # lambda of Value function fitting + normalize_adv: bool = False, # whether to normalize advantage + max_grad_norm: float = 0.05, # max gradient norm + gamma: float = 0.999, # gamma for improvement MDP task + n_step: float = 5, # n-step for n-step PPO + T_train: int = 250, # the maximum inference T used for training + T_test: int = 1000, # the maximum inference T used for test + lr_policy: float = 8e-5, # the learning rate for actor + lr_critic: float = 2e-5, # the learning rate for critic + CL_scalar: float = 2.0, # hyperparameter of CL scalar of PPO-CL algorithm + CL_best: bool = False, # whether use the best solution from the CL rollout + metrics: dict = { + "train": ["loss", "surrogate_loss", "value_loss", "cost_bsf", "cost_init"], + "val": ["cost_bsf", "cost_init"], + "test": ["cost_bsf", "cost_init"], + }, + lr_scheduler=torch.optim.lr_scheduler.ExponentialLR, + lr_scheduler_kwargs: dict = { + "gamma": 0.985, # the learning decay per epoch, + }, + lr_scheduler_interval: str = "epoch", + lr_scheduler_monitor=None, + **kwargs, + ): + super().__init__( + env, + policy, + metrics=metrics, + lr_scheduler=lr_scheduler, + lr_scheduler_kwargs=lr_scheduler_kwargs, + lr_scheduler_interval=lr_scheduler_interval, + lr_scheduler_monitor=lr_scheduler_monitor, + **kwargs, + ) + + self.CL_scalar = CL_scalar + self.CL_num = 0.0 + self.CL_best = CL_best + self.automatic_optimization = False # n_step_PPO uses custom optimization routine + + self.critic = critic + + self.ppo_cfg = { + "clip_range": clip_range, + "ppo_epochs": ppo_epochs, + "vf_lambda": vf_lambda, + "normalize_adv": normalize_adv, + "max_grad_norm": max_grad_norm, + "gamma": gamma, + "n_step": n_step, + "T_train": T_train, + "T_test": T_test, + "lr_policy": lr_policy, + "lr_critic": lr_critic, + } + + def configure_optimizers(self): + parameters = [ + {"params": self.policy.parameters(), "lr": self.ppo_cfg["lr_policy"]} + ] + [{"params": self.critic.parameters(), "lr": self.ppo_cfg["lr_critic"]}] + + return super().configure_optimizers(parameters) + + def on_train_epoch_end(self): + """ + Learning rate scheduler and CL scheduler + """ + # Learning rate scheduler + sch = self.lr_schedulers() + sch.step() + + # CL scheduler + self.CL_num += 1 / self.CL_scalar + + def shared_step( + self, batch: Any, batch_idx: int, phase: str, dataloader_idx: int = None + ): + if phase != "train": + with torch.no_grad(): + td = self.env.reset(batch) + cost_init = td["cost_current"] + for i in range(self.ppo_cfg["T_test"]): + out = self.policy(td, self.env, phase=phase) + self.env.step(td) + out["cost_bsf"] = td["cost_bsf"] + + else: + # init the training + memory = Memory() + td = self.env.reset(batch) + + # perform CL strategy + with torch.no_grad(): + for i in range(int(self.CL_num)): + out = self.policy(td, self.env, phase=phase) + self.env.step(td) + if self.CL_best: + td = self.env.step_to_solution(td, td["rec_best"]) + cost_init = td["cost_current"] + + # perform gradiant updates every n_step untill reaching T_max + assert ( + self.ppo_cfg["T_train"] % self.ppo_cfg["n_step"] == 0 + ), "T_max should be divided by n_step with no remainder" + t = 0 + while t < self.ppo_cfg["T_train"]: + memory.clear_memory() + bl = [] + ll = [] + # Rollout for n_step, perform actor and critic and env step, store the information in memory + for i in range(self.ppo_cfg["n_step"]): + memory.tds.append(td.clone()) + + out = self.policy(td, self.env, phase=phase, return_embeds=True) + value_pred = self.critic( + out["embeds"].detach(), td["cost_bsf"].unsqueeze(-1) + ) + + memory.actions.append(out["actions"].clone()) + memory.logprobs.append(out["log_likelihood"].clone()) + bl.append(value_pred) + + self.env.step(td) + memory.rewards.append(td["reward"].clone().view(-1, 1)) + + t += self.ppo_cfg["n_step"] + + # PPO inner epoch, K + old_value = None + for k in range(self.ppo_cfg["ppo_epochs"]): + if k == 0: + ll = memory.logprobs + + else: + ll = [] + bl = [] + for i in range(self.ppo_cfg["n_step"]): + out = self.policy( + memory.tds[i].clone(), + actions=memory.actions[i], + env=self.env, + phase=phase, + return_actions=False, + return_embeds=True, + ) + bl_value = self.critic( + out["embeds"].detach(), + memory.tds[i]["cost_bsf"].unsqueeze(-1), + ) + + ll.append(out["log_likelihood"]) + bl.append(bl_value) + + # prepare loglikelihood (ll) and baseline value (bl) + ll = torch.stack(ll).view(-1, 1) + bl = torch.stack(bl).view(-1, 1) + old_ll = torch.stack(memory.logprobs).view(-1, 1) + + # Compute the Reward wrt n_step + Reward = [] + reward_reversed = memory.rewards[::-1] + R = self.critic( + self.policy(td, self.env, phase=phase, only_return_embed=True)[ + "embeds" + ].detach(), + td["cost_bsf"].unsqueeze(-1), + ).detach() # Remember to detach() since we only need the predicted value here + for r in range(len(reward_reversed)): + R = R * self.ppo_cfg["gamma"] + reward_reversed[r] + Reward.append(R.clone()) + Reward = torch.stack(Reward[::-1]).view(-1, 1) + + # Compute the ratio of probabilities of new and old actions + ratio = torch.exp(ll - old_ll.detach()) + + # Compute the advantage + adv = Reward - bl.detach() + + # Normalize advantage + if self.ppo_cfg["normalize_adv"]: + adv = (adv - adv.mean()) / (adv.std() + 1e-8) + + # Compute the surrogate loss + surrogate_loss = -torch.min( + ratio * adv, + torch.clamp( + ratio, + 1 - self.ppo_cfg["clip_range"], + 1 + self.ppo_cfg["clip_range"], + ) + * adv, + ).mean() + + # compute value function loss + if old_value is None: + value_loss = ((bl - Reward) ** 2).mean() + old_value = bl.detach() + else: + value_clipped = ( + torch.clamp( + bl - old_value, + -self.ppo_cfg["clip_range"], + self.ppo_cfg["clip_range"], + ) + + old_value + ) + + value_loss = torch.max( + (bl - Reward) ** 2, + (value_clipped - Reward) ** 2, + ).mean() + + # compute total loss + loss = surrogate_loss + self.ppo_cfg["vf_lambda"] * value_loss + + # perform manual optimization following the Lightning routine + # https://lightning.ai/docs/pytorch/stable/common/optimization.html + opt = self.optimizers() + opt.zero_grad() + self.manual_backward(loss) + if self.ppo_cfg["max_grad_norm"] is not None: + self.clip_gradients( + opt, + gradient_clip_val=self.ppo_cfg["max_grad_norm"], + gradient_clip_algorithm="norm", + ) + opt.step() + + out.update( + { + "cost_init": cost_init, + "cost_bsf": td["cost_bsf"], + "loss": loss, + "surrogate_loss": surrogate_loss, + "value_loss": value_loss, + } + ) + metrics = self.log_metrics(out, phase, dataloader_idx=dataloader_idx) + return {"loss": out.get("loss", None), **metrics} diff --git a/rl4co/models/rl/ppo/ppo.py b/rl4co/models/rl/ppo/ppo.py new file mode 100644 index 00000000..2acc212e --- /dev/null +++ b/rl4co/models/rl/ppo/ppo.py @@ -0,0 +1,235 @@ +from typing import Any, Union + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from torch.utils.data import DataLoader + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl.common.base import RL4COLitModule +from rl4co.models.rl.common.critic import CriticNetwork, create_critic_from_actor +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class PPO(RL4COLitModule): + """ + An implementation of the Proximal Policy Optimization (PPO) algorithm (https://arxiv.org/abs/1707.06347) + is presented with modifications for autoregressive decoding schemes. + + In contrast to the original PPO algorithm, this implementation does not consider autoregressive decoding steps + as part of the MDP transition. While many Neural Combinatorial Optimization (NCO) studies model decoding steps + as transitions in a solution-construction MDP, we treat autoregressive solution construction as an algorithmic + choice for tractable CO solution generation. This choice aligns with the Attention Model (AM) + (https://openreview.net/forum?id=ByxBFsRqYm), which treats decoding steps as a single-step MDP in Equation 9. + + Modeling autoregressive decoding steps as a single-step MDP introduces significant changes to the PPO implementation, + including: + - Generalized Advantage Estimation (GAE) (https://arxiv.org/abs/1506.02438) is not applicable since we are dealing with a single-step MDP. + - The definition of policy entropy can differ from the commonly implemented manner. + + The commonly implemented definition of policy entropy is the entropy of the policy distribution, given by: + + $$H(\\pi(x_t)) = - \\sum_{a_t \\in A_t} \\pi(a_t|x_t) \\log \\pi(a_t|x_t)$$ + + where $x_t$ represents the given state at step $t$, $A_t$ is the set of all (admisible) actions + at step $t$, and $a_t$ is the action taken at step $t$. + + If we interpret autoregressive decoding steps as transition steps of an MDP, the entropy for the entire decoding + process can be defined as the sum of entropies for each decoding step: + + $$H(\\pi) = \\sum_t H(\\pi(x_t))$$ + + However, if we consider autoregressive decoding steps as an algorithmic choice, the entropy for the entire decoding + process is defined as: + + $$H(\\pi) = - \\sum_{a \\in A} \\pi(a|x) \\log \\pi(a|x)$$ + + where $x$ represents the given CO problem instance, and $A$ is the set of all feasible solutions. + + Due to the intractability of computing the entropy of the policy distribution over all feasible solutions, + we approximate it by computing the entropy over solutions generated by the policy itself. This approximation serves + as a proxy for the second definition of entropy, utilizing Monte Carlo sampling. + + It is worth noting that our modeling of decoding steps and the implementation of the PPO algorithm align with recent + work in the Natural Language Processing (NLP) community, specifically RL with Human Feedback (RLHF) + (e.g., https://github.com/lucidrains/PaLM-rlhf-pytorch). + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module, + critic: CriticNetwork = None, + critic_kwargs: dict = {}, + clip_range: float = 0.2, # epsilon of PPO + ppo_epochs: int = 2, # inner epoch, K + mini_batch_size: Union[int, float] = 0.25, # 0.25, + vf_lambda: float = 0.5, # lambda of Value function fitting + entropy_lambda: float = 0.0, # lambda of entropy bonus + normalize_adv: bool = False, # whether to normalize advantage + max_grad_norm: float = 0.5, # max gradient norm + metrics: dict = { + "train": ["reward", "loss", "surrogate_loss", "value_loss", "entropy"], + }, + **kwargs, + ): + super().__init__(env, policy, metrics=metrics, **kwargs) + self.automatic_optimization = False # PPO uses custom optimization routine + + if critic is None: + log.info("Creating critic network for {}".format(env.name)) + critic = create_critic_from_actor(policy, **critic_kwargs) + self.critic = critic + + if isinstance(mini_batch_size, float) and ( + mini_batch_size <= 0 or mini_batch_size > 1 + ): + default_mini_batch_fraction = 0.25 + log.warning( + f"mini_batch_size must be an integer or a float in the range (0, 1], got {mini_batch_size}. Setting mini_batch_size to {default_mini_batch_fraction}." + ) + mini_batch_size = default_mini_batch_fraction + + if isinstance(mini_batch_size, int) and (mini_batch_size <= 0): + default_mini_batch_size = 128 + log.warning( + f"mini_batch_size must be an integer or a float in the range (0, 1], got {mini_batch_size}. Setting mini_batch_size to {default_mini_batch_size}." + ) + mini_batch_size = default_mini_batch_size + + self.ppo_cfg = { + "clip_range": clip_range, + "ppo_epochs": ppo_epochs, + "mini_batch_size": mini_batch_size, + "vf_lambda": vf_lambda, + "entropy_lambda": entropy_lambda, + "normalize_adv": normalize_adv, + "max_grad_norm": max_grad_norm, + } + + def configure_optimizers(self): + parameters = list(self.policy.parameters()) + list(self.critic.parameters()) + return super().configure_optimizers(parameters) + + def on_train_epoch_end(self): + """ + ToDo: Add support for other schedulers. + """ + + sch = self.lr_schedulers() + + # If the selected scheduler is a MultiStepLR scheduler. + if isinstance(sch, torch.optim.lr_scheduler.MultiStepLR): + sch.step() + + def shared_step( + self, batch: Any, batch_idx: int, phase: str, dataloader_idx: int = None + ): + # Evaluate old actions, log probabilities, and rewards + with torch.no_grad(): + td = self.env.reset(batch) # note: clone needed for dataloader + out = self.policy(td.clone(), self.env, phase=phase) + + if phase == "train": + batch_size = out["actions"].shape[0] + + # infer batch size + if isinstance(self.ppo_cfg["mini_batch_size"], float): + mini_batch_size = int(batch_size * self.ppo_cfg["mini_batch_size"]) + elif isinstance(self.ppo_cfg["mini_batch_size"], int): + mini_batch_size = self.ppo_cfg["mini_batch_size"] + else: + raise ValueError("mini_batch_size must be an integer or a float.") + + if mini_batch_size > batch_size: + mini_batch_size = batch_size + + # Todo: Add support for multi dimensional batches + td.set("logprobs", out["log_likelihood"]) + td.set("reward", out["reward"]) + td.set("action", out["actions"]) + + # Inherit the dataset class from the environment for efficiency + dataset = self.env.dataset_cls(td) + dataloader = DataLoader( + dataset, + batch_size=mini_batch_size, + shuffle=True, + collate_fn=dataset.collate_fn, + ) + + for _ in range(self.ppo_cfg["ppo_epochs"]): # PPO inner epoch, K + for sub_td in dataloader: + sub_td = sub_td.to(td.device) + previous_reward = sub_td["reward"].view(-1, 1) + out = self.policy( # note: remember to clone to avoid in-place replacements! + sub_td.clone(), + actions=sub_td["action"], + env=self.env, + return_entropy=True, + return_sum_log_likelihood=False, + ) + ll, entropy = out["log_likelihood"], out["entropy"] + + # Compute the ratio of probabilities of new and old actions + ratio = torch.exp(ll.sum(dim=-1) - sub_td["logprobs"]).view( + -1, 1 + ) # [batch, 1] + + # Compute the advantage + value_pred = self.critic(sub_td) # [batch, 1] + adv = previous_reward - value_pred.detach() + + # Normalize advantage + if self.ppo_cfg["normalize_adv"]: + adv = (adv - adv.mean()) / (adv.std() + 1e-8) + + # Compute the surrogate loss + surrogate_loss = -torch.min( + ratio * adv, + torch.clamp( + ratio, + 1 - self.ppo_cfg["clip_range"], + 1 + self.ppo_cfg["clip_range"], + ) + * adv, + ).mean() + + # compute value function loss + value_loss = F.huber_loss(value_pred, previous_reward) + + # compute total loss + loss = ( + surrogate_loss + + self.ppo_cfg["vf_lambda"] * value_loss + - self.ppo_cfg["entropy_lambda"] * entropy.mean() + ) + + # perform manual optimization following the Lightning routine + # https://lightning.ai/docs/pytorch/stable/common/optimization.html + + opt = self.optimizers() + opt.zero_grad() + self.manual_backward(loss) + if self.ppo_cfg["max_grad_norm"] is not None: + self.clip_gradients( + opt, + gradient_clip_val=self.ppo_cfg["max_grad_norm"], + gradient_clip_algorithm="norm", + ) + opt.step() + + out.update( + { + "loss": loss, + "surrogate_loss": surrogate_loss, + "value_loss": value_loss, + "entropy": entropy.mean(), + } + ) + + metrics = self.log_metrics(out, phase, dataloader_idx=dataloader_idx) + return {"loss": out.get("loss", None), **metrics} diff --git a/rl4co/models/rl/ppo/stepwise_ppo.py b/rl4co/models/rl/ppo/stepwise_ppo.py new file mode 100644 index 00000000..49d087d0 --- /dev/null +++ b/rl4co/models/rl/ppo/stepwise_ppo.py @@ -0,0 +1,171 @@ +import copy + +from typing import Any, Union + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from torchrl.data.replay_buffers import ( + LazyMemmapStorage, + ListStorage, + SamplerWithoutReplacement, + TensorDictReplayBuffer, +) + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl.common.base import RL4COLitModule +from rl4co.models.rl.common.utils import RewardScaler +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def make_replay_buffer(buffer_size, batch_size, device="cpu"): + if device == "cpu": + storage = LazyMemmapStorage(buffer_size, device="cpu") + prefetch = 3 + else: + storage = ListStorage(buffer_size) + prefetch = None + return TensorDictReplayBuffer( + storage=storage, + batch_size=batch_size, + sampler=SamplerWithoutReplacement(drop_last=True), + pin_memory=False, + prefetch=prefetch, + ) + + +class StepwisePPO(RL4COLitModule): + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module, + clip_range: float = 0.2, # epsilon of PPO + update_timestep: int = 1, + buffer_size: int = 100_000, + ppo_epochs: int = 2, # inner epoch, K + batch_size: int = 256, + mini_batch_size: int = 256, + vf_lambda: float = 0.5, # lambda of Value function fitting + entropy_lambda: float = 0.01, # lambda of entropy bonus + max_grad_norm: float = 0.5, # max gradient norm + buffer_storage_device: str = "gpu", + metrics: dict = { + "train": ["loss", "surrogate_loss", "value_loss", "entropy"], + }, + reward_scale: Union[str, int] = None, + **kwargs, + ): + super().__init__(env, policy, metrics=metrics, batch_size=batch_size, **kwargs) + + self.policy_old = copy.deepcopy(self.policy) + self.automatic_optimization = False # PPO uses custom optimization routine + self.rb = make_replay_buffer(buffer_size, mini_batch_size, buffer_storage_device) + self.scaler = RewardScaler(reward_scale) + + self.ppo_cfg = { + "clip_range": clip_range, + "ppo_epochs": ppo_epochs, + "update_timestep": update_timestep, + "mini_batch_size": mini_batch_size, + "vf_lambda": vf_lambda, + "entropy_lambda": entropy_lambda, + "max_grad_norm": max_grad_norm, + } + + def update(self, device): + outs = [] + # PPO inner epoch + for _ in range(self.ppo_cfg["ppo_epochs"]): + for sub_td in self.rb: + sub_td = sub_td.to(device) + previous_reward = sub_td["reward"].view(-1, 1) + previous_logp = sub_td["logprobs"] + + logprobs, value_pred, entropy = self.policy.evaluate(sub_td) + + ratios = torch.exp(logprobs - previous_logp) + + advantages = torch.squeeze(previous_reward - value_pred.detach(), 1) + surr1 = ratios * advantages + surr2 = ( + torch.clamp( + ratios, + 1 - self.ppo_cfg["clip_range"], + 1 + self.ppo_cfg["clip_range"], + ) + * advantages + ) + surrogate_loss = -torch.min(surr1, surr2).mean() + + # compute value function loss + value_loss = F.mse_loss(value_pred, previous_reward) + + # compute total loss + loss = ( + surrogate_loss + + self.ppo_cfg["vf_lambda"] * value_loss + - self.ppo_cfg["entropy_lambda"] * entropy.mean() + ) + + # perform manual optimization following the Lightning routine + # https://lightning.ai/docs/pytorch/stable/common/optimization.html + + opt = self.optimizers() + opt.zero_grad() + self.manual_backward(loss) + if self.ppo_cfg["max_grad_norm"] is not None: + self.clip_gradients( + opt, + gradient_clip_val=self.ppo_cfg["max_grad_norm"], + gradient_clip_algorithm="norm", + ) + opt.step() + + out = { + "reward": previous_reward.mean(), + "loss": loss, + "surrogate_loss": surrogate_loss, + "value_loss": value_loss, + "entropy": entropy.mean(), + } + + outs.append(out) + # Copy new weights into old policy: + self.policy_old.load_state_dict(self.policy.state_dict()) + outs = {k: torch.stack([dic[k] for dic in outs], dim=0) for k in outs[0]} + return outs + + def shared_step( + self, batch: Any, batch_idx: int, phase: str, dataloader_idx: int = None + ): + next_td = self.env.reset(batch) + device = next_td.device + if phase == "train": + while not next_td["done"].all(): + with torch.no_grad(): + td = self.policy_old.act(next_td, self.env, phase="train") + # get next state + next_td = self.env.step(td)["next"] + # get reward of action + reward = self.env.get_reward(next_td, None) + reward = self.scaler(reward) + # add reward to prior state + td.set("reward", reward) + # add tensordict with action, logprobs and reward information to buffer + self.rb.extend(td) + + # if iter mod x = 0 then update the policy (x = 1 in paper) + if batch_idx % self.ppo_cfg["update_timestep"] == 0: + out = self.update(device) + self.rb.empty() + + else: + out = self.policy.generate( + next_td, self.env, phase=phase, select_best=phase != "train" + ) + + metrics = self.log_metrics(out, phase, dataloader_idx=dataloader_idx) + return {"loss": out.get("loss", None), **metrics} diff --git a/rl4co/models/rl/reinforce/__init__.py b/rl4co/models/rl/reinforce/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/models/rl/reinforce/baselines.py b/rl4co/models/rl/reinforce/baselines.py new file mode 100644 index 00000000..e59b1969 --- /dev/null +++ b/rl4co/models/rl/reinforce/baselines.py @@ -0,0 +1,311 @@ +import abc +import copy + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from scipy.stats import ttest_rel +from tensordict import TensorDict +from torch.utils.data import DataLoader, Dataset + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl.common.critic import CriticNetwork, create_critic_from_actor +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class REINFORCEBaseline(nn.Module, metaclass=abc.ABCMeta): + """Base class for REINFORCE baselines""" + + def __init__(self, *args, **kw): + super().__init__() + pass + + def wrap_dataset(self, dataset: Dataset, *args, **kw): + """Wrap dataset with baseline-specific functionality""" + return dataset + + @abc.abstractmethod + def eval( + self, td: TensorDict, reward: torch.Tensor, env: RL4COEnvBase = None, **kwargs + ): + """Evaluate baseline""" + raise NotImplementedError + + def epoch_callback(self, *args, **kw): + """Callback at the end of each epoch + For example, update baseline parameters and obtain baseline values + """ + pass + + def setup(self, *args, **kw): + """To be called before training during setup phase + This follow PyTorch Lightning's setup() convention + """ + pass + + +class NoBaseline(REINFORCEBaseline): + """No baseline: return 0 for baseline and neg_los""" + + def eval(self, td, reward, env=None): + return 0, 0 # No baseline, no neg_los + + +class SharedBaseline(REINFORCEBaseline): + """Shared baseline: return mean of reward as baseline""" + + def eval(self, td, reward, env=None, on_dim=1): # e.g. [batch, pomo, ...] + return reward.mean(dim=on_dim, keepdims=True), 0 + + +class ExponentialBaseline(REINFORCEBaseline): + """Exponential baseline: return exponential moving average of reward as baseline + + Args: + beta: Beta value for the exponential moving average + """ + + def __init__(self, beta=0.8, **kw): + super(REINFORCEBaseline, self).__init__() + + self.beta = beta + self.v = None + + def eval(self, td, reward, env=None): + if self.v is None: + v = reward.mean() + else: + v = self.beta * self.v + (1.0 - self.beta) * reward.mean() + self.v = v.detach() # Detach since we never want to backprop + return self.v, 0 # No loss + + +class MeanBaseline(REINFORCEBaseline): + """Mean baseline: return mean of reward as baseline""" + + def __new__(cls, **kw): + return ExponentialBaseline(beta=0.0, **kw) + + +class WarmupBaseline(REINFORCEBaseline): + """Warmup baseline: return convex combination of baseline and exponential baseline + + Args: + baseline: Baseline to use after warmup + n_epochs: Number of epochs to warmup + warmup_exp_beta: Beta value for the exponential baseline during warmup + """ + + def __init__(self, baseline, n_epochs=1, warmup_exp_beta=0.8, **kw): + super(REINFORCEBaseline, self).__init__() + + self.baseline = baseline + assert n_epochs > 0, "n_epochs to warmup must be positive" + self.warmup_baseline = ExponentialBaseline(warmup_exp_beta) + self.alpha = 0 + self.n_epochs = n_epochs + + def wrap_dataset(self, dataset, *args, **kw): + if self.alpha > 0: + return self.baseline.wrap_dataset(dataset, *args, **kw) + return self.warmup_baseline.wrap_dataset(dataset, *args, **kw) + + def setup(self, *args, **kw): + self.baseline.setup(*args, **kw) + + def eval(self, td, reward, env=None): + if self.alpha == 1: + return self.baseline.eval(td, reward, env) + if self.alpha == 0: + return self.warmup_baseline.eval(td, reward, env) + v_b, l_b = self.baseline.eval(td, reward, env) + v_wb, l_wb = self.warmup_baseline.eval(td, reward, env) + # Return convex combination of baseline and of loss + return ( + self.alpha * v_b + (1 - self.alpha) * v_wb, + self.alpha * l_b + (1 - self.alpha) * l_wb, + ) + + def epoch_callback(self, *args, **kw): + # Need to call epoch callback of inner policy (also after first epoch if we have not used it) + self.baseline.epoch_callback(*args, **kw) + if kw["epoch"] < self.n_epochs: + self.alpha = (kw["epoch"] + 1) / float(self.n_epochs) + log.info("Set warmup alpha = {}".format(self.alpha)) + + +class CriticBaseline(REINFORCEBaseline): + """Critic baseline: use critic network as baseline + + Args: + critic: Critic network to use as baseline. If None, create a new critic network based on the environment + """ + + def __init__(self, critic: CriticNetwork = None, **unused_kw): + super(CriticBaseline, self).__init__() + self.critic = critic + + def setup(self, policy, env, **kwargs): + if self.critic is None: + log.info("Critic not found. Creating critic network for {}".format(env.name)) + self.critic = create_critic_from_actor(policy) + + def eval(self, x, c, env=None): + v = self.critic(x).squeeze(-1) + # detach v since actor should not backprop through baseline, only for loss + return v.detach(), F.mse_loss(v, c.detach()) + + +class RolloutBaseline(REINFORCEBaseline): + """Rollout baseline: use greedy rollout as baseline + + Args: + bl_alpha: Alpha value for the baseline T-test + """ + + def __init__(self, bl_alpha=0.05, **kw): + super(RolloutBaseline, self).__init__() + self.bl_alpha = bl_alpha + + def setup(self, *args, **kw): + self._update_policy(*args, **kw) + + def _update_policy( + self, policy, env, batch_size=64, device="cpu", dataset_size=None, dataset=None + ): + """Update policy (=actor) and rollout baseline values""" + self.policy = copy.deepcopy(policy).to(device) + if dataset is None: + log.info("Creating evaluation dataset for rollout baseline") + self.dataset = env.dataset(batch_size=[dataset_size]) + + log.info("Evaluating baseline policy on evaluation dataset") + self.bl_vals = ( + self.rollout(self.policy, env, batch_size, device, self.dataset).cpu().numpy() + ) + self.mean = self.bl_vals.mean() + + def eval(self, td, reward, env): + """Evaluate rollout baseline + + Warning: + This is not differentiable and should only be used for evaluation. + Also, it is recommended to use the `rollout` method directly instead of this method. + """ + with torch.inference_mode(): + reward = self.policy(td, env)["reward"] + return reward, 0 + + def epoch_callback( + self, policy, env, batch_size=64, device="cpu", epoch=None, dataset_size=None + ): + """Challenges the current baseline with the policy and replaces the baseline policy if it is improved""" + log.info("Evaluating candidate policy on evaluation dataset") + candidate_vals = self.rollout(policy, env, batch_size, device).cpu().numpy() + candidate_mean = candidate_vals.mean() + + log.info( + "Candidate mean: {:.3f}, Baseline mean: {:.3f}".format( + candidate_mean, self.mean + ) + ) + if candidate_mean - self.mean > 0: + # Calc p value with inverse logic (costs) + t, p = ttest_rel(-candidate_vals, -self.bl_vals) + + p_val = p / 2 # one-sided + assert t < 0, "T-statistic should be negative" + log.info("p-value: {:.3f}".format(p_val)) + if p_val < self.bl_alpha: + log.info("Updating baseline") + self._update_policy(policy, env, batch_size, device, dataset_size) + + def rollout(self, policy, env, batch_size=64, device="cpu", dataset=None): + """Rollout the policy on the given dataset""" + + # if dataset is None, use the dataset of the baseline + dataset = self.dataset if dataset is None else dataset + + policy.eval() + policy = policy.to(device) + + def eval_policy(batch): + with torch.inference_mode(): + batch = env.reset(batch.to(device)) + return policy(batch, env, decode_type="greedy")["reward"] + + dl = DataLoader(dataset, batch_size=batch_size, collate_fn=dataset.collate_fn) + + rewards = torch.cat([eval_policy(batch) for batch in dl], 0) + return rewards + + def wrap_dataset(self, dataset, env, batch_size=64, device="cpu", **kw): + """Wrap the dataset in a baseline dataset + + Note: + This is an alternative to `eval` that does not require the policy to be passed + at every call but just once. Values are added to the dataset. This also allows for + larger batch sizes since we evauate the policy without gradients. + """ + rewards = ( + self.rollout(self.policy, env, batch_size, device, dataset=dataset) + .detach() + .cpu() + ) + return dataset.add_key("extra", rewards) + + def __getstate__(self): + """Do not include datasets in state to avoid pickling issues""" + state = self.__dict__.copy() + try: + del state["dataset"] + except KeyError: + pass + return state + + def __setstate__(self, state): + """Restore datasets after unpickling. Will be restored in setup""" + self.__dict__.update(state) + self.dataset = None + + +REINFORCE_BASELINES_REGISTRY = { + "no": NoBaseline, + "shared": SharedBaseline, + "exponential": ExponentialBaseline, + "critic": CriticBaseline, + "mean": MeanBaseline, + "rollout_only": RolloutBaseline, + "warmup": WarmupBaseline, +} + + +def get_reinforce_baseline(name, **kw): + """Get a REINFORCE baseline by name + The rollout baseline default to warmup baseline with one epoch of + exponential baseline and the greedy rollout + """ + if name == "warmup": + inner_baseline = kw.get("baseline", "rollout") + if not isinstance(inner_baseline, REINFORCEBaseline): + inner_baseline = get_reinforce_baseline(inner_baseline, **kw) + return WarmupBaseline(inner_baseline, **kw) + elif name == "rollout": + warmup_epochs = kw.get("n_epochs", 1) + warmup_exp_beta = kw.get("exp_beta", 0.8) + bl_alpha = kw.get("bl_alpha", 0.05) + return WarmupBaseline( + RolloutBaseline(bl_alpha=bl_alpha), warmup_epochs, warmup_exp_beta + ) + + if name is None: + name = "no" # default to no baseline + baseline_cls = REINFORCE_BASELINES_REGISTRY.get(name, None) + if baseline_cls is None: + raise ValueError( + f"Unknown baseline {baseline_cls}. Available baselines: {REINFORCE_BASELINES_REGISTRY.keys()}" + ) + return baseline_cls(**kw) diff --git a/rl4co/models/rl/reinforce/reinforce.py b/rl4co/models/rl/reinforce/reinforce.py new file mode 100644 index 00000000..269aaaff --- /dev/null +++ b/rl4co/models/rl/reinforce/reinforce.py @@ -0,0 +1,210 @@ +from typing import IO, Any, Optional, Union, cast + +import torch +import torch.nn as nn + +from lightning.fabric.utilities.types import _MAP_LOCATION_TYPE, _PATH +from lightning.pytorch.core.saving import _load_from_checkpoint +from tensordict import TensorDict +from typing_extensions import Self + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl.common.base import RL4COLitModule +from rl4co.models.rl.common.utils import RewardScaler +from rl4co.models.rl.reinforce.baselines import REINFORCEBaseline, get_reinforce_baseline +from rl4co.utils.lightning import get_lightning_device +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class REINFORCE(RL4COLitModule): + """REINFORCE algorithm, also known as policy gradients. + See superclass `RL4COLitModule` for more details. + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + baseline: REINFORCE baseline + baseline_kwargs: Keyword arguments for baseline. Ignored if baseline is not a string + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module, + baseline: Union[REINFORCEBaseline, str] = "rollout", + baseline_kwargs: dict = {}, + reward_scale: str = None, + **kwargs, + ): + super().__init__(env, policy, **kwargs) + + self.save_hyperparameters(logger=False) + + if baseline == "critic": + log.warning( + "Using critic as baseline. If you want more granular support, use the A2C module instead." + ) + + if isinstance(baseline, str): + baseline = get_reinforce_baseline(baseline, **baseline_kwargs) + else: + if baseline_kwargs != {}: + log.warning("baseline_kwargs is ignored when baseline is not a string") + self.baseline = baseline + self.advantage_scaler = RewardScaler(reward_scale) + + def shared_step( + self, batch: Any, batch_idx: int, phase: str, dataloader_idx: int = None + ): + td = self.env.reset(batch) + # Perform forward pass (i.e., constructing solution and computing log-likelihoods) + out = self.policy(td, self.env, phase=phase, select_best=phase != "train") + + # Compute loss + if phase == "train": + out = self.calculate_loss(td, batch, out) + + metrics = self.log_metrics(out, phase, dataloader_idx=dataloader_idx) + return {"loss": out.get("loss", None), **metrics} + + def calculate_loss( + self, + td: TensorDict, + batch: TensorDict, + policy_out: dict, + reward: Optional[torch.Tensor] = None, + log_likelihood: Optional[torch.Tensor] = None, + ): + """Calculate loss for REINFORCE algorithm. + + Args: + td: TensorDict containing the current state of the environment + batch: Batch of data. This is used to get the extra loss terms, e.g., REINFORCE baseline + policy_out: Output of the policy network + reward: Reward tensor. If None, it is taken from `policy_out` + log_likelihood: Log-likelihood tensor. If None, it is taken from `policy_out` + """ + # Extra: this is used for additional loss terms, e.g., REINFORCE baseline + extra = batch.get("extra", None) + reward = reward if reward is not None else policy_out["reward"] + log_likelihood = ( + log_likelihood if log_likelihood is not None else policy_out["log_likelihood"] + ) + + # REINFORCE baseline + bl_val, bl_loss = ( + self.baseline.eval(td, reward, self.env) if extra is None else (extra, 0) + ) + + # Main loss function + advantage = reward - bl_val # advantage = reward - baseline + advantage = self.advantage_scaler(advantage) + reinforce_loss = -(advantage * log_likelihood).mean() + loss = reinforce_loss + bl_loss + policy_out.update( + { + "loss": loss, + "reinforce_loss": reinforce_loss, + "bl_loss": bl_loss, + "bl_val": bl_val, + } + ) + return policy_out + + def post_setup_hook(self, stage="fit"): + # Make baseline taking model itself and train_dataloader from model as input + self.baseline.setup( + self.policy, + self.env, + batch_size=self.val_batch_size, + device=get_lightning_device(self), + dataset_size=self.data_cfg["val_data_size"], + ) + + def on_train_epoch_end(self): + """Callback for end of training epoch: we evaluate the baseline""" + self.baseline.epoch_callback( + self.policy, + env=self.env, + batch_size=self.val_batch_size, + device=get_lightning_device(self), + epoch=self.current_epoch, + dataset_size=self.data_cfg["val_data_size"], + ) + # Need to call super() for the dataset to be reset + super().on_train_epoch_end() + + def wrap_dataset(self, dataset): + """Wrap dataset from baseline evaluation. Used in greedy rollout baseline""" + return self.baseline.wrap_dataset( + dataset, + self.env, + batch_size=self.val_batch_size, + device=get_lightning_device(self), + ) + + def set_decode_type_multistart(self, phase: str): + """Set decode type to `multistart` for train, val and test in policy. + For example, if the decode type is `greedy`, it will be set to `multistart_greedy`. + + Args: + phase: Phase to set decode type for. Must be one of `train`, `val` or `test`. + """ + attribute = f"{phase}_decode_type" + attr_get = getattr(self.policy, attribute) + # If does not exist, log error + if attr_get is None: + log.error(f"Decode type for {phase} is None. Cannot prepend `multistart_`.") + return + elif "multistart" in attr_get: + return + else: + setattr(self.policy, attribute, f"multistart_{attr_get}") + + @classmethod + def load_from_checkpoint( + cls, + checkpoint_path: Union[_PATH, IO], + map_location: _MAP_LOCATION_TYPE = None, + hparams_file: Optional[_PATH] = None, + strict: bool = False, + load_baseline: bool = True, + **kwargs: Any, + ) -> Self: + """Load model from checkpoint/ + + Note: + This is a modified version of `load_from_checkpoint` from `pytorch_lightning.core.saving`. + It deals with matching keys for the baseline by first running setup + """ + + if strict: + log.warning("Setting strict=False for loading model from checkpoint.") + strict = False + + # Do not use strict + loaded = _load_from_checkpoint( + cls, + checkpoint_path, + map_location, + hparams_file, + strict, + **kwargs, + ) + + # Load baseline state dict + if load_baseline: + # setup baseline first + loaded.setup() + loaded.post_setup_hook() + # load baseline state dict + state_dict = torch.load(checkpoint_path, map_location=map_location)["state_dict"] + # get only baseline parameters + state_dict = {k: v for k, v in state_dict.items() if "baseline" in k} + state_dict = {k.replace("baseline.", "", 1): v for k, v in state_dict.items()} + loaded.baseline.load_state_dict(state_dict) + + return cast(Self, loaded) diff --git a/rl4co/models/zoo/__init__.py b/rl4co/models/zoo/__init__.py new file mode 100644 index 00000000..7fbb41eb --- /dev/null +++ b/rl4co/models/zoo/__init__.py @@ -0,0 +1,30 @@ +from rl4co.models.common.constructive.autoregressive import AutoregressivePolicy +from rl4co.models.common.constructive.nonautoregressive import NonAutoregressivePolicy +from rl4co.models.common.transductive import TransductiveModel +from rl4co.models.zoo.active_search import ActiveSearch +from rl4co.models.zoo.am import AttentionModel, AttentionModelPolicy +from rl4co.models.zoo.amppo import AMPPO +from rl4co.models.zoo.dact import DACT, DACTPolicy +from rl4co.models.zoo.deepaco import DeepACO, DeepACOPolicy +from rl4co.models.zoo.eas import EAS, EASEmb, EASLay +from rl4co.models.zoo.ham import ( + HeterogeneousAttentionModel, + HeterogeneousAttentionModelPolicy, +) +from rl4co.models.zoo.l2d import ( + L2DAttnPolicy, + L2DModel, + L2DPolicy, + L2DPolicy4PPO, + L2DPPOModel, +) +from rl4co.models.zoo.matnet import MatNet, MatNetPolicy +from rl4co.models.zoo.mdam import MDAM, MDAMPolicy +from rl4co.models.zoo.mvmoe import MVMoE_AM, MVMoE_POMO +from rl4co.models.zoo.n2s import N2S, N2SPolicy +from rl4co.models.zoo.nargnn import NARGNNPolicy +from rl4co.models.zoo.neuopt import NeuOpt, NeuOptPolicy +from rl4co.models.zoo.polynet import PolyNet +from rl4co.models.zoo.pomo import POMO +from rl4co.models.zoo.ptrnet import PointerNetwork, PointerNetworkPolicy +from rl4co.models.zoo.symnco import SymNCO, SymNCOPolicy diff --git a/rl4co/models/zoo/active_search/__init__.py b/rl4co/models/zoo/active_search/__init__.py new file mode 100644 index 00000000..9e25b87d --- /dev/null +++ b/rl4co/models/zoo/active_search/__init__.py @@ -0,0 +1 @@ +from .search import ActiveSearch diff --git a/rl4co/models/zoo/active_search/search.py b/rl4co/models/zoo/active_search/search.py new file mode 100644 index 00000000..3b588b8d --- /dev/null +++ b/rl4co/models/zoo/active_search/search.py @@ -0,0 +1,202 @@ +import time + +from functools import partial +from typing import Any, Union + +import torch + +from lightning.pytorch.utilities.types import STEP_OUTPUT +from torch.utils.data import Dataset + +from rl4co.data.transforms import StateAugmentation +from rl4co.models.common.transductive import TransductiveModel +from rl4co.utils.ops import batchify, unbatchify +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class ActiveSearch(TransductiveModel): + """Active Search for Neural Combination Optimization from Bello et al. (2016). + Fine-tunes the whole policy network (encoder + decoder) on a batch of instances. + Reference: https://arxiv.org/abs/1611.09940 + + Args: + env: RL4CO environment to be solved + policy: policy network + dataset: dataset to be used for training + batch_size: batch size for training + max_iters: maximum number of iterations + augment_size: number of augmentations per state + augment_dihedral: whether to augment with dihedral rotations + parallel_runs: number of parallel runs + max_runtime: maximum runtime in seconds + save_path: path to save solution checkpoints + optimizer: optimizer to use for training + optimizer_kwargs: keyword arguments for optimizer + **kwargs: additional keyword arguments + """ + + def __init__( + self, + env, + policy, + dataset: Union[Dataset, str], + batch_size: int = 1, + max_iters: int = 200, + augment_size: int = 8, + augment_dihedral: bool = True, + num_parallel_runs: int = 1, + max_runtime: int = 86_400, + save_path: str = None, + optimizer: Union[str, torch.optim.Optimizer, partial] = "Adam", + optimizer_kwargs: dict = {"lr": 2.6e-4, "weight_decay": 1e-6}, + **kwargs, + ): + self.save_hyperparameters(logger=False) + + assert batch_size == 1, "Batch size must be 1 for active search" + + super(ActiveSearch, self).__init__( + env, + policy=policy, + dataset=dataset, + batch_size=batch_size, + max_iters=max_iters, + max_runtime=max_runtime, + save_path=save_path, + optimizer=optimizer, + optimizer_kwargs=optimizer_kwargs, + **kwargs, + ) + + def setup(self, stage="fit"): + """Setup base class and instantiate: + - augmentation + - instance solutions and rewards + - original policy state dict + """ + log.info("Setting up active search...") + super(ActiveSearch, self).setup(stage) + + # Instantiate augmentation + self.augmentation = StateAugmentation( + num_augment=self.hparams.augment_size, + augment_fn="dihedral8" if self.hparams.augment_dihedral else "symmetric", + ) + + # Store original policy state dict + self.original_policy_state = self.policy.state_dict() + + # Get dataset size and problem size + dataset_size = len(self.dataset) + _batch = next(iter(self.train_dataloader())) + self.problem_size = self.env.reset(_batch)["action_mask"].shape[-1] + self.instance_solutions = torch.zeros( + dataset_size, self.problem_size * 2, dtype=int + ) + self.instance_rewards = torch.zeros(dataset_size) + + def on_train_batch_start(self, batch: Any, batch_idx: int): + """Called before training (i.e. search) for a new batch begins. + We re-load the original policy state dict and configure the optimizer. + """ + self.policy.load_state_dict(self.original_policy_state) + self.configure_optimizers(self.policy.parameters()) + + def training_step(self, batch, batch_idx): + """Main search loop. We use the training step to effectively adapt to a `batch` of instances.""" + # Augment state + batch_size = batch.shape[0] + td_init = self.env.reset(batch) + n_aug, n_start, n_runs = ( + self.augmentation.num_augment, + self.env.get_num_starts(td_init), + self.hparams.num_parallel_runs, + ) + td_init = self.augmentation(td_init) + td_init = batchify(td_init, n_runs) + + # Solution and reward buffer + max_reward = torch.full((batch_size,), -float("inf"), device=batch.device) + best_solutions = torch.zeros( + batch_size, self.problem_size * 2, device=batch.device, dtype=int + ) + + # Init search + t_start = time.time() + for i in range(self.hparams.max_iters): + # Evaluate policy with sampling multistarts (as in POMO) + out = self.policy( + td_init.clone(), + env=self.env, + decode_type="multistart_sampling", + num_starts=n_start, + ) + + if i == 0: + log.info(f"Initial reward: {out['reward'].max():.2f}") + + # Update best solution and reward found + max_reward_iter = out["reward"].max() + if max_reward_iter > max_reward: + max_reward_idx = out["reward"].argmax() + best_solution_iter = out["actions"][max_reward_idx] + max_reward = max_reward_iter + best_solutions[0, : best_solution_iter.shape[0]] = best_solution_iter + + # Compute REINFORCE loss with shared baseline + reward = unbatchify(out["reward"], (n_runs, n_aug, n_start)) + ll = unbatchify(out["log_likelihood"], (n_runs, n_aug, n_start)) + advantage = reward - reward.mean(dim=-1, keepdim=True) + loss = -(advantage * ll).mean() + + # Backpropagate loss + # perform manual optimization following the Lightning routine + # https://lightning.ai/docs/pytorch/stable/common/optimization.html + opt = self.optimizers() + opt.zero_grad() + self.manual_backward(loss) + + self.log_dict( + { + "loss": loss, + "max_reward": max_reward, + "step": i, + "time": time.time() - t_start, + }, + on_step=self.log_on_step, + ) + + # Stop if max runtime is exceeded + if time.time() - t_start > self.hparams.max_runtime: + break + + return {"max_reward": max_reward, "best_solutions": best_solutions} + + def on_train_batch_end( + self, outputs: STEP_OUTPUT, batch: Any, batch_idx: int + ) -> None: + """We store the best solution and reward found.""" + max_rewards, best_solutions = outputs["max_reward"], outputs["best_solutions"] + self.instance_rewards[batch_idx] = max_rewards + self.instance_solutions[batch_idx, :] = best_solutions.squeeze( + 0 + ) # only one instance + log.info(f"Best reward: {max_rewards.mean():.2f}") + + def on_train_epoch_end(self) -> None: + """Called when the training ends. + If the epoch ends, it means we have finished searching over the + instances, thus the trainer should stop. + """ + save_path = self.hparams.save_path + if save_path is not None: + log.info(f"Saving solutions and rewards to {save_path}...") + torch.save( + {"solutions": self.instance_solutions, "rewards": self.instance_rewards}, + save_path, + ) + + # https://github.com/Lightning-AI/lightning/issues/1406 + self.trainer.should_stop = True diff --git a/rl4co/models/zoo/am/__init__.py b/rl4co/models/zoo/am/__init__.py new file mode 100644 index 00000000..dda6581c --- /dev/null +++ b/rl4co/models/zoo/am/__init__.py @@ -0,0 +1,2 @@ +from .model import AttentionModel +from .policy import AttentionModelPolicy diff --git a/rl4co/models/zoo/am/decoder.py b/rl4co/models/zoo/am/decoder.py new file mode 100644 index 00000000..61600050 --- /dev/null +++ b/rl4co/models/zoo/am/decoder.py @@ -0,0 +1,235 @@ +from dataclasses import dataclass, fields +from typing import Tuple, Union + +import torch +import torch.nn as nn + +from einops import rearrange +from tensordict import TensorDict +from torch import Tensor + +from rl4co.envs import RL4COEnvBase +from rl4co.models.common.constructive.autoregressive.decoder import AutoregressiveDecoder +from rl4co.models.nn.attention import PointerAttention, PointerAttnMoE +from rl4co.models.nn.env_embeddings import env_context_embedding, env_dynamic_embedding +from rl4co.models.nn.env_embeddings.dynamic import StaticEmbedding +from rl4co.utils.ops import batchify, unbatchify +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +@dataclass +class PrecomputedCache: + node_embeddings: Tensor + graph_context: Union[Tensor, float] + glimpse_key: Tensor + glimpse_val: Tensor + logit_key: Tensor + + @property + def fields(self): + return tuple(getattr(self, x.name) for x in fields(self)) + + def batchify(self, num_starts): + new_embs = [] + for emb in self.fields: + if isinstance(emb, Tensor) or isinstance(emb, TensorDict): + new_embs.append(batchify(emb, num_starts)) + else: + new_embs.append(emb) + return PrecomputedCache(*new_embs) + + +class AttentionModelDecoder(AutoregressiveDecoder): + """ + Auto-regressive decoder based on Kool et al. (2019): https://arxiv.org/abs/1803.08475. + Given the environment state and the embeddings, compute the logits and sample actions autoregressively until + all the environments in the batch have reached a terminal state. + In this case we additionally have a `pre_decoder_hook` method that allows to precompute the embeddings before + the decoder is called, which saves a lot of computation. + + + Args: + embed_dim: Embedding dimension + num_heads: Number of attention heads + env_name: Name of the environment used to initialize embeddings + context_embedding: Context embedding module + dynamic_embedding: Dynamic embedding module + mask_inner: Whether to mask the inner loop + out_bias_pointer_attn: Whether to use a bias in the pointer attention + linear_bias: Whether to use a bias in the linear layer + use_graph_context: Whether to use the graph context + check_nan: Whether to check for nan values during decoding + sdpa_fn: scaled_dot_product_attention function + pointer: Module implementing the pointer logic (defaults to PointerAttention) + moe_kwargs: Keyword arguments for MoE + """ + + def __init__( + self, + embed_dim: int = 128, + num_heads: int = 8, + env_name: str = "tsp", + context_embedding: nn.Module = None, + dynamic_embedding: nn.Module = None, + mask_inner: bool = True, + out_bias_pointer_attn: bool = False, + linear_bias: bool = False, + use_graph_context: bool = True, + check_nan: bool = True, + sdpa_fn: callable = None, + pointer: nn.Module = None, + moe_kwargs: dict = None, + ): + super().__init__() + + if isinstance(env_name, RL4COEnvBase): + env_name = env_name.name + self.env_name = env_name + self.embed_dim = embed_dim + self.num_heads = num_heads + + assert embed_dim % num_heads == 0 + + self.context_embedding = ( + env_context_embedding(self.env_name, {"embed_dim": embed_dim}) + if context_embedding is None + else context_embedding + ) + self.dynamic_embedding = ( + env_dynamic_embedding(self.env_name, {"embed_dim": embed_dim}) + if dynamic_embedding is None + else dynamic_embedding + ) + self.is_dynamic_embedding = ( + False if isinstance(self.dynamic_embedding, StaticEmbedding) else True + ) + + if pointer is None: + # MHA with Pointer mechanism (https://arxiv.org/abs/1506.03134) + pointer_attn_class = ( + PointerAttention if moe_kwargs is None else PointerAttnMoE + ) + pointer = pointer_attn_class( + embed_dim, + num_heads, + mask_inner=mask_inner, + out_bias=out_bias_pointer_attn, + check_nan=check_nan, + sdpa_fn=sdpa_fn, + moe_kwargs=moe_kwargs, + ) + + self.pointer = pointer + + # For each node we compute (glimpse key, glimpse value, logit key) so 3 * embed_dim + self.project_node_embeddings = nn.Linear( + embed_dim, 3 * embed_dim, bias=linear_bias + ) + self.project_fixed_context = nn.Linear(embed_dim, embed_dim, bias=linear_bias) + self.use_graph_context = use_graph_context + + def _compute_q(self, cached: PrecomputedCache, td: TensorDict): + node_embeds_cache = cached.node_embeddings + graph_context_cache = cached.graph_context + + if td.dim() == 2 and isinstance(graph_context_cache, Tensor): + graph_context_cache = graph_context_cache.unsqueeze(1) + + step_context = self.context_embedding(node_embeds_cache, td) + glimpse_q = step_context + graph_context_cache + # add seq_len dim if not present + glimpse_q = glimpse_q.unsqueeze(1) if glimpse_q.ndim == 2 else glimpse_q + + return glimpse_q + + def _compute_kvl(self, cached: PrecomputedCache, td: TensorDict): + glimpse_k_stat, glimpse_v_stat, logit_k_stat = ( + cached.glimpse_key, + cached.glimpse_val, + cached.logit_key, + ) + # Compute dynamic embeddings and add to static embeddings + glimpse_k_dyn, glimpse_v_dyn, logit_k_dyn = self.dynamic_embedding(td) + glimpse_k = glimpse_k_stat + glimpse_k_dyn + glimpse_v = glimpse_v_stat + glimpse_v_dyn + logit_k = logit_k_stat + logit_k_dyn + + return glimpse_k, glimpse_v, logit_k + + def forward( + self, + td: TensorDict, + cached: PrecomputedCache, + num_starts: int = 0, + ) -> Tuple[Tensor, Tensor]: + """Compute the logits of the next actions given the current state + + Args: + cache: Precomputed embeddings + td: TensorDict with the current environment state + num_starts: Number of starts for the multi-start decoding + """ + + has_dyn_emb_multi_start = self.is_dynamic_embedding and num_starts > 1 + + # Handle efficient multi-start decoding + if has_dyn_emb_multi_start: + # if num_starts > 0 and we have some dynamic embeddings, we need to reshape them to [B*S, ...] + # since keys and values are not shared across starts (i.e. the episodes modify these embeddings at each step) + cached = cached.batchify(num_starts=num_starts) + + elif num_starts > 1: + td = unbatchify(td, num_starts) + + glimpse_q = self._compute_q(cached, td) + glimpse_k, glimpse_v, logit_k = self._compute_kvl(cached, td) + + # Compute logits + mask = td["action_mask"] + logits = self.pointer(glimpse_q, glimpse_k, glimpse_v, logit_k, mask) + + # Now we need to reshape the logits and mask to [B*S,N,...] is num_starts > 1 without dynamic embeddings + # note that rearranging order is important here + if num_starts > 1 and not has_dyn_emb_multi_start: + logits = rearrange(logits, "b s l -> (s b) l", s=num_starts) + mask = rearrange(mask, "b s l -> (s b) l", s=num_starts) + return logits, mask + + def pre_decoder_hook( + self, td, env, embeddings, num_starts: int = 0 + ) -> Tuple[TensorDict, RL4COEnvBase, PrecomputedCache]: + """Precompute the embeddings cache before the decoder is called""" + return td, env, self._precompute_cache(embeddings, num_starts=num_starts) + + def _precompute_cache( + self, embeddings: torch.Tensor, num_starts: int = 0 + ) -> PrecomputedCache: + """Compute the cached embeddings for the pointer attention. + + Args: + embeddings: Precomputed embeddings for the nodes + num_starts: Number of starts for the multi-start decoding + """ + # The projection of the node embeddings for the attention is calculated once up front + ( + glimpse_key_fixed, + glimpse_val_fixed, + logit_key_fixed, + ) = self.project_node_embeddings(embeddings).chunk(3, dim=-1) + + # Optionally disable the graph context from the initial embedding as done in POMO + if self.use_graph_context: + graph_context = self.project_fixed_context(embeddings.mean(1)) + else: + graph_context = 0 + + # Organize in a dataclass for easy access + return PrecomputedCache( + node_embeddings=embeddings, + graph_context=graph_context, + glimpse_key=glimpse_key_fixed, + glimpse_val=glimpse_val_fixed, + logit_key=logit_key_fixed, + ) diff --git a/rl4co/models/zoo/am/encoder.py b/rl4co/models/zoo/am/encoder.py new file mode 100644 index 00000000..b3a01a2f --- /dev/null +++ b/rl4co/models/zoo/am/encoder.py @@ -0,0 +1,91 @@ +from typing import Tuple, Union + +import torch.nn as nn + +from tensordict import TensorDict +from torch import Tensor + +from rl4co.envs import RL4COEnvBase +from rl4co.models.common.constructive import AutoregressiveEncoder +from rl4co.models.nn.env_embeddings import env_init_embedding +from rl4co.models.nn.graph.attnnet import GraphAttentionNetwork + + +class AttentionModelEncoder(AutoregressiveEncoder): + """Graph Attention Encoder as in Kool et al. (2019). + First embed the input and then process it with a Graph Attention Network. + + Args: + embed_dim: Dimension of the embedding space + init_embedding: Module to use for the initialization of the embeddings + env_name: Name of the environment used to initialize embeddings + num_heads: Number of heads in the attention layers + num_layers: Number of layers in the attention network + normalization: Normalization type in the attention layers + feedforward_hidden: Hidden dimension in the feedforward layers + net: Graph Attention Network to use + sdpa_fn: Function to use for the scaled dot product attention + moe_kwargs: Keyword arguments for MoE + """ + + def __init__( + self, + embed_dim: int = 128, + init_embedding: nn.Module = None, + env_name: str = "tsp", + num_heads: int = 8, + num_layers: int = 3, + normalization: str = "batch", + feedforward_hidden: int = 512, + net: nn.Module = None, + sdpa_fn = None, + moe_kwargs: dict = None, + ): + super(AttentionModelEncoder, self).__init__() + + if isinstance(env_name, RL4COEnvBase): + env_name = env_name.name + self.env_name = env_name + + self.init_embedding = ( + env_init_embedding(self.env_name, {"embed_dim": embed_dim}) + if init_embedding is None + else init_embedding + ) + + self.net = ( + GraphAttentionNetwork( + num_heads, + embed_dim, + num_layers, + normalization, + feedforward_hidden, + sdpa_fn=sdpa_fn, + moe_kwargs=moe_kwargs, + ) + if net is None + else net + ) + + def forward( + self, td: TensorDict, mask: Union[Tensor, None] = None + ) -> Tuple[Tensor, Tensor]: + """Forward pass of the encoder. + Transform the input TensorDict into a latent representation. + + Args: + td: Input TensorDict containing the environment state + mask: Mask to apply to the attention + + Returns: + h: Latent representation of the input + init_h: Initial embedding of the input + """ + # Transfer to embedding space + init_h = self.init_embedding(td) + + # Process embedding + h = self.net(init_h, mask) + + # Return latent representation and initial embedding + return h, init_h diff --git a/rl4co/models/zoo/am/model.py b/rl4co/models/zoo/am/model.py new file mode 100644 index 00000000..bb6b8e41 --- /dev/null +++ b/rl4co/models/zoo/am/model.py @@ -0,0 +1,34 @@ +from typing import Union + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl import REINFORCE +from rl4co.models.rl.reinforce.baselines import REINFORCEBaseline +from rl4co.models.zoo.am.policy import AttentionModelPolicy + + +class AttentionModel(REINFORCE): + """Attention Model based on REINFORCE: https://arxiv.org/abs/1803.08475. + Check :class:`REINFORCE` and :class:`rl4co.models.RL4COLitModule` for more details such as additional parameters including batch size. + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + baseline: REINFORCE baseline. Defaults to rollout (1 epoch of exponential, then greedy rollout baseline) + policy_kwargs: Keyword arguments for policy + baseline_kwargs: Keyword arguments for baseline + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: AttentionModelPolicy = None, + baseline: Union[REINFORCEBaseline, str] = "rollout", + policy_kwargs={}, + baseline_kwargs={}, + **kwargs, + ): + if policy is None: + policy = AttentionModelPolicy(env_name=env.name, **policy_kwargs) + + super().__init__(env, policy, baseline, baseline_kwargs, **kwargs) diff --git a/rl4co/models/zoo/am/policy.py b/rl4co/models/zoo/am/policy.py new file mode 100644 index 00000000..d650b72a --- /dev/null +++ b/rl4co/models/zoo/am/policy.py @@ -0,0 +1,122 @@ +from typing import Callable + +import torch.nn as nn + +from rl4co.models.common.constructive.autoregressive.policy import AutoregressivePolicy +from rl4co.models.zoo.am.decoder import AttentionModelDecoder +from rl4co.models.zoo.am.encoder import AttentionModelEncoder + + +class AttentionModelPolicy(AutoregressivePolicy): + """ + Attention Model Policy based on Kool et al. (2019): https://arxiv.org/abs/1803.08475. + This model first encodes the input graph using a Graph Attention Network (GAT) (:class:`AttentionModelEncoder`) + and then decodes the solution using a pointer network (:class:`AttentionModelDecoder`). Cache is used to store the + embeddings of the nodes to be used by the decoder to save computation. + See :class:`rl4co.models.common.constructive.autoregressive.policy.AutoregressivePolicy` for more details on the inference process. + + Args: + encoder: Encoder module, defaults to :class:`AttentionModelEncoder` + decoder: Decoder module, defaults to :class:`AttentionModelDecoder` + embed_dim: Dimension of the node embeddings + num_encoder_layers: Number of layers in the encoder + num_heads: Number of heads in the attention layers + normalization: Normalization type in the attention layers + feedforward_hidden: Dimension of the hidden layer in the feedforward network + env_name: Name of the environment used to initialize embeddings + encoder_network: Network to use for the encoder + init_embedding: Module to use for the initialization of the embeddings + context_embedding: Module to use for the context embedding + dynamic_embedding: Module to use for the dynamic embedding + use_graph_context: Whether to use the graph context + linear_bias_decoder: Whether to use a bias in the linear layer of the decoder + sdpa_fn_encoder: Function to use for the scaled dot product attention in the encoder + sdpa_fn_decoder: Function to use for the scaled dot product attention in the decoder + sdpa_fn: (deprecated) Function to use for the scaled dot product attention + mask_inner: Whether to mask the inner product + out_bias_pointer_attn: Whether to use a bias in the pointer attention + check_nan: Whether to check for nan values during decoding + temperature: Temperature for the softmax + tanh_clipping: Tanh clipping value (see Bello et al., 2016) + mask_logits: Whether to mask the logits during decoding + train_decode_type: Type of decoding to use during training + val_decode_type: Type of decoding to use during validation + test_decode_type: Type of decoding to use during testing + moe_kwargs: Keyword arguments for MoE, + e.g., {"encoder": {"hidden_act": "ReLU", "num_experts": 4, "k": 2, "noisy_gating": True}, + "decoder": {"light_version": True, ...}} + """ + + def __init__( + self, + encoder: nn.Module = None, + decoder: nn.Module = None, + embed_dim: int = 128, + num_encoder_layers: int = 3, + num_heads: int = 8, + normalization: str = "batch", + feedforward_hidden: int = 512, + env_name: str = "tsp", + encoder_network: nn.Module = None, + init_embedding: nn.Module = None, + context_embedding: nn.Module = None, + dynamic_embedding: nn.Module = None, + use_graph_context: bool = True, + linear_bias_decoder: bool = False, + sdpa_fn: Callable = None, + sdpa_fn_encoder: Callable = None, + sdpa_fn_decoder: Callable = None, + mask_inner: bool = True, + out_bias_pointer_attn: bool = False, + check_nan: bool = True, + temperature: float = 1.0, + tanh_clipping: float = 10.0, + mask_logits: bool = True, + train_decode_type: str = "sampling", + val_decode_type: str = "greedy", + test_decode_type: str = "greedy", + moe_kwargs: dict = {"encoder": None, "decoder": None}, + **unused_kwargs, + ): + if encoder is None: + encoder = AttentionModelEncoder( + embed_dim=embed_dim, + num_heads=num_heads, + num_layers=num_encoder_layers, + env_name=env_name, + normalization=normalization, + feedforward_hidden=feedforward_hidden, + net=encoder_network, + init_embedding=init_embedding, + sdpa_fn=sdpa_fn if sdpa_fn_encoder is None else sdpa_fn_encoder, + moe_kwargs=moe_kwargs["encoder"], + ) + + if decoder is None: + decoder = AttentionModelDecoder( + embed_dim=embed_dim, + num_heads=num_heads, + env_name=env_name, + context_embedding=context_embedding, + dynamic_embedding=dynamic_embedding, + sdpa_fn=sdpa_fn if sdpa_fn_decoder is None else sdpa_fn_decoder, + mask_inner=mask_inner, + out_bias_pointer_attn=out_bias_pointer_attn, + linear_bias=linear_bias_decoder, + use_graph_context=use_graph_context, + check_nan=check_nan, + moe_kwargs=moe_kwargs["decoder"], + ) + + super(AttentionModelPolicy, self).__init__( + encoder=encoder, + decoder=decoder, + env_name=env_name, + temperature=temperature, + tanh_clipping=tanh_clipping, + mask_logits=mask_logits, + train_decode_type=train_decode_type, + val_decode_type=val_decode_type, + test_decode_type=test_decode_type, + **unused_kwargs, + ) diff --git a/rl4co/models/zoo/amppo/__init__.py b/rl4co/models/zoo/amppo/__init__.py new file mode 100644 index 00000000..8a94600d --- /dev/null +++ b/rl4co/models/zoo/amppo/__init__.py @@ -0,0 +1 @@ +from .model import AMPPO diff --git a/rl4co/models/zoo/amppo/model.py b/rl4co/models/zoo/amppo/model.py new file mode 100644 index 00000000..17a55257 --- /dev/null +++ b/rl4co/models/zoo/amppo/model.py @@ -0,0 +1,49 @@ +import copy + +import torch.nn as nn + +from rl4co.envs import RL4COEnvBase +from rl4co.models.rl import PPO +from rl4co.models.rl.common.critic import CriticNetwork +from rl4co.models.zoo.am.policy import AttentionModelPolicy +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class AMPPO(PPO): + """PPO Model based on Proximal Policy Optimization (PPO) with an attention model policy. + We default to the attention model policy and the Attention Critic Network. + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + critic: Critic to use for the algorithm + policy_kwargs: Keyword arguments for policy + critic_kwargs: Keyword arguments for critic + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module = None, + critic: CriticNetwork = None, + policy_kwargs: dict = {}, + critic_kwargs: dict = {}, + **kwargs, + ): + if policy is None: + policy = AttentionModelPolicy(env_name=env.name, **policy_kwargs) + + if critic is None: + log.info("Creating critic network for {}".format(env.name)) + # we reuse the parameters of the model + encoder = getattr(policy, "encoder", None) + if encoder is None: + raise ValueError("Critic network requires an encoder") + critic = CriticNetwork( + copy.deepcopy(encoder).to(next(encoder.parameters()).device), + **critic_kwargs, + ) + + super().__init__(env, policy, critic, **kwargs) diff --git a/rl4co/models/zoo/dact/__init__.py b/rl4co/models/zoo/dact/__init__.py new file mode 100644 index 00000000..c0c9c6a1 --- /dev/null +++ b/rl4co/models/zoo/dact/__init__.py @@ -0,0 +1,2 @@ +from .model import DACT +from .policy import DACTPolicy diff --git a/rl4co/models/zoo/dact/decoder.py b/rl4co/models/zoo/dact/decoder.py new file mode 100644 index 00000000..81a684ad --- /dev/null +++ b/rl4co/models/zoo/dact/decoder.py @@ -0,0 +1,132 @@ +import math + +import torch +import torch.nn as nn + +from tensordict import TensorDict +from torch import Tensor + +from rl4co.models.common.improvement.base import ImprovementDecoder +from rl4co.models.nn.attention import MultiHeadCompat +from rl4co.models.nn.mlp import MLP +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class DACTDecoder(ImprovementDecoder): + """ + DACT decoder based on Ma et al. (2021) + Given the environment state and the dual sets of embeddings (PFE, NFE embeddings), compute the logits for + selecting two nodes for the 2-opt local search from the current solution + + + Args: + embed_dim: Embedding dimension + num_heads: Number of attention heads + """ + + def __init__( + self, + embed_dim: int = 64, + num_heads: int = 4, + ): + super().__init__() + self.embed_dim = embed_dim + self.n_heads = num_heads + self.hidden_dim = embed_dim + + # for MHC sublayer (NFE aspect) + self.compater_node = MultiHeadCompat( + num_heads, embed_dim, embed_dim, embed_dim, embed_dim + ) + + # for MHC sublayer (PFE aspect) + self.compater_pos = MultiHeadCompat( + num_heads, embed_dim, embed_dim, embed_dim, embed_dim + ) + + self.norm_factor = 1 / math.sqrt(1 * self.hidden_dim) + + # for Max-Pooling sublayer + self.project_graph_pos = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + self.project_graph_node = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + self.project_node_pos = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + self.project_node_node = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + + # for feed-forward aggregation (FFA)sublayer + self.value_head = MLP( + input_dim=2 * self.n_heads, + output_dim=1, + num_neurons=[32, 32], + dropout_probs=[0.05, 0.00], + ) + + def forward(self, td: TensorDict, final_h: Tensor, final_p: Tensor) -> Tensor: + """Compute the logits of the removing a node pair from the current solution + + Args: + td: TensorDict with the current environment state + final_h: final NFE embeddings + final_p: final pfe embeddings + """ + + batch_size, graph_size, dim = final_h.size() + + # Max-Pooling sublayer + h_node_refined = self.project_node_node(final_h) + self.project_graph_node( + final_h.max(1)[0] + )[:, None, :].expand(batch_size, graph_size, dim) + h_pos_refined = self.project_node_pos(final_p) + self.project_graph_pos( + final_p.max(1)[0] + )[:, None, :].expand(batch_size, graph_size, dim) + + # MHC sublayer + compatibility = torch.zeros( + (batch_size, graph_size, graph_size, self.n_heads * 2), + device=h_node_refined.device, + ) + compatibility[:, :, :, : self.n_heads] = self.compater_pos(h_pos_refined).permute( + 1, 2, 3, 0 + ) + compatibility[:, :, :, self.n_heads :] = self.compater_node( + h_node_refined + ).permute(1, 2, 3, 0) + + # FFA sublater + return self.value_head(self.norm_factor * compatibility).squeeze(-1) + + +class CriticDecoder(nn.Module): + def __init__(self, input_dim: int) -> None: + super().__init__() + self.input_dim = input_dim + + self.project_graph = nn.Linear(self.input_dim, self.input_dim, bias=False) + self.project_node = nn.Linear(self.input_dim, self.input_dim, bias=False) + + self.MLP = MLP( + input_dim=input_dim, + output_dim=1, + num_neurons=[input_dim, input_dim // 2], + dropout_probs=[0.05, 0.0], + ) + + def forward(self, x: torch.Tensor, hidden=None) -> torch.Tensor: + # h_wave: (batch_size, graph_size+1, input_size) + mean_pooling = x.mean(1) # mean Pooling (batch_size, input_size) + graph_feature: torch.Tensor = self.project_graph(mean_pooling)[ + :, None, : + ] # (batch_size, 1, input_dim/2) + node_feature: torch.Tensor = self.project_node( + x + ) # (batch_size, graph_size+1, input_dim/2) + + # pass through value_head, get estimated value + fusion = node_feature + graph_feature.expand_as( + node_feature + ) # (batch_size, graph_size+1, input_dim/2) + + value = self.MLP(fusion.mean(1)) + + return value diff --git a/rl4co/models/zoo/dact/encoder.py b/rl4co/models/zoo/dact/encoder.py new file mode 100644 index 00000000..0e263de0 --- /dev/null +++ b/rl4co/models/zoo/dact/encoder.py @@ -0,0 +1,274 @@ +import math + +from typing import Tuple + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from torch import Tensor + +from rl4co.models.common import ImprovementEncoder +from rl4co.models.nn.ops import AdaptiveSequential, Normalization +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +# implements the Multi-head DAC-Att module +class DAC_ATT(nn.Module): + def __init__(self, n_heads, input_dim, embed_dim=None, val_dim=None, key_dim=None): + super(DAC_ATT, self).__init__() + + self.n_heads = n_heads + + self.key_dim = self.val_dim = embed_dim // n_heads + self.input_dim = input_dim + self.embed_dim = embed_dim + + self.norm_factor = 1 / math.sqrt(1 * self.key_dim) + + # W_h^Q in the paper + self.W_query_node = nn.Parameter( + torch.Tensor(n_heads, self.input_dim, self.key_dim) + ) + # W_g^Q in the paper + self.W_query_pos = nn.Parameter( + torch.Tensor(n_heads, self.input_dim, self.key_dim) + ) + # W_h^K in the paper + self.W_key_node = nn.Parameter( + torch.Tensor(n_heads, self.input_dim, self.key_dim) + ) + # W_g^K in the paper + self.W_key_pos = nn.Parameter(torch.Tensor(n_heads, self.input_dim, self.key_dim)) + + # W_h^V and W_h^Vref in the paper + self.W_val_node = nn.Parameter( + torch.Tensor(2 * n_heads, self.input_dim, self.val_dim) + ) + # W_g^V and W_g^Vref in the paper + self.W_val_pos = nn.Parameter( + torch.Tensor(2 * n_heads, self.input_dim, self.val_dim) + ) + + # W_h^O and W_g^O in the paper + if embed_dim is not None: + self.W_out_node = nn.Parameter( + torch.Tensor(n_heads, 2 * self.key_dim, embed_dim) + ) + self.W_out_pos = nn.Parameter( + torch.Tensor(n_heads, 2 * self.key_dim, embed_dim) + ) + + self.init_parameters() + + def init_parameters(self): + for param in self.parameters(): + stdv = 1.0 / math.sqrt(param.size(-1)) + param.data.uniform_(-stdv, stdv) + + def forward(self, h_node_in, h_pos_in): # input (NFEs, PFEs) + # h,g should be (batch_size, graph_size, input_dim) + batch_size, graph_size, input_dim = h_node_in.size() + + shp = (self.n_heads, batch_size, graph_size, -1) + shp_v = (2, self.n_heads, batch_size, graph_size, -1) + + h_node = h_node_in.contiguous().view(-1, input_dim) + h_pos = h_pos_in.contiguous().view(-1, input_dim) + + Q_node = torch.matmul(h_node, self.W_query_node).view(shp) + Q_pos = torch.matmul(h_pos, self.W_query_pos).view(shp) + + K_node = torch.matmul(h_node, self.W_key_node).view(shp) + K_pos = torch.matmul(h_pos, self.W_key_pos).view(shp) + + V_node = torch.matmul(h_node, self.W_val_node).view(shp_v) + V_pos = torch.matmul(h_pos, self.W_val_pos).view(shp_v) + + # Get attention correlations and norm by softmax + node_correlations = self.norm_factor * torch.matmul( + Q_node, K_node.transpose(2, 3) + ) + pos_correlations = self.norm_factor * torch.matmul(Q_pos, K_pos.transpose(2, 3)) + attn1 = F.softmax(node_correlations, dim=-1) # head, bs, n, n + attn2 = F.softmax(pos_correlations, dim=-1) # head, bs, n, n + + heads_node_1 = torch.matmul(attn1, V_node[0]) # self-attn + heads_node_2 = torch.matmul(attn2, V_node[1]) # cross-aspect ref attn + + heads_pos_1 = torch.matmul(attn1, V_pos[0]) # cross-aspect ref attn + heads_pos_2 = torch.matmul(attn2, V_pos[1]) # self-attn + + heads_node = torch.cat((heads_node_1, heads_node_2), -1) + heads_pos = torch.cat((heads_pos_1, heads_pos_2), -1) + + # get output + out_node = torch.mm( + heads_node.permute(1, 2, 0, 3) + .contiguous() + .view(-1, self.n_heads * 2 * self.val_dim), + self.W_out_node.view(-1, self.embed_dim), + ).view(batch_size, graph_size, self.embed_dim) + + out_pos = torch.mm( + heads_pos.permute(1, 2, 0, 3) + .contiguous() + .view(-1, self.n_heads * 2 * self.val_dim), + self.W_out_pos.view(-1, self.embed_dim), + ).view(batch_size, graph_size, self.embed_dim) + + return out_node, out_pos # dual-aspect representation (NFEs, PFEs) + + +# implements the DAC encoder +class DACTEncoderLayer(nn.Module): + def __init__( + self, + n_heads, + embed_dim, + feed_forward_hidden, + normalization="layer", + ): + super(DACTEncoderLayer, self).__init__() + + self.MHA_sublayer = DACsubLayer( + n_heads, + embed_dim, + feed_forward_hidden, + normalization=normalization, + ) + + self.FFandNorm_sublayer = FFNsubLayer( + n_heads, + embed_dim, + feed_forward_hidden, + normalization=normalization, + ) + + def forward(self, input1, input2): + out1, out2 = self.MHA_sublayer(input1, input2) + return self.FFandNorm_sublayer(out1, out2) + + +# implements the DAC encoder (DAC-Att sublayer) +class DACsubLayer(nn.Module): + def __init__( + self, + n_heads, + embed_dim, + feed_forward_hidden, + normalization="layer", + ): + super(DACsubLayer, self).__init__() + + self.MHA = DAC_ATT(n_heads, input_dim=embed_dim, embed_dim=embed_dim) + + self.Norm = Normalization(embed_dim, normalization) + + def forward(self, input1, input2): + # Attention and Residual connection + out1, out2 = self.MHA(input1, input2) + + # Normalization + return self.Norm(out1 + input1), self.Norm(out2 + input2) + + +# implements the DAC encoder (FFN sublayer) +class FFNsubLayer(nn.Module): + def __init__( + self, + n_heads, + embed_dim, + feed_forward_hidden, + normalization="layer", + ): + super(FFNsubLayer, self).__init__() + + self.FF1 = ( + nn.Sequential( + nn.Linear(embed_dim, feed_forward_hidden), + nn.ReLU(inplace=True), + nn.Linear(feed_forward_hidden, embed_dim), + ) + if feed_forward_hidden > 0 + else nn.Linear(embed_dim, embed_dim) + ) + + self.FF2 = ( + nn.Sequential( + nn.Linear(embed_dim, feed_forward_hidden), + nn.ReLU(inplace=True), + nn.Linear(feed_forward_hidden, embed_dim), + ) + if feed_forward_hidden > 0 + else nn.Linear(embed_dim, embed_dim) + ) + + self.Norm = Normalization(embed_dim, normalization) + + def forward(self, input1, input2): + # FF and Residual connection + out1 = self.FF1(input1) + out2 = self.FF2(input2) + + # Normalization + return self.Norm(out1 + input1), self.Norm(out2 + input2) + + +class DACTEncoder(ImprovementEncoder): + """Dual-Aspect Collaborative Transformer Encoder as in Ma et al. (2021) + + Args: + embed_dim: Dimension of the embedding space + init_embedding: Module to use for the initialization of the node embeddings + pos_embedding: Module to use for the initialization of the positional embeddings + env_name: Name of the environment used to initialize embeddings + pos_type: Name of the used positional encoding method (CPE or APE) + num_heads: Number of heads in the attention layers + num_layers: Number of layers in the attention network + normalization: Normalization type in the attention layers + feedforward_hidden: Hidden dimension in the feedforward layers + """ + + def __init__( + self, + embed_dim: int = 64, + init_embedding: nn.Module = None, + pos_embedding: nn.Module = None, + env_name: str = "tsp_kopt", + pos_type: str = "CPE", + num_heads: int = 4, + num_layers: int = 3, + normalization: str = "layer", + feedforward_hidden: int = 64, + ): + super(DACTEncoder, self).__init__( + embed_dim=embed_dim, + env_name=env_name, + pos_type=pos_type, + num_heads=num_heads, + num_layers=num_layers, + normalization=normalization, + feedforward_hidden=feedforward_hidden, + ) + + assert self.env_name in ["tsp_kopt"], NotImplementedError() + + self.net = AdaptiveSequential( + *( + DACTEncoderLayer( + num_heads, + embed_dim, + feedforward_hidden, + normalization, + ) + for _ in range(num_layers) + ) + ) + + def _encoder_forward(self, init_h: Tensor, init_p: Tensor) -> Tuple[Tensor, Tensor]: + NFE, PFE = self.net(init_h, init_p) + + return NFE, PFE diff --git a/rl4co/models/zoo/dact/model.py b/rl4co/models/zoo/dact/model.py new file mode 100644 index 00000000..34bf9c5e --- /dev/null +++ b/rl4co/models/zoo/dact/model.py @@ -0,0 +1,62 @@ +import torch.nn as nn + +from rl4co.envs import RL4COEnvBase +from rl4co.models.nn.graph.attnnet import MultiHeadAttentionLayer +from rl4co.models.rl import n_step_PPO +from rl4co.models.rl.common.critic import CriticNetwork +from rl4co.models.zoo.dact.decoder import CriticDecoder +from rl4co.models.zoo.dact.policy import DACTPolicy +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class DACT(n_step_PPO): + """DACT Model based on n_step Proximal Policy Optimization (PPO) with an DACT model policy. + We default to the DACT model policy and the improvement Critic Network. + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + critic: Critic to use for the algorithm + policy_kwargs: Keyword arguments for policy + critic_kwargs: Keyword arguments for critic + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module = None, + critic: CriticNetwork = None, + policy_kwargs: dict = {}, + critic_kwargs: dict = {}, + **kwargs, + ): + if policy is None: + policy = DACTPolicy(env_name=env.name, **policy_kwargs) + + if critic is None: + embed_dim = ( + policy_kwargs["embed_dim"] * 2 if "embed_dim" in policy_kwargs else 128 + ) # the critic's embed_dim must be as policy's + + encoder = MultiHeadAttentionLayer( + embed_dim, + critic_kwargs["num_heads"] if "num_heads" in critic_kwargs else 4, + critic_kwargs["feedforward_hidden"] * 2 + if "feedforward_hidden" in critic_kwargs + else 128, + critic_kwargs["normalization"] + if "normalization" in critic_kwargs + else "layer", + bias=False, + ) + value_head = CriticDecoder(embed_dim) + + critic = CriticNetwork( + encoder=encoder, + value_head=value_head, + customized=True, + ) + + super().__init__(env, policy, critic, **kwargs) diff --git a/rl4co/models/zoo/dact/policy.py b/rl4co/models/zoo/dact/policy.py new file mode 100644 index 00000000..ecb6688c --- /dev/null +++ b/rl4co/models/zoo/dact/policy.py @@ -0,0 +1,188 @@ +from typing import Union + +import torch +import torch.nn as nn + +from tensordict import TensorDict + +from rl4co.envs import RL4COEnvBase, get_env +from rl4co.models.common.improvement.base import ImprovementPolicy +from rl4co.models.zoo.dact.decoder import DACTDecoder +from rl4co.models.zoo.dact.encoder import DACTEncoder +from rl4co.utils.decoding import DecodingStrategy, get_decoding_strategy +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class DACTPolicy(ImprovementPolicy): + """ + DACT Policy based on Ma et al. (2021) + This model first encodes the input graph and current solution using a DACT encoder (:class:`DACTEncoder`) + and then decodes the 2-opt action (:class:`DACTDecoder`) + + Args: + embed_dim: Dimension of the node embeddings + num_encoder_layers: Number of layers in the encoder + num_heads: Number of heads in the attention layers + normalization: Normalization type in the attention layers + feedforward_hidden: Dimension of the hidden layer in the feedforward network + env_name: Name of the environment used to initialize embeddings + pos_type: Name of the used positional encoding method (CPE or APE) + init_embedding: Module to use for the initialization of the embeddings + pos_embedding: Module to use for the initialization of the positional embeddings + temperature: Temperature for the softmax + tanh_clipping: Tanh clipping value (see Bello et al., 2016) + train_decode_type: Type of decoding to use during training + val_decode_type: Type of decoding to use during validation + test_decode_type: Type of decoding to use during testing + """ + + def __init__( + self, + embed_dim: int = 64, + num_encoder_layers: int = 3, + num_heads: int = 4, + normalization: str = "layer", + feedforward_hidden: int = 64, + env_name: str = "tsp_kopt", + pos_type: str = "CPE", + init_embedding: nn.Module = None, + pos_embedding: nn.Module = None, + temperature: float = 1.0, + tanh_clipping: float = 6.0, + train_decode_type: str = "sampling", + val_decode_type: str = "sampling", + test_decode_type: str = "sampling", + ): + super(DACTPolicy, self).__init__() + + self.env_name = env_name + + # Encoder and decoder + self.encoder = DACTEncoder( + embed_dim=embed_dim, + init_embedding=init_embedding, + pos_embedding=pos_embedding, + env_name=env_name, + pos_type=pos_type, + num_heads=num_heads, + num_layers=num_encoder_layers, + normalization=normalization, + feedforward_hidden=feedforward_hidden, + ) + + self.decoder = DACTDecoder(embed_dim=embed_dim, num_heads=num_heads) + + # Decoding strategies + self.temperature = temperature + self.tanh_clipping = tanh_clipping + self.train_decode_type = train_decode_type + self.val_decode_type = val_decode_type + self.test_decode_type = test_decode_type + + def forward( + self, + td: TensorDict, + env: Union[str, RL4COEnvBase] = None, + phase: str = "train", + return_actions: bool = True, + return_embeds: bool = False, + only_return_embed: bool = False, + actions=None, + **decoding_kwargs, + ) -> dict: + """Forward pass of the policy. + + Args: + td: TensorDict containing the environment state + env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that + it is more efficient to pass an already instantiated environment each time for fine-grained control + phase: Phase of the algorithm (train, val, test) + return_actions: Whether to return the actions + actions: Actions to use for evaluating the policy. + If passed, use these actions instead of sampling from the policy to calculate log likelihood + decoding_kwargs: Keyword arguments for the decoding strategy. See :class:`rl4co.utils.decoding.DecodingStrategy` for more information. + + Returns: + out: Dictionary containing the reward, log likelihood, and optionally the actions and entropy + """ + + # Encoder: get encoder output and initial embeddings from initial state + NFE, PFE = self.encoder(td) + h_featrues = torch.cat((NFE, PFE), -1) + + if only_return_embed: + return {"embeds": h_featrues.detach()} + + # Instantiate environment if needed + if isinstance(env, str) or env is None: + env_name = self.env_name if env is None else env + log.info(f"Instantiated environment not provided; instantiating {env_name}") + env = get_env(env_name) + assert env.two_opt_mode, "DACT only support 2-opt" + + # Get decode type depending on phase and whether actions are passed for evaluation + decode_type = decoding_kwargs.pop("decode_type", None) + if actions is not None: + decode_type = "evaluate" + elif decode_type is None: + decode_type = getattr(self, f"{phase}_decode_type") + + # Setup decoding strategy + # we pop arguments that are not part of the decoding strategy + decode_strategy: DecodingStrategy = get_decoding_strategy( + decode_type, + temperature=decoding_kwargs.pop("temperature", self.temperature), + tanh_clipping=decoding_kwargs.pop("tanh_clipping", self.tanh_clipping), + mask_logits=True, + improvement_method_mode=True, + **decoding_kwargs, + ) + + # Perform the decoding + batch_size, seq_length = td["rec_current"].size() + logits = self.decoder(td, NFE, PFE).view(batch_size, -1) + + # Get mask + mask = env.get_mask(td) + if "action" in td.keys(): + mask[torch.arange(batch_size), td["action"][:, 0], td["action"][:, 1]] = False + mask[torch.arange(batch_size), td["action"][:, 1], td["action"][:, 0]] = False + mask = mask.view(batch_size, -1) + + # Get action and log-likelihood + logprob, action_sampled = decode_strategy.step( + logits, + mask, + action=( + actions[:, 0] * seq_length + actions[:, 1] + if actions is not None + else None + ), + ) + action_sampled = action_sampled.unsqueeze(-1) + if phase == "train": + log_likelihood = logprob.gather(1, action_sampled) + else: + log_likelihood = torch.zeros(batch_size, device=td.device) + + ## return + DACT_action = torch.cat( + ( + action_sampled // seq_length, + action_sampled % seq_length, + ), + -1, + ) + + outdict = {"log_likelihood": log_likelihood, "cost_bsf": td["cost_bsf"]} + td.set("action", DACT_action) + + if return_embeds: + outdict["embeds"] = h_featrues.detach() + + if return_actions: + outdict["actions"] = DACT_action + + return outdict diff --git a/rl4co/models/zoo/deepaco/__init__.py b/rl4co/models/zoo/deepaco/__init__.py new file mode 100644 index 00000000..adb4d8f5 --- /dev/null +++ b/rl4co/models/zoo/deepaco/__init__.py @@ -0,0 +1,2 @@ +from rl4co.models.zoo.deepaco.model import DeepACO +from rl4co.models.zoo.deepaco.policy import DeepACOPolicy diff --git a/rl4co/models/zoo/deepaco/antsystem.py b/rl4co/models/zoo/deepaco/antsystem.py new file mode 100644 index 00000000..1965cd3d --- /dev/null +++ b/rl4co/models/zoo/deepaco/antsystem.py @@ -0,0 +1,347 @@ +from functools import lru_cache, cached_property, partial +from typing import Optional, Tuple + +import numpy as np +import torch + +from tensordict import TensorDict +from torch import Tensor + +from rl4co.envs import RL4COEnvBase +from rl4co.models.common.constructive.nonautoregressive.decoder import ( + NonAutoregressiveDecoder, +) +from rl4co.utils.decoding import Sampling +from rl4co.utils.ops import get_distance_matrix, unbatchify + + +class AntSystem: + """Implements the Ant System algorithm: https://doi.org/10.1109/3477.484436. + + Args: + log_heuristic: Logarithm of the heuristic matrix. + n_ants: Number of ants to be used in the algorithm. Defaults to 20. + alpha: Importance of pheromone in the decision-making process. Defaults to 1.0. + beta: Importance of heuristic information in the decision-making process. Defaults to 1.0. + decay: Rate at which pheromone evaporates. Should be between 0 and 1. Defaults to 0.95. + Q: Rate at which pheromone deposits. Defaults to `1 / n_ants`. + temperature: Temperature for the softmax during decoding. Defaults to 0.1. + pheromone: Initial pheromone matrix. Defaults to `torch.ones_like(log_heuristic)`. + require_logprobs: Whether to require the log probability of actions. Defaults to False. + use_local_search: Whether to use local_search provided by the env. Default to False. + use_nls: Whether to use neural-guided local search provided by the env. Default to False. + n_perturbations: Number of perturbations to be used for nls. Defaults to 5. + local_search_params: Arguments to be passed to the local_search. + perturbation_params: Arguments to be passed to the perturbation used for nls. + """ + + def __init__( + self, + log_heuristic: Tensor, + n_ants: int = 20, + alpha: float = 1.0, + beta: float = 1.0, + decay: float = 0.95, + Q: Optional[float] = None, + temperature: float = 0.1, + pheromone: Optional[Tensor] = None, + require_logprobs: bool = False, + use_local_search: bool = False, + use_nls: bool = False, + n_perturbations: int = 5, + local_search_params: dict = {}, + perturbation_params: dict = {}, + start_node: Optional[int] = None, + ): + self.batch_size = log_heuristic.shape[0] + self.n_ants = n_ants + self.alpha = alpha + self.beta = beta + self.decay = decay + self.Q = 1 / self.n_ants if Q is None else Q + self.temperature = temperature + + self.log_heuristic = log_heuristic / self.temperature + + if pheromone is None: + self.pheromone = torch.ones_like(log_heuristic) + self.pheromone.fill_(0.0005) + else: + self.pheromone = pheromone + + self.final_actions = self.final_reward = None + self.require_logprobs = require_logprobs + self.all_records = [] + + self.use_local_search = use_local_search + assert not (use_nls and not use_local_search), "use_nls requires use_local_search" + self.use_nls = use_nls + self.n_perturbations = n_perturbations + self.local_search_params = local_search_params + self.perturbation_params = perturbation_params + self.start_node = start_node + + self._batchindex = torch.arange(self.batch_size, device=log_heuristic.device) + + @cached_property + def heuristic_dist(self) -> torch.Tensor: + heuristic = self.log_heuristic.exp().detach().cpu() + 1e-10 + heuristic_dist = 1 / (heuristic / heuristic.max(-1, keepdim=True)[0] + 1e-5) + heuristic_dist[:, torch.arange(heuristic_dist.shape[1]), torch.arange(heuristic_dist.shape[2])] = 0 + return heuristic_dist + + @staticmethod + def select_start_node_fn( + td: TensorDict, env: RL4COEnvBase, num_starts: int, start_node: Optional[int]=None + ): + if env.name == "tsp" and start_node is not None: + # For now, only TSP supports explicitly setting the start node + return start_node * torch.ones( + td.shape[0] * num_starts, dtype=torch.long, device=td.device + ) + + # if start_node is not set, we use random start nodes + return torch.multinomial(td["action_mask"].float(), num_starts, replacement=True).view(-1) + + def run( + self, + td_initial: TensorDict, + env: RL4COEnvBase, + n_iterations: int, + ) -> Tuple[TensorDict, Tensor, Tensor]: + """Run the Ant System algorithm for a specified number of iterations. + + Args: + td_initial: Initial state of the problem. + env: Environment representing the problem. + n_iterations: Number of iterations to run the algorithm. + + Returns: + td: The final state of the problem. + actions: The final actions chosen by the algorithm. + reward: The final reward achieved by the algorithm. + """ + for _ in range(n_iterations): + # reset environment + td = td_initial.clone() + self._one_step(td, env) + + action_matrix = self._convert_final_action_to_matrix() + assert action_matrix is not None and self.final_reward is not None + td, env = self._recreate_final_routes(td_initial, env, action_matrix) + + return td, action_matrix, self.final_reward + + def _one_step(self, td: TensorDict, env: RL4COEnvBase): + """Run one step of the Ant System algorithm. + + Args: + td: Current state of the problem. + env: Environment representing the problem. + + Returns: + actions: The actions chosen by the algorithm. + reward: The reward achieved by the algorithm. + """ + # sampling + td, env, actions, reward = self._sampling(td, env) + # local search, reserved for extensions + if self.use_local_search: + actions, reward = self.local_search(td, env, actions) + + # reshape from (batch_size * n_ants, ...) to (batch_size, n_ants, ...) + reward = unbatchify(reward, self.n_ants) + actions = unbatchify(actions, self.n_ants) + + # update final actions and rewards + self._update_results(actions, reward) + # update pheromone matrix + self._update_pheromone(actions, reward) + + return actions, reward + + def _sampling( + self, + td: TensorDict, + env: RL4COEnvBase, + ): + # Sample from heatmaps + # p = phe**alpha * heu**beta <==> log(p) = alpha*log(phe) + beta*log(heu) + heatmaps_logits = ( + self.alpha * torch.log(self.pheromone) + self.beta * self.log_heuristic + ) + decode_strategy = Sampling( + multistart=True, + num_starts=self.n_ants, + select_start_nodes_fn=partial(self.select_start_node_fn, start_node=self.start_node), + ) + + td, env, num_starts = decode_strategy.pre_decoder_hook(td, env) + while not td["done"].all(): + logits, mask = NonAutoregressiveDecoder.heatmap_to_logits( + td, heatmaps_logits, num_starts + ) + td = decode_strategy.step(logits, mask, td) + td = env.step(td)["next"] + + logprobs, actions, td, env = decode_strategy.post_decoder_hook(td, env) + reward = env.get_reward(td, actions) + + if self.require_logprobs: + self.all_records.append((logprobs, actions, reward, td.get("mask", None))) + + return td, env, actions, reward + + def local_search( + self, td: TensorDict, env: RL4COEnvBase, actions: Tensor + ) -> Tuple[Tensor, Tensor]: + """Perform local search on the actions and reward obtained. + + Args: + td: Current state of the problem. + env: Environment representing the problem. + actions: Actions chosen by the algorithm. + + Returns: + actions: The modified actions + reward: The modified reward + """ + td_cpu = td.detach().cpu() # Convert to CPU in advance to minimize the overhead from device transfer + td_cpu["distances"] = get_distance_matrix(td_cpu["locs"]) + # TODO: avoid or generalize this, e.g., pre-compute for local search in each env + actions = actions.detach().cpu() + best_actions = env.local_search(td=td_cpu, actions=actions, **self.local_search_params) + best_rewards = env.get_reward(td_cpu, best_actions) + + if self.use_nls: + td_cpu_perturb = td_cpu.clone() + td_cpu_perturb["distances"] = torch.tile(self.heuristic_dist, (self.n_ants, 1, 1)) + new_actions = best_actions.clone() + + for _ in range(self.n_perturbations): + perturbed_actions = env.local_search( + td=td_cpu_perturb, actions=new_actions, **self.perturbation_params + ) + new_actions = env.local_search(td=td_cpu, actions=perturbed_actions, **self.local_search_params) + new_rewards = env.get_reward(td_cpu, new_actions) + + improved_indices = new_rewards > best_rewards + best_actions = env.replace_selected_actions(best_actions, new_actions, improved_indices) + best_rewards[improved_indices] = new_rewards[improved_indices] + + best_actions = best_actions.to(td.device) + best_rewards = best_rewards.to(td.device) + + return best_actions, best_rewards + + def _update_results(self, actions, reward): + # update the best-trails recorded in self.final_actions + best_index = reward.argmax(-1) + best_reward = reward[self._batchindex, best_index] + best_actions = actions[self._batchindex, best_index] + + if self.final_actions is None or self.final_reward is None: + self.final_actions = list(iter(best_actions.clone())) + self.final_reward = best_reward.clone() + else: + require_update = self._batchindex[self.final_reward <= best_reward] + for index in require_update: + self.final_actions[index] = best_actions[index] + self.final_reward[require_update] = best_reward[require_update] + + return best_index + + def _update_pheromone(self, actions, reward): + # calculate Δphe + delta_pheromone = torch.zeros_like(self.pheromone) + from_node = actions + to_node = torch.roll(from_node, -1, -1) + mapped_reward = self._reward_map(reward).detach() + batch_action_indices = self._batch_action_indices( + self.batch_size, actions.shape[-1], reward.device + ) + + for ant_index in range(self.n_ants): + delta_pheromone[ + batch_action_indices, + from_node[:, ant_index].flatten(), + to_node[:, ant_index].flatten(), + ] += mapped_reward[batch_action_indices, ant_index] + + # decay & update + self.pheromone *= self.decay + self.pheromone += delta_pheromone + + def _reward_map(self, x: Tensor): + """Map reward $f: \\mathbb{R} \\rightarrow \\mathbb{R}^+$""" + M, _ = x.max(-1, keepdim=True) + m, _ = x.min(-1, keepdim=True) + v = ((x - m) / (M - m)) ** 2 * self.Q + return v + + def _recreate_final_routes(self, td, env, action_matrix): + for action_index in range(action_matrix.shape[-1]): + actions = action_matrix[:, action_index] + td.set("action", actions) + td = env.step(td)["next"] + + assert td["done"].all() + return td, env + + def get_logp(self): + """Get the log probability (logprobs) values recorded during the execution of the algorithm. + + Returns: + results: Tuple containing the log probability values, + actions chosen, rewards obtained, and mask values (if available). + + Raises: + AssertionError: If `require_logp` is not enabled. + """ + + assert ( + self.require_logprobs + ), "Please enable `require_logp` to record logprobs values" + + logprobs_list, actions_list, reward_list, mask_list = [], [], [], [] + + for logprobs, actions, reward, mask in self.all_records: + logprobs_list.append(logprobs) + actions_list.append(actions) + reward_list.append(reward) + mask_list.append(mask) + + if mask_list[0] is None: + mask_list = None + else: + mask_list = torch.stack(mask_list, 0) + + # reset records + self.all_records = [] + + return ( + torch.stack(logprobs_list, 0), + torch.stack(actions_list, 0), + torch.stack(reward_list, 0), + mask_list, + ) + + @staticmethod + @lru_cache(5) + def _batch_action_indices(batch_size: int, n_actions: int, device: torch.device): + batchindex = torch.arange(batch_size, device=device) + return batchindex.unsqueeze(1).repeat(1, n_actions).view(-1) + + def _convert_final_action_to_matrix(self) -> Optional[Tensor]: + if self.final_actions is None: + return None + action_count = max(len(actions) for actions in self.final_actions) + mat_actions = torch.zeros( + (self.batch_size, action_count), + device=self.final_actions[0].device, + dtype=self.final_actions[0].dtype, + ) + for index, action in enumerate(self.final_actions): + mat_actions[index, : len(action)] = action + + return mat_actions diff --git a/rl4co/models/zoo/deepaco/model.py b/rl4co/models/zoo/deepaco/model.py new file mode 100644 index 00000000..3155d20a --- /dev/null +++ b/rl4co/models/zoo/deepaco/model.py @@ -0,0 +1,51 @@ +from typing import Any, Optional, Union + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl import REINFORCE +from rl4co.models.rl.reinforce.baselines import REINFORCEBaseline +from rl4co.models.zoo.deepaco.policy import DeepACOPolicy + + +class DeepACO(REINFORCE): + """Implements DeepACO: https://arxiv.org/abs/2309.14032. + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + baseline: REINFORCE baseline. Defaults to exponential + policy_kwargs: Keyword arguments for policy + baseline_kwargs: Keyword arguments for baseline + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: Optional[DeepACOPolicy] = None, + baseline: Union[REINFORCEBaseline, str] = "no", + policy_kwargs: dict = {}, + baseline_kwargs: dict = {}, + **kwargs, + ): + if policy is None: + policy = DeepACOPolicy(env_name=env.name, **policy_kwargs) + + super().__init__(env, policy, baseline, baseline_kwargs, **kwargs) + + def shared_step( + self, + batch: Any, + batch_idx: int, + phase: str, + dataloader_idx: Union[int, None] = None, + ): + td = self.env.reset(batch) + # Perform forward pass (i.e., constructing solution and computing log-likelihoods) + out = self.policy(td, self.env, phase=phase) + + # Compute loss + if phase == "train": + out["loss"] = -(out["advantage"] * out["log_likelihood"]).mean() + + metrics = self.log_metrics(out, phase, dataloader_idx=dataloader_idx) + return {"loss": out.get("loss", None), **metrics} diff --git a/rl4co/models/zoo/deepaco/policy.py b/rl4co/models/zoo/deepaco/policy.py new file mode 100644 index 00000000..4f7d3d72 --- /dev/null +++ b/rl4co/models/zoo/deepaco/policy.py @@ -0,0 +1,147 @@ +from functools import partial +from typing import Optional, Type, Union + +from tensordict import TensorDict + +from rl4co.envs import RL4COEnvBase, get_env +from rl4co.models.common.constructive.nonautoregressive import ( + NonAutoregressiveEncoder, + NonAutoregressivePolicy, +) +from rl4co.models.zoo.deepaco.antsystem import AntSystem +from rl4co.models.zoo.nargnn.encoder import NARGNNEncoder +from rl4co.utils.utils import merge_with_defaults +from rl4co.utils.ops import batchify, unbatchify + + +class DeepACOPolicy(NonAutoregressivePolicy): + """Implememts DeepACO policy based on :class:`NonAutoregressivePolicy`. Introduced by Ye et al. (2023): https://arxiv.org/abs/2309.14032. + This policy uses a Non-Autoregressive Graph Neural Network to generate heatmaps, + which are then used to run Ant Colony Optimization (ACO) to construct solutions. + + Args: + encoder: Encoder module. Can be passed by sub-classes + env_name: Name of the environment used to initialize embeddings + temperature: Temperature for the softmax during decoding. Defaults to 0.1. + aco_class: Class representing the ACO algorithm to be used. Defaults to :class:`AntSystem`. + aco_kwargs: Additional arguments to be passed to the ACO algorithm. + n_ants: Number of ants to be used in the ACO algorithm. Can be an integer or dictionary. Defaults to 20. + n_iterations: Number of iterations to run the ACO algorithm. Can be an integer or dictionary. Defaults to `dict(train=1, val=20, test=100)`. + ls_reward_aug_W: Coefficient to be used for the reward augmentation with the local search. Defaults to 0.95. + encoder_kwargs: Additional arguments to be passed to the encoder. + """ + + def __init__( + self, + encoder: Optional[NonAutoregressiveEncoder] = None, + env_name: str = "tsp", + temperature: float = 1.0, + aco_class: Optional[Type[AntSystem]] = None, + aco_kwargs: dict = {}, + train_with_local_search: bool = True, + n_ants: Optional[Union[int, dict]] = None, + n_iterations: Optional[Union[int, dict]] = None, + ls_reward_aug_W: float = 0.95, + **encoder_kwargs, + ): + if encoder is None: + encoder = NARGNNEncoder(**encoder_kwargs) + + super(DeepACOPolicy, self).__init__( + encoder=encoder, + env_name=env_name, + temperature=temperature, + train_decode_type="multistart_sampling", + val_decode_type="multistart_sampling", + test_decode_type="multistart_sampling", + ) + + self.aco_class = AntSystem if aco_class is None else aco_class + self.aco_kwargs = aco_kwargs + self.train_with_local_search = train_with_local_search + self.n_ants = merge_with_defaults(n_ants, train=30, val=48, test=48) + self.n_iterations = merge_with_defaults(n_iterations, train=1, val=5, test=10) + self.ls_reward_aug_W = ls_reward_aug_W + + def forward( + self, + td_initial: TensorDict, + env: Optional[Union[str, RL4COEnvBase]] = None, + calc_reward: bool = True, + phase: str = "train", + actions=None, + return_actions: bool = True, + return_hidden: bool = True, + **kwargs, + ): + """ + Forward method. During validation and testing, the policy runs the ACO algorithm to construct solutions. + See :class:`NonAutoregressivePolicy` for more details during the training phase. + """ + n_ants = self.n_ants[phase] + # Instantiate environment if needed + if (phase != "train" or self.ls_reward_aug_W > 0) and (env is None or isinstance(env, str)): + env_name = self.env_name if env is None else env + env = get_env(env_name) + + if phase == "train": + select_start_nodes_fn = partial( + self.aco_class.select_start_node_fn, start_node=self.aco_kwargs.get("start_node", None) + ) + kwargs.update({"select_start_nodes_fn": select_start_nodes_fn}) + # we just use the constructive policy + outdict = super().forward( + td_initial, + env, + phase=phase, + decode_type="multistart_sampling", + calc_reward=calc_reward, + num_starts=n_ants, + actions=actions, + return_actions=return_actions, + return_hidden=return_hidden, + **kwargs, + ) + + # manually compute the advantage + reward = unbatchify(outdict["reward"], n_ants) + advantage = reward - reward.mean(dim=1, keepdim=True) + + if self.ls_reward_aug_W > 0 and self.train_with_local_search: + heatmap_logits = outdict["hidden"] + aco = self.aco_class( + heatmap_logits, + n_ants=n_ants, + temperature=self.aco_kwargs.get("temperature", self.temperature), + **self.aco_kwargs, + ) + + actions = outdict["actions"] + _, ls_reward = aco.local_search(batchify(td_initial, n_ants), env, actions) + + ls_reward = unbatchify(ls_reward, n_ants) + ls_advantage = ls_reward - ls_reward.mean(dim=1, keepdim=True) + advantage = advantage * (1 - self.ls_reward_aug_W) + ls_advantage * self.ls_reward_aug_W + + outdict["advantage"] = advantage + outdict["log_likelihood"] = unbatchify(outdict["log_likelihood"], n_ants) + + return outdict + + heatmap_logits, _ = self.encoder(td_initial) + + aco = self.aco_class( + heatmap_logits, + n_ants=self.n_ants[phase], + temperature=self.aco_kwargs.get("temperature", self.temperature), + **self.aco_kwargs, + ) + td, actions, reward = aco.run(td_initial, env, self.n_iterations[phase]) + + out = {} + if calc_reward: + out["reward"] = reward + if return_actions: + out["actions"] = actions + + return out diff --git a/rl4co/models/zoo/eas/__init__.py b/rl4co/models/zoo/eas/__init__.py new file mode 100644 index 00000000..641f2a3b --- /dev/null +++ b/rl4co/models/zoo/eas/__init__.py @@ -0,0 +1 @@ +from .search import EAS, EASEmb, EASLay diff --git a/rl4co/models/zoo/eas/decoder.py b/rl4co/models/zoo/eas/decoder.py new file mode 100644 index 00000000..71d13df8 --- /dev/null +++ b/rl4co/models/zoo/eas/decoder.py @@ -0,0 +1,128 @@ +import math + +from typing import Union + +import torch + +from tensordict import TensorDict + +from rl4co.envs import RL4COEnvBase +from rl4co.utils.decoding import decode_logprobs, process_logits +from rl4co.utils.ops import batchify, unbatchify + + +def forward_pointer_attn_eas_lay(self, query, key, value, logit_key, mask): + """Add layer to the forward pass of logit attention, i.e. + Single-head attention. + """ + # Compute inner multi-head attention with no projections. + heads = self._inner_mha(query, key, value, mask) + + # Add residual for EAS layer if is set + if getattr(self, "eas_layer", None) is not None: + heads = heads + self.eas_layer(heads) + + glimpse = self.project_out(heads) + + # Batch matrix multiplication to compute logits (batch_size, num_steps, graph_size) + # bmm is slightly faster than einsum and matmul + logits = ( + torch.bmm(glimpse, logit_key.squeeze(1).transpose(-2, -1)) + / math.sqrt(glimpse.size(-1)) + ).squeeze(1) + + return logits + + +def forward_eas( + self, + td: TensorDict, + cached_embeds, + best_solutions, + iter_count: int = 0, + env: Union[str, RL4COEnvBase] = None, + decode_type: str = "multistart_sampling", + num_starts: int = None, + mask_logits: bool = True, + temperature: float = 1.0, + tanh_clipping: float = 0, + **decode_kwargs, +): + """Forward pass of the decoder + Given the environment state and the pre-computed embeddings, compute the logits and sample actions + + Args: + td: Input TensorDict containing the environment state + embeddings: Precomputed embeddings for the nodes. Can be already precomputed cached in form of q, k, v and + env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that + it is more efficient to pass an already instantiated environment each time for fine-grained control + decode_type: Type of decoding to use. Can be one of: + - "sampling": sample from the logits + - "greedy": take the argmax of the logits + - "multistart_sampling": sample as sampling, but with multi-start decoding + - "multistart_greedy": sample as greedy, but with multi-start decoding + num_starts: Number of multi-starts to use. If None, will be calculated from the action mask + calc_reward: Whether to calculate the reward for the decoded sequence + """ + # TODO: this could be refactored by decoding strategies + + # Collect logprobs + logprobs = [] + actions = [] + + decode_step = 0 + # Multi-start decoding: first action is chosen by ad-hoc node selection + if num_starts > 1 or "multistart" in decode_type: + action = env.select_start_nodes(td, num_starts + 1) % num_starts + # Append incumbent solutions + if iter_count > 0: + action = unbatchify(action, num_starts + 1) + action[:, -1] = best_solutions[:, decode_step] + action = action.permute(1, 0).reshape(-1) + + # Expand td to batch_size * (num_starts + 1) + td = batchify(td, num_starts + 1) + + td.set("action", action) + td = env.step(td)["next"] + logp = torch.zeros_like( + td["action_mask"], device=td.device + ) # first logprobs is 0, so p = logprobs.exp() = 1 + + logprobs.append(logp) + actions.append(action) + + # Main decoding: loop until all sequences are done + while not td["done"].all(): + decode_step += 1 + logits, mask = self.forward(td, cached_embeds, num_starts + 1) + + logp = process_logits( + logits, + mask, + temperature=self.temperature if self.temperature is not None else temperature, + tanh_clipping=self.tanh_clipping + if self.tanh_clipping is not None + else tanh_clipping, + mask_logits=self.mask_logits if self.mask_logits is not None else mask_logits, + ) + + # Select the indices of the next nodes in the sequences, result (batch_size) long + action = decode_logprobs(logp, mask, decode_type=decode_type) + + if iter_count > 0: # append incumbent solutions + init_shp = action.shape + action = unbatchify(action, num_starts + 1) + action[:, -1] = best_solutions[:, decode_step] + action = action.permute(1, 0).reshape(init_shp) + + td.set("action", action) + td = env.step(td)["next"] + + # Collect output of step + logprobs.append(logp) + actions.append(action) + + logprobs, actions = torch.stack(logprobs, 1), torch.stack(actions, 1) + rewards = env.get_reward(td, actions) + return logprobs, actions, td, rewards diff --git a/rl4co/models/zoo/eas/nn.py b/rl4co/models/zoo/eas/nn.py new file mode 100644 index 00000000..68a23f20 --- /dev/null +++ b/rl4co/models/zoo/eas/nn.py @@ -0,0 +1,30 @@ +import torch +import torch.nn as nn + + +class EASLayerNet(nn.Module): + """Instantiate weights and biases for the added layer. + The layer is defined as: h = relu(emb * W1 + b1); out = h * W2 + b2. + Wrapping in `nn.Parameter` makes the parameters trainable and sets gradient to True. + + Args: + num_instances: Number of instances in the dataset + emb_dim: Dimension of the embedding + """ + + def __init__(self, num_instances: int, emb_dim: int): + super().__init__() + # W2 and b2 are initialized to zero so in the first iteration the layer is identity + self.W1 = nn.Parameter(torch.randn(num_instances, emb_dim, emb_dim)) + self.b1 = nn.Parameter(torch.randn(num_instances, 1, emb_dim)) + self.W2 = nn.Parameter(torch.zeros(num_instances, emb_dim, emb_dim)) + self.b2 = nn.Parameter(torch.zeros(num_instances, 1, emb_dim)) + torch.nn.init.xavier_uniform_(self.W1) + torch.nn.init.xavier_uniform_(self.b1) + + def forward(self, *args): + """emb: [num_instances, group_num, emb_dim]""" + # get tensor arg (from partial instantiation) + emb = [arg for arg in args if isinstance(arg, torch.Tensor)][0] + h = torch.relu(torch.matmul(emb, self.W1) + self.b1.expand_as(emb)) + return torch.matmul(h, self.W2) + self.b2.expand_as(h) diff --git a/rl4co/models/zoo/eas/search.py b/rl4co/models/zoo/eas/search.py new file mode 100644 index 00000000..ef352d93 --- /dev/null +++ b/rl4co/models/zoo/eas/search.py @@ -0,0 +1,346 @@ +import time + +from functools import partial +from typing import Any, List, Union + +import torch + +from lightning.pytorch.utilities.types import STEP_OUTPUT +from torch.nn.utils.rnn import pad_sequence +from torch.utils.data import Dataset + +from rl4co.data.transforms import StateAugmentation +from rl4co.models.common.transductive import TransductiveModel +from rl4co.models.zoo.eas.decoder import forward_eas, forward_pointer_attn_eas_lay +from rl4co.models.zoo.eas.nn import EASLayerNet +from rl4co.utils.decoding import get_log_likelihood +from rl4co.utils.ops import batchify, gather_by_index, unbatchify +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class EAS(TransductiveModel): + """Efficient Active Search for Neural Combination Optimization from Hottung et al. (2022). + Fine-tunes a subset of parameters (such as node embeddings or newly added layers) thus avoiding + expensive re-encoding of the problem. + Reference: https://openreview.net/pdf?id=nO5caZwFwYu + + Args: + env: RL4CO environment to be solved + policy: policy network + dataset: dataset to be used for training + use_eas_embedding: whether to use EAS embedding (EASEmb) + use_eas_layer: whether to use EAS layer (EASLay) + eas_emb_cache_keys: keys to cache in the embedding + eas_lambda: lambda parameter for IL loss + batch_size: batch size for training + max_iters: maximum number of iterations + augment_size: number of augmentations per state + augment_dihedral: whether to augment with dihedral rotations + parallel_runs: number of parallel runs + baseline: REINFORCE baseline type (multistart, symmetric, full) + max_runtime: maximum runtime in seconds + save_path: path to save solution checkpoints + optimizer: optimizer to use for training + optimizer_kwargs: keyword arguments for optimizer + verbose: whether to print progress for each iteration + """ + + def __init__( + self, + env, + policy, + dataset: Union[Dataset, str], + use_eas_embedding: bool = True, + use_eas_layer: bool = False, + eas_emb_cache_keys: List[str] = ["logit_key"], + eas_lambda: float = 0.013, + batch_size: int = 2, + max_iters: int = 200, + augment_size: int = 8, + augment_dihedral: bool = True, + num_parallel_runs: int = 1, + baseline: str = "multistart", + max_runtime: int = 86_400, + save_path: str = None, + optimizer: Union[str, torch.optim.Optimizer, partial] = "Adam", + optimizer_kwargs: dict = {"lr": 0.0041, "weight_decay": 1e-6}, + verbose: bool = True, + **kwargs, + ): + self.save_hyperparameters(logger=False) + + assert ( + self.hparams.use_eas_embedding or self.hparams.use_eas_layer + ), "At least one of `use_eas_embedding` or `use_eas_layer` must be True." + + super(EAS, self).__init__( + env, + policy=policy, + dataset=dataset, + batch_size=batch_size, + max_iters=max_iters, + max_runtime=max_runtime, + save_path=save_path, + optimizer=optimizer, + optimizer_kwargs=optimizer_kwargs, + **kwargs, + ) + + assert self.hparams.baseline in [ + "multistart", + "symmetric", + "full", + ], f"Baseline {self.hparams.baseline} not supported." + + def setup(self, stage="fit"): + """Setup base class and instantiate: + - augmentation + - instance solutions and rewards + - original policy state dict + """ + log.info( + f"Setting up Efficient Active Search (EAS) with: \n" + f"- EAS Embedding: {self.hparams.use_eas_embedding} \n" + f"- EAS Layer: {self.hparams.use_eas_layer} \n" + ) + super(EAS, self).setup(stage) + + # Instantiate augmentation + self.augmentation = StateAugmentation( + num_augment=self.hparams.augment_size, + augment_fn="dihedral8" if self.hparams.augment_dihedral else "symmetric", + ) + + # Store original policy state dict + self.original_policy_state = self.policy.state_dict() + + # Get dataset size and problem size + len(self.dataset) + _batch = next(iter(self.train_dataloader())) + self.problem_size = self.env.reset(_batch)["action_mask"].shape[-1] + self.instance_solutions = [] + self.instance_rewards = [] + + def on_train_batch_start(self, batch: Any, batch_idx: int): + """Called before training (i.e. search) for a new batch begins. + We re-load the original policy state dict and configure all parameters not to require gradients. + We do the rest in the training step. + """ + self.policy.load_state_dict(self.original_policy_state) + + # Set all policy parameters to not require gradients + for param in self.policy.parameters(): + param.requires_grad = False + + def training_step(self, batch, batch_idx): + """Main search loop. We use the training step to effectively adapt to a `batch` of instances.""" + # Augment state + batch_size = batch.shape[0] + td_init = self.env.reset(batch) + n_aug, n_start, n_runs = ( + self.augmentation.num_augment, + self.env.get_num_starts(td_init), + self.hparams.num_parallel_runs, + ) + td_init = self.augmentation(td_init) + td_init = batchify(td_init, n_runs) + num_instances = batch_size * n_aug * n_runs # NOTE: no num_starts! + # batch_r = n_runs * batch_size # effective batch size + group_s = ( + n_start + 1 + ) # number of different rollouts per instance (+1 for incumbent solution construction) + + # Get encoder and decoder for simplicity + encoder = self.policy.encoder + decoder = self.policy.decoder + + # Precompute the cache of the embeddings (i.e. q,k,v and logit_key) + embeddings, _ = encoder(td_init) + cached_embeds = decoder._precompute_cache(embeddings) + + # Collect optimizer parameters + opt_params = [] + if self.hparams.use_eas_layer: + # EASLay: replace forward of logit attention computation. EASLayer + eas_layer = EASLayerNet(num_instances, decoder.embed_dim).to(batch.device) + decoder.pointer.eas_layer = partial(eas_layer, decoder.pointer) + decoder.pointer.forward = partial( + forward_pointer_attn_eas_lay, decoder.pointer + ) + for param in eas_layer.parameters(): + opt_params.append(param) + if self.hparams.use_eas_embedding: + # EASEmb: set gradient of emb_key to True + # for all the keys, wrap the embedding in a nn.Parameter + for key in self.hparams.eas_emb_cache_keys: + setattr( + cached_embeds, key, torch.nn.Parameter(getattr(cached_embeds, key)) + ) + opt_params.append(getattr(cached_embeds, key)) + decoder.forward_eas = partial(forward_eas, decoder) + + # We pass attributes saved in policy too + def set_attr_if_exists(attr): + if hasattr(self.policy, attr): + setattr(decoder, attr, getattr(self.policy, attr)) + + for attr in ["temperature", "tanh_clipping", "mask_logits"]: + set_attr_if_exists(attr) + + self.configure_optimizers(opt_params) + + # Solution and reward buffer + max_reward = torch.full((batch_size,), -float("inf"), device=batch.device) + best_solutions = torch.zeros( + batch_size, self.problem_size * 2, device=batch.device, dtype=int + ) # i.e. incumbent solutions + + # Init search + t_start = time.time() + for iter_count in range(self.hparams.max_iters): + # Evaluate policy with sampling multistarts passing the cached embeddings + best_solutions_expanded = best_solutions.repeat(n_aug, 1).repeat(n_runs, 1) + logprobs, actions, td_out, reward = decoder.forward_eas( + td_init.clone(), + cached_embeds=cached_embeds, + best_solutions=best_solutions_expanded, + iter_count=iter_count, + env=self.env, + decode_type="multistart_sampling", + num_starts=n_start, + ) + + # Unbatchify to get correct dimensions + ll = get_log_likelihood(logprobs, actions, td_out.get("mask", None)) + ll = unbatchify(ll, (n_runs * batch_size, n_aug, group_s)).squeeze() + reward = unbatchify(reward, (n_runs * batch_size, n_aug, group_s)).squeeze() + actions = unbatchify(actions, (n_runs * batch_size, n_aug, group_s)).squeeze() + + # Compute REINFORCE loss with shared baselines + # compared to original EAS, we also support symmetric and full baselines + group_reward = reward[..., :-1] # exclude incumbent solution + if self.hparams.baseline == "multistart": + bl_val = group_reward.mean(dim=-1, keepdim=True) + elif self.hparams.baseline == "symmetric": + bl_val = group_reward.mean(dim=-2, keepdim=True) + elif self.hparams.baseline == "full": + bl_val = group_reward.mean(dim=-1, keepdim=True).mean( + dim=-2, keepdim=True + ) + else: + raise ValueError(f"Baseline {self.hparams.baseline} not supported.") + + # REINFORCE loss + advantage = group_reward - bl_val + loss_rl = -(advantage * ll[..., :-1]).mean() + # IL loss + loss_il = -ll[..., -1].mean() + # Total loss + loss = loss_rl + self.hparams.eas_lambda * loss_il + + # Manual backpropagation + opt = self.optimizers() + opt.zero_grad() + self.manual_backward(loss) + + # Save best solutions and rewards + # Get max reward for each group and instance + max_reward = reward.max(dim=2)[0].max(dim=1)[0] + + # Reshape and rank rewards + reward_group = reward.reshape(n_runs * batch_size, -1) + _, top_indices = torch.topk(reward_group, k=1, dim=1) + + # Obtain best solutions found so far + solutions = actions.reshape(n_runs * batch_size, n_aug * group_s, -1) + best_solutions_iter = gather_by_index(solutions, top_indices, dim=1) + best_solutions[:, : best_solutions_iter.shape[1]] = best_solutions_iter + + self.log_dict( + { + "loss": loss, + "max_reward": max_reward.mean(), + "step": iter_count, + "time": time.time() - t_start, + }, + on_step=self.log_on_step, + ) + + log.info( + f"{iter_count}/{self.hparams.max_iters} | " + f" Reward: {max_reward.mean().item():.2f} " + ) + + # Stop if max runtime is exceeded + if time.time() - t_start > self.hparams.max_runtime: + log.info(f"Max runtime of {self.hparams.max_runtime} seconds exceeded.") + break + + return {"max_reward": max_reward, "best_solutions": best_solutions} + + def on_train_batch_end( + self, outputs: STEP_OUTPUT, batch: Any, batch_idx: int + ) -> None: + """We store the best solution and reward found.""" + max_rewards, best_solutions = outputs["max_reward"], outputs["best_solutions"] + self.instance_solutions.append(best_solutions) + self.instance_rewards.append(max_rewards) + log.info(f"Best reward: {max_rewards.mean():.2f}") + + def on_train_epoch_end(self) -> None: + """Called when the train ends.""" + save_path = self.hparams.save_path + # concatenate solutions and rewards + self.instance_solutions = pad_sequence( + self.instance_solutions, batch_first=True, padding_value=0 + ).squeeze() + self.instance_rewards = torch.cat(self.instance_rewards, dim=0).squeeze() + if save_path is not None: + log.info(f"Saving solutions and rewards to {save_path}...") + torch.save( + {"solutions": self.instance_solutions, "rewards": self.instance_rewards}, + save_path, + ) + + # https://github.com/Lightning-AI/lightning/issues/1406 + self.trainer.should_stop = True + + +class EASEmb(EAS): + """EAS with embedding adaptation""" + + def __init__( + self, + *args, + **kwargs, + ): + if not kwargs.get("use_eas_embedding", False) or kwargs.get( + "use_eas_layer", True + ): + log.warning( + "Setting `use_eas_embedding` to True and `use_eas_layer` to False. Use EAS base class to override." + ) + kwargs["use_eas_embedding"] = True + kwargs["use_eas_layer"] = False + super(EASEmb, self).__init__(*args, **kwargs) + + +class EASLay(EAS): + """EAS with layer adaptation""" + + def __init__( + self, + *args, + **kwargs, + ): + if kwargs.get("use_eas_embedding", False) or not kwargs.get( + "use_eas_layer", True + ): + log.warning( + "Setting `use_eas_embedding` to True and `use_eas_layer` to False. Use EAS base class to override." + ) + kwargs["use_eas_embedding"] = False + kwargs["use_eas_layer"] = True + super(EASLay, self).__init__(*args, **kwargs) diff --git a/rl4co/models/zoo/ham/__init__.py b/rl4co/models/zoo/ham/__init__.py new file mode 100644 index 00000000..1e283fc4 --- /dev/null +++ b/rl4co/models/zoo/ham/__init__.py @@ -0,0 +1,2 @@ +from .model import HeterogeneousAttentionModel +from .policy import HeterogeneousAttentionModelPolicy diff --git a/rl4co/models/zoo/ham/attention.py b/rl4co/models/zoo/ham/attention.py new file mode 100644 index 00000000..0c4d593e --- /dev/null +++ b/rl4co/models/zoo/ham/attention.py @@ -0,0 +1,488 @@ +import math + +import torch +import torch.nn as nn + + +class HeterogenousMHA(nn.Module): + def __init__(self, num_heads, input_dim, embed_dim=None, val_dim=None, key_dim=None): + """ + Heterogenous Multi-Head Attention for Pickup and Delivery problems + https://arxiv.org/abs/2110.02634 + """ + super(HeterogenousMHA, self).__init__() + + if val_dim is None: + assert embed_dim is not None, "Provide either embed_dim or val_dim" + val_dim = embed_dim // num_heads + if key_dim is None: + key_dim = val_dim + + self.num_heads = num_heads + self.input_dim = input_dim + self.embed_dim = embed_dim + self.val_dim = val_dim + self.key_dim = key_dim + + self.norm_factor = 1 / math.sqrt(key_dim) # See Attention is all you need + + self.W_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim)) + self.W_key = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim)) + self.W_val = nn.Parameter(torch.Tensor(num_heads, input_dim, val_dim)) + + # Pickup weights + self.W1_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim)) + self.W2_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim)) + self.W3_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim)) + + # Delivery weights + self.W4_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim)) + self.W5_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim)) + self.W6_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim)) + + if embed_dim is not None: + self.W_out = nn.Parameter(torch.Tensor(num_heads, key_dim, embed_dim)) + + self.init_parameters() + + def init_parameters(self): + for param in self.parameters(): + stdv = 1.0 / math.sqrt(param.size(-1)) + param.data.uniform_(-stdv, stdv) + + def forward(self, q, h=None, mask=None): + """ + Args: + q: queries (batch_size, n_query, input_dim) + h: data (batch_size, graph_size, input_dim) + mask: mask (batch_size, n_query, graph_size) or viewable as that (i.e. can be 2 dim if n_query == 1) + + Mask should contain 1 if attention is not possible (i.e. mask is negative adjacency) + """ + if h is None: + h = q # compute self-attention + + # h should be (batch_size, graph_size, input_dim) + batch_size, graph_size, input_dim = h.size() + + # Check if graph size is odd number + assert ( + graph_size % 2 == 1 + ), "Graph size should have odd number of nodes due to pickup-delivery problem \ + (n/2 pickup, n/2 delivery, 1 depot)" + + n_query = q.size(1) + assert q.size(0) == batch_size + assert q.size(2) == input_dim + assert input_dim == self.input_dim, "Wrong embedding dimension of input" + + hflat = h.contiguous().view(-1, input_dim) # [batch_size * graph_size, embed_dim] + qflat = q.contiguous().view(-1, input_dim) # [batch_size * n_query, embed_dim] + + # last dimension can be different for keys and values + shp = (self.num_heads, batch_size, graph_size, -1) + shp_q = (self.num_heads, batch_size, n_query, -1) + + # pickup -> its delivery attention + n_pick = (graph_size - 1) // 2 + shp_delivery = (self.num_heads, batch_size, n_pick, -1) + shp_q_pick = (self.num_heads, batch_size, n_pick, -1) + + # pickup -> all pickups attention + shp_allpick = (self.num_heads, batch_size, n_pick, -1) + shp_q_allpick = (self.num_heads, batch_size, n_pick, -1) + + # pickup -> all pickups attention + shp_alldelivery = (self.num_heads, batch_size, n_pick, -1) + shp_q_alldelivery = (self.num_heads, batch_size, n_pick, -1) + + # Calculate queries, (num_heads, n_query, graph_size, key/val_size) + Q = torch.matmul(qflat, self.W_query).view(shp_q) + # Calculate keys and values (num_heads, batch_size, graph_size, key/val_size) + K = torch.matmul(hflat, self.W_key).view(shp) + V = torch.matmul(hflat, self.W_val).view(shp) + + # pickup -> its delivery + pick_flat = ( + h[:, 1 : n_pick + 1, :].contiguous().view(-1, input_dim) + ) # [batch_size * n_pick, embed_dim] + delivery_flat = ( + h[:, n_pick + 1 :, :].contiguous().view(-1, input_dim) + ) # [batch_size * n_pick, embed_dim] + + # pickup -> its delivery attention + Q_pick = torch.matmul(pick_flat, self.W1_query).view( + shp_q_pick + ) # (self.num_heads, batch_size, n_pick, key_size) + K_delivery = torch.matmul(delivery_flat, self.W_key).view( + shp_delivery + ) # (self.num_heads, batch_size, n_pick, -1) + V_delivery = torch.matmul(delivery_flat, self.W_val).view( + shp_delivery + ) # (num_heads, batch_size, n_pick, key/val_size) + + # pickup -> all pickups attention + Q_pick_allpick = torch.matmul(pick_flat, self.W2_query).view( + shp_q_allpick + ) # (self.num_heads, batch_size, n_pick, -1) + K_allpick = torch.matmul(pick_flat, self.W_key).view( + shp_allpick + ) # [self.num_heads, batch_size, n_pick, key_size] + V_allpick = torch.matmul(pick_flat, self.W_val).view( + shp_allpick + ) # [self.num_heads, batch_size, n_pick, key_size] + + # pickup -> all delivery + Q_pick_alldelivery = torch.matmul(pick_flat, self.W3_query).view( + shp_q_alldelivery + ) # (self.num_heads, batch_size, n_pick, key_size) + K_alldelivery = torch.matmul(delivery_flat, self.W_key).view( + shp_alldelivery + ) # (self.num_heads, batch_size, n_pick, -1) + V_alldelivery = torch.matmul(delivery_flat, self.W_val).view( + shp_alldelivery + ) # (num_heads, batch_size, n_pick, key/val_size) + + # pickup -> its delivery + V_additional_delivery = torch.cat( + [ # [num_heads, batch_size, graph_size, key_size] + torch.zeros( + self.num_heads, + batch_size, + 1, + self.input_dim // self.num_heads, + dtype=V.dtype, + device=V.device, + ), + V_delivery, # [num_heads, batch_size, n_pick, key/val_size] + torch.zeros( + self.num_heads, + batch_size, + n_pick, + self.input_dim // self.num_heads, + dtype=V.dtype, + device=V.device, + ), + ], + 2, + ) + + # delivery -> its pickup attention + Q_delivery = torch.matmul(delivery_flat, self.W4_query).view( + shp_delivery + ) # (self.num_heads, batch_size, n_pick, key_size) + K_pick = torch.matmul(pick_flat, self.W_key).view( + shp_q_pick + ) # (self.num_heads, batch_size, n_pick, -1) + V_pick = torch.matmul(pick_flat, self.W_val).view( + shp_q_pick + ) # (num_heads, batch_size, n_pick, key/val_size) + + # delivery -> all delivery attention + Q_delivery_alldelivery = torch.matmul(delivery_flat, self.W5_query).view( + shp_alldelivery + ) # (self.num_heads, batch_size, n_pick, -1) + K_alldelivery2 = torch.matmul(delivery_flat, self.W_key).view( + shp_alldelivery + ) # [self.num_heads, batch_size, n_pick, key_size] + V_alldelivery2 = torch.matmul(delivery_flat, self.W_val).view( + shp_alldelivery + ) # [self.num_heads, batch_size, n_pick, key_size] + + # delivery -> all pickup + Q_delivery_allpickup = torch.matmul(delivery_flat, self.W6_query).view( + shp_alldelivery + ) # (self.num_heads, batch_size, n_pick, key_size) + K_allpickup2 = torch.matmul(pick_flat, self.W_key).view( + shp_q_alldelivery + ) # (self.num_heads, batch_size, n_pick, -1) + V_allpickup2 = torch.matmul(pick_flat, self.W_val).view( + shp_q_alldelivery + ) # (num_heads, batch_size, n_pick, key/val_size) + + # delivery -> its pick up + V_additional_pick = torch.cat( + [ # [num_heads, batch_size, graph_size, key_size] + torch.zeros( + self.num_heads, + batch_size, + 1, + self.input_dim // self.num_heads, + dtype=V.dtype, + device=V.device, + ), + torch.zeros( + self.num_heads, + batch_size, + n_pick, + self.input_dim // self.num_heads, + dtype=V.dtype, + device=V.device, + ), + V_pick, # [num_heads, batch_size, n_pick, key/val_size] + ], + 2, + ) + + # Calculate compatibility (num_heads, batch_size, n_query, graph_size) + compatibility = self.norm_factor * torch.matmul(Q, K.transpose(2, 3)) + + ##Pick up pair attention + compatibility_pick_delivery = self.norm_factor * torch.sum( + Q_pick * K_delivery, -1 + ) # element_wise, [num_heads, batch_size, n_pick] + # [num_heads, batch_size, n_pick, n_pick] + compatibility_pick_allpick = self.norm_factor * torch.matmul( + Q_pick_allpick, K_allpick.transpose(2, 3) + ) # [num_heads, batch_size, n_pick, n_pick] + compatibility_pick_alldelivery = self.norm_factor * torch.matmul( + Q_pick_alldelivery, K_alldelivery.transpose(2, 3) + ) # [num_heads, batch_size, n_pick, n_pick] + + ##Delivery + compatibility_delivery_pick = self.norm_factor * torch.sum( + Q_delivery * K_pick, -1 + ) # element_wise, [num_heads, batch_size, n_pick] + compatibility_delivery_alldelivery = self.norm_factor * torch.matmul( + Q_delivery_alldelivery, K_alldelivery2.transpose(2, 3) + ) # [num_heads, batch_size, n_pick, n_pick] + compatibility_delivery_allpick = self.norm_factor * torch.matmul( + Q_delivery_allpickup, K_allpickup2.transpose(2, 3) + ) # [num_heads, batch_size, n_pick, n_pick] + + ##Pick up-> + # compatibility_additional?pickup????delivery????attention(size 1),1:n_pick+1??attention,depot?delivery?? + compatibility_additional_delivery = torch.cat( + [ # [num_heads, batch_size, graph_size, 1] + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + 1, + dtype=compatibility.dtype, + device=compatibility.device, + ), + compatibility_pick_delivery, # [num_heads, batch_size, n_pick] + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + n_pick, + dtype=compatibility.dtype, + device=compatibility.device, + ), + ], + -1, + ).view(self.num_heads, batch_size, graph_size, 1) + + compatibility_additional_allpick = torch.cat( + [ # [num_heads, batch_size, graph_size, n_pick] + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + 1, + n_pick, + dtype=compatibility.dtype, + device=compatibility.device, + ), + compatibility_pick_allpick, # [num_heads, batch_size, n_pick, n_pick] + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + n_pick, + n_pick, + dtype=compatibility.dtype, + device=compatibility.device, + ), + ], + 2, + ).view(self.num_heads, batch_size, graph_size, n_pick) + + compatibility_additional_alldelivery = torch.cat( + [ # [num_heads, batch_size, graph_size, n_pick] + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + 1, + n_pick, + dtype=compatibility.dtype, + device=compatibility.device, + ), + compatibility_pick_alldelivery, # [num_heads, batch_size, n_pick, n_pick] + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + n_pick, + n_pick, + dtype=compatibility.dtype, + device=compatibility.device, + ), + ], + 2, + ).view(self.num_heads, batch_size, graph_size, n_pick) + # [num_heads, batch_size, n_query, graph_size+1+n_pick+n_pick] + + # Delivery + compatibility_additional_pick = torch.cat( + [ # [num_heads, batch_size, graph_size, 1] + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + 1, + dtype=compatibility.dtype, + device=compatibility.device, + ), + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + n_pick, + dtype=compatibility.dtype, + device=compatibility.device, + ), + compatibility_delivery_pick, # [num_heads, batch_size, n_pick] + ], + -1, + ).view(self.num_heads, batch_size, graph_size, 1) + + compatibility_additional_alldelivery2 = torch.cat( + [ # [num_heads, batch_size, graph_size, n_pick] + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + 1, + n_pick, + dtype=compatibility.dtype, + device=compatibility.device, + ), + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + n_pick, + n_pick, + dtype=compatibility.dtype, + device=compatibility.device, + ), + compatibility_delivery_alldelivery, # [num_heads, batch_size, n_pick, n_pick] + ], + 2, + ).view(self.num_heads, batch_size, graph_size, n_pick) + + compatibility_additional_allpick2 = torch.cat( + [ # [num_heads, batch_size, graph_size, n_pick] + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + 1, + n_pick, + dtype=compatibility.dtype, + device=compatibility.device, + ), + float("-inf") + * torch.ones( + self.num_heads, + batch_size, + n_pick, + n_pick, + dtype=compatibility.dtype, + device=compatibility.device, + ), + compatibility_delivery_allpick, # [num_heads, batch_size, n_pick, n_pick] + ], + 2, + ).view(self.num_heads, batch_size, graph_size, n_pick) + + compatibility = torch.cat( + [ + compatibility, + compatibility_additional_delivery, + compatibility_additional_allpick, + compatibility_additional_alldelivery, + compatibility_additional_pick, + compatibility_additional_alldelivery2, + compatibility_additional_allpick2, + ], + dim=-1, + ) + + # Optionally apply mask to prevent attention + if mask is not None: + mask = mask.view(1, batch_size, n_query, graph_size).expand_as(compatibility) + compatibility[mask] = float("-inf") + + attn = torch.softmax( + compatibility, dim=-1 + ) # [num_heads, batch_size, n_query, graph_size+1+n_pick*2] (graph_size include depot) + + # If there are nodes with no neighbours then softmax returns nan so we fix them to 0 + if mask is not None: + attnc = attn.clone() + attnc[mask] = 0 + attn = attnc + + # heads: [num_heads, batrch_size, n_query, val_size] pick -> its delivery + heads = torch.matmul( + attn[:, :, :, :graph_size], V + ) # V: (self.num_heads, batch_size, graph_size, val_size) + heads = ( + heads + + attn[:, :, :, graph_size].view(self.num_heads, batch_size, graph_size, 1) + * V_additional_delivery + ) # V_addi:[num_heads, batch_size, graph_size, key_size] + + # Heads pick -> otherpick, V_allpick: # [num_heads, batch_size, n_pick, key_size] + heads = heads + torch.matmul( + attn[:, :, :, graph_size + 1 : graph_size + 1 + n_pick].view( + self.num_heads, batch_size, graph_size, n_pick + ), + V_allpick, + ) + + # V_alldelivery: # (num_heads, batch_size, n_pick, key/val_size) + heads = heads + torch.matmul( + attn[:, :, :, graph_size + 1 + n_pick : graph_size + 1 + 2 * n_pick].view( + self.num_heads, batch_size, graph_size, n_pick + ), + V_alldelivery, + ) + + # Delivery + heads = ( + heads + + attn[:, :, :, graph_size + 1 + 2 * n_pick].view( + self.num_heads, batch_size, graph_size, 1 + ) + * V_additional_pick + ) + heads = heads + torch.matmul( + attn[ + :, + :, + :, + graph_size + 1 + 2 * n_pick + 1 : graph_size + 1 + 3 * n_pick + 1, + ].view(self.num_heads, batch_size, graph_size, n_pick), + V_alldelivery2, + ) + heads = heads + torch.matmul( + attn[:, :, :, graph_size + 1 + 3 * n_pick + 1 :].view( + self.num_heads, batch_size, graph_size, n_pick + ), + V_allpickup2, + ) + + out = torch.mm( + heads.permute(1, 2, 0, 3) + .contiguous() + .view(-1, self.num_heads * self.val_dim), + self.W_out.view(-1, self.embed_dim), + ).view(batch_size, n_query, self.embed_dim) + + return out diff --git a/rl4co/models/zoo/ham/encoder.py b/rl4co/models/zoo/ham/encoder.py new file mode 100644 index 00000000..8a116336 --- /dev/null +++ b/rl4co/models/zoo/ham/encoder.py @@ -0,0 +1,73 @@ +import torch.nn as nn + +from rl4co.models.nn.env_embeddings import env_init_embedding +from rl4co.models.nn.graph.attnnet import Normalization, SkipConnection +from rl4co.models.zoo.ham.attention import HeterogenousMHA + + +class HeterogeneuousMHALayer(nn.Sequential): + def __init__( + self, + num_heads, + embed_dim, + feedforward_hidden=512, + normalization="batch", + ): + super(HeterogeneuousMHALayer, self).__init__( + SkipConnection(HeterogenousMHA(num_heads, embed_dim, embed_dim)), + Normalization(embed_dim, normalization), + SkipConnection( + nn.Sequential( + nn.Linear(embed_dim, feedforward_hidden), + nn.ReLU(), + nn.Linear(feedforward_hidden, embed_dim), + ) + if feedforward_hidden > 0 + else nn.Linear(embed_dim, embed_dim) + ), + Normalization(embed_dim, normalization), + ) + + +class GraphHeterogeneousAttentionEncoder(nn.Module): + def __init__( + self, + init_embedding=None, + num_heads=8, + embed_dim=128, + num_encoder_layers=3, + env_name=None, + normalization="batch", + feedforward_hidden=512, + sdpa_fn=None, + ): + super(GraphHeterogeneousAttentionEncoder, self).__init__() + + # substitute env_name with pdp if none + if env_name is None: + env_name = "pdp" + # Map input to embedding space + if init_embedding is None: + self.init_embedding = env_init_embedding(env_name, {"embed_dim": embed_dim}) + else: + self.init_embedding = init_embedding + + self.layers = nn.Sequential( + *( + HeterogeneuousMHALayer( + num_heads, + embed_dim, + feedforward_hidden, + normalization, + ) + for _ in range(num_encoder_layers) + ) + ) + + def forward(self, x, mask=None): + assert mask is None, "Mask not yet supported!" + # initial Embedding from features + init_embeds = self.init_embedding(x) # (batch_size, graph_size, embed_dim) + # layers (batch_size, graph_size, embed_dim) + embeds = self.layers(init_embeds) + return embeds, init_embeds diff --git a/rl4co/models/zoo/ham/model.py b/rl4co/models/zoo/ham/model.py new file mode 100644 index 00000000..416f7771 --- /dev/null +++ b/rl4co/models/zoo/ham/model.py @@ -0,0 +1,37 @@ +from typing import Union + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl import REINFORCE +from rl4co.models.rl.reinforce.baselines import REINFORCEBaseline +from rl4co.models.zoo.ham.policy import HeterogeneousAttentionModelPolicy + + +class HeterogeneousAttentionModel(REINFORCE): + """Heterogenous Attention Model for solving the Pickup and Delivery Problem based on + REINFORCE: https://arxiv.org/abs/2110.02634. + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + baseline: REINFORCE baseline. Defaults to rollout (1 epoch of exponential, then greedy rollout baseline) + policy_kwargs: Keyword arguments for policy + baseline_kwargs: Keyword arguments for baseline + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: HeterogeneousAttentionModelPolicy = None, + baseline: Union[REINFORCEBaseline, str] = "rollout", + policy_kwargs={}, + baseline_kwargs={}, + **kwargs, + ): + assert ( + env.name == "pdp" + ), "HeterogeneousAttentionModel only works for PDP (Pickup and Delivery Problem)" + if policy is None: + policy = HeterogeneousAttentionModelPolicy(env_name=env.name, **policy_kwargs) + + super().__init__(env, policy, baseline, baseline_kwargs, **kwargs) diff --git a/rl4co/models/zoo/ham/policy.py b/rl4co/models/zoo/ham/policy.py new file mode 100644 index 00000000..3dc8ddbc --- /dev/null +++ b/rl4co/models/zoo/ham/policy.py @@ -0,0 +1,62 @@ +from typing import Callable, Optional + +import torch.nn as nn + +from rl4co.models.zoo.am import AttentionModelPolicy +from rl4co.models.zoo.ham.encoder import GraphHeterogeneousAttentionEncoder + + +class HeterogeneousAttentionModelPolicy(AttentionModelPolicy): + """Heterogeneous Attention Model Policy based on https://ieeexplore.ieee.org/document/9352489. + We re-declare the most important arguments here for convenience as in the paper. + See :class:`rl4co.models.zoo.am.AttentionModelPolicy` for more details. + + Args: + encoder: Encoder module. Can be passed by sub-classes + env_name: Name of the environment used to initialize embeddings + init_embedding: Model to use for the initial embedding. If None, use the default embedding for the environment + embed_dim: Dimension of the embeddings + num_encoder_layers: Number of layers in the encoder + num_heads: Number of heads for the attention in encoder + normalization: Normalization to use for the attention layers + feedforward_hidden: Dimension of the hidden layer in the feedforward network + sdpa_fn: Function to use for the scaled dot product attention + **kwargs: keyword arguments passed to the :class:`rl4co.models.zoo.am.AttentionModelPolicy` + """ + + def __init__( + self, + encoder: nn.Module = None, + env_name: str = "pdp", + init_embedding: nn.Module = None, + embed_dim: int = 128, + num_encoder_layers: int = 3, + num_heads: int = 8, + normalization: str = "batch", + feedforward_hidden: int = 512, + sdpa_fn: Optional[Callable] = None, + **kwargs, + ): + if encoder is None: + encoder = GraphHeterogeneousAttentionEncoder( + init_embedding=init_embedding, + num_heads=num_heads, + embed_dim=embed_dim, + num_encoder_layers=num_encoder_layers, + env_name=env_name, + normalization=normalization, + feedforward_hidden=feedforward_hidden, + sdpa_fn=sdpa_fn, + ) + else: + encoder = encoder + + super(HeterogeneousAttentionModelPolicy, self).__init__( + env_name=env_name, + encoder=encoder, + embed_dim=embed_dim, + num_encoder_layers=num_encoder_layers, + num_heads=num_heads, + normalization=normalization, + **kwargs, + ) diff --git a/rl4co/models/zoo/l2d/__init__.py b/rl4co/models/zoo/l2d/__init__.py new file mode 100644 index 00000000..398dea98 --- /dev/null +++ b/rl4co/models/zoo/l2d/__init__.py @@ -0,0 +1,2 @@ +from .model import L2DModel, L2DPPOModel +from .policy import L2DAttnPolicy, L2DPolicy, L2DPolicy4PPO diff --git a/rl4co/models/zoo/l2d/decoder.py b/rl4co/models/zoo/l2d/decoder.py new file mode 100644 index 00000000..833e9c6e --- /dev/null +++ b/rl4co/models/zoo/l2d/decoder.py @@ -0,0 +1,389 @@ +import abc + +from typing import Any, Tuple + +import torch +import torch.nn as nn + +from einops import einsum, rearrange +from tensordict import TensorDict +from torch import Tensor + +from rl4co.models.common.constructive.autoregressive import AutoregressiveDecoder +from rl4co.models.nn.attention import PointerAttention +from rl4co.models.nn.env_embeddings.context import SchedulingContext +from rl4co.models.nn.env_embeddings.dynamic import JSSPDynamicEmbedding +from rl4co.models.nn.graph.hgnn import HetGNNEncoder +from rl4co.models.nn.mlp import MLP +from rl4co.models.zoo.am.decoder import AttentionModelDecoder, PrecomputedCache +from rl4co.utils.ops import batchify, gather_by_index + +from .encoder import GCN4JSSP + + +class L2DActor(nn.Module, metaclass=abc.ABCMeta): + """Base decoder model for actor in L2D. The actor is responsible for generating the logits for the action + similar to the decoder in autoregressive models. Since the decoder in L2D can have the additional purpose + of extracting features (i.e. encoding the environment in ever iteration), we need an additional actor class. + This function serves as template for such actor classes in L2D + """ + + @abc.abstractmethod + def forward( + self, td: TensorDict, hidden: Any = None, num_starts: int = 0 + ) -> Tuple[Tensor, Tensor]: + """Obtain logits for current action to the next ones + + Args: + td: TensorDict containing the input data + hidden: Hidden state from the encoder. Can be any type + num_starts: Number of starts for multistart decoding + + Returns: + Tuple containing the logits and the action mask + """ + raise NotImplementedError("Implement me in subclass!") + + def pre_decoder_hook( + self, td: TensorDict, env=None, hidden: Any = None, num_starts: int = 0 + ) -> Tuple[TensorDict, Any]: + """By default, we only require the input for the actor to be a tuple + (in JSSP we only have operation embeddings but in FJSP we have operation + and machine embeddings. By expecting a tuple we can generalize things.) + + Args: + td: TensorDict containing the input data + hidden: Hidden state from the encoder + num_starts: Number of starts for multistart decoding + + Returns: + Tuple containing the updated hidden state(s) and the input TensorDict + """ + + hidden = (hidden,) if not isinstance(hidden, tuple) else hidden + + if num_starts > 1: + # NOTE: when using pomo, we need this + hidden = tuple(map(lambda x: batchify(x, num_starts), hidden)) + + return td, env, hidden + + +class JSSPActor(L2DActor): + def __init__( + self, + embed_dim: int, + hidden_dim: int, + hidden_layers: int = 2, + het_emb: bool = False, + check_nan: bool = True, + ) -> None: + super().__init__() + + input_dim = (1 + int(het_emb)) * embed_dim + self.mlp = MLP( + input_dim=input_dim, + output_dim=1, + num_neurons=[hidden_dim] * hidden_layers, + hidden_act="ReLU", + out_act="Identity", + input_norm="None", + output_norm="None", + ) + self.het_emb = het_emb + self.dummy = nn.Parameter(torch.rand(input_dim)) + self.check_nan = check_nan + + def forward(self, td, op_emb, ma_emb=None): + bs = td.size(0) + # (bs, n_j) + next_op = td["next_op"] + # (bs, n_j, emb) + job_emb = gather_by_index(op_emb, next_op, dim=1) + if ma_emb is not None: + ma_emb_per_op = einsum(td["ops_ma_adj"], ma_emb, "b m o, b m e -> b o e") + # (bs, n_j, emb) + ma_emb_per_job = gather_by_index(ma_emb_per_op, next_op, dim=1) + # (bs, n_j, 2 * emb) + job_emb = torch.cat((job_emb, ma_emb_per_job), dim=2) + # (bs, n_j, 2 * emb) + no_ops = self.dummy[None, None].expand(bs, 1, -1) + # (bs, 1 + n_j, 2 * emb) + all_actions = torch.cat((no_ops, job_emb), 1) + # (bs, 1 + n_j) + logits = self.mlp(all_actions).squeeze(2) + + if self.check_nan: + assert not torch.isnan(logits).any(), "Logits contain NaNs" + + # (b, 1 + j) + mask = td["action_mask"] + + return logits, mask + + +class FJSPActor(L2DActor): + def __init__( + self, + embed_dim: int, + hidden_dim: int, + hidden_layers: int = 2, + check_nan: bool = True, + ) -> None: + super().__init__() + self.mlp = MLP( + input_dim=2 * embed_dim, + output_dim=1, + num_neurons=[hidden_dim] * hidden_layers, + hidden_act="ReLU", + out_act="Identity", + input_norm="None", + output_norm="None", + ) + self.dummy = nn.Parameter(torch.rand(2 * embed_dim)) + self.check_nan = check_nan + + def forward(self, td, ops_emb, ma_emb): + bs, n_ma = ma_emb.shape[:2] + # (bs, n_jobs, emb) + job_emb = gather_by_index(ops_emb, td["next_op"], squeeze=False) + # (bs, n_jobs, n_ma, emb) + job_emb_expanded = job_emb.unsqueeze(2).expand(-1, -1, n_ma, -1) + ma_emb_expanded = ma_emb.unsqueeze(1).expand_as(job_emb_expanded) + # (bs, num_jobs * n_ma, 2*emb) + h_actions = torch.cat((job_emb_expanded, ma_emb_expanded), dim=-1).flatten(1, 2) + # (bs, 1, 2*emb_dim) + no_ops = self.dummy[None, None].expand(bs, 1, -1) + # (bs, num_jobs * n_ma + 1, 2*emb_dim) + h_actions_w_noop = torch.cat((no_ops, h_actions), 1) + # (b, j*m) + logits = self.mlp(h_actions_w_noop).squeeze(-1) + + if self.check_nan: + assert not torch.isnan(logits).any(), "Logits contain NaNs" + # (b, 1 + j) + mask = td["action_mask"] + return logits, mask + + +class L2DDecoder(AutoregressiveDecoder): + # feature extractor + actor + def __init__( + self, + env_name: str = "jssp", + feature_extractor: nn.Module = None, + actor: nn.Module = None, + init_embedding: nn.Module = None, + embed_dim: int = 128, + actor_hidden_dim: int = 128, + actor_hidden_layers: int = 2, + num_encoder_layers: int = 3, + normalization: str = "batch", + het_emb: bool = False, + stepwise: bool = False, + scaling_factor: int = 1000, + ): + super(L2DDecoder, self).__init__() + + if feature_extractor is None and stepwise: + if env_name == "fjsp" or (het_emb and env_name == "jssp"): + feature_extractor = HetGNNEncoder( + env_name=env_name, + embed_dim=embed_dim, + num_layers=num_encoder_layers, + normalization=normalization, + init_embedding=init_embedding, + scaling_factor=scaling_factor, + ) + else: + feature_extractor = GCN4JSSP( + embed_dim, + num_encoder_layers, + init_embedding=init_embedding, + scaling_factor=scaling_factor, + ) + + self.feature_extractor = feature_extractor + + if actor is None: + if env_name == "fjsp": + actor = FJSPActor( + embed_dim=embed_dim, + hidden_dim=actor_hidden_dim, + hidden_layers=actor_hidden_layers, + ) + else: + actor = JSSPActor( + embed_dim=embed_dim, + hidden_dim=actor_hidden_dim, + hidden_layers=actor_hidden_layers, + het_emb=het_emb, + ) + + self.actor = actor + + def forward(self, td, hidden, num_starts): + if hidden is None: + # NOTE in case we have multiple starts, td is batchified + # (through decoding strategy pre decoding hook). Thus the + # embeddings from feature_extractor have the correct shape + num_starts = 0 + # (bs, n_j * n_ops, e), (bs, n_m, e) + hidden, _ = self.feature_extractor(td) + + td, _, hidden = self.actor.pre_decoder_hook(td, None, hidden, num_starts) + + # (bs, n_j, e) + logits, mask = self.actor(td, *hidden) + + return logits, mask + + +class L2DAttnPointer(PointerAttention): + def __init__( + self, + env_name: str, + embed_dim: int, + num_heads: int, + out_bias: bool = False, + check_nan: bool = True, + ): + super().__init__( + embed_dim=embed_dim, + num_heads=num_heads, + mask_inner=False, + out_bias=out_bias, + check_nan=check_nan, + ) + self.env_name = env_name + + def forward(self, query, key, value, logit_key, attn_mask=None): + # bs = query.size(0) + # (b m j) + logits = super().forward(query, key, value, logit_key, attn_mask=attn_mask) + if self.env_name == "jssp": + # (b j) + logits = logits.sum(1) + elif self.env_name == "fjsp": + no_op_logits = logits[..., 0].sum(1, keepdims=True) + logits = rearrange(logits[..., 1:], "b m j -> b (j m)") + logits = torch.cat((no_op_logits, logits), dim=1) + + return logits + + +class AttnActor(AttentionModelDecoder): + def __init__( + self, + embed_dim: int = 128, + num_heads: int = 8, + env_name: str = "tsp", + context_embedding: nn.Module = None, + dynamic_embedding: nn.Module = None, + mask_inner: bool = True, + out_bias_pointer_attn: bool = False, + linear_bias: bool = False, + use_graph_context: bool = True, + check_nan: bool = True, + sdpa_fn: callable = None, + pointer: nn.Module = None, + moe_kwargs: dict = None, + ): + super().__init__( + embed_dim, + num_heads, + env_name, + context_embedding, + dynamic_embedding, + mask_inner, + out_bias_pointer_attn, + linear_bias, + use_graph_context, + check_nan, + sdpa_fn, + pointer, + moe_kwargs, + ) + + def pre_decoder_hook( + self, td: TensorDict, env=None, hidden: Any = None, num_starts: int = 0 + ) -> Tuple[TensorDict, Any]: + cache = self._precompute_cache(hidden, num_starts=num_starts) + return td, env, (cache,) + + +class L2DAttnActor(AttnActor): + def __init__( + self, + embed_dim: int = 128, + num_heads: int = 8, + env_name: str = "jssp", + scaling_factor: int = 1000, + stepwise: bool = False, + ): + context_embedding = SchedulingContext(embed_dim, scaling_factor=scaling_factor) + if stepwise: + # in a stepwise encoding setting, the embeddings contain all current information + dynamic_embedding = None + else: + # otherwise we might want to update the static embeddings using dynamic updates + dynamic_embedding = JSSPDynamicEmbedding( + embed_dim, scaling_factor=scaling_factor + ) + pointer = L2DAttnPointer(env_name, embed_dim, num_heads, check_nan=False) + + super().__init__( + embed_dim=embed_dim, + num_heads=num_heads, + env_name=env_name, + context_embedding=context_embedding, + dynamic_embedding=dynamic_embedding, + pointer=pointer, + ) + self.dummy = nn.Parameter(torch.rand(1, embed_dim)) + + def _compute_q(self, cached: PrecomputedCache, td: TensorDict): + embeddings = cached.node_embeddings + ma_embs = embeddings["machine_embeddings"] + return self.context_embedding(ma_embs, td) + + def _compute_kvl(self, cached: PrecomputedCache, td: TensorDict): + glimpse_k_stat, glimpse_v_stat, logit_k_stat = ( + gather_by_index(cached.glimpse_key, td["next_op"], dim=1), + gather_by_index(cached.glimpse_val, td["next_op"], dim=1), + gather_by_index(cached.logit_key, td["next_op"], dim=1), + ) + # Compute dynamic embeddings and add to static embeddings + glimpse_k_dyn, glimpse_v_dyn, logit_k_dyn = self.dynamic_embedding(td, cached) + glimpse_k = glimpse_k_stat + glimpse_k_dyn + glimpse_v = glimpse_v_stat + glimpse_v_dyn + logit_k = logit_k_stat + logit_k_dyn + + no_ops = self.dummy.unsqueeze(1).expand(td.size(0), 1, -1).to(logit_k) + logit_k = torch.cat((no_ops, logit_k), dim=1) + + return glimpse_k, glimpse_v, logit_k + + def _precompute_cache(self, embeddings: Tuple[torch.Tensor, torch.Tensor], **kwargs): + ops_emb, ma_emb = embeddings + + ( + glimpse_key_fixed, + glimpse_val_fixed, + logit_key, + ) = self.project_node_embeddings( + ops_emb + ).chunk(3, dim=-1) + + embeddings = TensorDict( + {"op_embeddings": ops_emb, "machine_embeddings": ma_emb}, + batch_size=ops_emb.size(0), + ) + # Organize in a dataclass for easy access + return PrecomputedCache( + node_embeddings=embeddings, + graph_context=0, + glimpse_key=glimpse_key_fixed, + glimpse_val=glimpse_val_fixed, + logit_key=logit_key, + ) diff --git a/rl4co/models/zoo/l2d/encoder.py b/rl4co/models/zoo/l2d/encoder.py new file mode 100644 index 00000000..0bc43fa9 --- /dev/null +++ b/rl4co/models/zoo/l2d/encoder.py @@ -0,0 +1,26 @@ +from rl4co.models.nn.env_embeddings.init import JSSPInitEmbedding +from rl4co.models.nn.graph.gcn import GCNEncoder +from rl4co.utils.ops import adj_to_pyg_edge_index + + +class GCN4JSSP(GCNEncoder): + def __init__( + self, + embed_dim: int, + num_layers: int, + init_embedding=None, + **init_embedding_kwargs, + ): + def edge_idx_fn(td, _): + return adj_to_pyg_edge_index(td["adjacency"]) + + if init_embedding is None: + init_embedding = JSSPInitEmbedding(embed_dim, **init_embedding_kwargs) + + super().__init__( + env_name="jssp", + embed_dim=embed_dim, + num_layers=num_layers, + edge_idx_fn=edge_idx_fn, + init_embedding=init_embedding, + ) diff --git a/rl4co/models/zoo/l2d/model.py b/rl4co/models/zoo/l2d/model.py new file mode 100644 index 00000000..b70784b1 --- /dev/null +++ b/rl4co/models/zoo/l2d/model.py @@ -0,0 +1,69 @@ +from typing import Union + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl import REINFORCE, StepwisePPO +from rl4co.models.rl.reinforce.baselines import REINFORCEBaseline + +from .policy import L2DPolicy, L2DPolicy4PPO + + +class L2DPPOModel(StepwisePPO): + """Learning2Dispatch model by Zhang et al. (2020): + 'Learning to Dispatch for Job Shop Scheduling via Deep Reinforcement Learning' + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + baseline: REINFORCE baseline. Defaults to rollout (1 epoch of exponential, then greedy rollout baseline) + policy_kwargs: Keyword arguments for policy + baseline_kwargs: Keyword arguments for baseline + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: L2DPolicy = None, + policy_kwargs={}, + **kwargs, + ): + assert env.name in [ + "fjsp", + "jssp", + ], "L2DModel currently only works for Job-Shop Scheduling Problems" + if policy is None: + policy = L2DPolicy4PPO(env_name=env.name, **policy_kwargs) + + super().__init__(env, policy, **kwargs) + + +class L2DModel(REINFORCE): + """Learning2Dispatch model by Zhang et al. (2020): + 'Learning to Dispatch for Job Shop Scheduling via Deep Reinforcement Learning' + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + baseline: REINFORCE baseline. Defaults to rollout (1 epoch of exponential, then greedy rollout baseline) + policy_kwargs: Keyword arguments for policy + baseline_kwargs: Keyword arguments for baseline + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: L2DPolicy = None, + baseline: Union[REINFORCEBaseline, str] = "rollout", + policy_kwargs={}, + baseline_kwargs={}, + **kwargs, + ): + assert env.name in [ + "fjsp", + "jssp", + ], "L2DModel currently only works for Job-Shop Scheduling Problems" + if policy is None: + policy = L2DPolicy(env_name=env.name, **policy_kwargs) + + super().__init__(env, policy, baseline, baseline_kwargs, **kwargs) diff --git a/rl4co/models/zoo/l2d/policy.py b/rl4co/models/zoo/l2d/policy.py new file mode 100644 index 00000000..0cfac356 --- /dev/null +++ b/rl4co/models/zoo/l2d/policy.py @@ -0,0 +1,251 @@ +from typing import Optional + +import torch +import torch.nn as nn + +from torch.distributions import Categorical + +from rl4co.models.common.constructive.autoregressive import ( + AutoregressiveDecoder, + AutoregressiveEncoder, + AutoregressivePolicy, +) +from rl4co.models.common.constructive.base import NoEncoder +from rl4co.models.nn.env_embeddings.init import FJSPMatNetInitEmbedding +from rl4co.models.nn.graph.hgnn import HetGNNEncoder +from rl4co.models.nn.mlp import MLP +from rl4co.models.zoo.matnet.matnet_w_sa import Encoder +from rl4co.utils.decoding import DecodingStrategy, process_logits +from rl4co.utils.ops import gather_by_index +from rl4co.utils.pylogger import get_pylogger + +from .decoder import L2DAttnActor, L2DDecoder +from .encoder import GCN4JSSP + +log = get_pylogger(__name__) + + +class L2DPolicy(AutoregressivePolicy): + def __init__( + self, + encoder: Optional[AutoregressiveEncoder] = None, + decoder: Optional[AutoregressiveDecoder] = None, + embed_dim: int = 64, + num_encoder_layers: int = 2, + env_name: str = "fjsp", + het_emb: bool = True, + scaling_factor: int = 1000, + normalization: str = "batch", + init_embedding: Optional[nn.Module] = None, + stepwise_encoding: bool = False, + tanh_clipping: float = 10, + train_decode_type: str = "sampling", + val_decode_type: str = "greedy", + test_decode_type: str = "multistart_sampling", + **constructive_policy_kw, + ): + if len(constructive_policy_kw) > 0: + log.warn(f"Unused kwargs: {constructive_policy_kw}") + + if encoder is None: + if stepwise_encoding: + encoder = NoEncoder() + elif env_name == "fjsp" or (env_name == "jssp" and het_emb): + encoder = HetGNNEncoder( + env_name=env_name, + embed_dim=embed_dim, + num_layers=num_encoder_layers, + normalization="batch", + init_embedding=init_embedding, + scaling_factor=scaling_factor, + ) + else: + encoder = GCN4JSSP( + embed_dim, + num_encoder_layers, + init_embedding=init_embedding, + scaling_factor=scaling_factor, + ) + + # The decoder generates logits given the current td and heatmap + if decoder is None: + decoder = L2DDecoder( + env_name=env_name, + embed_dim=embed_dim, + actor_hidden_dim=embed_dim, + num_encoder_layers=num_encoder_layers, + init_embedding=init_embedding, + het_emb=het_emb, + stepwise=stepwise_encoding, + scaling_factor=scaling_factor, + normalization=normalization, + ) + + # Pass to constructive policy + super(L2DPolicy, self).__init__( + encoder=encoder, + decoder=decoder, + env_name=env_name, + tanh_clipping=tanh_clipping, + train_decode_type=train_decode_type, + val_decode_type=val_decode_type, + test_decode_type=test_decode_type, + **constructive_policy_kw, + ) + + +class L2DAttnPolicy(AutoregressivePolicy): + def __init__( + self, + encoder: Optional[AutoregressiveEncoder] = None, + decoder: Optional[AutoregressiveDecoder] = None, + embed_dim: int = 256, + num_heads: int = 8, + num_encoder_layers: int = 4, + scaling_factor: int = 1000, + normalization: str = "batch", + env_name: str = "fjsp", + init_embedding: Optional[nn.Module] = None, + tanh_clipping: float = 10, + train_decode_type: str = "sampling", + val_decode_type: str = "greedy", + test_decode_type: str = "multistart_sampling", + **constructive_policy_kw, + ): + if len(constructive_policy_kw) > 0: + log.warn(f"Unused kwargs: {constructive_policy_kw}") + + if encoder is None: + if init_embedding is None: + init_embedding = FJSPMatNetInitEmbedding( + embed_dim, scaling_factor=scaling_factor + ) + + encoder = Encoder( + embed_dim=embed_dim, + num_heads=num_heads, + num_layers=num_encoder_layers, + normalization=normalization, + feedforward_hidden=embed_dim * 2, + init_embedding=init_embedding, + ) + + # The decoder generates logits given the current td and heatmap + if decoder is None: + decoder = L2DAttnActor( + env_name=env_name, + embed_dim=embed_dim, + num_heads=num_heads, + scaling_factor=scaling_factor, + stepwise=False, + ) + + # Pass to constructive policy + super(L2DAttnPolicy, self).__init__( + encoder=encoder, + decoder=decoder, + env_name=env_name, + tanh_clipping=tanh_clipping, + train_decode_type=train_decode_type, + val_decode_type=val_decode_type, + test_decode_type=test_decode_type, + **constructive_policy_kw, + ) + + +class L2DPolicy4PPO(L2DPolicy): + def __init__( + self, + encoder=None, + decoder=None, + critic=None, + embed_dim: int = 64, + num_encoder_layers: int = 2, + env_name: str = "fjsp", + het_emb: bool = True, + scaling_factor: int = 1000, + init_embedding=None, + tanh_clipping: float = 10, + train_decode_type: str = "sampling", + val_decode_type: str = "greedy", + test_decode_type: str = "multistart_sampling", + **constructive_policy_kw, + ): + if init_embedding is None: + pass # TODO PPO specific init emb? + + super().__init__( + encoder=encoder, + decoder=decoder, + embed_dim=embed_dim, + num_encoder_layers=num_encoder_layers, + env_name=env_name, + het_emb=het_emb, + scaling_factor=scaling_factor, + init_embedding=init_embedding, + stepwise_encoding=True, + tanh_clipping=tanh_clipping, + train_decode_type=train_decode_type, + val_decode_type=val_decode_type, + test_decode_type=test_decode_type, + **constructive_policy_kw, + ) + + if critic is None: + if env_name == "fjsp" or het_emb: + input_dim = 2 * embed_dim + else: + input_dim = embed_dim + critic = MLP(input_dim, 1, num_neurons=[embed_dim] * 2) + + self.critic = critic + assert isinstance( + self.encoder, NoEncoder + ), "Define a feature extractor for decoder rather than an encoder in stepwise PPO" + + def evaluate(self, td): + # Encoder: get encoder output and initial embeddings from initial state + hidden, _ = self.decoder.feature_extractor(td) + # pool the embeddings for the critic + h_tuple = (hidden,) if isinstance(hidden, torch.Tensor) else hidden + pooled = tuple(map(lambda x: x.mean(dim=-2), h_tuple)) + # potentially cat multiple embeddings (pooled ops and machines) + h_pooled = torch.cat(pooled, dim=-1) + # pred value via the value head + value_pred = self.critic(h_pooled) + # pre decoder / actor hook + td, _, hidden = self.decoder.actor.pre_decoder_hook( + td, None, hidden, num_starts=0 + ) + logits, mask = self.decoder.actor(td, *hidden) + # get logprobs and entropy over logp distribution + logprobs = process_logits(logits, mask, tanh_clipping=self.tanh_clipping) + action_logprobs = gather_by_index(logprobs, td["action"], dim=1) + dist_entropys = Categorical(logprobs.exp()).entropy() + + return action_logprobs, value_pred, dist_entropys + + def act(self, td, env, phase: str = "train"): + logits, mask = self.decoder(td, hidden=None, num_starts=0) + logprobs = process_logits(logits, mask, tanh_clipping=self.tanh_clipping) + + # DRL-S, sampling actions following \pi + if phase == "train": + action_indexes = DecodingStrategy.sampling(logprobs) + td["logprobs"] = gather_by_index(logprobs, action_indexes, dim=1) + + # DRL-G, greedily picking actions with the maximum probability + else: + action_indexes = DecodingStrategy.greedy(logprobs) + + # memories.states.append(copy.deepcopy(state)) + td["action"] = action_indexes + + return td + + @torch.no_grad() + def generate(self, td, env=None, phase: str = "train", **kwargs) -> dict: + assert phase != "train", "dont use generate() in training mode" + with torch.no_grad(): + out = super().__call__(td, env, phase=phase, **kwargs) + return out diff --git a/rl4co/models/zoo/matnet/__init__.py b/rl4co/models/zoo/matnet/__init__.py new file mode 100644 index 00000000..c2789c34 --- /dev/null +++ b/rl4co/models/zoo/matnet/__init__.py @@ -0,0 +1,2 @@ +from .model import MatNet +from .policy import MatNetPolicy diff --git a/rl4co/models/zoo/matnet/decoder.py b/rl4co/models/zoo/matnet/decoder.py new file mode 100644 index 00000000..5a8d6e28 --- /dev/null +++ b/rl4co/models/zoo/matnet/decoder.py @@ -0,0 +1,157 @@ +from dataclasses import dataclass +from typing import Tuple, Union + +import torch +import torch.nn as nn + +from tensordict import TensorDict +from torch import Tensor + +from rl4co.models.nn.env_embeddings.context import FFSPContext +from rl4co.models.zoo.am.decoder import AttentionModelDecoder +from rl4co.utils.decoding import decode_logprobs, process_logits +from rl4co.utils.ops import gather_by_index + + +@dataclass +class PrecomputedCache: + node_embeddings: Union[Tensor, TensorDict] + graph_context: Union[Tensor, float] + glimpse_key: Tensor + glimpse_val: Tensor + logit_key: Tensor + + +class MatNetDecoder(AttentionModelDecoder): + def _precompute_cache(self, embeddings: Tuple[Tensor, Tensor], *args, **kwargs): + col_emb, row_emb = embeddings + ( + glimpse_key_fixed, + glimpse_val_fixed, + logit_key, + ) = self.project_node_embeddings( + col_emb + ).chunk(3, dim=-1) + + # Optionally disable the graph context from the initial embedding as done in POMO + if self.use_graph_context: + graph_context = self.project_fixed_context(col_emb.mean(1)) + else: + graph_context = 0 + + # Organize in a dataclass for easy access + return PrecomputedCache( + node_embeddings=row_emb, + graph_context=graph_context, + glimpse_key=glimpse_key_fixed, + glimpse_val=glimpse_val_fixed, + logit_key=logit_key, + ) + + +class MatNetFFSPDecoder(AttentionModelDecoder): + def __init__( + self, + embed_dim: int, + num_heads: int, + linear_bias: bool = False, + out_bias_pointer_attn: bool = True, + use_graph_context: bool = False, + **kwargs, + ): + context_embedding = FFSPContext(embed_dim) + + super().__init__( + env_name="ffsp", + embed_dim=embed_dim, + num_heads=num_heads, + context_embedding=context_embedding, + out_bias_pointer_attn=out_bias_pointer_attn, + linear_bias=linear_bias, + use_graph_context=use_graph_context, + **kwargs, + ) + + self.no_job_emb = nn.Parameter(torch.rand(1, 1, embed_dim), requires_grad=True) + + def _precompute_cache(self, embeddings: Tuple[Tensor, Tensor], **kwargs): + job_emb, ma_emb = embeddings + + bs, _, emb_dim = job_emb.shape + + job_emb_plus_one = torch.cat( + (job_emb, self.no_job_emb.expand((bs, 1, emb_dim))), dim=1 + ) + + ( + glimpse_key_fixed, + glimpse_val_fixed, + logit_key, + ) = self.project_node_embeddings( + job_emb_plus_one + ).chunk(3, dim=-1) + + # Optionally disable the graph context from the initial embedding as done in POMO + if self.use_graph_context: + graph_context = self.project_fixed_context(job_emb_plus_one.mean(1)) + else: + graph_context = 0 + + embeddings = TensorDict( + {"job_embeddings": job_emb_plus_one, "machine_embeddings": ma_emb}, + batch_size=bs, + ) + # Organize in a dataclass for easy access + return PrecomputedCache( + node_embeddings=embeddings, + graph_context=graph_context, + glimpse_key=glimpse_key_fixed, + glimpse_val=glimpse_val_fixed, + logit_key=logit_key, + ) + + +class MultiStageFFSPDecoder(MatNetFFSPDecoder): + """Decoder class for the solving the FFSP using a seperate MatNet decoder for each stage + as originally implemented by Kwon et al. (2021) + """ + + def __init__( + self, + embed_dim: int, + num_heads: int, + use_graph_context: bool = True, + tanh_clipping: float = 10, + **kwargs, + ): + super().__init__( + embed_dim=embed_dim, + num_heads=num_heads, + use_graph_context=use_graph_context, + **kwargs, + ) + self.cached_embs: PrecomputedCache = None + self.tanh_clipping = tanh_clipping + + def _precompute_cache(self, embeddings: Tuple[Tensor], **kwargs): + self.cached_embs = super()._precompute_cache(embeddings, **kwargs) + + def forward( + self, + td: TensorDict, + decode_type="sampling", + num_starts: int = 1, + **decoding_kwargs, + ) -> Tuple[Tensor, Tensor, TensorDict]: + + logits, mask = super().forward(td, self.cached_embs, num_starts) + logprobs = process_logits( + logits, + mask, + tanh_clipping=self.tanh_clipping, + **decoding_kwargs, + ) + job_selected = decode_logprobs(logprobs, mask, decode_type) + job_prob = gather_by_index(logprobs, job_selected, dim=1) + + return job_selected, job_prob diff --git a/rl4co/models/zoo/matnet/encoder.py b/rl4co/models/zoo/matnet/encoder.py new file mode 100644 index 00000000..0af88e23 --- /dev/null +++ b/rl4co/models/zoo/matnet/encoder.py @@ -0,0 +1,224 @@ +from typing import Optional + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from rl4co.models.nn.attention import MultiHeadCrossAttention +from rl4co.models.nn.env_embeddings import env_init_embedding +from rl4co.models.nn.ops import TransformerFFN + + +class MixedScoresSDPA(nn.Module): + def __init__( + self, + num_heads: int, + num_scores: int = 1, + mixer_hidden_dim: int = 16, + mix1_init: float = (1 / 2) ** (1 / 2), + mix2_init: float = (1 / 16) ** (1 / 2), + ): + super().__init__() + self.num_heads = num_heads + self.num_scores = num_scores + mix_W1 = torch.torch.distributions.Uniform(low=-mix1_init, high=mix1_init).sample( + (num_heads, self.num_scores + 1, mixer_hidden_dim) + ) + mix_b1 = torch.torch.distributions.Uniform(low=-mix1_init, high=mix1_init).sample( + (num_heads, mixer_hidden_dim) + ) + self.mix_W1 = nn.Parameter(mix_W1) + self.mix_b1 = nn.Parameter(mix_b1) + + mix_W2 = torch.torch.distributions.Uniform(low=-mix2_init, high=mix2_init).sample( + (num_heads, mixer_hidden_dim, 1) + ) + mix_b2 = torch.torch.distributions.Uniform(low=-mix2_init, high=mix2_init).sample( + (num_heads, 1) + ) + self.mix_W2 = nn.Parameter(mix_W2) + self.mix_b2 = nn.Parameter(mix_b2) + + def forward(self, q, k, v, attn_mask=None, dmat=None, dropout_p=0.0): + """Scaled Dot-Product Attention with MatNet Scores Mixer""" + assert dmat is not None + b, m, n = dmat.shape[:3] + dmat = dmat.reshape(b, m, n, self.num_scores) + + # Calculate scaled dot product + attn_scores = torch.matmul(q, k.transpose(-2, -1)) / (k.size(-1) ** 0.5) + # [b, h, m, n, num_scores+1] + mix_attn_scores = torch.cat( + [ + attn_scores.unsqueeze(-1), + dmat[:, None, ...].expand(b, self.num_heads, m, n, self.num_scores), + ], + dim=-1, + ) + # [b, h, m, n] + attn_scores = ( + ( + torch.matmul( + F.relu( + torch.matmul(mix_attn_scores.transpose(1, 2), self.mix_W1) + + self.mix_b1[None, None, :, None, :] + ), + self.mix_W2, + ) + + self.mix_b2[None, None, :, None, :] + ) + .transpose(1, 2) + .squeeze(-1) + ) + + # Apply the provided attention mask + if attn_mask is not None: + if attn_mask.dtype == torch.bool: + attn_mask[~attn_mask.any(-1)] = True + attn_scores.masked_fill_(~attn_mask, float("-inf")) + else: + attn_scores += attn_mask + + # Softmax to get attention weights + attn_weights = F.softmax(attn_scores, dim=-1) + + # Apply dropout + if dropout_p > 0.0: + attn_weights = F.dropout(attn_weights, p=dropout_p) + + # Compute the weighted sum of values + return torch.matmul(attn_weights, v) + + +class MatNetCrossMHA(MultiHeadCrossAttention): + def __init__( + self, + embed_dim: int, + num_heads: int, + bias: bool = False, + mixer_hidden_dim: int = 16, + mix1_init: float = (1 / 2) ** (1 / 2), + mix2_init: float = (1 / 16) ** (1 / 2), + ): + attn_fn = MixedScoresSDPA( + num_heads=num_heads, + mixer_hidden_dim=mixer_hidden_dim, + mix1_init=mix1_init, + mix2_init=mix2_init, + ) + + super().__init__( + embed_dim=embed_dim, num_heads=num_heads, bias=bias, sdpa_fn=attn_fn + ) + + +class MatNetMHA(nn.Module): + def __init__(self, embed_dim: int, num_heads: int, bias: bool = False): + super().__init__() + self.row_encoding_block = MatNetCrossMHA(embed_dim, num_heads, bias) + self.col_encoding_block = MatNetCrossMHA(embed_dim, num_heads, bias) + + def forward(self, row_emb, col_emb, dmat, attn_mask=None): + """ + Args: + row_emb (Tensor): [b, m, d] + col_emb (Tensor): [b, n, d] + dmat (Tensor): [b, m, n] + + Returns: + Updated row_emb (Tensor): [b, m, d] + Updated col_emb (Tensor): [b, n, d] + """ + updated_row_emb = self.row_encoding_block( + row_emb, col_emb, dmat=dmat, cross_attn_mask=attn_mask + ) + attn_mask_t = attn_mask.transpose(-2, -1) if attn_mask is not None else None + updated_col_emb = self.col_encoding_block( + col_emb, + row_emb, + dmat=dmat.transpose(-2, -1), + cross_attn_mask=attn_mask_t, + ) + return updated_row_emb, updated_col_emb + + +class MatNetLayer(nn.Module): + def __init__( + self, + embed_dim: int, + num_heads: int, + bias: bool = False, + feedforward_hidden: int = 512, + normalization: Optional[str] = "instance", + ): + super().__init__() + self.MHA = MatNetMHA(embed_dim, num_heads, bias) + self.F_a = TransformerFFN(embed_dim, feedforward_hidden, normalization) + self.F_b = TransformerFFN(embed_dim, feedforward_hidden, normalization) + + def forward(self, row_emb, col_emb, dmat, attn_mask=None): + """ + Args: + row_emb (Tensor): [b, m, d] + col_emb (Tensor): [b, n, d] + dmat (Tensor): [b, m, n] + + Returns: + Updated row_emb (Tensor): [b, m, d] + Updated col_emb (Tensor): [b, n, d] + """ + + row_emb_out, col_emb_out = self.MHA(row_emb, col_emb, dmat, attn_mask) + row_emb_out = self.F_a(row_emb_out, row_emb) + col_emb_out = self.F_b(col_emb_out, col_emb) + return row_emb_out, col_emb_out + + +class MatNetEncoder(nn.Module): + def __init__( + self, + embed_dim: int = 256, + num_heads: int = 16, + num_layers: int = 3, + normalization: str = "batch", + feedforward_hidden: int = 512, + init_embedding: nn.Module = None, + init_embedding_kwargs: dict = {}, + bias: bool = False, + mask_non_neighbors: bool = False, + ): + super().__init__() + + if init_embedding is None: + init_embedding = env_init_embedding( + "matnet", {"embed_dim": embed_dim, **init_embedding_kwargs} + ) + + self.init_embedding = init_embedding + self.mask_non_neighbors = mask_non_neighbors + self.layers = nn.ModuleList( + [ + MatNetLayer( + embed_dim=embed_dim, + num_heads=num_heads, + bias=bias, + feedforward_hidden=feedforward_hidden, + normalization=normalization, + ) + for _ in range(num_layers) + ] + ) + + def forward(self, td, attn_mask: torch.Tensor = None): + row_emb, col_emb, dmat = self.init_embedding(td) + + if self.mask_non_neighbors and attn_mask is None: + # attn_mask (keep 1s discard 0s) to only attend on neighborhood + attn_mask = dmat.ne(0) + + for layer in self.layers: + row_emb, col_emb = layer(row_emb, col_emb, dmat, attn_mask) + + embedding = (row_emb, col_emb) + init_embedding = None + return embedding, init_embedding # match output signature for the AR policy class diff --git a/rl4co/models/zoo/matnet/matnet_w_sa.py b/rl4co/models/zoo/matnet/matnet_w_sa.py new file mode 100644 index 00000000..cf06056f --- /dev/null +++ b/rl4co/models/zoo/matnet/matnet_w_sa.py @@ -0,0 +1,202 @@ +import math + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from einops import rearrange + +from rl4co.models.nn.attention import MultiHeadAttention +from rl4co.models.nn.env_embeddings import env_init_embedding +from rl4co.models.nn.ops import Normalization, TransformerFFN + + +def apply_weights_and_combine(dots, v, tanh_clipping=0): + # scale to avoid numerical underflow + logits = dots / dots.std() + if tanh_clipping > 0: + # tanh clipping to avoid explosions + logits = torch.tanh(logits) * tanh_clipping + # shape: (batch, num_heads, row_cnt, col_cnt) + weights = nn.Softmax(dim=-1)(logits) + weights = weights.nan_to_num(0) + # shape: (batch, num_heads, row_cnt, qkv_dim) + out = torch.matmul(weights, v) + # shape: (batch, row_cnt, num_heads, qkv_dim) + out = rearrange(out, "b h s d -> b s (h d)") + return out + + +class MixedScoreFF(nn.Module): + def __init__(self, num_heads, ms_hidden_dim: int = 32, bias: bool = False) -> None: + super().__init__() + + self.lin1 = nn.Linear(2 * num_heads, num_heads * ms_hidden_dim, bias=bias) + self.lin2 = nn.Linear(num_heads * ms_hidden_dim, num_heads, bias=bias) + + def forward(self, dot_product_score, cost_mat_score): + # dot_product_score shape: (batch, head_num, row_cnt, col_cnt) + # cost_mat_score shape: (batch, head_num, row_cnt, col_cnt) + # shape: (batch, head_num, row_cnt, col_cnt, 2) + two_scores = torch.stack((dot_product_score, cost_mat_score), dim=-1) + two_scores = rearrange(two_scores, "b h r c s -> b r c (h s)") + # shape: (batch, row_cnt, col_cnt, 2 * num_heads) + ms1 = self.lin1(two_scores) + ms1_activated = F.relu(ms1) + # shape: (batch, row_cnt, col_cnt, num_heads) + ms2 = self.lin2(ms1_activated) + # shape: (batch, row_cnt, head_num, col_cnt) + mixed_scores = rearrange(ms2, "b r c h -> b h r c") + + return mixed_scores + + +class EfficientMixedScoreMultiHeadAttention(nn.Module): + def __init__(self, embed_dim: int, num_heads: int, bias: bool = False): + super().__init__() + + qkv_dim = embed_dim // num_heads + + self.num_heads = num_heads + self.qkv_dim = qkv_dim + self.norm_factor = 1 / math.sqrt(qkv_dim) + + self.Wqv1 = nn.Linear(embed_dim, 2 * embed_dim, bias=bias) + self.Wkv2 = nn.Linear(embed_dim, 2 * embed_dim, bias=bias) + + # self.init_parameters() + self.mixed_scores_layer = MixedScoreFF(num_heads, qkv_dim, bias) + + self.out_proj1 = nn.Linear(embed_dim, embed_dim, bias=bias) + self.out_proj2 = nn.Linear(embed_dim, embed_dim, bias=bias) + + def forward(self, x1, x2, attn_mask=None, cost_mat=None): + batch_size = x1.size(0) + row_cnt = x1.size(-2) + col_cnt = x2.size(-2) + + # Project query, key, value + q, v1 = rearrange( + self.Wqv1(x1), "b s (two h d) -> two b h s d", two=2, h=self.num_heads + ).unbind(dim=0) + + # Project query, key, value + k, v2 = rearrange( + self.Wqv1(x2), "b s (two h d) -> two b h s d", two=2, h=self.num_heads + ).unbind(dim=0) + + # shape: (batch, num_heads, row_cnt, col_cnt) + dot = self.norm_factor * torch.matmul(q, k.transpose(-2, -1)) + + if cost_mat is not None: + # shape: (batch, num_heads, row_cnt, col_cnt) + cost_mat_score = cost_mat[:, None, :, :].expand_as(dot) + dot = self.mixed_scores_layer(dot, cost_mat_score) + + if attn_mask is not None: + attn_mask = attn_mask.view(batch_size, 1, row_cnt, col_cnt).expand_as(dot) + dot.masked_fill_(~attn_mask, float("-inf")) + + h1 = self.out_proj1(apply_weights_and_combine(dot, v2)) + h2 = self.out_proj2(apply_weights_and_combine(dot.transpose(-2, -1), v1)) + + return h1, h2 + + +class EncoderLayer(nn.Module): + def __init__( + self, + embed_dim: int, + num_heads: int = 8, + feedforward_hidden: int = 512, + normalization: str = "batch", + bias: bool = False, + ): + super().__init__() + + self.op_attn = MultiHeadAttention(embed_dim, num_heads, bias=bias) + self.ma_attn = MultiHeadAttention(embed_dim, num_heads, bias=bias) + self.cross_attn = EfficientMixedScoreMultiHeadAttention( + embed_dim, num_heads, bias=bias + ) + + self.op_ffn = TransformerFFN(embed_dim, feedforward_hidden, normalization) + self.ma_ffn = TransformerFFN(embed_dim, feedforward_hidden, normalization) + + self.op_norm = Normalization(embed_dim, normalization) + self.ma_norm = Normalization(embed_dim, normalization) + + def forward( + self, op_in, ma_in, cost_mat, op_mask=None, ma_mask=None, cross_mask=None + ): + op_cross_out, ma_cross_out = self.cross_attn( + op_in, ma_in, attn_mask=cross_mask, cost_mat=cost_mat + ) + op_cross_out = self.op_norm(op_cross_out + op_in) + ma_cross_out = self.ma_norm(ma_cross_out + ma_in) + + # (bs, num_jobs, ops_per_job, d) + op_self_out = self.op_attn(op_cross_out, attn_mask=op_mask) + # (bs, num_ma, d) + ma_self_out = self.ma_attn(ma_cross_out, attn_mask=ma_mask) + + op_out = self.op_ffn(op_cross_out, op_self_out) + ma_out = self.ma_ffn(ma_cross_out, ma_self_out) + + return op_out, ma_out + + +class Encoder(nn.Module): + def __init__( + self, + embed_dim: int = 256, + num_heads: int = 16, + num_layers: int = 5, + normalization: str = "batch", + feedforward_hidden: int = 512, + init_embedding: nn.Module = None, + init_embedding_kwargs: dict = {}, + bias: bool = False, + ): + super().__init__() + self.d_model = embed_dim + + if init_embedding is None: + init_embedding = env_init_embedding( + "matnet", {"embed_dim": embed_dim, **init_embedding_kwargs} + ) + self.init_embedding = init_embedding + self.layers = nn.ModuleList( + [ + EncoderLayer( + embed_dim=embed_dim, + num_heads=num_heads, + feedforward_hidden=feedforward_hidden, + normalization=normalization, + bias=bias, + ) + for _ in range(num_layers) + ] + ) + + def forward(self, td, attn_mask: torch.Tensor = None): + # [BS, num_machines, emb], [BS, num_operations, emb] + ops_embed, ma_embed, edge_feat = self.init_embedding(td) + try: + # mask padded ops; shape=(bs, ops) + ops_attn_mask = ~td["pad_mask"] + except KeyError: + ops_attn_mask = None + # padded ops should also be masked in cross attention; shape=(bs, ops, ma) + # cross_mask = ops_attn_mask.unsqueeze(-1).expand(-1, -1, ma_embed.size(1)) + for layer in self.layers: + ops_embed, ma_embed = layer( + ops_embed, + ma_embed, + cost_mat=edge_feat, + op_mask=ops_attn_mask, # mask padded operations in attention + ma_mask=None, # no padding for machines + cross_mask=None, + ) + embedding = (ops_embed, ma_embed) + return embedding, None diff --git a/rl4co/models/zoo/matnet/model.py b/rl4co/models/zoo/matnet/model.py new file mode 100644 index 00000000..ea3f9188 --- /dev/null +++ b/rl4co/models/zoo/matnet/model.py @@ -0,0 +1,54 @@ +from typing import Union + +import torch.nn as nn + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.zoo.matnet.policy import MatNetPolicy, MultiStageFFSPPolicy +from rl4co.models.zoo.pomo import POMO +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def select_matnet_policy(env, **policy_params): + if env.name == "ffsp": + if env.flatten_stages: + return MatNetPolicy(env_name=env.name, **policy_params) + else: + return MultiStageFFSPPolicy(stage_cnt=env.num_stage, **policy_params) + else: + return MatNetPolicy(env_name=env.name, **policy_params) + + +class MatNet(POMO): + def __init__( + self, + env: RL4COEnvBase, + policy: Union[nn.Module, MatNetPolicy] = None, + num_starts: int = None, + policy_params: dict = {}, + **kwargs, + ): + if policy is None: + policy = select_matnet_policy(env=env, **policy_params) + + # Check if using augmentation and the validation of augmentation function + if kwargs.get("num_augment", 0) != 0: + log.warning("MatNet is using augmentation.") + if ( + kwargs.get("augment_fn") in ["symmetric", "dihedral8"] + or kwargs.get("augment_fn") is None + ): + log.error( + "MatNet does not use symmetric or dihedral augmentation. Seeting no augmentation function." + ) + kwargs["num_augment"] = 0 + else: + kwargs["num_augment"] = 0 + + super(MatNet, self).__init__( + env=env, + policy=policy, + num_starts=num_starts, + **kwargs, + ) diff --git a/rl4co/models/zoo/matnet/policy.py b/rl4co/models/zoo/matnet/policy.py new file mode 100644 index 00000000..a9be60d4 --- /dev/null +++ b/rl4co/models/zoo/matnet/policy.py @@ -0,0 +1,210 @@ +from math import factorial +from typing import List + +import torch +import torch.nn as nn + +from tensordict import TensorDict + +from rl4co.envs.scheduling.ffsp.env import FFSPEnv +from rl4co.models.common.constructive.autoregressive import AutoregressivePolicy +from rl4co.models.zoo.matnet.decoder import ( + MatNetDecoder, + MatNetFFSPDecoder, + MultiStageFFSPDecoder, +) +from rl4co.models.zoo.matnet.encoder import MatNetEncoder +from rl4co.utils.ops import batchify +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class MatNetPolicy(AutoregressivePolicy): + """MatNet Policy from Kwon et al., 2021. + Reference: https://arxiv.org/abs/2106.11113 + + Warning: + This implementation is under development and subject to change. + + Args: + env_name: Name of the environment used to initialize embeddings + embed_dim: Dimension of the node embeddings + num_encoder_layers: Number of layers in the encoder + num_heads: Number of heads in the attention layers + normalization: Normalization type in the attention layers + **kwargs: keyword arguments passed to the `AutoregressivePolicy` + + Default paarameters are adopted from the original implementation. + """ + + def __init__( + self, + env_name: str = "atsp", + embed_dim: int = 256, + num_encoder_layers: int = 5, + num_heads: int = 16, + normalization: str = "instance", + init_embedding_kwargs: dict = {"mode": "RandomOneHot"}, + use_graph_context: bool = False, + bias: bool = False, + **kwargs, + ): + if env_name not in ["atsp", "ffsp"]: + log.error(f"env_name {env_name} is not originally implemented in MatNet") + + if env_name == "ffsp": + decoder = MatNetFFSPDecoder( + embed_dim=embed_dim, + num_heads=num_heads, + use_graph_context=use_graph_context, + out_bias=True, + ) + + else: + decoder = MatNetDecoder( + env_name=env_name, + embed_dim=embed_dim, + num_heads=num_heads, + use_graph_context=use_graph_context, + ) + + super(MatNetPolicy, self).__init__( + env_name=env_name, + encoder=MatNetEncoder( + embed_dim=embed_dim, + num_heads=num_heads, + num_layers=num_encoder_layers, + normalization=normalization, + init_embedding_kwargs=init_embedding_kwargs, + bias=bias, + ), + decoder=decoder, + embed_dim=embed_dim, + num_encoder_layers=num_encoder_layers, + num_heads=num_heads, + normalization=normalization, + **kwargs, + ) + + +class MultiStageFFSPPolicy(nn.Module): + """Policy for solving the FFSP using a seperate encoder and decoder for each + stage. This requires the 'while not td["done"].all()'-loop to be on policy level + (instead of decoder level).""" + + def __init__( + self, + stage_cnt: int, + embed_dim: int = 512, + num_heads: int = 16, + num_encoder_layers: int = 5, + use_graph_context: bool = False, + normalization: str = "instance", + feedforward_hidden: int = 512, + bias: bool = False, + train_decode_type: str = "sampling", + val_decode_type: str = "sampling", + test_decode_type: str = "sampling", + ): + super().__init__() + self.stage_cnt = stage_cnt + + self.encoders: List[MatNetEncoder] = nn.ModuleList( + [ + MatNetEncoder( + embed_dim=embed_dim, + num_heads=num_heads, + num_layers=num_encoder_layers, + normalization=normalization, + feedforward_hidden=feedforward_hidden, + bias=bias, + init_embedding_kwargs={"mode": "RandomOneHot"}, + ) + for _ in range(self.stage_cnt) + ] + ) + self.decoders: List[MultiStageFFSPDecoder] = nn.ModuleList( + [ + MultiStageFFSPDecoder(embed_dim, num_heads, use_graph_context) + for _ in range(self.stage_cnt) + ] + ) + + self.train_decode_type = train_decode_type + self.val_decode_type = val_decode_type + self.test_decode_type = test_decode_type + + def pre_forward(self, td: TensorDict, env: FFSPEnv, num_starts: int): + run_time_list = td["run_time"].chunk(env.num_stage, dim=-1) + for stage_idx in range(self.stage_cnt): + td["cost_matrix"] = run_time_list[stage_idx] + encoder = self.encoders[stage_idx] + embeddings, _ = encoder(td) + decoder = self.decoders[stage_idx] + decoder._precompute_cache(embeddings) + + if num_starts > 1: + # repeat num_start times + td = batchify(td, num_starts) + # update machine idx and action mask + td = env.pre_step(td) + + return td + + def forward( + self, + td: TensorDict, + env: FFSPEnv, + phase="train", + num_starts=1, + return_actions: bool = True, + **decoder_kwargs, + ): + assert not env.flatten_stages, "Multistage model only supports unflattened env" + assert num_starts <= factorial(env.num_machine) + + # Get decode type depending on phase + decode_type = getattr(self, f"{phase}_decode_type") + device = td.device + + td = self.pre_forward(td, env, num_starts) + + # NOTE: this must come after pre_forward due to batchify op + batch_size = td.size(0) + logp_list = torch.zeros(size=(batch_size, 0), device=device) + action_list = [] + + while not td["done"].all(): + action_stack = torch.empty( + size=(batch_size, self.stage_cnt), dtype=torch.long, device=device + ) + logp_stack = torch.empty(size=(batch_size, self.stage_cnt), device=device) + + for stage_idx in range(self.stage_cnt): + decoder = self.decoders[stage_idx] + action, logp = decoder(td, decode_type, num_starts, **decoder_kwargs) + action_stack[:, stage_idx] = action + logp_stack[:, stage_idx] = logp + + gathering_index = td["stage_idx"][:, None] + # shape: (batch, 1) + action = action_stack.gather(dim=1, index=gathering_index).squeeze(dim=1) + logp = logp_stack.gather(dim=1, index=gathering_index).squeeze(dim=1) + # shape: (batch) + action_list.append(action) + # transition + td.set("action", action) + td = env.step(td)["next"] + + logp_list = torch.cat((logp_list, logp[:, None]), dim=1) + + out = { + "reward": td["reward"], + "log_likelihood": logp_list.sum(1), + } + + if return_actions: + out["actions"] = torch.stack(action_list, 1) + + return out diff --git a/rl4co/models/zoo/mdam/__init__.py b/rl4co/models/zoo/mdam/__init__.py new file mode 100644 index 00000000..2b7a14da --- /dev/null +++ b/rl4co/models/zoo/mdam/__init__.py @@ -0,0 +1,2 @@ +from .model import MDAM +from .policy import MDAMPolicy diff --git a/rl4co/models/zoo/mdam/decoder.py b/rl4co/models/zoo/mdam/decoder.py new file mode 100644 index 00000000..7764fc12 --- /dev/null +++ b/rl4co/models/zoo/mdam/decoder.py @@ -0,0 +1,331 @@ +import math + +from dataclasses import dataclass +from typing import Union + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from tensordict import TensorDict + +from rl4co.envs import RL4COEnvBase +from rl4co.models.nn.attention import PointerAttention +from rl4co.models.nn.env_embeddings import env_context_embedding, env_dynamic_embedding +from rl4co.utils.decoding import decode_logprobs, get_log_likelihood + + +@dataclass +class PrecomputedCache: + node_embeddings: torch.Tensor + graph_context: torch.Tensor + glimpse_key: torch.Tensor + glimpse_val: torch.Tensor + logit_key: torch.Tensor + + +class MDAMDecoder(nn.Module): + def __init__( + self, + embed_dim: int = 128, + num_heads: int = 8, + num_paths: int = 5, + env_name: str = "tsp", + mask_inner: bool = True, + mask_logits: bool = True, + eg_step_gap: int = 200, + tanh_clipping: float = 10.0, + shrink_size=None, + train_decode_type: str = "sampling", + val_decode_type: str = "greedy", + test_decode_type: str = "greedy", + ): + super(MDAMDecoder, self).__init__() + self.dynamic_embedding = env_dynamic_embedding(env_name, {"embed_dim": embed_dim}) + + self.train_decode_type = train_decode_type + self.val_decode_type = val_decode_type + self.test_decode_type = test_decode_type + + self.W_placeholder = nn.Parameter(torch.Tensor(2 * embed_dim)) + self.W_placeholder.data.uniform_( + -1, 1 + ) # Placeholder should be in range of activations + + self.context = nn.ModuleList( + [ + env_context_embedding(env_name, {"embed_dim": embed_dim}) + for _ in range(num_paths) + ] + ) + + self.project_node_embeddings = [ + nn.Linear(embed_dim, 3 * embed_dim, bias=False) for _ in range(num_paths) + ] + self.project_node_embeddings = nn.ModuleList(self.project_node_embeddings) + + self.project_fixed_context = [ + nn.Linear(embed_dim, embed_dim, bias=False) for _ in range(num_paths) + ] + self.project_fixed_context = nn.ModuleList(self.project_fixed_context) + + self.project_step_context = [ + nn.Linear(2 * embed_dim, embed_dim, bias=False) for _ in range(num_paths) + ] + self.project_step_context = nn.ModuleList(self.project_step_context) + + self.project_out = [ + nn.Linear(embed_dim, embed_dim, bias=False) for _ in range(num_paths) + ] + self.project_out = nn.ModuleList(self.project_out) + + self.dynamic_embedding = env_dynamic_embedding(env_name, {"embed_dim": embed_dim}) + + # MHA with Pointer mechanism (https://arxiv.org/abs/1506.03134) + self.pointer = [ + PointerAttention( + embed_dim, + num_heads, + mask_inner=mask_inner, + ) + for _ in range(num_paths) + ] + + self.env_name = env_name + self.mask_inner = mask_inner + self.mask_logits = mask_logits + self.num_heads = num_heads + self.num_paths = num_paths + self.eg_step_gap = eg_step_gap + self.tanh_clipping = tanh_clipping + self.shrink_size = shrink_size + + def forward( + self, + td: TensorDict, + encoded_inputs: torch.Tensor, + env: Union[str, RL4COEnvBase], + attn, + V, + h_old, + encoder, # note: used because of different paths, could be better modularized + **decoder_kwargs, + ): + # SECTION: Decoder first step: calculate for the decoder divergence loss + # Cost list and log likelihood list along with path + output_list = [] + # td_list = [env.reset(td) for i in range(self.num_paths)] + td_list = [td.clone() for i in range(self.num_paths)] + for i in range(self.num_paths): + # Clone the encoded features for this path + _encoded_inputs = encoded_inputs.clone() + + # Compute keys, values for the glimpse and keys for the logits once as they can be reused in every step + fixed = self._precompute(_encoded_inputs, path_index=i) + logprobs, _ = self._get_logprobs(fixed, td_list[i], i) + + # Collect output of step + output_list.append(logprobs[:, 0, :]) + output_list[-1] = torch.max( + output_list[-1], + torch.ones( + output_list[-1].shape, + dtype=output_list[-1].dtype, + device=output_list[-1].device, + ) + * (-1e9), + ) # for the kl loss + + if self.num_paths > 1: + kl_divergences = [] + for _i in range(self.num_paths): + for _j in range(self.num_paths): + if _i == _j: + continue + kl_divergence = torch.sum( + torch.exp(output_list[_i]) * (output_list[_i] - output_list[_j]), + -1, + ) + kl_divergences.append(kl_divergence) + loss_kl_divergence = torch.stack(kl_divergences, 0).mean() + + # SECTION: Decoder rest step: calculate for other decoder divergence loss + # Cost list and log likelihood list along with path + reward_list = [] + output_list = [] + action_list = [] + ll_list = [] + # td_list = [env.reset(td) for _ in range(self.num_paths)] + td_list = [td.clone() for i in range(self.num_paths)] + for i in range(self.num_paths): + # Clone the encoded features for this path + _encoded_inputs = encoded_inputs.clone() + _attn = attn.clone() + _V = V.clone() + _h_old = h_old.clone() + + outputs, actions = [], [] + fixed = self._precompute(_encoded_inputs, path_index=i) + + j = 0 + mask, mask_first = None, None # dummy, we get them during the steps + while not (self.shrink_size is None and td_list[i]["done"].all()): + if j > 1 and j % self.eg_step_gap == 0: + if not self.is_vrp: + # TODO: modularize + mask_attn = mask ^ mask_first + else: + mask_attn = mask + + # TODO: decoder + _encoded_inputs, _ = encoder.change(_attn, _V, _h_old, mask_attn) + fixed = self._precompute(_encoded_inputs, path_index=i) + logprobs, mask = self._get_logprobs(fixed, td_list[i], i) + if j == 0: + pass + + # Select the indices of the next nodes in the sequences, result (batch_size) long + action = decode_logprobs( + logprobs[:, 0, :], + mask, + decode_type=decoder_kwargs["decode_type"], + ) + + td_list[i].set("action", action) + td_list[i] = env.step(td_list[i])["next"] + + # Collect output of step + outputs.append(logprobs[:, 0, :]) + actions.append(action) + j += 1 + + assert len(outputs) > 0, "No outputs were generated, check if envs were done" + outputs, actions = torch.stack(outputs, 1), torch.stack(actions, 1) + reward = env.get_reward(td, actions) + ll = get_log_likelihood(outputs, actions, mask=None) + + reward_list.append(reward) + output_list.append(outputs) + action_list.append(actions) + ll_list.append(ll) + + reward = torch.stack(reward_list, 1) + log_likelihood = torch.stack(ll_list, 1) + return reward, log_likelihood, loss_kl_divergence, actions + + def _precompute(self, embeddings, num_steps=1, path_index=None): + # The fixed context projection of the graph embedding is calculated only once for efficiency + graph_embed = embeddings.mean(1) + + # Fixed context = (batch_size, 1, embed_dim) to make broadcastable with parallel timesteps + fixed_context = self.project_fixed_context[path_index](graph_embed)[:, None, :] + + # The projection of the node embeddings for the attention is calculated once up front + ( + glimpse_key_fixed, + glimpse_val_fixed, + logit_key_fixed, + ) = self.project_node_embeddings[path_index](embeddings[:, None, :, :]).chunk( + 3, dim=-1 + ) + + fixed = PrecomputedCache( + node_embeddings=embeddings, + graph_context=fixed_context, + glimpse_key=self._make_heads(glimpse_key_fixed, num_steps), + glimpse_val=self._make_heads(glimpse_val_fixed, num_steps), + logit_key=logit_key_fixed.contiguous(), + ) + return fixed + + def _make_heads(self, v, num_steps=None): + assert num_steps is None or v.size(1) == 1 or v.size(1) == num_steps + return ( + v.contiguous() + .view(v.size(0), v.size(1), v.size(2), self.num_heads, -1) + .expand( + v.size(0), + v.size(1) if num_steps is None else num_steps, + v.size(2), + self.num_heads, + -1, + ) + .permute( + 3, 0, 1, 2, 4 + ) # (n_heads, batch_size, num_steps, graph_size, head_dim) + ) + + def _get_logprobs(self, fixed, td, path_index, normalize=True): + step_context = self.context[path_index]( + fixed.node_embeddings, td + ) # [batch, embed_dim] + glimpse_q = fixed.graph_context + step_context.unsqueeze(1).to( + fixed.graph_context.device + ) + + # Compute keys and values for the nodes + ( + glimpse_key_dynamic, + glimpse_val_dynamic, + logit_key_dynamic, + ) = self.dynamic_embedding(td) + glimpse_k = fixed.glimpse_key + glimpse_key_dynamic + glimpse_v = fixed.glimpse_val + glimpse_val_dynamic + logit_k = fixed.logit_key + logit_key_dynamic + + # Compute the action mask + mask = td["action_mask"] + + # Compute logits (unnormalized logprobs) + # logprobs, _ = self.logit_attention[path_index](glimpse_q, glimpse_k, glimpse_v, logit_k, mask, path_index) + logprobs, _ = self._one_to_many_logits( + glimpse_q, glimpse_k, glimpse_v, logit_k, mask, path_index + ) + return logprobs, mask + + def _one_to_many_logits(self, query, glimpse_K, glimpse_V, logit_K, mask, path_index): + batch_size, num_steps, embed_dim = query.size() + key_size = val_size = embed_dim // self.num_heads + + # Compute the glimpse, rearrange dimensions so the dimensions are (n_heads, batch_size, num_steps, 1, key_size) + glimpse_Q = query.view( + batch_size, num_steps, self.num_heads, 1, key_size + ).permute(2, 0, 1, 3, 4) + + # Batch matrix multiplication to compute compatibilities (n_heads, batch_size, num_steps, graph_size) + compatibility = torch.matmul(glimpse_Q, glimpse_K.transpose(-2, -1)) / math.sqrt( + glimpse_Q.size(-1) + ) + if self.mask_inner: + assert self.mask_logits, "Cannot mask inner without masking logits" + compatibility[ + ~mask[None, :, None, None, :].expand_as(compatibility) + ] = -math.inf + + # Batch matrix multiplication to compute heads (n_heads, batch_size, num_steps, val_size) + heads = torch.matmul(F.softmax(compatibility, dim=-1), glimpse_V) + + # Project to get glimpse/updated context node embedding (batch_size, num_steps, embed_dim) + glimpse = self.project_out[path_index]( + heads.permute(1, 2, 3, 0, 4) + .contiguous() + .view(-1, num_steps, 1, self.num_heads * val_size) + ) + + # Now projecting the glimpse is not needed since this can be absorbed into project_out + # final_Q = self.project_glimpse(glimpse) + final_Q = glimpse + + # Batch matrix multiplication to compute logits (batch_size, num_steps, graph_size) + # logits = 'compatibility' + logits = torch.matmul(final_Q, logit_K.transpose(-2, -1)).squeeze(-2) / math.sqrt( + final_Q.size(-1) + ) + + # From the logits compute the probabilities by clipping, masking and softmax + if self.tanh_clipping > 0: + logits = F.tanh(logits) * self.tanh_clipping + if self.mask_logits: + logits[~mask[:, None, :]] = -math.inf + + return logits, glimpse.squeeze(-2) diff --git a/rl4co/models/zoo/mdam/encoder.py b/rl4co/models/zoo/mdam/encoder.py new file mode 100644 index 00000000..bab7546f --- /dev/null +++ b/rl4co/models/zoo/mdam/encoder.py @@ -0,0 +1,101 @@ +from typing import Callable, Optional + +import torch +import torch.nn as nn + +from rl4co.models.nn.graph.attnnet import ( + MultiHeadAttentionLayer, + Normalization, + SkipConnection, +) +from rl4co.models.zoo.mdam.mha import MultiHeadAttentionMDAM + + +class MDAMGraphAttentionEncoder(nn.Module): + def __init__( + self, + num_heads, + embed_dim, + num_layers, + node_dim=None, + normalization="batch", + feedforward_hidden=512, + sdpa_fn: Optional[Callable] = None, + ): + super(MDAMGraphAttentionEncoder, self).__init__() + + # To map input to embedding space + self.init_embed = nn.Linear(node_dim, embed_dim) if node_dim is not None else None + + self.layers = nn.Sequential( + *( + MultiHeadAttentionLayer( + embed_dim, + num_heads, + feedforward_hidden, + normalization, + sdpa_fn=sdpa_fn, + ) + for _ in range(num_layers - 1) # because last layer is different + ) + ) + self.attention_layer = MultiHeadAttentionMDAM( + embed_dim, num_heads, sdpa_fn=sdpa_fn, last_one=True + ) + self.BN1 = Normalization(embed_dim, normalization) + self.projection = SkipConnection( + nn.Sequential( + nn.Linear(embed_dim, feedforward_hidden), + nn.ReLU(), + nn.Linear(feedforward_hidden, embed_dim), + ) + if feedforward_hidden > 0 + else nn.Linear(embed_dim, embed_dim) + ) + self.BN2 = Normalization(embed_dim, normalization) + + def forward(self, x, mask=None, return_transform_loss=False): + """ + Returns: + - h [batch_size, graph_size, embed_dim] + - attn [num_head, batch_size, graph_size, graph_size] + - V [num_head, batch_size, graph_size, key_dim] + - h_old [batch_size, graph_size, embed_dim] + """ + assert mask is None, "TODO mask not yet supported!" + + h_embeded = x + h_old = self.layers(h_embeded) + h_new, attn, V = self.attention_layer(h_old) + h = h_new + h_old + h = self.BN1(h) + h = self.projection(h) + h = self.BN2(h) + + return (h, h.mean(dim=1), attn, V, h_old) + + def change(self, attn, V, h_old, mask): + num_heads, batch_size, graph_size, feat_size = V.size() + attn = ( + mask.float() + .view(1, batch_size, 1, graph_size) + .repeat(num_heads, 1, graph_size, 1) + * attn + ) + attn = attn / ( + torch.sum(attn, dim=-1).view(num_heads, batch_size, graph_size, 1) + 1e-9 + ) + heads = torch.matmul(attn, V) + + h_new = torch.mm( + heads.permute(1, 2, 0, 3) + .contiguous() + .view(-1, self.attention_layer.num_heads * self.attention_layer.val_dim), + self.attention_layer.W_out.view(-1, self.attention_layer.embed_dim), + ).view(batch_size, graph_size, self.attention_layer.embed_dim) + h = h_new + h_old + h = self.BN1(h) + h = self.projection(h) + h = self.BN2(h) + + return (h, h.mean(dim=1)) diff --git a/rl4co/models/zoo/mdam/mha.py b/rl4co/models/zoo/mdam/mha.py new file mode 100644 index 00000000..4499faa0 --- /dev/null +++ b/rl4co/models/zoo/mdam/mha.py @@ -0,0 +1,87 @@ +import math + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class MultiHeadAttentionMDAM(nn.Module): + def __init__(self, embed_dim, n_heads, last_one=False, sdpa_fn=None): + super(MultiHeadAttentionMDAM, self).__init__() + + if sdpa_fn is not None: + log.warning("sdpa_fn is not used in this implementation") + + self.embed_dim = embed_dim + self.n_heads = n_heads + + self.norm_factor = 1 / math.sqrt(embed_dim) # See Attention is all you need + + self.W_query = nn.Parameter(torch.Tensor(n_heads, embed_dim, embed_dim)) + self.W_key = nn.Parameter(torch.Tensor(n_heads, embed_dim, embed_dim)) + self.W_val = nn.Parameter(torch.Tensor(n_heads, embed_dim, embed_dim)) + self.W_out = nn.Parameter(torch.Tensor(n_heads, embed_dim, embed_dim)) + + self.init_parameters() + self.last_one = last_one + + def init_parameters(self): + for param in self.parameters(): + stdv = 1.0 / math.sqrt(param.size(-1)) + param.data.uniform_(-stdv, stdv) + + def forward(self, q, h=None, mask=None): + if h is None: + h = q # compute self-attention + + # h should be (batch_size, graph_size, input_dim) + batch_size, graph_size, input_dim = h.size() + n_query = q.size(1) + assert q.size(0) == batch_size + assert q.size(2) == input_dim + assert input_dim == self.embed_dim, "Wrong embedding dimension of input" + + hflat = h.contiguous().view(-1, input_dim) + qflat = q.contiguous().view(-1, input_dim) + + # last dimension can be different for keys and values + shp = (self.n_heads, batch_size, graph_size, -1) + shp_q = (self.n_heads, batch_size, n_query, -1) + + # Calculate queries, (n_heads, n_query, graph_size, key/val_size) + Q = torch.matmul(qflat, self.W_query).view(shp_q) + # Calculate keys and values (n_heads, batch_size, graph_size, key/val_size) + K = torch.matmul(hflat, self.W_key).view(shp) + V = torch.matmul(hflat, self.W_val).view(shp) + + # Calculate compatibility (n_heads, batch_size, n_query, graph_size) + compatibility = self.norm_factor * torch.matmul(Q, K.transpose(2, 3)) + + # Optionally apply mask to prevent attention + if mask is not None: + mask = mask.view(1, batch_size, n_query, graph_size).expand_as(compatibility) + compatibility[mask] = float("-inf") + + attn = F.softmax(compatibility, dim=-1) + + # If there are nodes with no neighbours then softmax returns nan so we fix them to 0 + if mask is not None: + attnc = attn.clone() + attnc[mask] = 0 + attn = attnc + + heads = torch.matmul(attn, V) + + out = torch.mm( + heads.permute(1, 2, 0, 3) + .contiguous() + .view(-1, self.n_heads * self.embed_dim), + self.W_out.view(-1, self.embed_dim), + ).view(batch_size, n_query, self.embed_dim) + if self.last_one: + return (out, attn, V) + return out diff --git a/rl4co/models/zoo/mdam/model.py b/rl4co/models/zoo/mdam/model.py new file mode 100644 index 00000000..0b830866 --- /dev/null +++ b/rl4co/models/zoo/mdam/model.py @@ -0,0 +1,125 @@ +from functools import partial +from typing import Union + +import torch + +from torch.utils.data import DataLoader + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl import REINFORCE +from rl4co.models.rl.reinforce.baselines import ( + REINFORCEBaseline, + RolloutBaseline, + WarmupBaseline, +) +from rl4co.models.zoo.mdam.policy import MDAMPolicy + + +def rollout(self, model, env, batch_size=64, device="cpu", dataset=None): + """In this case the reward from the model is [batch, num_paths] + and the baseline takes the maximum reward from the model as the baseline. + https://github.com/liangxinedu/MDAM/blob/19b0bf813fb2dbec2fcde9e22eb50e04675400cd/train.py#L38C29-L38C33 + """ + # if dataset is None, use the dataset of the baseline + dataset = self.dataset if dataset is None else dataset + + model.eval() + model = model.to(device) + + def eval_model(batch): + with torch.inference_mode(): + batch = env.reset(batch.to(device)) + return model(batch, env, decode_type="greedy")["reward"].max(1).values + + dl = DataLoader(dataset, batch_size=batch_size, collate_fn=dataset.collate_fn) + + rewards = torch.cat([eval_model(batch) for batch in dl], 0) + return rewards + + +class MDAM(REINFORCE): + """Multi-Decoder Attention Model (MDAM) is a model + to train multiple diverse policies, which effectively increases the chance of finding + good solutions compared with existing methods that train only one policy. + Reference link: https://arxiv.org/abs/2012.10638; + Implementation reference: https://github.com/liangxinedu/MDAM. + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + baseline: REINFORCE baseline. Defaults to rollout (1 epoch of exponential, then greedy rollout baseline) + policy_kwargs: Keyword arguments for policy + baseline_kwargs: Keyword arguments for baseline + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: MDAMPolicy = None, + baseline: Union[REINFORCEBaseline, str] = "rollout", + policy_kwargs={}, + baseline_kwargs={}, + **kwargs, + ): + if policy is None: + policy = MDAMPolicy(env_name=env.name, **policy_kwargs) + + super().__init__(env, policy, baseline, baseline_kwargs, **kwargs) + + # Change rollout of baseline to the rollout function + if isinstance(self.baseline, WarmupBaseline): + if isinstance(self.baseline.baseline, RolloutBaseline): + self.baseline.baseline.rollout = partial(rollout, self.baseline.baseline) + elif isinstance(self.baseline, RolloutBaseline): + self.baseline.rollout = partial(rollout, self.baseline) + + def calculate_loss( + self, + td, + batch, + policy_out, + reward=None, + log_likelihood=None, + ): + """Calculate loss for REINFORCE algorithm. + Same as in :class:`REINFORCE`, but the bl_val is calculated is simply unsqueezed to match + the reward shape (i.e., [batch, num_paths]) + + Args: + td: TensorDict containing the current state of the environment + batch: Batch of data. This is used to get the extra loss terms, e.g., REINFORCE baseline + policy_out: Output of the policy network + reward: Reward tensor. If None, it is taken from `policy_out` + log_likelihood: Log-likelihood tensor. If None, it is taken from `policy_out` + """ + # Extra: this is used for additional loss terms, e.g., REINFORCE baseline + extra = batch.get("extra", None) + reward = reward if reward is not None else policy_out["reward"] + log_likelihood = ( + log_likelihood if log_likelihood is not None else policy_out["log_likelihood"] + ) + + # REINFORCE baseline + bl_val, bl_loss = ( + self.baseline.eval(td, reward, self.env) if extra is None else (extra, 0) + ) + + # Main loss function + # reward: [batch, num_paths]. Note that the baseline value is the max reward + # if bl_val is a tensor, unsqueeze it to match the reward shape + if isinstance(bl_val, torch.Tensor): + if len(bl_val.shape) > 0: + bl_val = bl_val.unsqueeze(1) + advantage = reward - bl_val # advantage = reward - baseline + reinforce_loss = -(advantage * log_likelihood).mean() + loss = reinforce_loss + bl_loss + policy_out.update( + { + "loss": loss, + "reinforce_loss": reinforce_loss, + "bl_loss": bl_loss, + "bl_val": bl_val, + } + ) + return policy_out diff --git a/rl4co/models/zoo/mdam/policy.py b/rl4co/models/zoo/mdam/policy.py new file mode 100644 index 00000000..0ef44595 --- /dev/null +++ b/rl4co/models/zoo/mdam/policy.py @@ -0,0 +1,90 @@ +from typing import Union + +from tensordict import TensorDict + +from rl4co.envs import RL4COEnvBase, get_env +from rl4co.models.common.constructive.autoregressive import AutoregressivePolicy +from rl4co.models.nn.env_embeddings import env_init_embedding +from rl4co.models.zoo.mdam.decoder import MDAMDecoder +from rl4co.models.zoo.mdam.encoder import MDAMGraphAttentionEncoder +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class MDAMPolicy(AutoregressivePolicy): + """Multi-Decoder Attention Model (MDAM) policy. + Args: + + """ + + def __init__( + self, + encoder: MDAMGraphAttentionEncoder = None, + decoder: MDAMDecoder = None, + embed_dim: int = 128, + env_name: str = "tsp", + num_encoder_layers: int = 3, + num_heads: int = 8, + normalization: str = "batch", + **decoder_kwargs, + ): + encoder = ( + MDAMGraphAttentionEncoder( + num_heads=num_heads, + embed_dim=embed_dim, + num_layers=num_encoder_layers, + normalization=normalization, + ) + if encoder is None + else encoder + ) + + decoder = ( + MDAMDecoder( + env_name=env_name, + embed_dim=embed_dim, + num_heads=num_heads, + **decoder_kwargs, + ) + if decoder is None + else decoder + ) + + super(MDAMPolicy, self).__init__( + env_name=env_name, encoder=encoder, decoder=decoder + ) + + self.init_embedding = env_init_embedding(env_name, {"embed_dim": embed_dim}) + + def forward( + self, + td: TensorDict, + env: Union[str, RL4COEnvBase] = None, + phase: str = "train", + return_actions: bool = True, + **decoder_kwargs, + ) -> TensorDict: + embedding = self.init_embedding(td) + encoded_inputs, _, attn, V, h_old = self.encoder(embedding) + + # Instantiate environment if needed + if isinstance(env, str) or env is None: + env_name = self.env_name if env is None else env + log.info(f"Instantiated environment not provided; instantiating {env_name}") + env = get_env(env_name) + + # Get decode type depending on phase + if decoder_kwargs.get("decode_type", None) is None: + decoder_kwargs["decode_type"] = getattr(self, f"{phase}_decode_type") + + reward, log_likelihood, kl_divergence, actions = self.decoder( + td, encoded_inputs, env, attn, V, h_old, self.encoder, **decoder_kwargs + ) + out = { + "reward": reward, + "log_likelihood": log_likelihood, + "entropy": kl_divergence, + "actions": actions if return_actions else None, + } + return out diff --git a/rl4co/models/zoo/mvmoe/__init__.py b/rl4co/models/zoo/mvmoe/__init__.py new file mode 100644 index 00000000..a26e33c4 --- /dev/null +++ b/rl4co/models/zoo/mvmoe/__init__.py @@ -0,0 +1,2 @@ +from .model import MVMoE_POMO +from .model import MVMoE_AM diff --git a/rl4co/models/zoo/mvmoe/model.py b/rl4co/models/zoo/mvmoe/model.py new file mode 100644 index 00000000..124402e4 --- /dev/null +++ b/rl4co/models/zoo/mvmoe/model.py @@ -0,0 +1,79 @@ +from typing import Union + +import torch.nn as nn + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl.reinforce.baselines import REINFORCEBaseline +from rl4co.models.zoo.am import AttentionModel, AttentionModelPolicy +from rl4co.models.zoo.pomo import POMO +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class MVMoE_POMO(POMO): + """MVMoE Model for neural combinatorial optimization based on POMO and REINFORCE + Please refer to Zhou et al. (2024) . + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module = None, + policy_kwargs = {}, + baseline: str = "shared", + num_augment: int = 8, + augment_fn: Union[str, callable] = "dihedral8", + first_aug_identity: bool = True, + feats: list = None, + num_starts: int = None, + moe_kwargs: dict = None, + **kwargs, + ): + if moe_kwargs is None: + moe_kwargs = {"encoder": {"hidden_act": "ReLU", "num_experts": 4, "k": 2, "noisy_gating": True}, + "decoder": {"light_version": True, "num_experts": 4, "k": 2, "noisy_gating": True}} + + if policy is None: + policy_kwargs_ = { + "num_encoder_layers": 6, + "normalization": "instance", + "use_graph_context": False, + "moe_kwargs": moe_kwargs, + } + policy_kwargs.update(policy_kwargs_) + policy = AttentionModelPolicy(env_name=env.name, **policy_kwargs) + + # Initialize with the shared baseline + super(MVMoE_POMO, self).__init__(env, policy, policy_kwargs, baseline, num_augment, augment_fn, + first_aug_identity, feats, num_starts, **kwargs) + + +class MVMoE_AM(AttentionModel): + """MVMoE Model for neural combinatorial optimization based on AM and REINFORCE + Please refer to Zhou et al. (2024) . + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: AttentionModelPolicy = None, + baseline: Union[REINFORCEBaseline, str] = "rollout", + policy_kwargs={}, + baseline_kwargs={}, + moe_kwargs: dict = None, + **kwargs, + ): + if moe_kwargs is None: + moe_kwargs = {"encoder": {"hidden_act": "ReLU", "num_experts": 4, "k": 2, "noisy_gating": True}, + "decoder": {"light_version": True, "out_bias": False, "num_experts": 4, "k": 2, "noisy_gating": True}} + + if policy is None: + policy_kwargs_ = { + "moe_kwargs": moe_kwargs, + } + policy_kwargs.update(policy_kwargs_) + policy = AttentionModelPolicy(env_name=env.name, **policy_kwargs) + + # Initialize with the shared baseline + super(MVMoE_AM, self).__init__(env, policy, baseline, policy_kwargs, baseline_kwargs, **kwargs) diff --git a/rl4co/models/zoo/n2s/__init__.py b/rl4co/models/zoo/n2s/__init__.py new file mode 100644 index 00000000..77085511 --- /dev/null +++ b/rl4co/models/zoo/n2s/__init__.py @@ -0,0 +1,2 @@ +from .model import N2S +from .policy import N2SPolicy diff --git a/rl4co/models/zoo/n2s/decoder.py b/rl4co/models/zoo/n2s/decoder.py new file mode 100644 index 00000000..2c843a8b --- /dev/null +++ b/rl4co/models/zoo/n2s/decoder.py @@ -0,0 +1,261 @@ +import math + +import torch +import torch.nn as nn + +from tensordict import TensorDict +from torch import Tensor + +from rl4co.models.common.improvement.base import ImprovementDecoder +from rl4co.models.nn.attention import MultiHeadCompat +from rl4co.models.nn.mlp import MLP +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class NodePairRemovalDecoder(ImprovementDecoder): + """ + N2S Node-Pair Removal decoder based on Ma et al. (2022) + Given the environment state and the node embeddings (positional embeddings are discarded), compute the logits for + selecting a pair of pickup and delivery nodes for node pair removal from the current solution + + + Args: + embed_dim: Embedding dimension + num_heads: Number of attention heads + """ + + def __init__( + self, + embed_dim: int = 128, + num_heads: int = 4, + ): + super().__init__() + self.input_dim = embed_dim + self.n_heads = num_heads + self.hidden_dim = embed_dim + + assert embed_dim % num_heads == 0 + + self.W_Q = nn.Parameter( + torch.Tensor(self.n_heads, self.input_dim, self.hidden_dim) + ) + self.W_K = nn.Parameter( + torch.Tensor(self.n_heads, self.input_dim, self.hidden_dim) + ) + + self.agg = MLP(input_dim=2 * self.n_heads + 4, output_dim=1, num_neurons=[32, 32]) + + self.init_parameters() + + def init_parameters(self) -> None: + for param in self.parameters(): + stdv = 1.0 / math.sqrt(param.size(-1)) + param.data.uniform_(-stdv, stdv) + + def forward(self, td: TensorDict, final_h: Tensor, final_p: Tensor) -> Tensor: + """Compute the logits of the removing a node pair from the current solution + + Args: + td: TensorDict with the current environment state + final_h: final node embeddings + final_p: final positional embeddings + """ + + selection_recent = torch.cat( + (td["action_record"][:, -3:], td["action_record"].mean(1, True)), 1 + ) + solution = td["rec_current"] + + pre = solution.argsort() # pre=[1,2,0] + post = solution.gather( + 1, solution + ) # post=[1,2,0] # the second neighbour works better + batch_size, graph_size_plus1, input_dim = final_h.size() + + hflat = final_h.contiguous().view(-1, input_dim) ################# reshape + + shp = (self.n_heads, batch_size, graph_size_plus1, self.hidden_dim) + + # Calculate queries, (n_heads, batch_size, graph_size+1, key_size) + hidden_Q = torch.matmul(hflat, self.W_Q).view(shp) + hidden_K = torch.matmul(hflat, self.W_K).view(shp) + + Q_pre = hidden_Q.gather( + 2, pre.view(1, batch_size, graph_size_plus1, 1).expand_as(hidden_Q) + ) + K_post = hidden_K.gather( + 2, post.view(1, batch_size, graph_size_plus1, 1).expand_as(hidden_Q) + ) + + compatibility = ( + (Q_pre * hidden_K).sum(-1) + + (hidden_Q * K_post).sum(-1) + - (Q_pre * K_post).sum(-1) + )[ + :, :, 1: + ] # (n_heads, batch_size, graph_size) (12) + + compatibility_pairing = torch.cat( + ( + compatibility[:, :, : graph_size_plus1 // 2], + compatibility[:, :, graph_size_plus1 // 2 :], + ), + 0, + ) # (n_heads*2, batch_size, graph_size/2) + + compatibility_pairing = self.agg( + torch.cat( + ( + compatibility_pairing.permute(1, 2, 0), + selection_recent.permute(0, 2, 1), + ), + -1, + ) + ).squeeze() # (batch_size, graph_size/2) + + return compatibility_pairing + + +class NodePairReinsertionDecoder(ImprovementDecoder): + """ + N2S Node-Pair Reinsertion decoder based on Ma et al. (2022) + Given the environment state, the node embeddings (positional embeddings are discarded), and the removed node from the NodePairRemovalDecoder, + compute the logits for finding places to re-insert the removed pair of pickup and delivery nodes to form a new solution + + + Args: + embed_dim: Embedding dimension + num_heads: Number of attention heads + """ + + def __init__( + self, + embed_dim: int = 128, + num_heads: int = 4, + ): + super().__init__() + self.input_dim = embed_dim + self.n_heads = num_heads + self.hidden_dim = embed_dim + + assert embed_dim % num_heads == 0 + + self.compater_insert1 = MultiHeadCompat( + num_heads, embed_dim, embed_dim, embed_dim, embed_dim + ) + + self.compater_insert2 = MultiHeadCompat( + num_heads, embed_dim, embed_dim, embed_dim, embed_dim + ) + + self.agg = MLP(input_dim=4 * self.n_heads, output_dim=1, num_neurons=[32, 32]) + + def forward(self, td: TensorDict, final_h: Tensor, final_p: Tensor) -> torch.Tensor: + action_removal = td["action"] + solution = td["rec_current"] + + pos_pickup = (1 + action_removal).view(-1) + pos_delivery = pos_pickup + solution.size(-1) // 2 + + batch_size, graph_size_plus1, input_dim = final_h.size() + shp = (batch_size, graph_size_plus1, graph_size_plus1, self.n_heads) + shp_p = (batch_size, -1, 1, self.n_heads) + shp_d = (batch_size, 1, -1, self.n_heads) + + arange = torch.arange(batch_size, device=final_h.device) + h_pickup = final_h[arange, pos_pickup].unsqueeze(1) # (batch_size, 1, input_dim) + h_delivery = final_h[arange, pos_delivery].unsqueeze( + 1 + ) # (batch_size, 1, input_dim) + h_K_neibour = final_h.gather( + 1, solution.view(batch_size, graph_size_plus1, 1).expand_as(final_h) + ) # (batch_size, graph_size+1, input_dim) + + compatibility_pickup_pre = ( + self.compater_insert1( + h_pickup, final_h + ) # (n_heads, batch_size, 1, graph_size+1) + .permute(1, 2, 3, 0) # (batch_size, 1, graph_size+1, n_heads) + .view(shp_p) # (batch_size, graph_size+1, 1, n_heads) + .expand(shp) # (batch_size, graph_size+1, graph_size+1, n_heads) + ) + compatibility_pickup_post = ( + self.compater_insert2(h_pickup, h_K_neibour) + .permute(1, 2, 3, 0) + .view(shp_p) + .expand(shp) + ) + compatibility_delivery_pre = ( + self.compater_insert1( + h_delivery, final_h + ) # (n_heads, batch_size, 1, graph_size+1) + .permute(1, 2, 3, 0) # (batch_size, 1, graph_size+1, n_heads) + .view(shp_d) # (batch_size, 1, graph_size+1, n_heads) + .expand(shp) # (batch_size, graph_size+1, graph_size+1, n_heads) + ) + compatibility_delivery_post = ( + self.compater_insert2(h_delivery, h_K_neibour) + .permute(1, 2, 3, 0) + .view(shp_d) + .expand(shp) + ) + + compatibility = self.agg( + torch.cat( + ( + compatibility_pickup_pre, + compatibility_pickup_post, + compatibility_delivery_pre, + compatibility_delivery_post, + ), + -1, + ) + ).squeeze() + + return compatibility # (batch_size, graph_size+1, graph_size+1) + + +class CriticDecoder(nn.Module): + def __init__(self, input_dim: int, dropout_rate=0.01) -> None: + super().__init__() + self.input_dim = input_dim + + self.project_graph = nn.Linear(self.input_dim, self.input_dim // 2) + self.project_node = nn.Linear(self.input_dim, self.input_dim // 2) + + self.MLP = MLP( + input_dim=input_dim + 1, + output_dim=1, + num_neurons=[input_dim, input_dim // 2], + dropout_probs=[dropout_rate, 0.0], + ) + + def forward(self, x: torch.Tensor, best_cost: torch.Tensor) -> torch.Tensor: + # h_wave: (batch_size, graph_size+1, input_size) + mean_pooling = x.mean(1) # mean Pooling (batch_size, input_size) + graph_feature: torch.Tensor = self.project_graph(mean_pooling)[ + :, None, : + ] # (batch_size, 1, input_dim/2) + node_feature: torch.Tensor = self.project_node( + x + ) # (batch_size, graph_size+1, input_dim/2) + + # pass through value_head, get estimated value + fusion = node_feature + graph_feature.expand_as( + node_feature + ) # (batch_size, graph_size+1, input_dim/2) + + fusion_feature = torch.cat( + ( + fusion.mean(1), + fusion.max(1)[0], # max_pooling + best_cost.to(x.device), + ), + -1, + ) # (batch_size, input_dim + 1) + + value = self.MLP(fusion_feature) + + return value diff --git a/rl4co/models/zoo/n2s/encoder.py b/rl4co/models/zoo/n2s/encoder.py new file mode 100644 index 00000000..c219c3c3 --- /dev/null +++ b/rl4co/models/zoo/n2s/encoder.py @@ -0,0 +1,217 @@ +import math + +from typing import Callable, Tuple + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from torch import Tensor + +from rl4co.models.common import ImprovementEncoder +from rl4co.models.nn.attention import MultiHeadCompat +from rl4co.models.nn.ops import AdaptiveSequential, Normalization +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class Synth_Attention(nn.Module): + def __init__(self, n_heads: int, input_dim: int) -> None: + super().__init__() + + hidden_dim = input_dim // n_heads + + self.n_heads = n_heads + self.input_dim = input_dim + self.hidden_dim = hidden_dim + + self.W_query = nn.Parameter(torch.Tensor(n_heads, input_dim, hidden_dim)) + self.W_key = nn.Parameter(torch.Tensor(n_heads, input_dim, hidden_dim)) + self.W_val = nn.Parameter(torch.Tensor(n_heads, input_dim, hidden_dim)) + + self.score_aggr = nn.Sequential( + nn.Linear(2 * n_heads, 2 * n_heads), + nn.ReLU(inplace=True), + nn.Linear(2 * n_heads, n_heads), + ) + + self.W_out = nn.Parameter(torch.Tensor(n_heads, hidden_dim, input_dim)) + + self.init_parameters() + + # used for init nn.Parameter + def init_parameters(self): + for param in self.parameters(): + stdv = 1.0 / math.sqrt(param.size(-1)) + param.data.uniform_(-stdv, stdv) + + def forward( + self, h_fea: torch.Tensor, aux_att_score: torch.Tensor + ) -> Tuple[torch.Tensor, torch.Tensor]: + # h should be (batch_size, n_query, input_dim) + batch_size, n_query, input_dim = h_fea.size() + + hflat = h_fea.contiguous().view(-1, input_dim) + + shp = (self.n_heads, batch_size, n_query, self.hidden_dim) + + # Calculate queries, (n_heads, batch_size, n_query, hidden_dim) + Q = torch.matmul(hflat, self.W_query).view(shp) + K = torch.matmul(hflat, self.W_key).view(shp) + V = torch.matmul(hflat, self.W_val).view(shp) + + # Calculate compatibility (n_heads, batch_size, n_query, n_key) + compatibility = torch.cat((torch.matmul(Q, K.transpose(2, 3)), aux_att_score), 0) + + attn_raw = compatibility.permute( + 1, 2, 3, 0 + ) # (batch_size, n_query, n_key, n_heads) + attn = self.score_aggr(attn_raw).permute( + 3, 0, 1, 2 + ) # (n_heads, batch_size, n_query, n_key) + heads = torch.matmul( + F.softmax(attn, dim=-1), V + ) # (n_heads, batch_size, n_query, hidden_dim) + + h_wave = torch.mm( + heads.permute(1, 2, 0, 3) # (batch_size, n_query, n_heads, hidden_dim) + .contiguous() + .view( + -1, self.n_heads * self.hidden_dim + ), # (batch_size * n_query, n_heads * hidden_dim) + self.W_out.view(-1, self.input_dim), # (n_heads * hidden_dim, input_dim) + ).view(batch_size, n_query, self.input_dim) + + return h_wave, aux_att_score + + +class SynthAttNormSubLayer(nn.Module): + def __init__(self, n_heads: int, input_dim: int, normalization: str) -> None: + super().__init__() + + self.SynthAtt = Synth_Attention(n_heads, input_dim) + + self.Norm = Normalization(input_dim, normalization) + + __call__: Callable[..., Tuple[torch.Tensor, torch.Tensor]] + + def forward( + self, h_fea: torch.Tensor, aux_att_score: torch.Tensor + ) -> Tuple[torch.Tensor, torch.Tensor]: + # Attention and Residual connection + h_wave, aux_att_score = self.SynthAtt(h_fea, aux_att_score) + + # Normalization + return self.Norm(h_wave + h_fea), aux_att_score + + +class FFNormSubLayer(nn.Module): + def __init__( + self, input_dim: int, feed_forward_hidden: int, normalization: str + ) -> None: + super().__init__() + + self.FF = ( + nn.Sequential( + nn.Linear(input_dim, feed_forward_hidden, bias=False), + nn.ReLU(inplace=True), + nn.Linear(feed_forward_hidden, input_dim, bias=False), + ) + if feed_forward_hidden > 0 + else nn.Linear(input_dim, input_dim, bias=False) + ) + + self.Norm = Normalization(input_dim, normalization) + + __call__: Callable[..., torch.Tensor] + + def forward(self, input: torch.Tensor) -> torch.Tensor: + # FF and Residual connection + out = self.FF(input) + # Normalization + return self.Norm(out + input) + + +class N2SEncoderLayer(nn.Module): + def __init__( + self, n_heads: int, input_dim: int, feed_forward_hidden: int, normalization: str + ) -> None: + super().__init__() + + self.SynthAttNorm_sublayer = SynthAttNormSubLayer( + n_heads, input_dim, normalization + ) + + self.FFNorm_sublayer = FFNormSubLayer( + input_dim, feed_forward_hidden, normalization + ) + + __call__: Callable[..., Tuple[torch.Tensor, torch.Tensor]] + + def forward( + self, h_fea: torch.Tensor, aux_att_score: torch.Tensor + ) -> Tuple[torch.Tensor, torch.Tensor]: + h_wave, aux_att_score = self.SynthAttNorm_sublayer(h_fea, aux_att_score) + return self.FFNorm_sublayer(h_wave), aux_att_score + + +class N2SEncoder(ImprovementEncoder): + """Neural Neighborhood Search Encoder as in Ma et al. (2022) + First embed the input and then process it with a Graph AttepdN2ntion Network. + + Args: + embed_dim: Dimension of the embedding space + init_embedding: Module to use for the initialization of the node embeddings + pos_embedding: Module to use for the initialization of the positional embeddings + env_name: Name of the environment used to initialize embeddings + pos_type: Name of the used positional encoding method (CPE or APE) + num_heads: Number of heads in the attention layers + num_layers: Number of layers in the attention network + normalization: Normalization type in the attention layers + feedforward_hidden: Hidden dimension in the feedforward layers + """ + + def __init__( + self, + embed_dim: int = 128, + init_embedding: nn.Module = None, + pos_embedding: nn.Module = None, + env_name: str = "pdp_ruin_repair", + pos_type: str = "CPE", + num_heads: int = 4, + num_layers: int = 3, + normalization: str = "layer", + feedforward_hidden: int = 128, + ): + super(N2SEncoder, self).__init__( + embed_dim=embed_dim, + init_embedding=init_embedding, + pos_embedding=pos_embedding, + env_name=env_name, + pos_type=pos_type, + num_heads=num_heads, + num_layers=num_layers, + normalization=normalization, + feedforward_hidden=feedforward_hidden, + ) + + self.pos_net = MultiHeadCompat(num_heads, embed_dim, feedforward_hidden) + + self.net = AdaptiveSequential( + *( + N2SEncoderLayer( + num_heads, + embed_dim, + feedforward_hidden, + normalization, + ) + for _ in range(num_layers) + ) + ) + + def _encoder_forward(self, init_h: Tensor, init_p: Tensor) -> Tuple[Tensor, Tensor]: + embed_p = self.pos_net(init_p) + final_h, final_p = self.net(init_h, embed_p) + + return final_h, final_p diff --git a/rl4co/models/zoo/n2s/model.py b/rl4co/models/zoo/n2s/model.py new file mode 100644 index 00000000..d3080e4a --- /dev/null +++ b/rl4co/models/zoo/n2s/model.py @@ -0,0 +1,62 @@ +import torch.nn as nn + +from rl4co.envs import RL4COEnvBase +from rl4co.models.nn.graph.attnnet import MultiHeadAttentionLayer +from rl4co.models.rl import n_step_PPO +from rl4co.models.rl.common.critic import CriticNetwork +from rl4co.models.zoo.n2s.decoder import CriticDecoder +from rl4co.models.zoo.n2s.policy import N2SPolicy +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class N2S(n_step_PPO): + """N2S Model based on n_step Proximal Policy Optimization (PPO) with an N2S model policy. + We default to the N2S model policy and the improvement Critic Network. + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + critic: Critic to use for the algorithm + policy_kwargs: Keyword arguments for policy + critic_kwargs: Keyword arguments for critic + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module = None, + critic: CriticNetwork = None, + policy_kwargs: dict = {}, + critic_kwargs: dict = {}, + **kwargs, + ): + if policy is None: + policy = N2SPolicy(env_name=env.name, **policy_kwargs) + + if critic is None: + embed_dim = ( + policy_kwargs["embed_dim"] if "embed_dim" in policy_kwargs else 128 + ) # the critic's embed_dim must be as policy's + + encoder = MultiHeadAttentionLayer( + embed_dim, + critic_kwargs["num_heads"] if "num_heads" in critic_kwargs else 4, + critic_kwargs["feedforward_hidden"] + if "feedforward_hidden" in critic_kwargs + else 128, + critic_kwargs["normalization"] + if "normalization" in critic_kwargs + else "layer", + bias=False, + ) + value_head = CriticDecoder(embed_dim) + + critic = CriticNetwork( + encoder=encoder, + value_head=value_head, + customized=True, + ) + + super().__init__(env, policy, critic, **kwargs) diff --git a/rl4co/models/zoo/n2s/policy.py b/rl4co/models/zoo/n2s/policy.py new file mode 100644 index 00000000..6a6a0c9e --- /dev/null +++ b/rl4co/models/zoo/n2s/policy.py @@ -0,0 +1,222 @@ +from typing import Union + +import torch +import torch.nn as nn + +from tensordict import TensorDict + +from rl4co.envs import RL4COEnvBase, get_env +from rl4co.models.common.improvement.base import ImprovementPolicy +from rl4co.models.zoo.n2s.decoder import ( + NodePairReinsertionDecoder, + NodePairRemovalDecoder, +) +from rl4co.models.zoo.n2s.encoder import N2SEncoder +from rl4co.utils.decoding import DecodingStrategy, get_decoding_strategy +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class N2SPolicy(ImprovementPolicy): + """ + N2S Policy based on Ma et al. (2022) + This model first encodes the input graph and current solution using a N2S encoder (:class:`N2SEncoder`) + and then decodes the node-pair removal and reinsertion action using + the Node-Pair Removal (:class:`NodePairRemovalDecoder`) and Reinsertion (:class:`NodePairReinsertionDecoder`) decoders + + Args: + embed_dim: Dimension of the node embeddings + num_encoder_layers: Number of layers in the encoder + num_heads: Number of heads in the attention layers + normalization: Normalization type in the attention layers + feedforward_hidden: Dimension of the hidden layer in the feedforward network + env_name: Name of the environment used to initialize embeddings + pos_type: Name of the used positional encoding method (CPE or APE) + init_embedding: Module to use for the initialization of the embeddings + pos_embedding: Module to use for the initialization of the positional embeddings + temperature: Temperature for the softmax + tanh_clipping: Tanh clipping value (see Bello et al., 2016) + train_decode_type: Type of decoding to use during training + val_decode_type: Type of decoding to use during validation + test_decode_type: Type of decoding to use during testing + """ + + def __init__( + self, + embed_dim: int = 128, + num_encoder_layers: int = 3, + num_heads: int = 4, + normalization: str = "layer", + feedforward_hidden: int = 128, + env_name: str = "pdp_ruin_repair", + pos_type: str = "CPE", + init_embedding: nn.Module = None, + pos_embedding: nn.Module = None, + temperature: float = 1.0, + tanh_clipping: float = 6.0, + train_decode_type: str = "sampling", + val_decode_type: str = "sampling", + test_decode_type: str = "sampling", + ): + super(N2SPolicy, self).__init__() + + self.env_name = env_name + + # Encoder and decoder + self.encoder = N2SEncoder( + embed_dim=embed_dim, + init_embedding=init_embedding, + pos_embedding=pos_embedding, + env_name=env_name, + pos_type=pos_type, + num_heads=num_heads, + num_layers=num_encoder_layers, + normalization=normalization, + feedforward_hidden=feedforward_hidden, + ) + + self.removal_decoder = NodePairRemovalDecoder( + embed_dim=embed_dim, num_heads=num_heads + ) + + self.reinsertion_decoder = NodePairReinsertionDecoder( + embed_dim=embed_dim, num_heads=num_heads + ) + + self.project_graph = nn.Linear(embed_dim, embed_dim, bias=False) + self.project_node = nn.Linear(embed_dim, embed_dim, bias=False) + + # Decoding strategies + self.temperature = temperature + self.tanh_clipping = tanh_clipping + self.train_decode_type = train_decode_type + self.val_decode_type = val_decode_type + self.test_decode_type = test_decode_type + + def forward( + self, + td: TensorDict, + env: Union[str, RL4COEnvBase] = None, + phase: str = "train", + return_actions: bool = True, + return_embeds: bool = False, + only_return_embed: bool = False, + actions=None, + **decoding_kwargs, + ) -> dict: + """Forward pass of the policy. + + Args: + td: TensorDict containing the environment state + env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that + it is more efficient to pass an already instantiated environment each time for fine-grained control + phase: Phase of the algorithm (train, val, test) + return_actions: Whether to return the actions + actions: Actions to use for evaluating the policy. + If passed, use these actions instead of sampling from the policy to calculate log likelihood + decoding_kwargs: Keyword arguments for the decoding strategy. See :class:`rl4co.utils.decoding.DecodingStrategy` for more information. + + Returns: + out: Dictionary containing the reward, log likelihood, and optionally the actions and entropy + """ + + # Encoder: get encoder output and initial embeddings from initial state + h_wave, final_p = self.encoder(td) + if only_return_embed: + return {"embeds": h_wave.detach()} + final_h = ( + self.project_node(h_wave) + self.project_graph(h_wave.max(1)[0])[:, None, :] + ) + + # Instantiate environment if needed + if isinstance(env, str) or env is None: + env_name = self.env_name if env is None else env + log.info(f"Instantiated environment not provided; instantiating {env_name}") + env = get_env(env_name) + + # Get decode type depending on phase and whether actions are passed for evaluation + decode_type = decoding_kwargs.pop("decode_type", None) + if actions is not None: + decode_type = "evaluate" + elif decode_type is None: + decode_type = getattr(self, f"{phase}_decode_type") + + # Setup decoding strategy + # we pop arguments that are not part of the decoding strategy + decode_strategy: DecodingStrategy = get_decoding_strategy( + decode_type, + temperature=decoding_kwargs.pop("temperature", self.temperature), + tanh_clipping=decoding_kwargs.pop("tanh_clipping", self.tanh_clipping), + mask_logits=True, + improvement_method_mode=True, + **decoding_kwargs, + ) + + ## action 1 + + # Perform the decoding + logits = self.removal_decoder(td, final_h, final_p) + + # Get mask + mask = torch.ones_like(td["action_record"][:, 0], device=td.device).bool() + if "action" in td.keys(): + mask = mask.scatter(1, td["action"][:, :1], 0) + + # Get action and log-likelihood + logprob_removal, action_removal = decode_strategy.step( + logits, + mask, + action=actions[:, 0] if actions is not None else None, + ) + action_removal = action_removal.unsqueeze(-1) + if phase == "train": + selected_log_ll_action1 = logprob_removal.gather(1, action_removal) + + ## action 2 + td.set("action", action_removal) + + # Perform the decoding + batch_size, seq_length = td["rec_current"].size() + logits = self.reinsertion_decoder(td, final_h, final_p).view(batch_size, -1) + + # Get mask + mask = env.get_mask(action_removal + 1, td).view(batch_size, -1) + # Get action and log-likelihood + logprob_reinsertion, action_reinsertion = decode_strategy.step( + logits, + mask, + action=( + actions[:, 1] * seq_length + actions[:, 2] + if actions is not None + else None + ), + ) + action_reinsertion = action_reinsertion.unsqueeze(-1) + if phase == "train": + selected_log_ll_action2 = logprob_reinsertion.gather(1, action_reinsertion) + + ## return + N2S_action = torch.cat( + ( + action_removal.view(batch_size, -1), + action_reinsertion // seq_length, + action_reinsertion % seq_length, + ), + -1, + ) + if phase == "train": + log_likelihood = selected_log_ll_action1 + selected_log_ll_action2 + else: + log_likelihood = torch.zeros(batch_size, device=td.device) + + outdict = {"log_likelihood": log_likelihood, "cost_bsf": td["cost_bsf"]} + td.set("action", N2S_action) + + if return_embeds: + outdict["embeds"] = h_wave.detach() + + if return_actions: + outdict["actions"] = N2S_action + + return outdict diff --git a/rl4co/models/zoo/nargnn/__init__.py b/rl4co/models/zoo/nargnn/__init__.py new file mode 100644 index 00000000..9da8ee9b --- /dev/null +++ b/rl4co/models/zoo/nargnn/__init__.py @@ -0,0 +1,2 @@ +from .encoder import NARGNNEncoder +from .policy import NARGNNPolicy diff --git a/rl4co/models/zoo/nargnn/encoder.py b/rl4co/models/zoo/nargnn/encoder.py new file mode 100644 index 00000000..0ace632b --- /dev/null +++ b/rl4co/models/zoo/nargnn/encoder.py @@ -0,0 +1,212 @@ +from typing import Callable, Optional, Union + +import torch +import torch.nn as nn + +from tensordict import TensorDict +from torch import Tensor + +from rl4co.models.common.constructive.nonautoregressive import NonAutoregressiveEncoder +from rl4co.models.nn.env_embeddings import env_edge_embedding, env_init_embedding +from rl4co.models.nn.graph.gnn import GNNEncoder + +try: + from torch_geometric.data import Batch +except ImportError: + # `Batch` is referred to only as type notations in this file + Batch = None + + +class EdgeHeatmapGenerator(nn.Module): + """MLP for converting edge embeddings to heatmaps. + + Args: + embed_dim: Dimension of the embeddings + num_layers: The number of linear layers in the network. + act_fn: Activation function. Defaults to "silu". + linear_bias: Use bias in linear layers. Defaults to True. + undirected_graph: Whether the graph is undirected. Defaults to True. + """ + + def __init__( + self, + embed_dim: int, + num_layers: int, + act_fn: Union[str, Callable] = "silu", + linear_bias: bool = True, + undirected_graph: bool = True, + ) -> None: + super(EdgeHeatmapGenerator, self).__init__() + + self.linears = nn.ModuleList( + [ + nn.Linear(embed_dim, embed_dim, bias=linear_bias) + for _ in range(num_layers - 1) + ] + ) + self.output = nn.Linear(embed_dim, 1, bias=linear_bias) + + self.act = getattr(nn.functional, act_fn) if isinstance(act_fn, str) else act_fn + + self.undirected_graph = undirected_graph + + def forward(self, graph: Batch) -> Tensor: # type: ignore + # do not reuse the input value + edge_attr = graph.edge_attr # type: ignore + for layer in self.linears: + edge_attr = self.act(layer(edge_attr)) + graph.edge_attr = torch.sigmoid(self.output(edge_attr)) # type: ignore + + heatmap_logits = self._make_heatmap_logits(graph) + return heatmap_logits + + def _make_heatmap_logits(self, batch_graph: Batch) -> Tensor: # type: ignore + graphs = batch_graph.to_data_list() + device = graphs[0].edge_attr.device + batch_size = len(graphs) + num_nodes = graphs[0].x.shape[0] + + heatmap = torch.zeros( + (batch_size, num_nodes, num_nodes), + device=device, + dtype=graphs[0].edge_attr.dtype, + ) + + for index, graph in enumerate(graphs): + edge_index, edge_attr = graph.edge_index, graph.edge_attr + heatmap[index, edge_index[0], edge_index[1]] = edge_attr.flatten() + + # This is commented out, because it undo the some of the sparsification. + # if self.undirected_graph: + # heatmap = (heatmap + heatmap.transpose(1, 2)) * 0.5 + + heatmap += 1e-10 if heatmap.dtype != torch.float16 else 3e-8 + # 3e-8 is the smallest positive number such that log(3e-8) is not -inf + heatmap_logits = torch.log(heatmap) + + return heatmap_logits + + +class NARGNNEncoder(NonAutoregressiveEncoder): + """Anisotropic Graph Neural Network encoder with edge-gating mechanism as in Joshi et al. (2022), and used in DeepACO (Ye et al., 2023). + This creates a heatmap of NxN for N nodes (i.e., heuristic) that models the probability to go from one node to another for all nodes. + This model utilizes a multi-layer perceptron (MLP) approach to predict edge attributes directly from the input graph features, + which are then transformed into a heatmap representation to facilitate the decoding of the solution. The decoding process + is managed by a specified strategy which could vary from simple greedy selection to more complex sampling methods. + + Tip: + This decoder's performance heavily relies on the ability of the MLP to capture the dependencies between different + parts of the solution without the iterative refinement provided by autoregressive models. It is particularly useful + in scenarios where the solution space can be effectively explored in a parallelized manner or when the solution components + are largely independent. + + Args: + embed_dim: Dimension of the node embeddings + env_name: Name of the environment used to initialize embeddings + num_layers: Number of layers in the encoder + init_embedding: Model to use for the initial embedding. If None, use the default embedding for the environment + edge_embedding: Model to use for the edge embedding. If None, use the default embedding for the environment + graph_network: Model to use for the graph network. If None, use the default network for the environment + heatmap_generator: Model to use for the heatmap generator. If None, use the default network for the environment + num_layers_heatmap_generator: Number of layers in the heatmap generator + num_layers_graph_encoder: Number of layers in the graph encoder + act_fn: The activation function to use in each GNNLayer, see https://pytorch.org/docs/stable/nn.functional.html#non-linear-activation-functions for available options. Defaults to 'silu'. + agg_fn: The aggregation function to use in each GNNLayer for pooling features. Options: 'add', 'mean', 'max'. Defaults to 'mean'. + linear_bias: Use bias in linear layers. Defaults to True. + k_sparse: Number of edges to keep for each node. Defaults to None. + """ + + def __init__( + self, + embed_dim: int = 64, + env_name: str = "tsp", + # TODO: pass network + init_embedding: Optional[nn.Module] = None, + edge_embedding: Optional[nn.Module] = None, + graph_network: Optional[nn.Module] = None, + heatmap_generator: Optional[nn.Module] = None, + num_layers_heatmap_generator: int = 5, + num_layers_graph_encoder: int = 15, + act_fn="silu", + agg_fn="mean", + linear_bias: bool = True, + k_sparse: Optional[int] = None, + ): + super(NonAutoregressiveEncoder, self).__init__() + self.env_name = env_name + + self.init_embedding = ( + env_init_embedding(self.env_name, {"embed_dim": embed_dim}) + if init_embedding is None + else init_embedding + ) + + self.edge_embedding = ( + env_edge_embedding(self.env_name, {"embed_dim": embed_dim, "k_sparse": k_sparse}) + if edge_embedding is None + else edge_embedding + ) + + self.graph_network = ( + GNNEncoder( + embed_dim=embed_dim, + num_layers=num_layers_graph_encoder, + act_fn=act_fn, + agg_fn=agg_fn, + ) + if graph_network is None + else graph_network + ) + + self.heatmap_generator = ( + EdgeHeatmapGenerator( + embed_dim=embed_dim, + num_layers=num_layers_heatmap_generator, + linear_bias=linear_bias, + ) + if heatmap_generator is None + else heatmap_generator + ) + + def forward(self, td: TensorDict): + """Forward pass of the encoder. + Transform the input TensorDict into the latent representation. + """ + # Transfer to embedding space + node_embed = self.init_embedding(td) + graph = self.edge_embedding(td, node_embed) + + # Process embedding into graph + # TODO: standardize? + graph.x, graph.edge_attr = self.graph_network( + graph.x, graph.edge_index, graph.edge_attr + ) + + # Generate heatmap logits + heatmap_logits = self.heatmap_generator(graph) + + # Return latent representation (i.e. heatmap logits) and initial embeddings + return heatmap_logits, node_embed + + +class NARGNNNodeEncoder(NARGNNEncoder): + """In this case, we just use the node embeddings from the graph + without transforming them into a heatmap. + """ + + def forward(self, td: TensorDict): + # Transfer to embedding space + node_embed = self.init_embedding(td) + graph = self.edge_embedding(td, node_embed) + + # Process embedding into graph + # TODO: standardize? + graph.x, graph.edge_attr = self.graph_network( + graph.x, graph.edge_index, graph.edge_attr + ) + + proc_embeds = graph.x + batch_size = node_embed.shape[0] + # reshape proc_embeds from [bs*n, h] to [bs, n, h] + proc_embeds = proc_embeds.reshape(batch_size, -1, proc_embeds.shape[1]) + return proc_embeds, node_embed diff --git a/rl4co/models/zoo/nargnn/policy.py b/rl4co/models/zoo/nargnn/policy.py new file mode 100644 index 00000000..5d83cb73 --- /dev/null +++ b/rl4co/models/zoo/nargnn/policy.py @@ -0,0 +1,107 @@ +from typing import Optional + +import torch.nn as nn + +from rl4co.models.common.constructive.nonautoregressive import ( + NonAutoregressiveDecoder, + NonAutoregressiveEncoder, + NonAutoregressivePolicy, +) +from rl4co.utils.pylogger import get_pylogger + +from .encoder import NARGNNEncoder + +log = get_pylogger(__name__) + + +class NARGNNPolicy(NonAutoregressivePolicy): + """ + Base Non-autoregressive policy for NCO construction methods. + This creates a heatmap of NxN for N nodes (i.e., heuristic) that models the probability to go from one node to another for all nodes. + + The policy performs the following steps: + 1. Encode the environment initial state into node embeddings + 2. Decode (non-autoregressively) to construct the solution to the NCO problem + + Warning: + The effectiveness of the non-autoregressive approach can vary significantly across different problem types and configurations. + It may require careful tuning of the model architecture and decoding strategy to achieve competitive results. + + Args: + encoder: Encoder module. Can be passed by sub-classes + decoder: Decoder module. Note that this moule defaults to the non-autoregressive decoder + embed_dim: Dimension of the embeddings + env_name: Name of the environment used to initialize embeddings + init_embedding: Model to use for the initial embedding. If None, use the default embedding for the environment + edge_embedding: Model to use for the edge embedding. If None, use the default embedding for the environment + graph_network: Model to use for the graph network. If None, use the default embedding for the environment + heatmap_generator: Model to use for the heatmap generator. If None, use the default embedding for the environment + num_layers_heatmap_generator: Number of layers in the heatmap generator + num_layers_graph_encoder: Number of layers in the graph encoder + act_fn: Activation function to use in the encoder + agg_fn: Aggregation function to use in the encoder + linear_bias: Whether to use bias in the encoder + train_decode_type: Type of decoding during training + val_decode_type: Type of decoding during validation + test_decode_type: Type of decoding during testing + **constructive_policy_kw: Unused keyword arguments + """ + + def __init__( + self, + encoder: Optional[NonAutoregressiveEncoder] = None, + decoder: Optional[NonAutoregressiveDecoder] = None, + embed_dim: int = 64, + env_name: str = "tsp", + init_embedding: Optional[nn.Module] = None, + edge_embedding: Optional[nn.Module] = None, + graph_network: Optional[nn.Module] = None, + heatmap_generator: Optional[nn.Module] = None, + num_layers_heatmap_generator: int = 5, + num_layers_graph_encoder: int = 15, + act_fn="silu", + agg_fn="mean", + linear_bias: bool = True, + train_decode_type: str = "multistart_sampling", + val_decode_type: str = "multistart_greedy", + test_decode_type: str = "multistart_greedy", + **constructive_policy_kw, + ): + if len(constructive_policy_kw) > 0: + log.warn(f"Unused kwargs: {constructive_policy_kw}") + + if encoder is None: + encoder = NARGNNEncoder( + embed_dim=embed_dim, + env_name=env_name, + init_embedding=init_embedding, + edge_embedding=edge_embedding, + graph_network=graph_network, + heatmap_generator=heatmap_generator, + num_layers_heatmap_generator=num_layers_heatmap_generator, + num_layers_graph_encoder=num_layers_graph_encoder, + act_fn=act_fn, + agg_fn=agg_fn, + linear_bias=linear_bias, + ) + + # The decoder generates logits given the current td and heatmap + if decoder is None: + decoder = NonAutoregressiveDecoder() + else: + # check if the decoder has trainable parameters + if any(p.requires_grad for p in decoder.parameters()): + log.error( + "The decoder contains trainable parameters. This should not happen in a non-autoregressive policy." + ) + + # Pass to constructive policy + super(NARGNNPolicy, self).__init__( + encoder=encoder, + decoder=decoder, + env_name=env_name, + train_decode_type=train_decode_type, + val_decode_type=val_decode_type, + test_decode_type=test_decode_type, + **constructive_policy_kw, + ) diff --git a/rl4co/models/zoo/neuopt/__init__.py b/rl4co/models/zoo/neuopt/__init__.py new file mode 100644 index 00000000..f9fe19c0 --- /dev/null +++ b/rl4co/models/zoo/neuopt/__init__.py @@ -0,0 +1,2 @@ +from .model import NeuOpt +from .policy import NeuOptPolicy diff --git a/rl4co/models/zoo/neuopt/decoder.py b/rl4co/models/zoo/neuopt/decoder.py new file mode 100644 index 00000000..f9cca584 --- /dev/null +++ b/rl4co/models/zoo/neuopt/decoder.py @@ -0,0 +1,77 @@ +import torch +import torch.nn as nn + +from torch import Tensor + +from rl4co.models.common.improvement.base import ImprovementDecoder +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class RDSDecoder(ImprovementDecoder): + """ + RDS Decoder for flexible k-opt based on Ma et al. (2023) + Given the environment state and the node embeddings (positional embeddings are discarded), compute the logits for + selecting a k-opt exchange on basis moves (S-move, I-move, E-move) from the current solution + + Args: + embed_dim: Embedding dimension + num_heads: Number of attention heads + """ + + def __init__( + self, + embed_dim: int = 128, + ): + super().__init__() + self.embed_dim = embed_dim + + self.linear_K1 = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + self.linear_K2 = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + self.linear_K3 = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + self.linear_K4 = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + + self.linear_Q1 = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + self.linear_Q2 = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + self.linear_Q3 = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + self.linear_Q4 = nn.Linear(self.embed_dim, self.embed_dim, bias=False) + + self.linear_V1 = nn.Parameter(torch.Tensor(self.embed_dim)) + self.linear_V2 = nn.Parameter(torch.Tensor(self.embed_dim)) + + self.rnn1 = nn.GRUCell(self.embed_dim, self.embed_dim) + self.rnn2 = nn.GRUCell(self.embed_dim, self.embed_dim) + + def forward(self, h, q1, q2, input_q1, input_q2) -> Tensor: + bs = h.size(0) + + # GRUs + q1 = self.rnn1(input_q1, q1) + q2 = self.rnn2(input_q2, q2) + + # Dual-Stream Attention + linear_V1 = self.linear_V1.view(1, -1).expand(bs, -1) + linear_V2 = self.linear_V2.view(1, -1).expand(bs, -1) + result = ( + linear_V1.unsqueeze(1) + * torch.tanh( + self.linear_K1(h) + + self.linear_Q1(q1).unsqueeze(1) + + self.linear_K3(h) * self.linear_Q3(q1).unsqueeze(1) + ) + ).sum( + -1 + ) # \mu stream + result += ( + linear_V2.unsqueeze(1) + * torch.tanh( + self.linear_K2(h) + + self.linear_Q2(q2).unsqueeze(1) + + self.linear_K4(h) * self.linear_Q4(q2).unsqueeze(1) + ) + ).sum( + -1 + ) # \lambda stream + + return result, q1, q2 diff --git a/rl4co/models/zoo/neuopt/model.py b/rl4co/models/zoo/neuopt/model.py new file mode 100644 index 00000000..5bd7050d --- /dev/null +++ b/rl4co/models/zoo/neuopt/model.py @@ -0,0 +1,62 @@ +import torch.nn as nn + +from rl4co.envs import RL4COEnvBase +from rl4co.models.nn.graph.attnnet import MultiHeadAttentionLayer +from rl4co.models.rl import n_step_PPO +from rl4co.models.rl.common.critic import CriticNetwork +from rl4co.models.zoo.n2s.decoder import CriticDecoder +from rl4co.models.zoo.neuopt.policy import NeuOptPolicy +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class NeuOpt(n_step_PPO): + """NeuOpt Model based on n_step Proximal Policy Optimization (PPO) with an NeuOpt model policy. + We default to the NeuOpt model policy and the improvement Critic Network. + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + critic: Critic to use for the algorithm + policy_kwargs: Keyword arguments for policy + critic_kwargs: Keyword arguments for critic + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module = None, + critic: CriticNetwork = None, + policy_kwargs: dict = {}, + critic_kwargs: dict = {}, + **kwargs, + ): + if policy is None: + policy = NeuOptPolicy(env_name=env.name, **policy_kwargs) + + if critic is None: + embed_dim = ( + policy_kwargs["embed_dim"] if "embed_dim" in policy_kwargs else 128 + ) # the critic's embed_dim must be as policy's + + encoder = MultiHeadAttentionLayer( + embed_dim, + critic_kwargs["num_heads"] if "num_heads" in critic_kwargs else 4, + critic_kwargs["feedforward_hidden"] + if "feedforward_hidden" in critic_kwargs + else 128, + critic_kwargs["normalization"] + if "normalization" in critic_kwargs + else "layer", + bias=False, + ) + value_head = CriticDecoder(embed_dim, dropout_rate=0.001) + + critic = CriticNetwork( + encoder=encoder, + value_head=value_head, + customized=True, + ) + + super().__init__(env, policy, critic, **kwargs) diff --git a/rl4co/models/zoo/neuopt/policy.py b/rl4co/models/zoo/neuopt/policy.py new file mode 100644 index 00000000..0d686d0f --- /dev/null +++ b/rl4co/models/zoo/neuopt/policy.py @@ -0,0 +1,300 @@ +import math + +from typing import Union + +import torch +import torch.nn as nn + +from tensordict import TensorDict + +from rl4co.envs import RL4COEnvBase, get_env +from rl4co.models.common.improvement.base import ImprovementPolicy +from rl4co.models.zoo.n2s.encoder import N2SEncoder +from rl4co.models.zoo.neuopt.decoder import RDSDecoder +from rl4co.utils.decoding import DecodingStrategy, get_decoding_strategy +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class CustomizeTSPInitEmbedding(nn.Module): + """Initial embedding for the Traveling Salesman Problems (TSP). + Embed the following node features to the embedding space: + - locs: x, y coordinates of the cities + """ + + def __init__(self, embed_dim, linear_bias=True): + super(CustomizeTSPInitEmbedding, self).__init__() + node_dim = 2 # x, y + self.init_embed = nn.Sequential( + nn.Linear(node_dim, embed_dim // 2, linear_bias), + nn.ReLU(inplace=True), + nn.Linear(embed_dim // 2, embed_dim, linear_bias), + ) + + def forward(self, td): + out = self.init_embed(td["locs"]) + return out + + +class NeuOptPolicy(ImprovementPolicy): + """ + NeuOpt Policy based on Ma et al. (2023) + This model first encodes the input graph and current solution using a N2S encoder (:class:`N2SEncoder`) + and then decodes the k-opt action (:class:`RDSDecoder`) + + Args: + embed_dim: Dimension of the node embeddings + num_encoder_layers: Number of layers in the encoder + num_heads: Number of heads in the attention layers + normalization: Normalization type in the attention layers + feedforward_hidden: Dimension of the hidden layer in the feedforward network + env_name: Name of the environment used to initialize embeddings + pos_type: Name of the used positional encoding method (CPE or APE) + init_embedding: Module to use for the initialization of the embeddings + pos_embedding: Module to use for the initialization of the positional embeddings + temperature: Temperature for the softmax + tanh_clipping: Tanh clipping value (see Bello et al., 2016) + train_decode_type: Type of decoding to use during training + val_decode_type: Type of decoding to use during validation + test_decode_type: Type of decoding to use during testing + """ + + def __init__( + self, + embed_dim: int = 128, + num_encoder_layers: int = 3, + num_heads: int = 4, + normalization: str = "layer", + feedforward_hidden: int = 128, + env_name: str = "tsp_kopt", + pos_type: str = "CPE", + init_embedding: nn.Module = None, + pos_embedding: nn.Module = None, + temperature: float = 1.0, + tanh_clipping: float = 6.0, + train_decode_type: str = "sampling", + val_decode_type: str = "sampling", + test_decode_type: str = "sampling", + ): + super(NeuOptPolicy, self).__init__() + + self.env_name = env_name + self.embed_dim = embed_dim + + # Decoding strategies + self.temperature = temperature + self.tanh_clipping = tanh_clipping + self.train_decode_type = train_decode_type + self.val_decode_type = val_decode_type + self.test_decode_type = test_decode_type + + # Encoder and decoder + if init_embedding is None: + init_embedding = CustomizeTSPInitEmbedding(self.embed_dim) + + self.encoder = N2SEncoder( + embed_dim=embed_dim, + init_embedding=init_embedding, + pos_embedding=pos_embedding, + env_name=env_name, + pos_type=pos_type, + num_heads=num_heads, + num_layers=num_encoder_layers, + normalization=normalization, + feedforward_hidden=feedforward_hidden, + ) + + self.decoder = RDSDecoder(embed_dim=embed_dim) + + self.init_hidden_W = nn.Linear(self.embed_dim, self.embed_dim) + self.init_query_learnable = nn.Parameter(torch.Tensor(self.embed_dim)) + + self.init_parameters() + + def init_parameters(self) -> None: + for param in self.parameters(): + stdv = 1.0 / math.sqrt(param.size(-1)) + param.data.uniform_(-stdv, stdv) + + def forward( + self, + td: TensorDict, + env: Union[str, RL4COEnvBase] = None, + phase: str = "train", + return_actions: bool = True, + return_embeds: bool = False, + only_return_embed: bool = False, + actions=None, + **decoding_kwargs, + ) -> dict: + """Forward pass of the policy. + + Args: + td: TensorDict containing the environment state + env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that + it is more efficient to pass an already instantiated environment each time for fine-grained control + phase: Phase of the algorithm (train, val, test) + return_actions: Whether to return the actions + actions: Actions to use for evaluating the policy. + If passed, use these actions instead of sampling from the policy to calculate log likelihood + decoding_kwargs: Keyword arguments for the decoding strategy. See :class:`rl4co.utils.decoding.DecodingStrategy` for more information. + + Returns: + out: Dictionary containing the reward, log likelihood, and optionally the actions and entropy + """ + + # Encoder: get encoder output and initial embeddings from initial state + nfe, _ = self.encoder(td) + if only_return_embed: + return {"embeds": nfe.detach()} + + # Instantiate environment if needed + if isinstance(env, str) or env is None: + env_name = self.env_name if env is None else env + log.info(f"Instantiated environment not provided; instantiating {env_name}") + env = get_env(env_name) + assert not env.two_opt_mode, "NeuOpt only support k-opt with k > 2" + + # Get decode type depending on phase and whether actions are passed for evaluation + decode_type = decoding_kwargs.pop("decode_type", None) + if actions is not None: + decode_type = "evaluate" + elif decode_type is None: + decode_type = getattr(self, f"{phase}_decode_type") + + # Setup decoding strategy + # we pop arguments that are not part of the decoding strategy + decode_strategy: DecodingStrategy = get_decoding_strategy( + decode_type, + temperature=decoding_kwargs.pop("temperature", self.temperature), + tanh_clipping=decoding_kwargs.pop("tanh_clipping", self.tanh_clipping), + mask_logits=True, + improvement_method_mode=True, + **decoding_kwargs, + ) + + # Perform the decoding + bs, gs, _, ll, action_sampled, rec, visited_time = ( + *nfe.size(), + 0.0, + None, + td["rec_current"], + td["visited_time"], + ) + action_index = torch.zeros(bs, env.k_max, dtype=torch.long).to(rec.device) + k_action_left = torch.zeros(bs, env.k_max + 1, dtype=torch.long).to(rec.device) + k_action_right = torch.zeros(bs, env.k_max, dtype=torch.long).to(rec.device) + next_of_last_action = ( + torch.zeros_like(rec[:, :1], dtype=torch.long).to(rec.device) - 1 + ) + mask = torch.zeros_like(rec, dtype=torch.bool).to(rec.device) + stopped = torch.ones(bs, dtype=torch.bool).to(rec.device) + zeros = torch.zeros((bs, 1), device=td.device) + + # init queries + h_mean = nfe.mean(1) + init_query = self.init_query_learnable.repeat(bs, 1) + input_q1 = input_q2 = init_query.clone() + init_hidden = self.init_hidden_W(h_mean) + q1 = q2 = init_hidden.clone() + + for i in range(env.k_max): + # Pass RDS decoder + logits, q1, q2 = self.decoder(nfe, q1, q2, input_q1, input_q2) + + # Calc probs + if i == 0 and "action" in td.keys(): + mask = mask.scatter(1, td["action"][:, :1], 1) + + logprob, action_sampled = decode_strategy.step( + logits, + ~mask.clone(), + action=actions[:, i : i + 1].squeeze() if actions is not None else None, + ) + action_sampled = action_sampled.unsqueeze(-1) + if i > 0: + action_sampled = torch.where( + stopped.unsqueeze(-1), action_index[:, :1], action_sampled + ) + if phase == "train": + loss_now = logprob.gather(1, action_sampled) + else: + loss_now = zeros.clone() + + # Record log_likelihood and Entropy + if i > 0: + ll = ll + torch.where(stopped.unsqueeze(-1), zeros * 0, loss_now) + else: + ll = ll + loss_now + + # Store and Process actions + next_of_new_action = rec.gather(1, action_sampled) + action_index[:, i] = action_sampled.squeeze().clone() + k_action_left[stopped, i] = action_sampled[stopped].squeeze().clone() + k_action_right[~stopped, i - 1] = action_sampled[~stopped].squeeze().clone() + k_action_left[:, i + 1] = next_of_new_action.squeeze().clone() + + # Prepare next RNN input + input_q1 = nfe.gather( + 1, action_sampled.view(bs, 1, 1).expand(bs, 1, self.embed_dim) + ).squeeze(1) + input_q2 = torch.where( + stopped.view(bs, 1).expand(bs, self.embed_dim), + input_q1.clone(), + nfe.gather( + 1, + (next_of_last_action % gs) + .view(bs, 1, 1) + .expand(bs, 1, self.embed_dim), + ).squeeze(1), + ) + + # Process if k-opt close + # assert (input_q1[stopped] == input_q2[stopped]).all() + if i > 0: + stopped = stopped | (action_sampled == next_of_last_action).squeeze() + else: + stopped = (action_sampled == next_of_last_action).squeeze() + # assert (input_q1[stopped] == input_q2[stopped]).all() + + k_action_left[stopped, i] = k_action_left[stopped, i - 1] + k_action_right[stopped, i] = k_action_right[stopped, i - 1] + + # Calc next basic masks + if i == 0: + visited_time_tag = ( + visited_time - visited_time.gather(1, action_sampled) + ) % gs + mask &= False + mask[(visited_time_tag <= visited_time_tag.gather(1, action_sampled))] = True + if i == 0: + mask[visited_time_tag > (gs - 2)] = True + mask[stopped, action_sampled[stopped].squeeze()] = ( + False # allow next k-opt starts immediately + ) + # if True:#i == env.k_max - 2: # allow special case: close k-opt at the first selected node + index_allow_first_node = (~stopped) & ( + next_of_new_action.squeeze() == action_index[:, 0] + ) + mask[index_allow_first_node, action_index[index_allow_first_node, 0]] = False + + # Move to next + next_of_last_action = next_of_new_action + next_of_last_action[stopped] = -1 + + # Form final action + k_action_right[~stopped, -1] = k_action_left[~stopped, -1].clone() + k_action_left = k_action_left[:, : env.k_max] + action_all = torch.cat((action_index, k_action_left, k_action_right), -1) + + outdict = {"log_likelihood": ll, "cost_bsf": td["cost_bsf"]} + td.set("action", action_all) + + if return_embeds: + outdict["embeds"] = nfe.detach() + + if return_actions: + outdict["actions"] = action_all + + return outdict diff --git a/rl4co/models/zoo/polynet/__init__.py b/rl4co/models/zoo/polynet/__init__.py new file mode 100644 index 00000000..1a908241 --- /dev/null +++ b/rl4co/models/zoo/polynet/__init__.py @@ -0,0 +1 @@ +from .model import PolyNet diff --git a/rl4co/models/zoo/polynet/decoder.py b/rl4co/models/zoo/polynet/decoder.py new file mode 100644 index 00000000..7a28fa1a --- /dev/null +++ b/rl4co/models/zoo/polynet/decoder.py @@ -0,0 +1,145 @@ +from dataclasses import dataclass +from typing import Tuple, Union + +import torch.nn as nn + +from torch import Tensor + +from rl4co.envs import RL4COEnvBase +from rl4co.models.nn.attention import PolyNetAttention +from rl4co.models.nn.env_embeddings import env_context_embedding, env_dynamic_embedding +from rl4co.models.nn.env_embeddings.dynamic import StaticEmbedding +from rl4co.models.zoo.am.decoder import AttentionModelDecoder +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +@dataclass +class PrecomputedCache: + node_embeddings: Tensor + graph_context: Union[Tensor, float] + glimpse_key: Tensor + glimpse_val: Tensor + logit_key: Tensor + + +class PolyNetDecoder(AttentionModelDecoder): + """ + PolyNet decoder for constructing diverse solutions for combinatorial optimization problems. + Given the environment state and the embeddings, compute the logits and sample actions autoregressively until + all the environments in the batch have reached a terminal state. + We additionally include support for multi-starts as it is more efficient to do so in the decoder as we can + natively perform the attention computation. + + Args: + k: Number of strategies to learn ("K" in the PolyNet paper) + encoder_type: Type of encoder that should be used. "AM" or "MatNet" are supported + embed_dim: Embedding dimension + poly_layer_dim: Dimension of the PolyNet layers + num_heads: Number of attention heads + env_name: Name of the environment used to initialize embeddings + context_embedding: Context embedding module + dynamic_embedding: Dynamic embedding module + mask_inner: Whether to mask the inner loop + out_bias_pointer_attn: Whether to use a bias in the pointer attention + linear_bias: Whether to use a bias in the linear layer + use_graph_context: Whether to use the graph context + check_nan: Whether to check for nan values during decoding + sdpa_fn: scaled_dot_product_attention function + """ + + def __init__( + self, + k: int, + encoder_type: str, + embed_dim: int = 128, + poly_layer_dim: int = 256, + num_heads: int = 8, + env_name: Union[str, RL4COEnvBase] = "tsp", + context_embedding: nn.Module = None, + dynamic_embedding: nn.Module = None, + mask_inner: bool = True, + out_bias_pointer_attn: bool = False, + linear_bias: bool = False, + use_graph_context: bool = True, + check_nan: bool = True, + sdpa_fn: callable = None, + **unused_kwargs, + ): + super().__init__() + + if isinstance(env_name, RL4COEnvBase): + env_name = env_name.name + self.env_name = env_name + self.embed_dim = embed_dim + self.num_heads = num_heads + self.encoder_type = encoder_type + + assert embed_dim % num_heads == 0 + + self.context_embedding = ( + env_context_embedding(self.env_name, {"embed_dim": embed_dim}) + if context_embedding is None + else context_embedding + ) + self.dynamic_embedding = ( + env_dynamic_embedding(self.env_name, {"embed_dim": embed_dim}) + if dynamic_embedding is None + else dynamic_embedding + ) + self.is_dynamic_embedding = ( + False if isinstance(self.dynamic_embedding, StaticEmbedding) else True + ) + + # MHA with Pointer mechanism (https://arxiv.org/abs/1506.03134) + self.pointer = PolyNetAttention( + k, + embed_dim, + poly_layer_dim, + num_heads, + mask_inner=mask_inner, + out_bias=out_bias_pointer_attn, + check_nan=check_nan, + sdpa_fn=sdpa_fn, + ) + + # For each node we compute (glimpse key, glimpse value, logit key) so 3 * embed_dim + self.project_node_embeddings = nn.Linear( + embed_dim, 3 * embed_dim, bias=linear_bias + ) + self.project_fixed_context = nn.Linear(embed_dim, embed_dim, bias=linear_bias) + self.use_graph_context = use_graph_context + + def _precompute_cache_matnet( + self, embeddings: Tuple[Tensor, Tensor], *args, **kwargs + ): + col_emb, row_emb = embeddings + ( + glimpse_key_fixed, + glimpse_val_fixed, + logit_key, + ) = self.project_node_embeddings( + col_emb + ).chunk(3, dim=-1) + + # Optionally disable the graph context from the initial embedding as done in POMO + if self.use_graph_context: + graph_context = self.project_fixed_context(col_emb.mean(1)) + else: + graph_context = 0 + + # Organize in a dataclass for easy access + return PrecomputedCache( + node_embeddings=row_emb, + graph_context=graph_context, + glimpse_key=glimpse_key_fixed, + glimpse_val=glimpse_val_fixed, + logit_key=logit_key, + ) + + def _precompute_cache(self, embeddings: Tuple[Tensor, Tensor], *args, **kwargs): + if self.encoder_type == "AM": + return super()._precompute_cache(embeddings, *args, **kwargs) + elif self.encoder_type == "MatNet": + return self._precompute_cache_matnet(embeddings, *args, **kwargs) diff --git a/rl4co/models/zoo/polynet/model.py b/rl4co/models/zoo/polynet/model.py new file mode 100644 index 00000000..ba8ea727 --- /dev/null +++ b/rl4co/models/zoo/polynet/model.py @@ -0,0 +1,240 @@ +import logging + +from typing import Any, Optional, Union + +import torch + +from tensordict import TensorDict + +from rl4co.data.transforms import StateAugmentation +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl.reinforce.reinforce import REINFORCE +from rl4co.models.zoo.polynet.policy import PolyNetPolicy +from rl4co.utils.ops import gather_by_index, unbatchify +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class PolyNet(REINFORCE): + """PolyNet + Based on Hottung et al. (2024) https://arxiv.org/abs/2402.14048. + + Note: + PolyNet allows to learn diverse solution stratgies with a single model. This is achieved + through a modified decoder and the Poppy loss (Grinsztajn et al. (2021)). PolyNet can be used with the attention model encoder or the MatNet encoder by + setting encoder_type to "AM" or "MatNet", respectively. + + Args: + env: TorchRL Environment + policy: Policy to use for the algorithm + k: Number of strategies to learn ("K" in the paper) + val_num_solutions: Number of solutions that are generated per instance during validation + encoder_type: Type of encoder that should be used. "AM" or "MatNet" are supported + policy_kwargs: Keyword arguments for policy + baseline: Baseline to use for the algorithm. Note that PolyNet only supports shared baseline, + so we will throw an error if anything else is passed. + num_augment: Number of augmentations (used only for validation and test) + augment_fn: Function to use for augmentation, defaulting to dihedral8 + first_aug_identity: Whether to include the identity augmentation in the first position + feats: List of features to augment + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: PolyNetPolicy = None, + k: int = 128, + val_num_solutions: int = 800, + encoder_type="AM", + base_model_checkpoint_path: str = None, + policy_kwargs={}, + baseline: str = "shared", + num_augment: int = 8, + augment_fn: Union[str, callable] = "dihedral8", + first_aug_identity: bool = True, + feats: list = None, + **kwargs, + ): + self.save_hyperparameters(logger=False) + + self.k = k + self.val_num_solutions = val_num_solutions + + assert encoder_type in [ + "AM", + "MatNet", + ], "Supported encoder types are 'AM' and 'MatNet'" + + assert baseline == "shared", "PolyNet only supports shared baseline" + + if ( + policy_kwargs.get("val_decode_type") == "greedy" + or policy_kwargs.get("test_decode_type") == "greedy" + ): + assert ( + val_num_solutions <= k + ), "If greedy decoding is used val_num_solutions must be <= k" + + if encoder_type == "MatNet": + assert ( + num_augment == 1 + ), "MatNet does not use symmetric or dihedral augmentation" + + if policy is None: + policy = PolyNetPolicy( + env_name=env.name, k=k, encoder_type=encoder_type, **policy_kwargs + ) + + if base_model_checkpoint_path is not None: + logging.info( + f"Trying to load weights from baseline model {base_model_checkpoint_path}" + ) + checkpoint = torch.load(base_model_checkpoint_path) + state_dict = checkpoint["state_dict"] + state_dict = {k.replace("policy.", "", 1): v for k, v in state_dict.items()} + policy.load_state_dict(state_dict, strict=False) + + train_batch_size = kwargs["batch_size"] if "batch_size" in kwargs else 64 + kwargs_with_defaults = { + "val_batch_size": train_batch_size, + "test_batch_size": train_batch_size, + } + kwargs_with_defaults.update(kwargs) + + # Initialize with the shared baseline + super(PolyNet, self).__init__(env, policy, baseline, **kwargs_with_defaults) + + self.num_augment = num_augment + if self.num_augment > 1: + self.augment = StateAugmentation( + num_augment=self.num_augment, + augment_fn=augment_fn, + first_aug_identity=first_aug_identity, + feats=feats, + ) + else: + self.augment = None + + # Add `_multistart` to decode type for train, val and test in policy + # for phase in ["train", "val", "test"]: + # self.set_decode_type_multistart(phase) + + def shared_step( + self, batch: Any, batch_idx: int, phase: str, dataloader_idx: int = None + ): + td = self.env.reset(batch) + n_aug = self.num_augment + + # During training, we do not augment the data + if phase == "train": + n_aug = 0 + elif n_aug > 1: + td = self.augment(td) + + if phase == "train": + n_start = self.k + else: + n_start = self.val_num_solutions + + # Evaluate policy + out = self.policy( + td, + self.env, + phase=phase, + num_starts=n_start, + multisample=True, + ) + + # Unbatchify reward to [batch_size, num_augment, num_starts]. + reward = unbatchify(out["reward"], (n_aug, n_start)) + + # Training phase + if phase == "train": + assert n_start > 1, "num_starts must be > 1 during training" + log_likelihood = unbatchify(out["log_likelihood"], (n_aug, n_start)) + self.calculate_loss(td, batch, out, reward, log_likelihood) + max_reward, max_idxs = reward.max(dim=-1) + out.update({"max_reward": max_reward}) + # Get multi-start (=POMO) rewards and best actions only during validation and test + else: + if n_start > 1: + # max multi-start reward + max_reward, max_idxs = reward.max(dim=-1) + out.update({"max_reward": max_reward}) + + if out.get("actions", None) is not None: + # Reshape batch to [batch_size, num_augment, num_starts, ...] + actions = unbatchify(out["actions"], (n_aug, n_start)) + out.update( + { + "best_multistart_actions": gather_by_index( + actions, max_idxs.unsqueeze(2), dim=2 + ) + } + ) + out["actions"] = actions + + # Get augmentation score only during inference + if n_aug > 1: + # If multistart is enabled, we use the best multistart rewards + reward_ = max_reward if n_start > 1 else reward + max_aug_reward, max_idxs = reward_.max(dim=1) + out.update({"max_aug_reward": max_aug_reward}) + + if out.get("actions", None) is not None: + actions_ = ( + out["best_multistart_actions"] if n_start > 1 else out["actions"] + ) + out.update({"best_aug_actions": gather_by_index(actions_, max_idxs)}) + + metrics = self.log_metrics(out, phase, dataloader_idx=dataloader_idx) + return {"loss": out.get("loss", None), **metrics} + + def calculate_loss( + self, + td: TensorDict, + batch: TensorDict, + policy_out: dict, + reward: Optional[torch.Tensor] = None, + log_likelihood: Optional[torch.Tensor] = None, + ): + """Calculate loss following Poppy (https://arxiv.org/abs/2210.03475). + + Args: + td: TensorDict containing the current state of the environment + batch: Batch of data. This is used to get the extra loss terms, e.g., REINFORCE baseline + policy_out: Output of the policy network + reward: Reward tensor. If None, it is taken from `policy_out` + log_likelihood: Log-likelihood tensor. If None, it is taken from `policy_out` + """ + # Extra: this is used for additional loss terms, e.g., REINFORCE baseline + extra = batch.get("extra", None) + reward = reward if reward is not None else policy_out["reward"] + log_likelihood = ( + log_likelihood if log_likelihood is not None else policy_out["log_likelihood"] + ) + + # REINFORCE baseline + bl_val, bl_loss = ( + self.baseline.eval(td, reward, self.env) if extra is None else (extra, 0) + ) + + # Log-likelihood mask. Mask everything but the best rollout per instance + best_idx = (-reward).argsort(1).argsort(1) + mask = best_idx < 1 + + # Main loss function + advantage = reward - bl_val # advantage = reward - baseline + reinforce_loss = -(advantage * log_likelihood * mask).mean() + loss = reinforce_loss + bl_loss + policy_out.update( + { + "loss": loss, + "reinforce_loss": reinforce_loss, + "bl_loss": bl_loss, + "bl_val": bl_val, + } + ) + return policy_out diff --git a/rl4co/models/zoo/polynet/policy.py b/rl4co/models/zoo/polynet/policy.py new file mode 100644 index 00000000..d2128a6f --- /dev/null +++ b/rl4co/models/zoo/polynet/policy.py @@ -0,0 +1,101 @@ +from typing import Union + +import torch.nn as nn + +from rl4co.envs import RL4COEnvBase +from rl4co.models.common.constructive.autoregressive.policy import AutoregressivePolicy +from rl4co.models.zoo.am.encoder import AttentionModelEncoder +from rl4co.models.zoo.matnet.encoder import MatNetEncoder +from rl4co.models.zoo.polynet.decoder import PolyNetDecoder + + +class PolyNetPolicy(AutoregressivePolicy): + """ + # TODO + Polynet policy based on Hottung et al. (2024) https://arxiv.org/abs/2402.14048. + The model uses either the AttentionModel encoder or the MatNet encoder in combination with + a custom PolyNet decoder. + + Note: The default arguments for the AttentionModel encoder follow the POMO paper. The default decoding type + during validation and testing is 'sampling'. + + Args: + k: Number of strategies to learn ("K" in the paper) + encoder_type: Type of encoder that should be used. "AM" or "MatNet" are supported. + embed_dim: Dimension of the node embeddings + num_encoder_layers: Number of layers in the encoder + num_heads: Number of heads in the attention layers + normalization: Normalization type in the attention layers + feedforward_hidden: Dimension of the hidden layer in the feedforward network + env_name: Name of the environment used to initialize embeddings + temperature: Temperature for the softmax + tanh_clipping: Tanh clipping value (see Bello et al., 2016) + mask_logits: Whether to mask the logits during decoding + train_decode_type: Type of decoding to use during training + val_decode_type: Type of decoding to use during validation + test_decode_type: Type of decoding to use during testing + **kwargs: keyword arguments passed to the encoder and decoder modules + """ + + def __init__( + self, + k: int, + encoder: nn.Module = None, + encoder_type: str = "AM", + embed_dim: int = 128, + num_encoder_layers: int = 6, + num_heads: int = 8, + normalization: str = "instance", + feedforward_hidden: int = 512, + env_name: Union[str, RL4COEnvBase] = "tsp", + temperature: float = 1.0, + tanh_clipping: float = 10.0, + mask_logits: bool = True, + train_decode_type: str = "sampling", + val_decode_type: str = "sampling", + test_decode_type: str = "sampling", + **kwargs, + ): + if encoder is None: + if encoder_type == "AM": + encoder = AttentionModelEncoder( + embed_dim=embed_dim, + num_heads=num_heads, + num_layers=num_encoder_layers, + env_name=env_name, + normalization=normalization, + feedforward_hidden=feedforward_hidden, + **kwargs, + ) + elif encoder_type == "MatNet": + kwargs_with_defaults = {"init_embedding_kwargs": {"mode": "RandomOneHot"}} + kwargs_with_defaults.update(kwargs) + encoder = MatNetEncoder( + embed_dim=embed_dim, + num_heads=num_heads, + num_layers=num_encoder_layers, + normalization=normalization, + **kwargs_with_defaults, + ) + + decoder = PolyNetDecoder( + k=k, + encoder_type=encoder_type, + embed_dim=embed_dim, + num_heads=num_heads, + env_name=env_name, + **kwargs, + ) + + super(PolyNetPolicy, self).__init__( + encoder=encoder, + decoder=decoder, + env_name=env_name, + temperature=temperature, + tanh_clipping=tanh_clipping, + mask_logits=mask_logits, + train_decode_type=train_decode_type, + val_decode_type=val_decode_type, + test_decode_type=test_decode_type, + **kwargs, + ) diff --git a/rl4co/models/zoo/pomo/__init__.py b/rl4co/models/zoo/pomo/__init__.py new file mode 100644 index 00000000..d16e98d7 --- /dev/null +++ b/rl4co/models/zoo/pomo/__init__.py @@ -0,0 +1 @@ +from .model import POMO diff --git a/rl4co/models/zoo/pomo/model.py b/rl4co/models/zoo/pomo/model.py new file mode 100644 index 00000000..bb361b36 --- /dev/null +++ b/rl4co/models/zoo/pomo/model.py @@ -0,0 +1,148 @@ +from typing import Any, Union + +import torch.nn as nn + +from rl4co.data.transforms import StateAugmentation +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl.reinforce.reinforce import REINFORCE +from rl4co.models.zoo.am import AttentionModelPolicy +from rl4co.utils.ops import gather_by_index, unbatchify +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class POMO(REINFORCE): + """POMO Model for neural combinatorial optimization based on REINFORCE + Based on Kwon et al. (2020) http://arxiv.org/abs/2010.16011. + + Note: + If no policy kwargs is passed, we use the Attention Model policy with the following arguments: + Differently to the base class: + - `num_encoder_layers=6` (instead of 3) + - `normalization="instance"` (instead of "batch") + - `use_graph_context=False` (instead of True) + The latter is due to the fact that the paper does not use the graph context in the policy, which seems to be + helpful in overfitting to the training graph size. + + Args: + env: TorchRL Environment + policy: Policy to use for the algorithm + policy_kwargs: Keyword arguments for policy + baseline: Baseline to use for the algorithm. Note that POMO only supports shared baseline, + so we will throw an error if anything else is passed. + num_augment: Number of augmentations (used only for validation and test) + augment_fn: Function to use for augmentation, defaulting to dihedral8 + first_aug_identity: Whether to include the identity augmentation in the first position + feats: List of features to augment + num_starts: Number of starts for multi-start. If None, use the number of available actions + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: nn.Module = None, + policy_kwargs={}, + baseline: str = "shared", + num_augment: int = 8, + augment_fn: Union[str, callable] = "dihedral8", + first_aug_identity: bool = True, + feats: list = None, + num_starts: int = None, + **kwargs, + ): + self.save_hyperparameters(logger=False) + + if policy is None: + policy_kwargs_with_defaults = { + "num_encoder_layers": 6, + "normalization": "instance", + "use_graph_context": False, + } + policy_kwargs_with_defaults.update(policy_kwargs) + policy = AttentionModelPolicy( + env_name=env.name, **policy_kwargs_with_defaults + ) + + assert baseline == "shared", "POMO only supports shared baseline" + + # Initialize with the shared baseline + super(POMO, self).__init__(env, policy, baseline, **kwargs) + + self.num_starts = num_starts + self.num_augment = num_augment + if self.num_augment > 1: + self.augment = StateAugmentation( + num_augment=self.num_augment, + augment_fn=augment_fn, + first_aug_identity=first_aug_identity, + feats=feats, + ) + else: + self.augment = None + + # Add `_multistart` to decode type for train, val and test in policy + for phase in ["train", "val", "test"]: + self.set_decode_type_multistart(phase) + + def shared_step( + self, batch: Any, batch_idx: int, phase: str, dataloader_idx: int = None + ): + td = self.env.reset(batch) + n_aug, n_start = self.num_augment, self.num_starts + n_start = self.env.get_num_starts(td) if n_start is None else n_start + + # During training, we do not augment the data + if phase == "train": + n_aug = 0 + elif n_aug > 1: + td = self.augment(td) + + # Evaluate policy + out = self.policy(td, self.env, phase=phase, num_starts=n_start) + + # Unbatchify reward to [batch_size, num_augment, num_starts]. + reward = unbatchify(out["reward"], (n_aug, n_start)) + + # Training phase + if phase == "train": + assert n_start > 1, "num_starts must be > 1 during training" + log_likelihood = unbatchify(out["log_likelihood"], (n_aug, n_start)) + self.calculate_loss(td, batch, out, reward, log_likelihood) + max_reward, max_idxs = reward.max(dim=-1) + out.update({"max_reward": max_reward}) + # Get multi-start (=POMO) rewards and best actions only during validation and test + else: + if n_start > 1: + # max multi-start reward + max_reward, max_idxs = reward.max(dim=-1) + out.update({"max_reward": max_reward}) + + if out.get("actions", None) is not None: + # Reshape batch to [batch_size, num_augment, num_starts, ...] + actions = unbatchify(out["actions"], (n_aug, n_start)) + out.update( + { + "best_multistart_actions": gather_by_index( + actions, max_idxs, dim=max_idxs.dim() + ) + } + ) + out["actions"] = actions + + # Get augmentation score only during inference + if n_aug > 1: + # If multistart is enabled, we use the best multistart rewards + reward_ = max_reward if n_start > 1 else reward + max_aug_reward, max_idxs = reward_.max(dim=1) + out.update({"max_aug_reward": max_aug_reward}) + + if out.get("actions", None) is not None: + actions_ = ( + out["best_multistart_actions"] if n_start > 1 else out["actions"] + ) + out.update({"best_aug_actions": gather_by_index(actions_, max_idxs)}) + + metrics = self.log_metrics(out, phase, dataloader_idx=dataloader_idx) + return {"loss": out.get("loss", None), **metrics} diff --git a/rl4co/models/zoo/ptrnet/__init__.py b/rl4co/models/zoo/ptrnet/__init__.py new file mode 100644 index 00000000..631b3154 --- /dev/null +++ b/rl4co/models/zoo/ptrnet/__init__.py @@ -0,0 +1,2 @@ +from .model import PointerNetwork +from .policy import PointerNetworkPolicy diff --git a/rl4co/models/zoo/ptrnet/critic.py b/rl4co/models/zoo/ptrnet/critic.py new file mode 100644 index 00000000..efbda9ed --- /dev/null +++ b/rl4co/models/zoo/ptrnet/critic.py @@ -0,0 +1,58 @@ +import torch +import torch.nn as nn + +from .decoder import SimpleAttention +from .encoder import Encoder + + +class CriticNetworkLSTM(nn.Module): + """Useful as a baseline in REINFORCE updates""" + + def __init__( + self, + embed_dim, + hidden_dim, + n_process_block_iters, + tanh_exploration, + use_tanh, + ): + super(CriticNetworkLSTM, self).__init__() + + self.hidden_dim = hidden_dim + self.n_process_block_iters = n_process_block_iters + + self.encoder = Encoder(embed_dim, hidden_dim) + + self.process_block = SimpleAttention( + hidden_dim, use_tanh=use_tanh, C=tanh_exploration + ) + self.sm = nn.Softmax(dim=1) + self.decoder = nn.Sequential( + nn.Linear(hidden_dim, hidden_dim), nn.ReLU(), nn.Linear(hidden_dim, 1) + ) + + def forward(self, inputs): + """ + Args: + inputs: [embed_dim x batch_size x sourceL] of embedded inputs + """ + inputs = inputs.transpose(0, 1).contiguous() + + encoder_hx = ( + self.encoder.init_hx.unsqueeze(0).repeat(inputs.size(1), 1).unsqueeze(0) + ) + encoder_cx = ( + self.encoder.init_cx.unsqueeze(0).repeat(inputs.size(1), 1).unsqueeze(0) + ) + + # encoder forward pass + enc_outputs, (enc_h_t, enc_c_t) = self.encoder(inputs, (encoder_hx, encoder_cx)) + + # grab the hidden state and process it via the process block + process_block_state = enc_h_t[-1] + for i in range(self.n_process_block_iters): + ref, logits = self.process_block(process_block_state, enc_outputs) + process_block_state = torch.bmm(ref, self.sm(logits).unsqueeze(2)).squeeze(2) + # produce the final scalar output + out = self.decoder(process_block_state) + return out diff --git a/rl4co/models/zoo/ptrnet/decoder.py b/rl4co/models/zoo/ptrnet/decoder.py new file mode 100644 index 00000000..710f03c0 --- /dev/null +++ b/rl4co/models/zoo/ptrnet/decoder.py @@ -0,0 +1,182 @@ +import math + +import torch +import torch.nn as nn +import torch.nn.functional as F + +from rl4co.utils.decoding import decode_logprobs +from rl4co.utils.ops import gather_by_index + + +class SimpleAttention(nn.Module): + """A generic attention module for a decoder in seq2seq""" + + def __init__(self, dim, use_tanh=False, C=10): + super(SimpleAttention, self).__init__() + self.use_tanh = use_tanh + self.project_query = nn.Linear(dim, dim) + self.project_ref = nn.Conv1d(dim, dim, 1, 1) + self.C = C # tanh exploration + + self.v = nn.Parameter(torch.FloatTensor(dim)) + self.v.data.uniform_(-(1.0 / math.sqrt(dim)), 1.0 / math.sqrt(dim)) + + def forward(self, query, ref): + """ + Args: + query: is the hidden state of the decoder at the current + time step. batch x dim + ref: the set of hidden states from the encoder. + sourceL x batch x hidden_dim + """ + # ref is now [batch_size x hidden_dim x sourceL] + ref = ref.permute(1, 2, 0) + q = self.project_query(query).unsqueeze(2) # batch x dim x 1 + e = self.project_ref(ref) # batch_size x hidden_dim x sourceL + # expand the query by sourceL + # batch x dim x sourceL + expanded_q = q.repeat(1, 1, e.size(2)) + # batch x 1 x hidden_dim + v_view = self.v.unsqueeze(0).expand(expanded_q.size(0), len(self.v)).unsqueeze(1) + # [batch_size x 1 x hidden_dim] * [batch_size x hidden_dim x sourceL] + u = torch.bmm(v_view, F.tanh(expanded_q + e)).squeeze(1) + if self.use_tanh: + logits = self.C * F.tanh(u) + else: + logits = u + return e, logits + + +class Decoder(nn.Module): + def __init__( + self, + embed_dim: int = 128, + hidden_dim: int = 128, + tanh_exploration: float = 10.0, + use_tanh: bool = True, + num_glimpses=1, + mask_glimpses=True, + mask_logits=True, + ): + super(Decoder, self).__init__() + + self.embed_dim = embed_dim + self.hidden_dim = hidden_dim + self.num_glimpses = num_glimpses + self.mask_glimpses = mask_glimpses + self.mask_logits = mask_logits + self.use_tanh = use_tanh + self.tanh_exploration = tanh_exploration + + self.lstm = nn.LSTMCell(embed_dim, hidden_dim) + self.pointer = SimpleAttention(hidden_dim, use_tanh=use_tanh, C=tanh_exploration) + self.glimpse = SimpleAttention(hidden_dim, use_tanh=False) + + def update_mask(self, mask, selected): + return mask.clone().scatter_(1, selected.unsqueeze(-1), False) + + def recurrence(self, x, h_in, prev_mask, prev_idxs, step, context): + logit_mask = ( + self.update_mask(prev_mask, prev_idxs) if prev_idxs is not None else prev_mask + ) + + logits, h_out = self.calc_logits( + x, h_in, logit_mask, context, self.mask_glimpses, self.mask_logits + ) + + # Calculate log_softmax for better numerical stability + log_p = torch.log_softmax(logits, dim=1) + + if not self.mask_logits: + log_p[~logit_mask] = float("-inf") + + return h_out, log_p, logit_mask + + def calc_logits( + self, x, h_in, logit_mask, context, mask_glimpses=None, mask_logits=None + ): + if mask_glimpses is None: + mask_glimpses = self.mask_glimpses + + if mask_logits is None: + mask_logits = self.mask_logits + + hy, cy = self.lstm(x, h_in) + g_l, h_out = hy, (hy, cy) + + for i in range(self.num_glimpses): + ref, logits = self.glimpse(g_l, context) + # For the glimpses, only mask before softmax so we have always an L1 norm 1 readout vector + if mask_glimpses: + logits[~logit_mask] = float("-inf") + # [batch_size x h_dim x sourceL] * [batch_size x sourceL x 1] = + # [batch_size x h_dim x 1] + g_l = torch.bmm(ref, F.softmax(logits, dim=1).unsqueeze(2)).squeeze(2) + _, logits = self.pointer(g_l, context) + + # Masking before softmax makes probs sum to one + if mask_logits: + logits[~logit_mask] = float("-inf") + + return logits, h_out + + def forward( + self, + decoder_input, + embedded_inputs, + hidden, + context, + decode_type="sampling", + eval_tours=None, + ): + """ + Args: + decoder_input: The initial input to the decoder + size is [batch_size x embed_dim]. Trainable parameter. + embedded_inputs: [sourceL x batch_size x embed_dim] + hidden: the prev hidden state, size is [batch_size x hidden_dim]. + Initially this is set to (enc_h[-1], enc_c[-1]) + context: encoder outputs, [sourceL x batch_size x hidden_dim] + """ + + batch_size = context.size(1) + outputs = [] + selections = [] + steps = range(embedded_inputs.size(0)) + idxs = None + mask = torch.ones( + embedded_inputs.size(1), + embedded_inputs.size(0), + dtype=torch.bool, + device=embedded_inputs.device, + ) + + for i in steps: + hidden, log_p, mask = self.recurrence( + decoder_input, hidden, mask, idxs, i, context + ) + # select the next inputs for the decoder [batch_size x hidden_dim] + idxs = ( + decode_logprobs(log_p, mask, decode_type=decode_type) + if eval_tours is None + else eval_tours[:, i] + ) + # select logp of chosen action + log_p = gather_by_index(log_p, idxs, dim=1) + + idxs = ( + idxs.detach() + ) # Otherwise pytorch complains it want's a reward, todo implement this more properly? + # Gather input embedding of selected + decoder_input = torch.gather( + embedded_inputs, + 0, + idxs.contiguous() + .view(1, batch_size, 1) + .expand(1, batch_size, *embedded_inputs.size()[2:]), + ).squeeze(0) + + # use outs to point to next object + outputs.append(log_p) + selections.append(idxs) + return (torch.stack(outputs, 1), torch.stack(selections, 1)), hidden diff --git a/rl4co/models/zoo/ptrnet/encoder.py b/rl4co/models/zoo/ptrnet/encoder.py new file mode 100644 index 00000000..575c7430 --- /dev/null +++ b/rl4co/models/zoo/ptrnet/encoder.py @@ -0,0 +1,29 @@ +import math + +import torch +import torch.nn as nn + + +class Encoder(nn.Module): + """Maps a graph represented as an input sequence + to a hidden vector""" + + def __init__(self, input_dim, hidden_dim): + super(Encoder, self).__init__() + self.hidden_dim = hidden_dim + self.lstm = nn.LSTM(input_dim, hidden_dim) + self.init_hx, self.init_cx = self.init_hidden(hidden_dim) + + def forward(self, x, hidden): + output, hidden = self.lstm(x, hidden) + return output, hidden + + def init_hidden(self, hidden_dim): + """Trainable initial hidden state""" + std = 1.0 / math.sqrt(hidden_dim) + enc_init_hx = nn.Parameter(torch.FloatTensor(hidden_dim)) + enc_init_hx.data.uniform_(-std, std) + + enc_init_cx = nn.Parameter(torch.FloatTensor(hidden_dim)) + enc_init_cx.data.uniform_(-std, std) + return enc_init_hx, enc_init_cx diff --git a/rl4co/models/zoo/ptrnet/model.py b/rl4co/models/zoo/ptrnet/model.py new file mode 100644 index 00000000..66381255 --- /dev/null +++ b/rl4co/models/zoo/ptrnet/model.py @@ -0,0 +1,35 @@ +from typing import Union + +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl import REINFORCE +from rl4co.models.rl.reinforce.baselines import REINFORCEBaseline +from rl4co.models.zoo.ptrnet.policy import PointerNetworkPolicy + + +class PointerNetwork(REINFORCE): + """Pointer Network for neural combinatorial optimization based on REINFORCE + Based on Vinyals et al. (2015) https://arxiv.org/abs/1506.03134 + Refactored from reference implementation: https://github.com/wouterkool/attention-learn-to-route + + Args: + env: Environment to use for the algorithm + policy: Policy to use for the algorithm + baseline: REINFORCE baseline. Defaults to rollout (1 epoch of exponential, then greedy rollout baseline) + policy_kwargs: Keyword arguments for policy + baseline_kwargs: Keyword arguments for baseline + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: PointerNetworkPolicy = None, + baseline: Union[REINFORCEBaseline, str] = "rollout", + policy_kwargs={}, + baseline_kwargs={}, + **kwargs, + ): + policy = ( + PointerNetworkPolicy(env=env, **policy_kwargs) if policy is None else policy + ) + super().__init__(env, policy, baseline, baseline_kwargs, **kwargs) diff --git a/rl4co/models/zoo/ptrnet/policy.py b/rl4co/models/zoo/ptrnet/policy.py new file mode 100644 index 00000000..dc0373a3 --- /dev/null +++ b/rl4co/models/zoo/ptrnet/policy.py @@ -0,0 +1,107 @@ +import math + +import torch +import torch.nn as nn + +from rl4co.models.zoo.ptrnet.decoder import Decoder +from rl4co.models.zoo.ptrnet.encoder import Encoder +from rl4co.utils.decoding import get_log_likelihood +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class PointerNetworkPolicy(nn.Module): + def __init__( + self, + env_name: str = "tsp", + embed_dim: int = 128, + hidden_dim: int = 128, + tanh_clipping=10.0, + mask_inner=True, + mask_logits=True, + **kwargs, + ): + super(PointerNetworkPolicy, self).__init__() + + assert env_name == "tsp", "Only the Euclidean TSP env is implemented" + self.env_name = env_name + self.input_dim = 2 + + self.encoder = Encoder(embed_dim, hidden_dim) + + self.decoder = Decoder( + embed_dim, + hidden_dim, + tanh_exploration=tanh_clipping, + use_tanh=tanh_clipping > 0, + num_glimpses=1, + mask_glimpses=mask_inner, + mask_logits=mask_logits, + ) + + # Trainable initial hidden states + std = 1.0 / math.sqrt(embed_dim) + self.decoder_in_0 = nn.Parameter(torch.FloatTensor(embed_dim)) + self.decoder_in_0.data.uniform_(-std, std) + + self.embedding = nn.Parameter(torch.FloatTensor(self.input_dim, embed_dim)) + self.embedding.data.uniform_(-std, std) + + def forward( + self, + td, + env, + phase: str = "train", + decode_type="sampling", + eval_tours=None, + **unused_kwargs, + ): + if len(unused_kwargs) > 0: + log.info(f"Unused kwargs for {self.__class__.__name__}: {unused_kwargs}") + + # Set train or eval mode. Although this is already done by PyTorch Lightning, + # there still is an exception raised otherwise https://github.com/pytorch/captum/issues/564 + if phase == "train": + self.train() + else: + self.eval() + + batch_size, graph_size, input_dim = td["locs"].size() + + embedded_inputs = torch.mm( + td["locs"].transpose(0, 1).contiguous().view(-1, input_dim), + self.embedding, + ).view(graph_size, batch_size, -1) + + # query the actor net for the input indices + # making up the output, and the pointer attn + _logprobs, actions = self._inner(embedded_inputs, decode_type, eval_tours) + + reward = env.get_reward(td, actions) + + # Log likelyhood is calculated within the model since returning it per action does not work well with + # DataParallel since sequences can be of different lengths + ll = get_log_likelihood(_logprobs, actions, td.get("mask", None)) + + out = {"reward": reward, "log_likelihood": ll, "actions": actions} + return out + + def _inner(self, inputs, decode_type="sampling", eval_tours=None): + encoder_hx = encoder_cx = torch.zeros( + 1, *inputs.shape[1:], device=inputs.device + ) # (1, inputs.size(1), self.encoder.hidden_dim, device=inputs.device, out=inputs.data.new(), requires_grad=False) + + # encoder forward pass + enc_h, (enc_h_t, enc_c_t) = self.encoder(inputs, (encoder_hx, encoder_cx)) + + dec_init_state = (enc_h_t[-1], enc_c_t[-1]) + + # repeat decoder_in_0 across batch + decoder_input = self.decoder_in_0.unsqueeze(0).repeat(inputs.size(1), 1) + + (pointer_probs, input_idxs), dec_hidden_t = self.decoder( + decoder_input, inputs, dec_init_state, enc_h, decode_type, eval_tours + ) + + return pointer_probs, input_idxs diff --git a/rl4co/models/zoo/symnco/__init__.py b/rl4co/models/zoo/symnco/__init__.py new file mode 100644 index 00000000..80a9ca2e --- /dev/null +++ b/rl4co/models/zoo/symnco/__init__.py @@ -0,0 +1,2 @@ +from .model import SymNCO +from .policy import SymNCOPolicy diff --git a/rl4co/models/zoo/symnco/losses.py b/rl4co/models/zoo/symnco/losses.py new file mode 100644 index 00000000..38f9265e --- /dev/null +++ b/rl4co/models/zoo/symnco/losses.py @@ -0,0 +1,39 @@ +from einops import rearrange +from torch.nn.functional import cosine_similarity + + +def problem_symmetricity_loss(reward, log_likelihood, dim=1): + """REINFORCE loss for problem symmetricity + Baseline is the average reward for all augmented problems + Corresponds to `L_ps` in the SymNCO paper + """ + num_augment = reward.shape[dim] + if num_augment < 2: + return 0 + advantage = reward - reward.mean(dim=dim, keepdim=True) + loss = -advantage * log_likelihood + return loss.mean() + + +def solution_symmetricity_loss(reward, log_likelihood, dim=-1): + """REINFORCE loss for solution symmetricity + Baseline is the average reward for all start nodes + Corresponds to `L_ss` in the SymNCO paper + """ + num_starts = reward.shape[dim] + if num_starts < 2: + return 0 + advantage = reward - reward.mean(dim=dim, keepdim=True) + loss = -advantage * log_likelihood + return loss.mean() + + +def invariance_loss(proj_embed, num_augment): + """Loss for invariant representation on projected nodes + Corresponds to `L_inv` in the SymNCO paper + """ + pe = rearrange(proj_embed, "(b a) ... -> b a ...", a=num_augment) + similarity = sum( + [cosine_similarity(pe[:, 0], pe[:, i], dim=-1) for i in range(1, num_augment)] + ) + return similarity.mean() diff --git a/rl4co/models/zoo/symnco/model.py b/rl4co/models/zoo/symnco/model.py new file mode 100644 index 00000000..93d73d1a --- /dev/null +++ b/rl4co/models/zoo/symnco/model.py @@ -0,0 +1,142 @@ +from typing import Any, Union + +import torch.nn as nn + +from rl4co.data.transforms import StateAugmentation +from rl4co.envs.common.base import RL4COEnvBase +from rl4co.models.rl.reinforce.reinforce import REINFORCE +from rl4co.models.zoo.symnco.losses import ( + invariance_loss, + problem_symmetricity_loss, + solution_symmetricity_loss, +) +from rl4co.models.zoo.symnco.policy import SymNCOPolicy +from rl4co.utils.ops import gather_by_index, get_num_starts, unbatchify +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class SymNCO(REINFORCE): + """SymNCO Model based on REINFORCE with shared baselines. + Based on Kim et al. (2022) https://arxiv.org/abs/2205.13209. + + Args: + env: TorchRL environment to use for the algorithm + policy: Policy to use for the algorithm + policy_kwargs: Keyword arguments for policy + num_augment: Number of augmentations + augment_fn: Function to use for augmentation, defaulting to dihedral_8_augmentation + feats: List of features to augment + alpha: weight for invariance loss + beta: weight for solution symmetricity loss + num_starts: Number of starts for multi-start. If None, use the number of available actions + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + env: RL4COEnvBase, + policy: Union[nn.Module, SymNCOPolicy] = None, + policy_kwargs: dict = {}, + baseline: str = "symnco", + num_augment: int = 4, + augment_fn: Union[str, callable] = "symmetric", + feats: list = None, + alpha: float = 0.2, + beta: float = 1, + num_starts: int = 0, + **kwargs, + ): + self.save_hyperparameters(logger=False) + + if policy is None: + policy = SymNCOPolicy(env_name=env.name, **policy_kwargs) + + assert baseline == "symnco", "SymNCO only supports custom-symnco baseline" + baseline = "no" # Pass no baseline to superclass since there are multiple custom baselines + + # Pass no baseline to superclass since there are multiple custom baselines + super().__init__(env, policy, baseline, **kwargs) + + self.num_starts = num_starts + self.num_augment = num_augment + self.augment = StateAugmentation( + num_augment=self.num_augment, augment_fn=augment_fn, feats=feats + ) + self.alpha = alpha # weight for invariance loss + self.beta = beta # weight for solution symmetricity loss + + # Add `_multistart` to decode type for train, val and test in policy if num_starts > 1 + if self.num_starts > 1: + for phase in ["train", "val", "test"]: + self.set_decode_type_multistart(phase) + + def shared_step( + self, batch: Any, batch_idx: int, phase: str, dataloader_idx: int = None + ): + td = self.env.reset(batch) + n_aug, n_start = self.num_augment, self.num_starts + n_start = get_num_starts(td, self.env.name) if n_start is None else n_start + + # Symmetric augmentation + if n_aug > 1: + td = self.augment(td) + + # Evaluate policy + out = self.policy(td, self.env, phase=phase, num_starts=n_start) + + # Unbatchify reward to [batch_size, n_start, n_aug]. + reward = unbatchify(out["reward"], (n_start, n_aug)) + + # Main training loss + if phase == "train": + # [batch_size, n_start, n_aug] + ll = unbatchify(out["log_likelihood"], (n_start, n_aug)) + + # Calculate losses: problem symmetricity, solution symmetricity, invariance + loss_ps = problem_symmetricity_loss(reward, ll) if n_start > 1 else 0 + loss_ss = solution_symmetricity_loss(reward, ll) if n_aug > 1 else 0 + loss_inv = invariance_loss(out["proj_embeddings"], n_aug) if n_aug > 1 else 0 + loss = loss_ps + self.beta * loss_ss + self.alpha * loss_inv + out.update( + { + "loss": loss, + "loss_ss": loss_ss, + "loss_ps": loss_ps, + "loss_inv": loss_inv, + } + ) + + # Log only during validation and test + else: + if n_start > 1: + # max multi-start reward + max_reward, max_idxs = reward.max(dim=1) + out.update({"max_reward": max_reward}) + + # Reshape batch to [batch, n_start, n_aug] + if out.get("actions", None) is not None: + actions = unbatchify(out["actions"], (n_start, n_aug)) + out.update( + {"best_multistart_actions": gather_by_index(actions, max_idxs)} + ) + out["actions"] = actions + + # Get augmentation score only during inference + if n_aug > 1: + # If multistart is enabled, we use the best multistart rewards + reward_ = max_reward if n_start > 1 else reward + max_aug_reward, max_idxs = reward_.max(dim=1) + out.update({"max_aug_reward": max_aug_reward}) + if out.get("best_multistart_actions", None) is not None: + out.update( + { + "best_aug_actions": gather_by_index( + out["best_multistart_actions"], max_idxs + ) + } + ) + + metrics = self.log_metrics(out, phase, dataloader_idx=dataloader_idx) + return {"loss": out.get("loss", None), **metrics} diff --git a/rl4co/models/zoo/symnco/policy.py b/rl4co/models/zoo/symnco/policy.py new file mode 100644 index 00000000..92c69e03 --- /dev/null +++ b/rl4co/models/zoo/symnco/policy.py @@ -0,0 +1,91 @@ +from typing import Union + +import torch.nn as nn + +from tensordict.tensordict import TensorDict +from torchrl.modules.models import MLP + +from rl4co.envs import RL4COEnvBase +from rl4co.models.zoo.am import AttentionModelPolicy +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +class SymNCOPolicy(AttentionModelPolicy): + """SymNCO Policy based on AutoregressivePolicy. + This differs from the default :class:`AutoregressivePolicy` in that it + projects the initial embeddings to a lower dimension using a projection head and + returns it. This is used in the SymNCO algorithm to compute the invariance loss. + Based on Kim et al. (2022) https://arxiv.org/abs/2205.13209. + + Args: + embed_dim: Dimension of the embedding + env_name: Name of the environment + num_encoder_layers: Number of layers in the encoder + num_heads: Number of heads in the encoder + normalization: Normalization to use in the encoder + projection_head: Projection head to use + use_projection_head: Whether to use projection head + **kwargs: Keyword arguments passed to the superclass + """ + + def __init__( + self, + embed_dim: int = 128, + env_name: str = "tsp", + num_encoder_layers: int = 3, + num_heads: int = 8, + normalization: str = "batch", + projection_head: nn.Module = None, + use_projection_head: bool = True, + **kwargs, + ): + super(SymNCOPolicy, self).__init__( + env_name=env_name, + embed_dim=embed_dim, + num_encoder_layers=num_encoder_layers, + num_heads=num_heads, + normalization=normalization, + **kwargs, + ) + + self.use_projection_head = use_projection_head + + if self.use_projection_head: + self.projection_head = ( + MLP(embed_dim, embed_dim, 1, embed_dim, nn.ReLU) + if projection_head is None + else projection_head + ) + + def forward( + self, + td: TensorDict, + env: Union[str, RL4COEnvBase] = None, + phase: str = "train", + return_actions: bool = True, + return_init_embeds: bool = True, + **kwargs, + ) -> dict: + super().forward.__doc__ # trick to get docs from parent class + + # Ensure that if use_projection_head is True, then return_init_embeds is True + assert not ( + self.use_projection_head and not return_init_embeds + ), "If `use_projection_head` is True, then we must `return_init_embeds`" + + out = super().forward( + td, + env, + phase, + return_actions=return_actions, + return_init_embeds=return_init_embeds, + **kwargs, + ) + + # Project initial embeddings + if self.use_projection_head: + out["proj_embeddings"] = self.projection_head(out["init_embeds"]) + + return out diff --git a/rl4co/tasks/__init__.py b/rl4co/tasks/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/tasks/eval.py b/rl4co/tasks/eval.py new file mode 100644 index 00000000..3f32eacb --- /dev/null +++ b/rl4co/tasks/eval.py @@ -0,0 +1,591 @@ +import time + +import numpy as np +import torch + +from torch.utils.data import DataLoader +from tqdm.auto import tqdm + +from rl4co.data.transforms import StateAugmentation +from rl4co.utils.ops import batchify, gather_by_index, sample_n_random_actions, unbatchify + + +def check_unused_kwargs(class_, kwargs): + if len(kwargs) > 0 and not (len(kwargs) == 1 and "progress" in kwargs): + print(f"Warning: {class_.__class__.__name__} does not use kwargs {kwargs}") + + +class EvalBase: + """Base class for evaluation + + Args: + env: Environment + progress: Whether to show progress bar + **kwargs: Additional arguments (to be implemented in subclasses) + """ + + name = "base" + + def __init__(self, env, progress=True, **kwargs): + check_unused_kwargs(self, kwargs) + self.env = env + self.progress = progress + + def __call__(self, policy, dataloader, **kwargs): + """Evaluate the policy on the given dataloader with **kwargs parameter + self._inner is implemented in subclasses and returns actions and rewards + """ + start = time.time() + + with torch.inference_mode(): + rewards_list = [] + actions_list = [] + + for batch in tqdm( + dataloader, disable=not self.progress, desc=f"Running {self.name}" + ): + td = batch.to(next(policy.parameters()).device) + td = self.env.reset(td) + actions, rewards = self._inner(policy, td, **kwargs) + rewards_list.append(rewards) + actions_list.append(actions) + + rewards = torch.cat(rewards_list) + + # Padding: pad actions to the same length with zeros + max_length = max(action.size(-1) for action in actions_list) + actions = torch.cat( + [ + torch.nn.functional.pad(action, (0, max_length - action.size(-1))) + for action in actions_list + ], + 0, + ) + + inference_time = time.time() - start + + tqdm.write(f"Mean reward for {self.name}: {rewards.mean():.4f}") + tqdm.write(f"Time: {inference_time:.4f}s") + + # Empty cache + if torch.cuda.is_available(): + torch.cuda.empty_cache() + + return { + "actions": actions.cpu(), + "rewards": rewards.cpu(), + "inference_time": inference_time, + "avg_reward": rewards.cpu().mean(), + } + + def _inner(self, policy, td): + """Inner function to be implemented in subclasses. + This function returns actions and rewards for the given policy + """ + raise NotImplementedError("Implement in subclass") + + +class GreedyEval(EvalBase): + """Evaluates the policy using greedy decoding and single trajectory""" + + name = "greedy" + + def __init__(self, env, **kwargs): + check_unused_kwargs(self, kwargs) + super().__init__(env, kwargs.get("progress", True)) + + def _inner(self, policy, td): + out = policy( + td.clone(), + decode_type="greedy", + num_starts=0, + ) + rewards = self.env.get_reward(td, out["actions"]) + return out["actions"], rewards + + +class AugmentationEval(EvalBase): + """Evaluates the policy via N state augmentations + `force_dihedral_8` forces the use of 8 augmentations (rotations and flips) as in POMO + https://en.wikipedia.org/wiki/Examples_of_groups#dihedral_group_of_order_8 + + Args: + num_augment (int): Number of state augmentations + force_dihedral_8 (bool): Whether to force the use of 8 augmentations + """ + + name = "augmentation" + + def __init__(self, env, num_augment=8, force_dihedral_8=False, feats=None, **kwargs): + check_unused_kwargs(self, kwargs) + super().__init__(env, kwargs.get("progress", True)) + self.augmentation = StateAugmentation( + num_augment=num_augment, + augment_fn="dihedral8" if force_dihedral_8 else "symmetric", + feats=feats, + ) + + def _inner(self, policy, td, num_augment=None): + if num_augment is None: + num_augment = self.augmentation.num_augment + td_init = td.clone() + td = self.augmentation(td) + out = policy(td.clone(), decode_type="greedy", num_starts=0) + + # Move into batches and compute rewards + rewards = self.env.get_reward(batchify(td_init, num_augment), out["actions"]) + rewards = unbatchify(rewards, num_augment) + actions = unbatchify(out["actions"], num_augment) + + # Get best reward and corresponding action + rewards, max_idxs = rewards.max(dim=1) + actions = gather_by_index(actions, max_idxs, dim=1) + return actions, rewards + + @property + def num_augment(self): + return self.augmentation.num_augment + + +class SamplingEval(EvalBase): + """Evaluates the policy via N samples from the policy + + Args: + samples (int): Number of samples to take + softmax_temp (float): Temperature for softmax sampling. The higher the temperature, the more random the sampling + """ + + name = "sampling" + + def __init__( + self, + env, + samples, + softmax_temp=None, + select_best=True, + temperature=1.0, + top_p=0.0, + top_k=0, + **kwargs, + ): + check_unused_kwargs(self, kwargs) + super().__init__(env, kwargs.get("progress", True)) + + self.samples = samples + self.softmax_temp = softmax_temp + self.temperature = temperature + self.select_best = select_best + self.top_p = top_p + self.top_k = top_k + + def _inner(self, policy, td): + out = policy( + td.clone(), + decode_type="sampling", + num_starts=self.samples, + temperature=self.temperature, + top_p=self.top_p, + top_k=self.top_k, + multisample=True, + softmax_temp=self.softmax_temp, + select_best=self.select_best, + select_start_nodes_fn=lambda td, _, n: sample_n_random_actions(td, n), + ) + + # Move into batches and compute rewards + rewards = out["reward"] + actions = out["actions"] + + return actions, rewards + + +class GreedyMultiStartEval(EvalBase): + """Evaluates the policy via `num_starts` greedy multistarts samples from the policy + + Args: + num_starts (int): Number of greedy multistarts to use + """ + + name = "multistart_greedy" + + def __init__(self, env, num_starts=None, **kwargs): + check_unused_kwargs(self, kwargs) + super().__init__(env, kwargs.get("progress", True)) + + assert num_starts is not None, "Must specify num_starts" + self.num_starts = num_starts + + def _inner(self, policy, td): + td_init = td.clone() + out = policy( + td.clone(), + decode_type="multistart_greedy", + num_starts=self.num_starts, + ) + + # Move into batches and compute rewards + td = batchify(td_init, self.num_starts) + rewards = self.env.get_reward(td, out["actions"]) + rewards = unbatchify(rewards, self.num_starts) + actions = unbatchify(out["actions"], self.num_starts) + + # Get the best trajectories + rewards, max_idxs = rewards.max(dim=1) + actions = gather_by_index(actions, max_idxs, dim=1) + return actions, rewards + + +class GreedyMultiStartAugmentEval(EvalBase): + """Evaluates the policy via `num_starts` samples from the policy + and `num_augment` augmentations of each sample.` + `force_dihedral_8` forces the use of 8 augmentations (rotations and flips) as in POMO + https://en.wikipedia.org/wiki/Examples_of_groups#dihedral_group_of_order_8 + + Args: + num_starts: Number of greedy multistart samples + num_augment: Number of augmentations per sample + force_dihedral_8: If True, force the use of 8 augmentations (rotations and flips) as in POMO + """ + + name = "multistart_greedy_augment" + + def __init__( + self, + env, + num_starts=None, + num_augment=8, + force_dihedral_8=False, + feats=None, + **kwargs, + ): + check_unused_kwargs(self, kwargs) + super().__init__(env, kwargs.get("progress", True)) + + assert num_starts is not None, "Must specify num_starts" + self.num_starts = num_starts + assert not ( + num_augment != 8 and force_dihedral_8 + ), "Cannot force dihedral 8 when num_augment != 8" + self.augmentation = StateAugmentation( + num_augment=num_augment, + augment_fn="dihedral8" if force_dihedral_8 else "symmetric", + feats=feats, + ) + + def _inner(self, policy, td, num_augment=None): + if num_augment is None: + num_augment = self.augmentation.num_augment + + td_init = td.clone() + + td = self.augmentation(td) + out = policy( + td.clone(), + decode_type="multistart_greedy", + num_starts=self.num_starts, + ) + + # Move into batches and compute rewards + td = batchify(td_init, (num_augment, self.num_starts)) + rewards = self.env.get_reward(td, out["actions"]) + rewards = unbatchify(rewards, self.num_starts * num_augment) + actions = unbatchify(out["actions"], self.num_starts * num_augment) + + # Get the best trajectories + rewards, max_idxs = rewards.max(dim=1) + actions = gather_by_index(actions, max_idxs, dim=1) + return actions, rewards + + @property + def num_augment(self): + return self.augmentation.num_augment + + +def get_automatic_batch_size(eval_fn, start_batch_size=8192, max_batch_size=4096): + """Automatically reduces the batch size based on the eval function + + Args: + eval_fn: The eval function + start_batch_size: The starting batch size. This should be the theoretical maximum batch size + max_batch_size: The maximum batch size. This is the practical maximum batch size + """ + batch_size = start_batch_size + + effective_ratio = 1 + + if hasattr(eval_fn, "num_starts"): + batch_size = batch_size // (eval_fn.num_starts // 10) + effective_ratio *= eval_fn.num_starts // 10 + if hasattr(eval_fn, "num_augment"): + batch_size = batch_size // eval_fn.num_augment + effective_ratio *= eval_fn.num_augment + if hasattr(eval_fn, "samples"): + batch_size = batch_size // eval_fn.samples + effective_ratio *= eval_fn.samples + + batch_size = min(batch_size, max_batch_size) + # get closest integer power of 2 + batch_size = 2 ** int(np.log2(batch_size)) + + print(f"Effective batch size: {batch_size} (ratio: {effective_ratio})") + + return batch_size + + +def evaluate_policy( + env, + policy, + dataset, + method="greedy", + batch_size=None, + max_batch_size=4096, + start_batch_size=8192, + auto_batch_size=True, + samples=1280, + softmax_temp=1.0, + num_augment=8, + force_dihedral_8=True, + **kwargs, +): + num_loc = getattr(env.generator, "num_loc", None) + + methods_mapping = { + "greedy": {"func": GreedyEval, "kwargs": {}}, + "sampling": { + "func": SamplingEval, + "kwargs": {"samples": samples, "softmax_temp": softmax_temp}, + }, + "multistart_greedy": { + "func": GreedyMultiStartEval, + "kwargs": {"num_starts": num_loc}, + }, + "augment_dihedral_8": { + "func": AugmentationEval, + "kwargs": {"num_augment": num_augment, "force_dihedral_8": force_dihedral_8}, + }, + "augment": {"func": AugmentationEval, "kwargs": {"num_augment": num_augment}}, + "multistart_greedy_augment_dihedral_8": { + "func": GreedyMultiStartAugmentEval, + "kwargs": { + "num_augment": num_augment, + "force_dihedral_8": force_dihedral_8, + "num_starts": num_loc, + }, + }, + "multistart_greedy_augment": { + "func": GreedyMultiStartAugmentEval, + "kwargs": {"num_augment": num_augment, "num_starts": num_loc}, + }, + } + + assert method in methods_mapping, "Method {} not found".format(method) + + # Set up the evaluation function + eval_settings = methods_mapping[method] + func, kwargs_ = eval_settings["func"], eval_settings["kwargs"] + # subsitute kwargs with the ones passed in + kwargs_.update(kwargs) + kwargs = kwargs_ + eval_fn = func(env, **kwargs) + + if auto_batch_size: + assert ( + batch_size is None + ), "Cannot specify batch_size when auto_batch_size is True" + batch_size = get_automatic_batch_size( + eval_fn, max_batch_size=max_batch_size, start_batch_size=start_batch_size + ) + print("Using automatic batch size: {}".format(batch_size)) + + # Set up the dataloader + dataloader = DataLoader( + dataset, + batch_size=batch_size, + shuffle=False, + num_workers=0, + collate_fn=dataset.collate_fn, + ) + + # Run evaluation + retvals = eval_fn(policy, dataloader) + + return retvals + + +if __name__ == "__main__": + import argparse + import importlib + import os + import pickle + + import torch + + from rl4co.envs import get_env + + parser = argparse.ArgumentParser() + + # Environment + parser.add_argument("--problem", type=str, default="tsp", help="Problem to solve") + parser.add_argument( + "--generator-params", + type=dict, + default={"num_loc": 50}, + help="Generator parameters for the environment", + ) + parser.add_argument( + "--data-path", + type=str, + default="data/tsp/tsp50_test_seed1234.npz", + help="Path of the test data npz file", + ) + + # Model + parser.add_argument( + "--model", + type=str, + default="AttentionModel", + help="The class name of the valid model", + ) + parser.add_argument( + "--ckpt-path", + type=str, + default="checkpoints/am-tsp50.ckpt", + help="The path of the checkpoint file", + ) + parser.add_argument( + "--device", type=str, default="cuda:1", help="Device to run the evaluation" + ) + + # Evaluation + parser.add_argument( + "--method", + type=str, + default="greedy", + help="Evaluation method, support 'greedy', 'sampling',\ + 'multistart_greedy', 'augment_dihedral_8', 'augment', 'multistart_greedy_augment_dihedral_8',\ + 'multistart_greedy_augment'", + ) + parser.add_argument( + "--temperature", type=float, default=1.0, help="Temperature for sampling" + ) + parser.add_argument( + "--top-p", + type=float, + default=0.0, + help="Top-p for sampling, from 0.0 to 1.0, 0.0 means not activated", + ) + parser.add_argument("--top-k", type=int, default=0, help="Top-k for sampling") + parser.add_argument( + "--select-best", + default=True, + action=argparse.BooleanOptionalAction, + help="During sampling, whether to select the best action, use --no-select_best to disable", + ) + parser.add_argument( + "--save-results", + default=True, + action=argparse.BooleanOptionalAction, + help="Whether to save the evaluation results", + ) + parser.add_argument( + "--save-path", + type=str, + default="results", + help="The root path to save the results", + ) + parser.add_argument( + "--num-instances", + type=int, + default=1000, + help="Number of instances to test, maximum 10000", + ) + + parser.add_argument( + "--samples", type=int, default=1280, help="Number of samples for sampling method" + ) + parser.add_argument( + "--softmax-temp", + type=float, + default=1.0, + help="Temperature for softmax in the sampling method", + ) + parser.add_argument( + "--num-augment", + type=int, + default=8, + help="Number of augmentations for augmentation method", + ) + parser.add_argument( + "--force-dihedral-8", + default=True, + action=argparse.BooleanOptionalAction, + help="Force the use of 8 augmentations for augmentation method", + ) + + opts = parser.parse_args() + + # Log the evaluation setting information + print(f"Problem: {opts.problem}-{opts.generator_params['num_loc']}") + print(f"Model: {opts.model}") + print(f"Loading test instances from: {opts.data_path}") + print(f"Loading model checkpoint from: {opts.ckpt_path}") + print(f"Using the device: {opts.device}") + print(f"Evaluation method: {opts.method}") + print(f"Number of instances to test: {opts.num_instances}") + + if opts.method == "sampling": + print(f"[Sampling] Number of samples: {opts.samples}") + print(f"[Sampling] Temperature: {opts.temperature}") + print(f"[Sampling] Top-p: {opts.top_p}") + print(f"[Sampling] Top-k: {opts.top_k}") + print(f"[Sampling] Softmax temperature: {opts.softmax_temp}") + print(f"[Sampling] Select best: {opts.select_best}") + + if opts.method == "augment" or opts.method == "augment_dihedral_8": + print(f"[Augmentation] Number of augmentations: {opts.num_augment}") + print(f"[Augmentation] Force dihedral 8: {opts.force_dihedral_8}") + + if opts.save_results: + print(f"Saving the results to: {opts.save_path}") + else: + print("[Warning] The result will not be saved!") + + # Init the environment + env = get_env(opts.problem, generator_params=opts.generator_params) + + # Load the test data + dataset = env.dataset(filename=opts.data_path) + + # Restrict the instances of testing + dataset.data_len = min(opts.num_instances, len(dataset)) + + # Load the model from checkpoint + model_root = importlib.import_module("rl4co.models.zoo") + model_cls = getattr(model_root, opts.model) + model = model_cls.load_from_checkpoint(opts.ckpt_path, load_baseline=False) + model = model.to(opts.device) + + # Evaluate + result = evaluate_policy( + env=env, + policy=model.policy, + dataset=dataset, + method=opts.method, + temperature=opts.temperature, + top_p=opts.top_p, + top_k=opts.top_k, + samples=opts.samples, + softmax_temp=opts.softmax_temp, + num_augment=opts.num_augment, + select_best=True, + force_dihedral_8=True, + ) + + # Save the results + if opts.save_results: + if not os.path.exists(opts.save_path): + os.makedirs(opts.save_path) + save_fname = f"{env.name}{env.generator.num_loc}-{opts.model}-{opts.method}-temp-{opts.temperature}-top_p-{opts.top_p}-top_k-{opts.top_k}.pkl" + save_path = os.path.join(opts.save_path, save_fname) + with open(save_path, "wb") as f: + pickle.dump(result, f) diff --git a/rl4co/tasks/index.html b/rl4co/tasks/index.html new file mode 100644 index 00000000..8c8412a7 --- /dev/null +++ b/rl4co/tasks/index.html @@ -0,0 +1,2454 @@ + + + + + + + + + + + + + + + + + + + + + + + Evaluation - RL4CO + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + +
+ + +
+ +
+ + + + + + + + + +
+
+ + + +
+
+
+ + + + + + + +
+
+
+ + + +
+
+
+ + + + + +
+
+
+ + + +
+
+ + + + + + + + + +

Evaluation

+

To evaluate your trained model, here are some steps to follow:

+

Step 1. Prepare your pre-trained model checkpoint and test instances data file. Put them in your preferred place. e.g., we will test the AttentionModel on TSP50:

+
.
+├── rl4co/
+│   └── ...
+├── checkpoints/
+│   └── am-tsp50.ckpt
+└── data/
+    └── tsp/
+        └── tsp50_test_seed1234.npz
+
+

You can generate the test instances data file by running the following command:

+
python -c "from rl4co.data.generate_data import generate_default_datasets; generate_default_datasets('data')"
+
+

Step 2. Run the eval.py with your customized setting. e.g., let's use the sampling method with a top_p=0.95 sampling strategy:

+
python rl4co/tasks/eval.py --problem tsp --data-path data/tsp/tsp50_test_seed1234.npz --model AttentionModel --ckpt-path checkpoints/am-tsp50.ckpt --method sampling --top-p 0.95
+
+

Arguments guideline:

+
    +
  • --problem: the problem name, e.g., tsp, cvrp, pdp, etc. This should be consistent with the env.name. Default is tsp.
  • +
  • --generator-params: the generator parameters for the test instances. You could specify the num_loc etc. Default is {'num_loc': 50}.
  • +
  • --data-path: the path to the test instances data file. Default is data/tsp/tsp50_test_seed1234.npz.
  • +
  • --model: the model class name, e.g., AttentionModel, POMO, SymNCO, etc. It will be dynamically imported and instantiated. Default is AttentionModel.
  • +
  • --ckpt-path: the path to the pre-trained model checkpoint. Default is checkpoints/am-tsp50.ckpt.
  • +
  • --device: the device to run the evaluation, e.g., cuda:0, cpu, etc. Default is cuda:0.
  • +
  • --method: the evaluation method, e.g., greedy, sampling, multistart_greedy, augment_dihedral_8, augment, multistart_greedy_augment_dihedral_8, and multistart_greedy_augment. Default is greedy.
  • +
  • --save-results: whether to save the evaluation results as a .pkl file. Deafult is True. The results include actions, rewards, inference_time, and avg_reward.
  • +
  • --save-path: the path to save the evaluation results. Default is results/.
  • +
  • --num-instances: the number of test instances to evaluate. Default is 1000.
  • +
+

If you use the sampling method, you may need to specify the following parameters:

+
    +
  • --samples: the number of samples for the sampling method. Default is 1280.
  • +
  • --temperature: the temperature for the sampling method. Default is 1.0.
  • +
  • --top-p: the top-p for the sampling method. Default is 0.0, i.e. not activated.
  • +
  • --top-k: the top-k for the sampling method. Deafult is 0, i.e. not activated.
  • +
  • --select-best: whether to select the best action from the sampling results. If False, the results will include all sampled rewards, i.e., [num_instances * num_samples].
  • +
+

If you use the augment method, you may need to specify the following parameters:

+
    +
  • --num-augments: the number of augmented instances for the augment method. Default is 8.
  • +
  • --force-dihedral-8: whether to force the augmented instances to be dihedral 8. Default is True.
  • +
+

Step 3. If you want to launch several evaluations with various parameters, you may refer to the following examples:

+
    +
  • Evaluate POMO on TSP50 with a sampling of different Top-p and temperature:
        #!/bin/bash
    +
    +    top_p_list=(0.5 0.6 0.7 0.8 0.9 0.95 0.98 0.99 0.995 1.0)
    +    temp_list=(0.1 0.3 0.5 0.7 0.8 0.9 1.0 1.1 1.2 1.5 1.8 2.0 2.2 2.5 2.8 3.0)
    +
    +    device=cuda:0
    +
    +    problem=tsp
    +    model=POMO
    +    ckpt_path=checkpoints/pomo-tsp50.ckpt
    +    data_path=data/tsp/tsp50_test_seed1234.npz
    +
    +    num_instances=1000
    +    save_path=results/tsp50-pomo-topp-1k
    +
    +    for top_p in ${top_p_list[@]}; do
    +        for temp in ${temp_list[@]}; do
    +            python rl4co/tasks/eval.py --problem ${problem} --model ${model} --ckpt_path ${ckpt_path} --data_path ${data_path} --save_path ${save_path} --method sampling --temperature=${temp} --top_p=${top_p} --top_k=0 --device ${device}
    +        done
    +    done
    +
    +
  • +
+
    +
  • Evaluate POMO on CVRP50 with a sampling of different Top-k and temperature:
        #!/bin/bash
    +
    +    top_k_list=(5 10 15 20 25)
    +    temp_list=(0.1 0.3 0.5 0.7 0.8 0.9 1.0 1.1 1.2 1.5 1.8 2.0 2.2 2.5 2.8 3.0)
    +
    +    device=cuda:1
    +
    +    problem=cvrp
    +    model=POMO
    +    ckpt_path=checkpoints/pomo-cvrp50.ckpt
    +    data_path=data/vrp/vrp50_test_seed1234.npz
    +
    +    num_instances=1000
    +    save_path=results/cvrp50-pomo-topk-1k
    +
    +    for top_k in ${top_k_list[@]}; do
    +        for temp in ${temp_list[@]}; do
    +            python rl4co/tasks/eval.py --problem ${problem} --model ${model} --ckpt_path ${ckpt_path} --data_path ${data_path} --save_path ${save_path} --method sampling --temperature=${temp} --top_p=0.0 --top_k=${top_k} --device ${device}
    +        done
    +    done
    +
    +
  • +
+ + + + + + + + + + + + + + +
+
+ + + + + +
+ + + +
+ + + +
+
+
+
+ +
+ + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/rl4co/tasks/train.py b/rl4co/tasks/train.py new file mode 100644 index 00000000..b1d104b4 --- /dev/null +++ b/rl4co/tasks/train.py @@ -0,0 +1,117 @@ +from typing import List, Optional, Tuple + +import hydra +import lightning as L +import pyrootutils +import torch + +from lightning import Callback, LightningModule +from lightning.pytorch.loggers import Logger +from omegaconf import DictConfig + +from rl4co import utils +from rl4co.utils import RL4COTrainer + +pyrootutils.setup_root(__file__, indicator=".gitignore", pythonpath=True) + + +log = utils.get_pylogger(__name__) + + +@utils.task_wrapper +def run(cfg: DictConfig) -> Tuple[dict, dict]: + """Trains the model. Can additionally evaluate on a testset, using best weights obtained during + training. + This method is wrapped in optional @task_wrapper decorator, that controls the behavior during + failure. Useful for multiruns, saving info about the crash, etc. + + Args: + cfg (DictConfig): Configuration composed by Hydra. + Returns: + Tuple[dict, dict]: Dict with metrics and dict with all instantiated objects. + """ + + # set seed for random number generators in pytorch, numpy and python.random + if cfg.get("seed"): + L.seed_everything(cfg.seed, workers=True) + + # We instantiate the environment separately and then pass it to the model + log.info(f"Instantiating environment <{cfg.env._target_}>") + env = hydra.utils.instantiate(cfg.env) + + # Note that the RL environment is instantiated inside the model + log.info(f"Instantiating model <{cfg.model._target_}>") + model: LightningModule = hydra.utils.instantiate(cfg.model, env) + + log.info("Instantiating callbacks...") + callbacks: List[Callback] = utils.instantiate_callbacks(cfg.get("callbacks")) + + log.info("Instantiating loggers...") + logger: List[Logger] = utils.instantiate_loggers(cfg.get("logger"), model) + + log.info("Instantiating trainer...") + trainer: RL4COTrainer = hydra.utils.instantiate( + cfg.trainer, + callbacks=callbacks, + logger=logger, + ) + + object_dict = { + "cfg": cfg, + "model": model, + "callbacks": callbacks, + "logger": logger, + "trainer": trainer, + } + + if logger: + log.info("Logging hyperparameters!") + utils.log_hyperparameters(object_dict) + + if cfg.get("compile", False): + log.info("Compiling model!") + model = torch.compile(model) + + if cfg.get("train"): + log.info("Starting training!") + trainer.fit(model=model, ckpt_path=cfg.get("ckpt_path")) + + train_metrics = trainer.callback_metrics + + if cfg.get("test"): + log.info("Starting testing!") + ckpt_path = trainer.checkpoint_callback.best_model_path + if ckpt_path == "": + log.warning("Best ckpt not found! Using current weights for testing...") + ckpt_path = None + trainer.test(model=model, ckpt_path=ckpt_path) + log.info(f"Best ckpt path: {ckpt_path}") + + test_metrics = trainer.callback_metrics + + # merge train and test metrics + metric_dict = {**train_metrics, **test_metrics} + + return metric_dict, object_dict + + +@hydra.main(version_base="1.3", config_path="../../configs", config_name="main.yaml") +def train(cfg: DictConfig) -> Optional[float]: + # apply extra utilities + # (e.g. ask for tags if none are provided in cfg, print cfg tree, etc.) + utils.extras(cfg) + + # train the model + metric_dict, _ = run(cfg) + + # safely retrieve metric value for hydra-based hyperparameter optimization + metric_value = utils.get_metric_value( + metric_dict=metric_dict, metric_name=cfg.get("optimized_metric") + ) + + # return optimized metric + return metric_value + + +if __name__ == "__main__": + train() diff --git a/rl4co/utils/__init__.py b/rl4co/utils/__init__.py new file mode 100644 index 00000000..4b0246aa --- /dev/null +++ b/rl4co/utils/__init__.py @@ -0,0 +1,11 @@ +from rl4co.utils.instantiators import instantiate_callbacks, instantiate_loggers +from rl4co.utils.pylogger import get_pylogger +from rl4co.utils.rich_utils import enforce_tags, print_config_tree +from rl4co.utils.trainer import RL4COTrainer +from rl4co.utils.utils import ( + extras, + get_metric_value, + log_hyperparameters, + show_versions, + task_wrapper, +) diff --git a/rl4co/utils/callbacks/__init__.py b/rl4co/utils/callbacks/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/rl4co/utils/callbacks/speed_monitor.py b/rl4co/utils/callbacks/speed_monitor.py new file mode 100644 index 00000000..3f1ab6ae --- /dev/null +++ b/rl4co/utils/callbacks/speed_monitor.py @@ -0,0 +1,123 @@ +# Adapted from https://pytorch-lightning.readthedocs.io/en/latest/_modules/pytorch_lightning/callbacks/gpu_stats_monitor.html#GPUStatsMonitor +# We only need the speed monitoring, not the GPU monitoring +import time + +import lightning as L + +from lightning.pytorch.callbacks import Callback +from lightning.pytorch.utilities.parsing import AttributeDict +from lightning.pytorch.utilities.rank_zero import rank_zero_only + + +class SpeedMonitor(Callback): + """Monitor the speed of each step and each epoch.""" + + def __init__( + self, + intra_step_time: bool = True, + inter_step_time: bool = True, + epoch_time: bool = True, + verbose=False, + ): + super().__init__() + self._log_stats = AttributeDict( + { + "intra_step_time": intra_step_time, + "inter_step_time": inter_step_time, + "epoch_time": epoch_time, + } + ) + self.verbose = verbose + + def on_train_start(self, trainer: "L.Trainer", L_module: "L.LightningModule") -> None: + self._snap_epoch_time = None + + def on_train_epoch_start( + self, trainer: "L.Trainer", L_module: "L.LightningModule" + ) -> None: + self._snap_intra_step_time = None + self._snap_inter_step_time = None + self._snap_epoch_time = time.time() + + def on_validation_epoch_start( + self, trainer: "L.Trainer", L_module: "L.LightningModule" + ) -> None: + self._snap_inter_step_time = None + + def on_test_epoch_start( + self, trainer: "L.Trainer", L_module: "L.LightningModule" + ) -> None: + self._snap_inter_step_time = None + + @rank_zero_only + def on_train_batch_start( + self, + trainer: "L.Trainer", + *unused_args, + **unused_kwargs, # easy fix for new pytorch lightning versions + ) -> None: + if self._log_stats.intra_step_time: + self._snap_intra_step_time = time.time() + + if not self._should_log(trainer): + return + + logs = {} + if self._log_stats.inter_step_time and self._snap_inter_step_time: + # First log at beginning of second step + logs["time/inter_step (ms)"] = ( + time.time() - self._snap_inter_step_time + ) * 1000 + + if trainer.logger is not None: + trainer.logger.log_metrics(logs, step=trainer.global_step) + + @rank_zero_only + def on_train_batch_end( + self, + trainer: "L.Trainer", + L_module: "L.LightningModule", + *unused_args, + **unused_kwargs, # easy fix for new pytorch lightning versions + ) -> None: + if self._log_stats.inter_step_time: + self._snap_inter_step_time = time.time() + + if ( + self.verbose + and self._log_stats.intra_step_time + and self._snap_intra_step_time + ): + L_module.print( + f"time/intra_step (ms): {(time.time() - self._snap_intra_step_time) * 1000}" + ) + + if not self._should_log(trainer): + return + + logs = {} + if self._log_stats.intra_step_time and self._snap_intra_step_time: + logs["time/intra_step (ms)"] = ( + time.time() - self._snap_intra_step_time + ) * 1000 + + if trainer.logger is not None: + trainer.logger.log_metrics(logs, step=trainer.global_step) + + @rank_zero_only + def on_train_epoch_end( + self, + trainer: "L.Trainer", + L_module: "L.LightningModule", + ) -> None: + logs = {} + if self._log_stats.epoch_time and self._snap_epoch_time: + logs["time/epoch (s)"] = time.time() - self._snap_epoch_time + if trainer.logger is not None: + trainer.logger.log_metrics(logs, step=trainer.global_step) + + @staticmethod + def _should_log(trainer) -> bool: + return ( + trainer.global_step + 1 + ) % trainer.log_every_n_steps == 0 or trainer.should_stop diff --git a/rl4co/utils/decoding.py b/rl4co/utils/decoding.py new file mode 100644 index 00000000..b16e5cf5 --- /dev/null +++ b/rl4co/utils/decoding.py @@ -0,0 +1,606 @@ +import abc + +from typing import Optional, Tuple + +import torch +import torch.nn.functional as F + +from tensordict.tensordict import TensorDict + +from rl4co.envs import RL4COEnvBase +from rl4co.utils.ops import batchify, gather_by_index, unbatchify, unbatchify_and_gather +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def get_decoding_strategy(decoding_strategy, **config): + strategy_registry = { + "greedy": Greedy, + "sampling": Sampling, + "multistart_greedy": Greedy, + "multistart_sampling": Sampling, + "beam_search": BeamSearch, + "evaluate": Evaluate, + } + + if decoding_strategy not in strategy_registry: + log.warning( + f"Unknown decode type '{decoding_strategy}'. Available decode types: {strategy_registry.keys()}. Defaulting to Sampling." + ) + + if "multistart" in decoding_strategy: + config["multistart"] = True + + return strategy_registry.get(decoding_strategy, Sampling)(**config) + + +def get_log_likelihood(logprobs, actions=None, mask=None, return_sum: bool = True): + """Get log likelihood of selected actions. + Note that mask is a boolean tensor where True means the value should be kept. + + Args: + logprobs: Log probabilities of actions from the model (batch_size, seq_len, action_dim). + actions: Selected actions (batch_size, seq_len). + mask: Action mask. 1 if feasible, 0 otherwise (so we keep if 1 as done in PyTorch). + return_sum: Whether to return the sum of log probabilities or not. Defaults to True. + """ + # Optional: select logp when logp.shape = (bs, dec_steps, N) + if actions is not None and logprobs.dim() == 3: + logprobs = logprobs.gather(-1, actions.unsqueeze(-1)).squeeze(-1) + + # Optional: mask out actions irrelevant to objective so they do not get reinforced + if mask is not None: + logprobs[~mask] = 0 + + assert ( + logprobs > -1000 + ).data.all(), "Logprobs should not be -inf, check sampling procedure!" + + # Calculate log_likelihood + if return_sum: + return logprobs.sum(1) # [batch] + else: + return logprobs # [batch, decode_len] + + +def decode_logprobs(logprobs, mask, decode_type="sampling"): + """Decode log probabilities to select actions with mask. + Note that mask is a boolean tensor where True means the value should be kept. + """ + if "greedy" in decode_type: + selected = DecodingStrategy.greedy(logprobs, mask) + elif "sampling" in decode_type: + selected = DecodingStrategy.sampling(logprobs, mask) + else: + assert False, "Unknown decode type: {}".format(decode_type) + return selected + + +def random_policy(td): + """Helper function to select a random action from available actions""" + action = torch.multinomial(td["action_mask"].float(), 1).squeeze(-1) + td.set("action", action) + return td + + +def rollout(env, td, policy, max_steps: int = None): + """Helper function to rollout a policy. Currently, TorchRL does not allow to step + over envs when done with `env.rollout()`. We need this because for environments that complete at different steps. + """ + + max_steps = float("inf") if max_steps is None else max_steps + actions = [] + steps = 0 + + while not td["done"].all(): + td = policy(td) + actions.append(td["action"]) + td = env.step(td)["next"] + steps += 1 + if steps > max_steps: + log.info("Max steps reached") + break + return ( + env.get_reward(td, torch.stack(actions, dim=1)), + td, + torch.stack(actions, dim=1), + ) + + +def modify_logits_for_top_k_filtering(logits, top_k): + """Set the logits for none top-k values to -inf. Done out-of-place. + Ref: https://github.com/togethercomputer/stripedhyena/blob/7e13f618027fea9625be1f2d2d94f9a361f6bd02/stripedhyena/sample.py#L6 + """ + indices_to_remove = logits < torch.topk(logits, top_k)[0][..., -1, None] + return logits.masked_fill(indices_to_remove, float("-inf")) + + +def modify_logits_for_top_p_filtering(logits, top_p): + """Set the logits for none top-p values to -inf. Done out-of-place. + Ref: https://github.com/togethercomputer/stripedhyena/blob/7e13f618027fea9625be1f2d2d94f9a361f6bd02/stripedhyena/sample.py#L14 + """ + if top_p <= 0.0 or top_p >= 1.0: + return logits + + # First sort and calculate cumulative sum of probabilities. + sorted_logits, sorted_indices = torch.sort(logits, descending=False) + cumulative_probs = sorted_logits.softmax(dim=-1).cumsum(dim=-1) + + # Remove tokens with cumulative top_p above the threshold (token with 0 are kept) + sorted_indices_to_remove = cumulative_probs <= (1 - top_p) + + # Scatter sorted tensors to original indexing + indices_to_remove = sorted_indices_to_remove.scatter( + -1, sorted_indices, sorted_indices_to_remove + ) + return logits.masked_fill(indices_to_remove, float("-inf")) + + +def process_logits( + logits: torch.Tensor, + mask: torch.Tensor = None, + temperature: float = 1.0, + top_p: float = 0.0, + top_k: int = 0, + tanh_clipping: float = 0, + mask_logits: bool = True, +): + """Convert logits to log probabilities with additional features like temperature scaling, top-k and top-p sampling. + + Note: + We convert to log probabilities instead of probabilities to avoid numerical instability. + This is because, roughly, softmax = exp(logits) / sum(exp(logits)) and log(softmax) = logits - log(sum(exp(logits))), + and avoiding the division by the sum of exponentials can help with numerical stability. + You may check the [official PyTorch documentation](https://pytorch.org/docs/stable/generated/torch.nn.functional.log_softmax.html). + + Args: + logits: Logits from the model (batch_size, num_actions). + mask: Action mask. 1 if feasible, 0 otherwise (so we keep if 1 as done in PyTorch). + temperature: Temperature scaling. Higher values make the distribution more uniform (exploration), + lower values make it more peaky (exploitation). + top_p: Top-p sampling, a.k.a. Nucleus Sampling (https://arxiv.org/abs/1904.09751). Remove tokens that have a cumulative probability + less than the threshold 1 - top_p (lower tail of the distribution). If 0, do not perform. + top_k: Top-k sampling, i.e. restrict sampling to the top k logits. If 0, do not perform. Note that we only do filtering and + do not return all the top-k logits here. + tanh_clipping: Tanh clipping (https://arxiv.org/abs/1611.09940). + mask_logits: Whether to mask logits of infeasible actions. + """ + + # Tanh clipping from Bello et al. 2016 + if tanh_clipping > 0: + logits = torch.tanh(logits) * tanh_clipping + + # In RL, we want to mask the logits to prevent the agent from selecting infeasible actions + if mask_logits: + assert mask is not None, "mask must be provided if mask_logits is True" + logits[~mask] = float("-inf") + + logits = logits / temperature # temperature scaling + + if top_k > 0: + top_k = min(top_k, logits.size(-1)) # safety check + logits = modify_logits_for_top_k_filtering(logits, top_k) + + if top_p > 0: + assert top_p <= 1.0, "top-p should be in (0, 1]." + logits = modify_logits_for_top_p_filtering(logits, top_p) + + # Compute log probabilities + return F.log_softmax(logits, dim=-1) + + +class DecodingStrategy(metaclass=abc.ABCMeta): + """Base class for decoding strategies. Subclasses should implement the :meth:`_step` method. + Includes hooks for pre and post main decoding operations. + + Args: + temperature: Temperature scaling. Higher values make the distribution more uniform (exploration), + lower values make it more peaky (exploitation). Defaults to 1.0. + top_p: Top-p sampling, a.k.a. Nucleus Sampling (https://arxiv.org/abs/1904.09751). Defaults to 0.0. + top_k: Top-k sampling, i.e. restrict sampling to the top k logits. If 0, do not perform. Defaults to 0. + mask_logits: Whether to mask logits of infeasible actions. Defaults to True. + tanh_clipping: Tanh clipping (https://arxiv.org/abs/1611.09940). Defaults to 0. + multisample: Whether to use sampling decoding. Defaults to False. + num_samples: Number of samples to evaluate during decoding. Defaults to None. + num_starts: Number of starts for multistart decoding. Defaults to None. + multistart: Whether to use multistart decoding. Defaults to False. + select_start_nodes_fn: Function to select start nodes for multistart decoding. Defaults to None. + improvement_method_mode: Whether to use improvement method mode. Defaults to False. + select_best: Whether to select the best action or return all. Defaults to False. + store_all_logp: Whether to store all log probabilities. Defaults to False. If True, logprobs will be stored for all actions. + Note that this will increase memory usage. + """ + + name = "base" + + def __init__( + self, + temperature: float = 1.0, + top_p: float = 0.0, + top_k: int = 0, + mask_logits: bool = True, + tanh_clipping: float = 0, + num_samples: Optional[int] = None, + multisample: bool = False, + num_starts: Optional[int] = None, + multistart: bool = False, + select_start_nodes_fn: Optional[callable] = None, + improvement_method_mode: bool = False, + select_best: bool = False, + store_all_logp: bool = False, + **kwargs, + ) -> None: + self.temperature = temperature + self.top_p = top_p + self.top_k = top_k + self.mask_logits = mask_logits + self.tanh_clipping = tanh_clipping + # check if multistart (POMO) and multisample flags + assert not ( + multistart and multisample + ), "Using both multistart and multisample is not supported" + if num_samples and num_starts: + assert not ( + num_samples > 1 and num_starts > 1 + ), f"num_samples={num_samples} and num_starts={num_starts} are both > 1" + if num_samples is not None: + multisample = True if num_samples > 1 else False + if num_starts is not None: + multistart = True if num_starts > 1 else False + self.multistart = multistart + self.multisample = multisample + # num_starts is used for both multistart and multisample + # the function is to use start multiple rollouts for the same instance in parallel + self.num_starts = num_starts if multistart else num_samples + + self.select_start_nodes_fn = select_start_nodes_fn + self.improvement_method_mode = improvement_method_mode + self.select_best = select_best + self.store_all_logp = store_all_logp + # initialize buffers + self.actions = [] + self.logprobs = [] + + @abc.abstractmethod + def _step( + self, + logprobs: torch.Tensor, + mask: torch.Tensor, + td: TensorDict, + action: torch.Tensor = None, + **kwargs, + ) -> Tuple[torch.Tensor, torch.Tensor, TensorDict]: + """Main decoding operation. This method should be called in a loop until all sequences are done. + + Args: + logprobs: Log probabilities processed from logits of the model. + mask: Action mask. 1 if feasible, 0 otherwise (so we keep if 1 as done in PyTorch). + td: TensorDict containing the current state of the environment. + action: Optional action to use, e.g. for evaluating log probabilities. + """ + raise NotImplementedError("Must be implemented by subclass") + + def pre_decoder_hook( + self, td: TensorDict, env: RL4COEnvBase, action: torch.Tensor = None + ): + """Pre decoding hook. This method is called before the main decoding operation.""" + + # Multi-start decoding. If num_starts is None, we use the number of actions in the action mask + if self.multistart or self.multisample: + if self.num_starts is None: + self.num_starts = env.get_num_starts(td) + if self.multisample: + log.warn( + f"num_starts is not provided for sampling, using num_starts={self.num_starts}" + ) + else: + if self.num_starts is not None: + if self.num_starts >= 1: + log.warn( + f"num_starts={self.num_starts} is ignored for decode_type={self.name}" + ) + + self.num_starts = 0 + + # Multi-start decoding: first action is chosen by ad-hoc node selection + if self.num_starts >= 1: + if self.multistart: + if action is None: # if action is provided, we use it as the first action + if self.select_start_nodes_fn is not None: + action = self.select_start_nodes_fn(td, env, self.num_starts) + else: + action = env.select_start_nodes(td, num_starts=self.num_starts) + + # Expand td to batch_size * num_starts + td = batchify(td, self.num_starts) + + td.set("action", action) + td = env.step(td)["next"] + # first logprobs is 0, so p = logprobs.exp() = 1 + if self.store_all_logp: + logprobs = torch.zeros_like(td["action_mask"]) # [B, N] + else: + logprobs = torch.zeros_like(action, device=td.device) # [B] + + self.logprobs.append(logprobs) + self.actions.append(action) + else: + # Expand td to batch_size * num_samplestarts + td = batchify(td, self.num_starts) + + return td, env, self.num_starts + + def post_decoder_hook( + self, td: TensorDict, env: RL4COEnvBase + ) -> Tuple[torch.Tensor, torch.Tensor, TensorDict, RL4COEnvBase]: + assert ( + len(self.logprobs) > 0 + ), "No logprobs were collected because all environments were done. Check your initial state" + logprobs = torch.stack(self.logprobs, 1) + actions = torch.stack(self.actions, 1) + if self.num_starts > 0 and self.select_best: + logprobs, actions, td, env = self._select_best(logprobs, actions, td, env) + return logprobs, actions, td, env + + def step( + self, + logits: torch.Tensor, + mask: torch.Tensor, + td: TensorDict = None, + action: torch.Tensor = None, + **kwargs, + ) -> TensorDict: + """Main decoding operation. This method should be called in a loop until all sequences are done. + + Args: + logits: Logits from the model. + mask: Action mask. 1 if feasible, 0 otherwise (so we keep if 1 as done in PyTorch). + td: TensorDict containing the current state of the environment. + action: Optional action to use, e.g. for evaluating log probabilities. + """ + if not self.mask_logits: # set mask_logit to None if mask_logits is False + mask = None + + logprobs = process_logits( + logits, + mask, + temperature=self.temperature, + top_p=self.top_p, + top_k=self.top_k, + tanh_clipping=self.tanh_clipping, + mask_logits=self.mask_logits, + ) + logprobs, selected_action, td = self._step( + logprobs, mask, td, action=action, **kwargs + ) + + # directly return for improvement methods, since the action for improvement methods is finalized in its own policy + if self.improvement_method_mode: + return logprobs, selected_action + # for others + if not self.store_all_logp: + logprobs = gather_by_index(logprobs, selected_action, dim=1) + td.set("action", selected_action) + self.actions.append(selected_action) + self.logprobs.append(logprobs) + return td + + @staticmethod + def greedy(logprobs, mask=None): + """Select the action with the highest probability.""" + # [BS], [BS] + selected = logprobs.argmax(dim=-1) + if mask is not None: + assert ( + not (~mask).gather(1, selected.unsqueeze(-1)).data.any() + ), "infeasible action selected" + + return selected + + @staticmethod + def sampling(logprobs, mask=None): + """Sample an action with a multinomial distribution given by the log probabilities.""" + probs = logprobs.exp() + selected = torch.multinomial(probs, 1).squeeze(1) + + if mask is not None: + while (~mask).gather(1, selected.unsqueeze(-1)).data.any(): + log.info("Sampled bad values, resampling!") + selected = probs.multinomial(1).squeeze(1) + assert ( + not (~mask).gather(1, selected.unsqueeze(-1)).data.any() + ), "infeasible action selected" + + return selected + + def _select_best(self, logprobs, actions, td: TensorDict, env: RL4COEnvBase): + rewards = env.get_reward(td, actions) + _, max_idxs = unbatchify(rewards, self.num_starts).max(dim=-1) + + actions = unbatchify_and_gather(actions, max_idxs, self.num_starts) + logprobs = unbatchify_and_gather(logprobs, max_idxs, self.num_starts) + td = unbatchify_and_gather(td, max_idxs, self.num_starts) + + return logprobs, actions, td, env + + +class Greedy(DecodingStrategy): + name = "greedy" + + def _step( + self, logprobs: torch.Tensor, mask: torch.Tensor, td: TensorDict, **kwargs + ) -> Tuple[torch.Tensor, torch.Tensor, TensorDict]: + """Select the action with the highest log probability""" + selected = self.greedy(logprobs, mask) + return logprobs, selected, td + + +class Sampling(DecodingStrategy): + name = "sampling" + + def _step( + self, logprobs: torch.Tensor, mask: torch.Tensor, td: TensorDict, **kwargs + ) -> Tuple[torch.Tensor, torch.Tensor, TensorDict]: + """Sample an action with a multinomial distribution given by the log probabilities.""" + selected = self.sampling(logprobs, mask) + return logprobs, selected, td + + +class Evaluate(DecodingStrategy): + name = "evaluate" + + def _step( + self, + logprobs: torch.Tensor, + mask: torch.Tensor, + td: TensorDict, + action: torch.Tensor, + **kwargs, + ) -> Tuple[torch.Tensor, torch.Tensor, TensorDict]: + """The action is provided externally, so we just return the action""" + selected = action + return logprobs, selected, td + + +class BeamSearch(DecodingStrategy): + name = "beam_search" + + def __init__(self, beam_width=None, select_best=True, **kwargs) -> None: + # TODO do we really need all logp in beam search? + kwargs["store_all_logp"] = True + super().__init__(**kwargs) + self.beam_width = beam_width + self.select_best = select_best + self.parent_beam_logprobs = None + self.beam_path = [] + + def _step( + self, logprobs: torch.Tensor, mask: torch.Tensor, td: TensorDict, **kwargs + ) -> Tuple[torch.Tensor, torch.Tensor, TensorDict]: + selected, batch_beam_idx = self._make_beam_step(logprobs) + # select the correct state representation, logprobs and mask according to beam parent + td = td[batch_beam_idx] + logprobs = logprobs[batch_beam_idx] + mask = mask[batch_beam_idx] + + assert ( + not (~mask).gather(1, selected.unsqueeze(-1)).data.any() + ), "infeasible action selected" + + return logprobs, selected, td + + def pre_decoder_hook(self, td: TensorDict, env: RL4COEnvBase, **kwargs): + if self.beam_width is None: + self.beam_width = env.get_num_starts(td) + assert self.beam_width > 1, "beam width must be larger than 1" + + # select start nodes. TODO: include first step in beam search as well + if self.select_start_nodes_fn is not None: + action = self.select_start_nodes_fn(td, env, self.beam_width) + else: + action = env.select_start_nodes(td, num_starts=self.beam_width) + + # Expand td to batch_size * beam_width + td = batchify(td, self.beam_width) + + td.set("action", action) + td = env.step(td)["next"] + + logprobs = torch.zeros_like(td["action_mask"], device=td.device) + beam_parent = torch.zeros(logprobs.size(0), device=td.device, dtype=torch.int32) + + self.logprobs.append(logprobs) + self.actions.append(action) + self.parent_beam_logprobs = logprobs.gather(1, action[..., None]) + self.beam_path.append(beam_parent) + + return td, env, self.beam_width + + def post_decoder_hook(self, td, env): + # [BS*BW, seq_len] + aligned_sequences, aligned_logprobs = self._backtrack() + + if self.select_best: + return self._select_best_beam(aligned_logprobs, aligned_sequences, td, env) + else: + return aligned_logprobs, aligned_sequences, td, env + + def _backtrack(self): + # [BS*BW, seq_len] + actions = torch.stack(self.actions, 1) + # [BS*BW, seq_len] + logprobs = torch.stack(self.logprobs, 1) + assert actions.size(1) == len( + self.beam_path + ), "action idx shape and beam path shape dont match" + + # [BS*BW] + cur_parent = self.beam_path[-1] + # [BS*BW] + reversed_aligned_sequences = [actions[:, -1]] + reversed_aligned_logprobs = [logprobs[:, -1]] + + aug_batch_size = actions.size(0) + batch_size = aug_batch_size // self.beam_width + batch_beam_sequence = ( + torch.arange(0, batch_size).repeat(self.beam_width).to(actions.device) + ) + + for k in reversed(range(len(self.beam_path) - 1)): + batch_beam_idx = batch_beam_sequence + cur_parent * batch_size + + reversed_aligned_sequences.append(actions[batch_beam_idx, k]) + reversed_aligned_logprobs.append(logprobs[batch_beam_idx, k]) + cur_parent = self.beam_path[k][batch_beam_idx] + + # [BS*BW, seq_len*num_targets] + actions = torch.stack(list(reversed(reversed_aligned_sequences)), dim=1) + logprobs = torch.stack(list(reversed(reversed_aligned_logprobs)), dim=1) + + return actions, logprobs + + def _select_best_beam(self, logprobs, actions, td: TensorDict, env: RL4COEnvBase): + aug_batch_size = logprobs.size(0) # num nodes + batch_size = aug_batch_size // self.beam_width + rewards = env.get_reward(td, actions) + _, idx = torch.cat(rewards.unsqueeze(1).split(batch_size), 1).max(1) + flat_idx = torch.arange(batch_size, device=rewards.device) + idx * batch_size + return logprobs[flat_idx], actions[flat_idx], td[flat_idx], env + + def _make_beam_step(self, logprobs: torch.Tensor): + aug_batch_size, num_nodes = logprobs.shape # num nodes + batch_size = aug_batch_size // self.beam_width + batch_beam_sequence = ( + torch.arange(0, batch_size).repeat(self.beam_width).to(logprobs.device) + ) + + # [BS*BW, num_nodes] + [BS*BW, 1] -> [BS*BW, num_nodes] + log_beam_prob = logprobs + self.parent_beam_logprobs # + + # [BS, num_nodes * BW] + log_beam_prob_hstacked = torch.cat(log_beam_prob.split(batch_size), dim=1) + # [BS, BW] + topk_logprobs, topk_ind = torch.topk( + log_beam_prob_hstacked, self.beam_width, dim=1 + ) + + # [BS*BW, 1] + logprobs_selected = torch.hstack(torch.unbind(topk_logprobs, 1)).unsqueeze(1) + + # [BS*BW, 1] + topk_ind = torch.hstack(torch.unbind(topk_ind, 1)) + + # since we stack the logprobs from the distinct branches, the indices in + # topk dont correspond to node indices directly and need to be translated + selected = topk_ind % num_nodes # determine node index + + # calc parent this branch comes from + beam_parent = (topk_ind // num_nodes).int() + + batch_beam_idx = batch_beam_sequence + beam_parent * batch_size + + self.parent_beam_logprobs = logprobs_selected + self.beam_path.append(beam_parent) + + return selected, batch_beam_idx diff --git a/rl4co/utils/instantiators.py b/rl4co/utils/instantiators.py new file mode 100644 index 00000000..9f4cdaf4 --- /dev/null +++ b/rl4co/utils/instantiators.py @@ -0,0 +1,61 @@ +from typing import List + +import hydra + +from lightning import Callback +from lightning.pytorch.loggers import Logger +from omegaconf import DictConfig + +from rl4co.utils import pylogger + +log = pylogger.get_pylogger(__name__) + + +def instantiate_callbacks(callbacks_cfg: DictConfig) -> List[Callback]: + """Instantiates callbacks from config.""" + + callbacks: List[Callback] = [] + + if not callbacks_cfg: + log.warning("No callback configs found! Skipping..") + return callbacks + + if not isinstance(callbacks_cfg, DictConfig): + raise TypeError("Callbacks config must be a DictConfig!") + + for _, cb_conf in callbacks_cfg.items(): + if isinstance(cb_conf, DictConfig) and "_target_" in cb_conf: + log.info(f"Instantiating callback <{cb_conf._target_}>") + callbacks.append(hydra.utils.instantiate(cb_conf)) + + return callbacks + + +def instantiate_loggers(logger_cfg: DictConfig, model) -> List[Logger]: + """Instantiates loggers from config.""" + + logger_list: List[Logger] = [] + + if not logger_cfg: + log.warning("No logger configs found! Skipping...") + return logger_list + + if not isinstance(logger_cfg, DictConfig): + raise TypeError("Logger config must be a DictConfig!") + + for _, lg_conf in logger_cfg.items(): + if isinstance(lg_conf, DictConfig) and "_target_" in lg_conf: + log.info(f"Instantiating logger <{lg_conf._target_}>") + if hasattr(lg_conf, "log_gradients"): + log_gradients = lg_conf.get("log_gradients", False) + # manually remove parameter, since pop doesnt work on DictConfig + del lg_conf.log_gradients + else: + log_gradients = False + logger = hydra.utils.instantiate(lg_conf) + if hasattr(logger, "watch") and log_gradients: + # make use of wandb gradient statistics logger + logger.watch(model, log_graph=False) + logger_list.append(logger) + + return logger_list diff --git a/rl4co/utils/lightning.py b/rl4co/utils/lightning.py new file mode 100644 index 00000000..a3f29cb7 --- /dev/null +++ b/rl4co/utils/lightning.py @@ -0,0 +1,76 @@ +import os + +import lightning as L +import torch + +from omegaconf import DictConfig + +# from rl4co. +from rl4co.utils.pylogger import get_pylogger + +log = get_pylogger(__name__) + + +def get_lightning_device(lit_module: L.LightningModule) -> torch.device: + """Get the device of the Lightning module before setup is called + See device setting issue in setup https://github.com/Lightning-AI/lightning/issues/2638 + """ + try: + if lit_module.trainer.strategy.root_device != lit_module.device: + return lit_module.trainer.strategy.root_device + return lit_module.device + except Exception: + return lit_module.device + + +def remove_key(config, key="wandb"): + """Remove keys containing 'key`""" + new_config = {} + for k, v in config.items(): + if key in k: + continue + else: + new_config[k] = v + return new_config + + +def clean_hydra_config( + config, keep_value_only=True, remove_keys="wandb", clean_cfg_path=True +): + """Clean hydra config by nesting dictionary and cleaning values""" + # Remove keys containing `remove_keys` + if not isinstance(remove_keys, list): + remove_keys = [remove_keys] + for key in remove_keys: + config = remove_key(config, key=key) + + new_config = {} + # Iterate over config dictionary + for key, value in config.items(): + # If key contains slash, split it and create nested dictionary recursively + if "/" in key: + keys = key.split("/") + d = new_config + for k in keys[:-1]: + d = d.setdefault(k, {}) + d[keys[-1]] = value["value"] if keep_value_only else value + else: + new_config[key] = value["value"] if keep_value_only else value + + cfg = DictConfig(new_config) + + if clean_cfg_path: + # Clean cfg_path recursively substituting root_dir with cwd + root_dir = cfg.paths.root_dir + + def replace_dir_recursive(d, search, replace): + for k, v in d.items(): + if isinstance(v, dict) or isinstance(v, DictConfig): + replace_dir_recursive(v, search, replace) + elif isinstance(v, str): + if search in v: + d[k] = v.replace(search, replace) + + replace_dir_recursive(cfg, root_dir, os.getcwd()) + + return cfg diff --git a/rl4co/utils/meta_trainer.py b/rl4co/utils/meta_trainer.py new file mode 100644 index 00000000..ccd64352 --- /dev/null +++ b/rl4co/utils/meta_trainer.py @@ -0,0 +1,170 @@ +import lightning.pytorch as pl +import torch +import math +import copy +from torch.optim import Adam + +from lightning import Callback +from rl4co import utils +import random +log = utils.get_pylogger(__name__) + + +class ReptileCallback(Callback): + + """ Meta training framework for addressing the generalization issue (implement the Reptile algorithm only) + Based on Manchanda et al. 2022 (https://arxiv.org/abs/2206.00787) and Zhou et al. 2023 (https://arxiv.org/abs/2305.19587) + + Args: + - num_tasks: the number of tasks in a mini-batch, i.e. `B` in the original paper + - alpha: initial weight of the task model for the outer-loop optimization of reptile + - alpha_decay: weight decay of the task model for the outer-loop optimization of reptile + - min_size: minimum problem size of the task (only supported in cross-size generalization) + - max_size: maximum problem size of the task (only supported in cross-size generalization) + - sch_bar: for the task scheduler of size setting, where lr_decay_epoch = sch_bar * epochs, i.e. after this epoch, learning rate will decay with a weight 0.1 + - data_type: type of the tasks, chosen from ["size", "distribution", "size_distribution"] + - print_log: whether to print the specific task sampled in each inner-loop optimization + """ + def __init__(self, + num_tasks: int, + alpha: float, + alpha_decay: float, + min_size: int, + max_size: int, + sch_bar: float = 0.9, + data_type: str = "size", + print_log: bool =True): + + super().__init__() + + self.num_tasks = num_tasks + self.alpha = alpha + self.alpha_decay = alpha_decay + self.sch_bar = sch_bar + self.print_log = print_log + self.data_type = data_type + self.task_set = self._generate_task_set(data_type, min_size, max_size) + + def on_fit_start(self, trainer: pl.Trainer, pl_module: pl.LightningModule) -> None: + + # Sample a batch of tasks + self._sample_task() + + # Pre-set the distribution + if self.data_type == "size_distribution": + pl_module.env.generator.loc_distribution = "gaussian_mixture" + self.selected_tasks[0] = (pl_module.env.generator.num_loc, 0, 0) + elif self.data_type == "size": + pl_module.env.generator.loc_distribution = "uniform" + self.selected_tasks[0] = (pl_module.env.generator.num_loc, ) + elif self.data_type == "distribution": + pl_module.env.generator.loc_distribution = "gaussian_mixture" + self.selected_tasks[0] = (0, 0) + self.task_params = self.selected_tasks[0] + + def on_train_epoch_start(self, trainer: pl.Trainer, pl_module: pl.LightningModule) -> None: + + # Alpha scheduler (decay for the update of meta model) + self._alpha_scheduler() + + # Reinitialize the task model with the parameters of the meta model + if trainer.current_epoch % self.num_tasks == 0: # Save the meta model + self.meta_model_state_dict = copy.deepcopy(pl_module.state_dict()) + self.task_models = [] + # Print sampled tasks + if self.print_log: + print('\n>> Meta epoch: {} (Exact epoch: {}), Training task: {}'.format(trainer.current_epoch//self.num_tasks, trainer.current_epoch, self.selected_tasks)) + else: + pl_module.load_state_dict(self.meta_model_state_dict) + + # Reinitialize the optimizer every epoch + lr_decay = 0.1 if trainer.current_epoch+1 == int(self.sch_bar * trainer.max_epochs) else 1 + old_lr = trainer.optimizers[0].param_groups[0]['lr'] + new_optimizer = Adam(pl_module.parameters(), lr=old_lr * lr_decay) + trainer.optimizers = [new_optimizer] + + # Print + if self.print_log: + if hasattr(pl_module.env.generator, 'capacity'): + print('>> Training task: {}, capacity: {}'.format(self.task_params, pl_module.env.generator.capacity)) + else: + print('>> Training task: {}'.format(self.task_params)) + + def on_train_epoch_end(self, trainer: pl.Trainer, pl_module: pl.LightningModule): + + # Save the task model + self.task_models.append(copy.deepcopy(pl_module.state_dict())) + if (trainer.current_epoch+1) % self.num_tasks == 0: + # Outer-loop optimization (update the meta model with the parameters of the task model) + with torch.no_grad(): + state_dict = {params_key: (self.meta_model_state_dict[params_key] + + self.alpha * torch.mean(torch.stack([fast_weight[params_key] - self.meta_model_state_dict[params_key] + for fast_weight in self.task_models], dim=0).float(), dim=0)) + for params_key in self.meta_model_state_dict} + pl_module.load_state_dict(state_dict) + + # Get ready for the next meta-training iteration + if (trainer.current_epoch + 1) % self.num_tasks == 0: + # Sample a batch of tasks + self._sample_task() + + # Load new training task (Update the environment) for the next meta-training iteration + self._load_task(pl_module, task_idx = (trainer.current_epoch+1) % self.num_tasks) + + def _sample_task(self): + + # Sample a batch of tasks + self.selected_tasks = [] + for b in range(self.num_tasks): + task_params = random.sample(self.task_set, 1)[0] + self.selected_tasks.append(task_params) + + def _load_task(self, pl_module: pl.LightningModule, task_idx=0): + + # Load new training task (Update the environment) + self.task_params = self.selected_tasks[task_idx] + + if self.data_type == "size_distribution": + assert len(self.task_params) == 3 + pl_module.env.generator.num_loc = self.task_params[0] + pl_module.env.generator.num_modes = self.task_params[1] + pl_module.env.generator.cdist = self.task_params[2] + elif self.data_type == "distribution": # fixed size + assert len(self.task_params) == 2 + pl_module.env.generator.num_modes = self.task_params[0] + pl_module.env.generator.cdist = self.task_params[1] + elif self.data_type == "size": # fixed distribution + assert len(self.task_params) == 1 + pl_module.env.generator.num_loc = self.task_params[0] + + if hasattr(pl_module.env.generator, 'capacity') and self.data_type in ["size_distribution", "size"]: + task_capacity = math.ceil(30 + self.task_params[0] / 5) if self.task_params[0] >= 20 else 20 + pl_module.env.generator.capacity = task_capacity + + def _alpha_scheduler(self): + self.alpha = max(self.alpha * self.alpha_decay, 0.0001) + + def _generate_task_set(self, data_type, min_size, max_size): + """ + Following the setting in Zhou et al. 2023 (https://arxiv.org/abs/2305.19587) + Current setting: + size: (n,) \in [20, 150] + distribution: (m, c) \in {(0, 0) + [1-9] * [1, 10, 20, 30, 40, 50]} + size_distribution: (n, m, c) \in [50, 200, 5] * {(0, 0) + (1, 1) + [3, 5, 7] * [10, 30, 50]} + """ + + if data_type == "distribution": # focus on TSP100 with gaussian mixture distributions + task_set = [(0, 0)] + [(m, c) for m in range(1, 10) for c in [1, 10, 20, 30, 40, 50]] + elif data_type == "size": # focus on uniform distribution with different sizes + task_set = [(n,) for n in range(min_size, max_size + 1)] + elif data_type == "size_distribution": + dist_set = [(0, 0), (1, 1)] + [(m, c) for m in [3, 5, 7] for c in [10, 30, 50]] + task_set = [(n, m, c) for n in range(50, 201, 5) for (m, c) in dist_set] + else: + raise NotImplementedError + + print(">> Generating training task set: {} tasks with type {}".format(len(task_set), data_type)) + print(">> Training task set: {}".format(task_set)) + + return task_set + diff --git a/rl4co/utils/ops.py b/rl4co/utils/ops.py new file mode 100644 index 00000000..b78821dc --- /dev/null +++ b/rl4co/utils/ops.py @@ -0,0 +1,262 @@ +from functools import lru_cache +from typing import Optional, Union + +import torch + +from einops import rearrange +from tensordict import TensorDict +from torch import Tensor + + +def _batchify_single( + x: Union[Tensor, TensorDict], repeats: int +) -> Union[Tensor, TensorDict]: + """Same as repeat on dim=0 for Tensordicts as well""" + s = x.shape + return x.expand(repeats, *s).contiguous().view(s[0] * repeats, *s[1:]) + + +def batchify( + x: Union[Tensor, TensorDict], shape: Union[tuple, int] +) -> Union[Tensor, TensorDict]: + """Same as `einops.repeat(x, 'b ... -> (b r) ...', r=repeats)` but ~1.5x faster and supports TensorDicts. + Repeats batchify operation `n` times as specified by each shape element. + If shape is a tuple, iterates over each element and repeats that many times to match the tuple shape. + + Example: + >>> x.shape: [a, b, c, ...] + >>> shape: [a, b, c] + >>> out.shape: [a*b*c, ...] + """ + shape = [shape] if isinstance(shape, int) else shape + for s in reversed(shape): + x = _batchify_single(x, s) if s > 0 else x + return x + + +def _unbatchify_single( + x: Union[Tensor, TensorDict], repeats: int +) -> Union[Tensor, TensorDict]: + """Undoes batchify operation for Tensordicts as well""" + s = x.shape + return x.view(repeats, s[0] // repeats, *s[1:]).permute(1, 0, *range(2, len(s) + 1)) + + +def unbatchify( + x: Union[Tensor, TensorDict], shape: Union[tuple, int] +) -> Union[Tensor, TensorDict]: + """Same as `einops.rearrange(x, '(r b) ... -> b r ...', r=repeats)` but ~2x faster and supports TensorDicts + Repeats unbatchify operation `n` times as specified by each shape element + If shape is a tuple, iterates over each element and unbatchifies that many times to match the tuple shape. + + Example: + >>> x.shape: [a*b*c, ...] + >>> shape: [a, b, c] + >>> out.shape: [a, b, c, ...] + """ + shape = [shape] if isinstance(shape, int) else shape + for s in reversed( + shape + ): # we need to reverse the shape to unbatchify in the right order + x = _unbatchify_single(x, s) if s > 0 else x + return x + + +def gather_by_index(src, idx, dim=1, squeeze=True): + """Gather elements from src by index idx along specified dim + + Example: + >>> src: shape [64, 20, 2] + >>> idx: shape [64, 3)] # 3 is the number of idxs on dim 1 + >>> Returns: [64, 3, 2] # get the 3 elements from src at idx + """ + expanded_shape = list(src.shape) + expanded_shape[dim] = -1 + idx = idx.view(idx.shape + (1,) * (src.dim() - idx.dim())).expand(expanded_shape) + squeeze = idx.size(dim) == 1 and squeeze + return src.gather(dim, idx).squeeze(dim) if squeeze else src.gather(dim, idx) + + +def unbatchify_and_gather(x: Tensor, idx: Tensor, n: int): + """first unbatchify a tensor by n and then gather (usually along the unbatchified dimension) + by the specified index + """ + x = unbatchify(x, n) + return gather_by_index(x, idx, dim=idx.dim()) + + +def get_distance(x: Tensor, y: Tensor): + """Euclidean distance between two tensors of shape `[..., n, dim]`""" + return (x - y).norm(p=2, dim=-1) + + +def get_tour_length(ordered_locs): + """Compute the total tour distance for a batch of ordered tours. + Computes the L2 norm between each pair of consecutive nodes in the tour and sums them up. + + Args: + ordered_locs: Tensor of shape [batch_size, num_nodes, 2] containing the ordered locations of the tour + """ + ordered_locs_next = torch.roll(ordered_locs, -1, dims=-2) + return get_distance(ordered_locs_next, ordered_locs).sum(-1) + + +def get_distance_matrix(locs: Tensor): + """Compute the euclidean distance matrix for the given coordinates. + + Args: + locs: Tensor of shape [..., n, dim] + """ + distance = (locs[..., :, None, :] - locs[..., None, :, :]).norm(p=2, dim=-1) + return distance + + +def calculate_entropy(logprobs: Tensor): + """Calculate the entropy of the log probabilities distribution + logprobs: Tensor of shape [batch, decoder_steps, num_actions] + """ + logprobs = torch.nan_to_num(logprobs, nan=0.0) + entropy = -(logprobs.exp() * logprobs).sum(dim=-1) # [batch, decoder steps] + entropy = entropy.sum(dim=1) # [batch] -- sum over decoding steps + assert entropy.isfinite().all(), "Entropy is not finite" + return entropy + + +# TODO: modularize inside the envs +def get_num_starts(td, env_name=None): + """Returns the number of possible start nodes for the environment based on the action mask""" + num_starts = td["action_mask"].shape[-1] + if env_name == "pdp": + num_starts = ( + num_starts - 1 + ) // 2 # only half of the nodes (i.e. pickup nodes) can be start nodes + elif env_name in ["cvrp", "cvrptw", "sdvrp", "mtsp", "op", "pctsp", "spctsp"]: + num_starts = num_starts - 1 # depot cannot be a start node + + return num_starts + + +def select_start_nodes(td, env, num_starts): + """Node selection strategy as proposed in POMO (Kwon et al. 2020) + and extended in SymNCO (Kim et al. 2022). + Selects different start nodes for each batch element + + Args: + td: TensorDict containing the data. We may need to access the available actions to select the start nodes + env: Environment may determine the node selection strategy + num_starts: Number of nodes to select. This may be passed when calling the policy directly. See :class:`rl4co.models.AutoregressiveDecoder` + """ + num_loc = env.generator.num_loc if hasattr(env.generator, "num_loc") else 0xFFFFFFFF + if env.name in ["tsp", "atsp", "flp", "mcp"]: + selected = ( + torch.arange(num_starts, device=td.device).repeat_interleave(td.shape[0]) + % num_loc + ) + elif env.name in ["jssp", "fjsp"]: + raise NotImplementedError("Multistart not yet supported for FJSP/JSSP") + else: + # Environments with depot: we do not select the depot as a start node + selected = ( + torch.arange(num_starts, device=td.device).repeat_interleave(td.shape[0]) + % num_loc + + 1 + ) + if env.name == "op": + if (td["action_mask"][..., 1:].float().sum(-1) < num_starts).any(): + # for the orienteering problem, we may have some nodes that are not available + # so we need to resample from the distribution of available nodes + selected = ( + torch.multinomial( + td["action_mask"][..., 1:].float(), num_starts, replacement=True + ) + + 1 + ) # re-add depot index + selected = rearrange(selected, "b n -> (n b)") + return selected + + +def get_best_actions(actions, max_idxs): + actions = unbatchify(actions, max_idxs.shape[0]) + return actions.gather(0, max_idxs[..., None, None]) + + +def sparsify_graph(cost_matrix: Tensor, k_sparse: Optional[int] = None, self_loop=False): + """Generate a sparsified graph for the cost_matrix by selecting k edges with the lowest cost for each node. + + Args: + cost_matrix: Tensor of shape [m, n] + k_sparse: Number of edges to keep for each node. Defaults to max(n//5, 10) if not provided. + self_loop: Include self-loop edges in the generated graph when m==n. Defaults to False. + """ + m, n = cost_matrix.shape + k_sparse = max(n // 5, 10) if k_sparse is None else k_sparse + + # fill diagonal value with +inf to exclude them from topk results + if not self_loop and m == n: + # k_sparse should not exceed n-1 in this occasion + k_sparse = min(k_sparse, n - 1) + cost_matrix.fill_diagonal_(torch.inf) + + # select top-k edges with least cost + topk_values, topk_indices = torch.topk( + cost_matrix, k=k_sparse, dim=-1, largest=False, sorted=False + ) + + # generate PyG-compatiable edge_index + edge_index_u = torch.repeat_interleave( + torch.arange(m, device=cost_matrix.device), topk_indices.shape[1] + ) + edge_index_v = topk_indices.flatten() + edge_index = torch.stack([edge_index_u, edge_index_v]) + + edge_attr = topk_values.flatten().unsqueeze(-1) + return edge_index, edge_attr + + +@lru_cache(5) +def get_full_graph_edge_index(num_node: int, self_loop=False) -> Tensor: + adj_matrix = torch.ones(num_node, num_node) + if not self_loop: + adj_matrix.fill_diagonal_(0) + edge_index = torch.permute(torch.nonzero(adj_matrix), (1, 0)) + return edge_index + + +def adj_to_pyg_edge_index(adj: Tensor) -> Tensor: + """transforms an adjacency matrix (boolean) to a Tensor with the respective edge + indices (in the format required by the pytorch geometric module). + + :param Tensor adj: shape=(bs, num_nodes, num_nodes) + :return Tensor: shape=(2, num_edges) + """ + assert adj.size(1) == adj.size(2), "only symmetric adjacency matrices are supported" + num_nodes = adj.size(1) + # (num_edges, 3) + edge_idx = adj.nonzero() + batch_idx = edge_idx[:, 0] * num_nodes + # PyG expects a "single, flat graph", in which the graphs of the batch are not connected. + # Therefore, add the batch_idx to edge_idx to have unique indices + flat_edge_idx = edge_idx[:, 1:] + batch_idx[:, None] + # (2, num_edges) + flat_edge_idx = torch.permute(flat_edge_idx, (1, 0)) + return flat_edge_idx + + +def sample_n_random_actions(td: TensorDict, n: int): + """Helper function to sample n random actions from available actions. If + number of valid actions is less then n, we sample with replacement from the + valid actions + """ + action_mask = td["action_mask"] + # check whether to use replacement or not + n_valid_actions = torch.sum(action_mask[:, 1:], 1).min() + if n_valid_actions < n: + replace = True + else: + replace = False + ps = torch.rand((action_mask.shape)) + ps[~action_mask] = -torch.inf + ps = torch.softmax(ps, dim=1) + selected = torch.multinomial(ps, n, replacement=replace).squeeze(1) + selected = rearrange(selected, "b n -> (n b)") + return selected.to(td.device) diff --git a/rl4co/utils/optim_helpers.py b/rl4co/utils/optim_helpers.py new file mode 100644 index 00000000..46367a37 --- /dev/null +++ b/rl4co/utils/optim_helpers.py @@ -0,0 +1,38 @@ +import inspect + +import torch +from torch.optim import Optimizer + + +def get_pytorch_lr_schedulers(): + """Get all learning rate schedulers from `torch.optim.lr_scheduler`""" + return torch.optim.lr_scheduler.__all__ + + +def get_pytorch_optimizers(): + """Get all optimizers from `torch.optim`""" + optimizers = [] + for name, obj in inspect.getmembers(torch.optim): + if inspect.isclass(obj) and issubclass(obj, Optimizer): + optimizers.append(name) + return optimizers + + +def create_optimizer(parameters, optimizer_name: str, **optimizer_kwargs) -> Optimizer: + """Create optimizer for model. If `optimizer_name` is not found, raise ValueError.""" + if optimizer_name in get_pytorch_optimizers(): + optimizer_cls = getattr(torch.optim, optimizer_name) + return optimizer_cls(parameters, **optimizer_kwargs) + else: + raise ValueError(f"Optimizer {optimizer_name} not found.") + + +def create_scheduler( + optimizer: Optimizer, scheduler_name: str, **scheduler_kwargs +) -> torch.optim.lr_scheduler.LRScheduler: + """Create scheduler for optimizer. If `scheduler_name` is not found, raise ValueError.""" + if scheduler_name in get_pytorch_lr_schedulers(): + scheduler_cls = getattr(torch.optim.lr_scheduler, scheduler_name) + return scheduler_cls(optimizer, **scheduler_kwargs) + else: + raise ValueError(f"Scheduler {scheduler_name} not found.") diff --git a/rl4co/utils/pylogger.py b/rl4co/utils/pylogger.py new file mode 100644 index 00000000..aa1b5f1a --- /dev/null +++ b/rl4co/utils/pylogger.py @@ -0,0 +1,25 @@ +import logging + +from lightning.pytorch.utilities.rank_zero import rank_zero_only + + +def get_pylogger(name=__name__) -> logging.Logger: + """Initializes multi-GPU-friendly python command line logger.""" + + logger = logging.getLogger(name) + + # this ensures all logging levels get marked with the rank zero decorator + # otherwise logs would get multiplied for each GPU process in multi-GPU setup + logging_levels = ( + "debug", + "info", + "warning", + "error", + "exception", + "fatal", + "critical", + ) + for level in logging_levels: + setattr(logger, level, rank_zero_only(getattr(logger, level))) + + return logger diff --git a/rl4co/utils/rich_utils.py b/rl4co/utils/rich_utils.py new file mode 100644 index 00000000..652ba568 --- /dev/null +++ b/rl4co/utils/rich_utils.py @@ -0,0 +1,97 @@ +from pathlib import Path +from typing import Sequence + +import rich +import rich.syntax +import rich.tree + +from hydra.core.hydra_config import HydraConfig +from lightning.pytorch.utilities.rank_zero import rank_zero_only +from omegaconf import DictConfig, OmegaConf, open_dict +from rich.prompt import Prompt + +from rl4co.utils.utils import pylogger + +log = pylogger.get_pylogger(__name__) + + +@rank_zero_only +def print_config_tree( + cfg: DictConfig, + print_order: Sequence[str] = ( + # "data", # note: data is dealt with in model + "model", + "callbacks", + "logger", + "trainer", + "paths", + "extras", + ), + resolve: bool = True, + save_to_file: bool = False, +) -> None: + """Prints content of DictConfig using Rich library and its tree structure. + Args: + cfg (DictConfig): Configuration composed by Hydra. + print_order (Sequence[str], optional): Determines in what order config components are printed. + resolve (bool, optional): Whether to resolve reference fields of DictConfig. + save_to_file (bool, optional): Whether to export config to the hydra output folder. + """ + + style = "dim" + tree = rich.tree.Tree("CONFIG", style=style, guide_style=style) + + queue = [] + + # add fields from `print_order` to queue + for field in print_order: + queue.append(field) if field in cfg else log.warning( + f"Field '{field}' not found in config. Skipping '{field}' config printing..." + ) + + # add all the other fields to queue (not specified in `print_order`) + for field in cfg: + if field not in queue: + queue.append(field) + + # generate config tree from queue + for field in queue: + branch = tree.add(field, style=style, guide_style=style) + + config_group = cfg[field] + if isinstance(config_group, DictConfig): + branch_content = OmegaConf.to_yaml(config_group, resolve=resolve) + else: + branch_content = str(config_group) + + branch.add(rich.syntax.Syntax(branch_content, "yaml")) + + # print config tree + rich.print(tree) + + # save config tree to file + if save_to_file: + with open(Path(cfg.paths.output_dir, "config_tree.log"), "w") as file: + rich.print(tree, file=file) + + +@rank_zero_only +def enforce_tags(cfg: DictConfig, save_to_file: bool = False) -> None: + """Prompts user to input tags from command line if no tags are provided in config.""" + + if not cfg.get("tags"): + if "id" in HydraConfig().cfg.hydra.job: + raise ValueError("Specify tags before launching a multirun!") + + log.warning("No tags provided in config. Prompting user to input tags...") + tags = Prompt.ask("Enter a list of comma separated tags", default="dev") + tags = [t.strip() for t in tags.split(",") if t != ""] + + with open_dict(cfg): + cfg.tags = tags + + log.info(f"Tags: {cfg.tags}") + + if save_to_file: + with open(Path(cfg.paths.output_dir, "tags.log"), "w") as file: + rich.print(cfg.tags, file=file) diff --git a/rl4co/utils/test_utils.py b/rl4co/utils/test_utils.py new file mode 100644 index 00000000..60e2a327 --- /dev/null +++ b/rl4co/utils/test_utils.py @@ -0,0 +1,71 @@ +from torch.utils.data import DataLoader + +from rl4co.envs import ( + CVRPEnv, + CVRPTWEnv, + DPPEnv, + MDPPEnv, + MTSPEnv, + OPEnv, + PCTSPEnv, + PDPEnv, + PDPRuinRepairEnv, + SDVRPEnv, + SMTWTPEnv, + SPCTSPEnv, + TSPEnv, + FLPEnv, + MCPEnv, +) + + +def get_env(name, size): + if name == "tsp": + env = TSPEnv(generator_params=dict(num_loc=size)) + elif name == "cvrp": + env = CVRPEnv(generator_params=dict(num_loc=size)) + elif name == "cvrptw": + env = CVRPTWEnv(generator_params=dict(num_loc=size)) + elif name == "sdvrp": + env = SDVRPEnv(generator_params=dict(num_loc=size)) + elif name == "pdp": + env = PDPEnv(generator_params=dict(num_loc=size)) + elif name == "op": + env = OPEnv(generator_params=dict(num_loc=size)) + elif name == "mtsp": + env = MTSPEnv(generator_params=dict(num_loc=size)) + elif name == "pctsp": + env = PCTSPEnv(generator_params=dict(num_loc=size)) + elif name == "spctsp": + env = SPCTSPEnv(generator_params=dict(num_loc=size)) + elif name == "dpp": + env = DPPEnv() + elif name == "mdpp": + env = MDPPEnv() + elif name == "smtwtp": + env = SMTWTPEnv() + elif name == "pdp_ruin_repair": + env = PDPRuinRepairEnv() + elif name == "mcp": + env = MCPEnv() + elif name == "flp": + env = FLPEnv() + else: + raise ValueError(f"Unknown env_name: {name}") + + return env.transform() + + +def generate_env_data(env, size, batch_size): + env = get_env(env, size) + dataset = env.dataset([batch_size]) + + dataloader = DataLoader( + dataset, + batch_size=batch_size, + shuffle=False, + num_workers=0, + collate_fn=dataset.collate_fn, + ) + + return env, next(iter(dataloader)) diff --git a/rl4co/utils/trainer.py b/rl4co/utils/trainer.py new file mode 100644 index 00000000..0ad10fa1 --- /dev/null +++ b/rl4co/utils/trainer.py @@ -0,0 +1,152 @@ +from typing import Iterable, List, Optional, Union + +import lightning.pytorch as pl +import torch + +from lightning import Callback, Trainer +from lightning.fabric.accelerators.cuda import num_cuda_devices +from lightning.pytorch.accelerators import Accelerator +from lightning.pytorch.core.datamodule import LightningDataModule +from lightning.pytorch.loggers import Logger +from lightning.pytorch.strategies import DDPStrategy, Strategy +from lightning.pytorch.utilities.types import EVAL_DATALOADERS, TRAIN_DATALOADERS + +from rl4co import utils + +log = utils.get_pylogger(__name__) + + +class RL4COTrainer(Trainer): + """Wrapper around Lightning Trainer, with some RL4CO magic for efficient training. + + Note: + The most important hyperparameter to use is `reload_dataloaders_every_n_epochs`. + This allows for datasets to be re-created on the run and distributed by Lightning across + devices on each epoch. Setting to a value different than 1 may lead to overfitting to a + specific (such as the initial) data distribution. + + Args: + accelerator: hardware accelerator to use. + callbacks: list of callbacks. + logger: logger (or iterable collection of loggers) for experiment tracking. + min_epochs: minimum number of training epochs. + max_epochs: maximum number of training epochs. + strategy: training strategy to use (if any), such as Distributed Data Parallel (DDP). + devices: number of devices to train on (int) or which GPUs to train on (list or str) applied per node. + gradient_clip_val: 0 means don't clip. Defaults to 1.0 for stability. + precision: allows for mixed precision training. Can be specified as a string (e.g., '16'). + This also allows to use `FlashAttention` by default. + disable_profiling_executor: Disable JIT profiling executor. This reduces memory and increases speed. + auto_configure_ddp: Automatically configure DDP strategy if multiple GPUs are available. + reload_dataloaders_every_n_epochs: Set to a value different than 1 to reload dataloaders every n epochs. + matmul_precision: Set matmul precision for faster inference https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision + **kwargs: Additional keyword arguments passed to the Lightning Trainer. See :class:`lightning.pytorch.trainer.Trainer` for details. + """ + + def __init__( + self, + accelerator: Union[str, Accelerator] = "auto", + callbacks: Optional[List[Callback]] = None, + logger: Optional[Union[Logger, Iterable[Logger]]] = None, + min_epochs: Optional[int] = None, + max_epochs: Optional[int] = None, + strategy: Union[str, Strategy] = "auto", + devices: Union[List[int], str, int] = "auto", + gradient_clip_val: Union[int, float] = 1.0, + precision: Union[str, int] = "16-mixed", + reload_dataloaders_every_n_epochs: int = 1, + disable_profiling_executor: bool = True, + auto_configure_ddp: bool = True, + matmul_precision: Union[str, int] = "medium", + **kwargs, + ): + # Disable JIT profiling executor. This reduces memory and increases speed. + # Reference: https://github.com/HazyResearch/safari/blob/111d2726e7e2b8d57726b7a8b932ad8a4b2ad660/train.py#LL124-L129C17 + if disable_profiling_executor: + try: + torch._C._jit_set_profiling_executor(False) + torch._C._jit_set_profiling_mode(False) + except AttributeError: + pass + + # Configure DDP automatically if multiple GPUs are available + if auto_configure_ddp and strategy == "auto": + if devices == "auto": + n_devices = num_cuda_devices() + elif isinstance(devices, Iterable): + n_devices = len(devices) + else: + n_devices = devices + if n_devices > 1: + log.info( + "Configuring DDP strategy automatically with {} GPUs".format( + n_devices + ) + ) + strategy = DDPStrategy( + find_unused_parameters=True, # We set to True due to RL envs + gradient_as_bucket_view=True, # https://pytorch-lightning.readthedocs.io/en/stable/advanced/advanced_gpu.html#ddp-optimizations + ) + + # Set matmul precision for faster inference https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html#torch.set_float32_matmul_precision + if matmul_precision is not None: + torch.set_float32_matmul_precision(matmul_precision) + + # Check if gradient_clip_val is set to None + if gradient_clip_val is None: + log.warning( + "gradient_clip_val is set to None. This may lead to unstable training." + ) + + # We should reload dataloaders every epoch for RL training + if reload_dataloaders_every_n_epochs != 1: + log.warning( + "We reload dataloaders every epoch for RL training. Setting reload_dataloaders_every_n_epochs to a value different than 1 " + + "may lead to unexpected behavior since the initial conditions will be the same for `n_epochs` epochs." + ) + + # Main call to `Trainer` superclass + super().__init__( + accelerator=accelerator, + callbacks=callbacks, + logger=logger, + min_epochs=min_epochs, + max_epochs=max_epochs, + strategy=strategy, + gradient_clip_val=gradient_clip_val, + devices=devices, + precision=precision, + reload_dataloaders_every_n_epochs=reload_dataloaders_every_n_epochs, + **kwargs, + ) + + def fit( + self, + model: "pl.LightningModule", + train_dataloaders: Optional[Union[TRAIN_DATALOADERS, LightningDataModule]] = None, + val_dataloaders: Optional[EVAL_DATALOADERS] = None, + datamodule: Optional[LightningDataModule] = None, + ckpt_path: Optional[str] = None, + ) -> None: + """ + We override the `fit` method to automatically apply and handle RL4CO magic + to 'self.automatic_optimization = False' models, such as PPO + + It behaves exactly like the original `fit` method, but with the following changes: + - if the given model is 'self.automatic_optimization = False', we override 'gradient_clip_val' as None + """ + + if not model.automatic_optimization: + if self.gradient_clip_val is not None: + log.warning( + "Overriding gradient_clip_val to None for 'automatic_optimization=False' models" + ) + self.gradient_clip_val = None + + super().fit( + model=model, + train_dataloaders=train_dataloaders, + val_dataloaders=val_dataloaders, + datamodule=datamodule, + ckpt_path=ckpt_path, + ) diff --git a/rl4co/utils/utils.py b/rl4co/utils/utils.py new file mode 100644 index 00000000..41ac59f4 --- /dev/null +++ b/rl4co/utils/utils.py @@ -0,0 +1,285 @@ +import importlib +import platform +import sys +import warnings + +from importlib.util import find_spec +from typing import Callable, List + +import hydra + +from lightning import Callback +from lightning.pytorch.loggers.logger import Logger + +# Import the necessary PyTorch Lightning component +from lightning.pytorch.trainer.connectors.accelerator_connector import ( + _AcceleratorConnector, +) +from lightning.pytorch.utilities.rank_zero import rank_zero_only +from omegaconf import DictConfig, OmegaConf + +from rl4co.utils import pylogger, rich_utils + +log = pylogger.get_pylogger(__name__) + + +def task_wrapper(task_func: Callable) -> Callable: + """Optional decorator that wraps the task function in extra utilities. + + Makes multirun more resistant to failure. + + Utilities: + - Calling the `utils.extras()` before the task is started + - Calling the `utils.close_loggers()` after the task is finished or failed + - Logging the exception if occurs + - Logging the output dir + """ + + def wrap(cfg: DictConfig): + # execute the task + try: + metric_dict, object_dict = task_func(cfg=cfg) + + # things to do if exception occurs + except Exception as ex: + # save exception to `.log` file + log.exception("") + + # some hyperparameter combinations might be invalid or cause out-of-memory errors + # so when using hparam search plugins like Optuna, you might want to disable + # raising the below exception to avoid multirun failure + raise ex + + # things to always do after either success or exception + finally: + # display output dir path in terminal + log.info(f"Output dir: {cfg.paths.output_dir}") + + # close loggers (even if exception occurs so multirun won't fail) + close_loggers() + + return metric_dict, object_dict + + return wrap + + +def extras(cfg: DictConfig) -> None: + """Applies optional utilities before the task is started. + + Utilities: + - Ignoring python warnings + - Setting tags from command line + - Rich config printing + """ + + # return if no `extras` config + if not cfg.get("extras"): + log.warning("Extras config not found! ") + return + + # disable python warnings + if cfg.extras.get("ignore_warnings"): + log.info("Disabling python warnings! ") + warnings.filterwarnings("ignore") + + # prompt user to input tags from command line if none are provided in the config + if cfg.extras.get("enforce_tags"): + log.info("Enforcing tags! ") + rich_utils.enforce_tags(cfg, save_to_file=True) + + # pretty print config tree using Rich library + if cfg.extras.get("print_config"): + log.info("Printing config tree with Rich! ") + rich_utils.print_config_tree(cfg, resolve=True, save_to_file=True) + + +def instantiate_callbacks(callbacks_cfg: DictConfig) -> List[Callback]: + """Instantiates callbacks from config.""" + callbacks: List[Callback] = [] + + if not callbacks_cfg: + log.warning("No callback configs found! Skipping..") + return callbacks + + if not isinstance(callbacks_cfg, DictConfig): + raise TypeError("Callbacks config must be a DictConfig!") + + for _, cb_conf in callbacks_cfg.items(): + if isinstance(cb_conf, DictConfig) and "_target_" in cb_conf: + log.info(f"Instantiating callback <{cb_conf._target_}>") + callbacks.append(hydra.utils.instantiate(cb_conf)) + + return callbacks + + +def instantiate_loggers(logger_cfg: DictConfig) -> List[Logger]: + """Instantiates loggers from config.""" + logger: List[Logger] = [] + + if not logger_cfg: + log.warning("No logger configs found! Skipping...") + return logger + + if not isinstance(logger_cfg, DictConfig): + raise TypeError("Logger config must be a DictConfig!") + + for _, lg_conf in logger_cfg.items(): + if isinstance(lg_conf, DictConfig) and "_target_" in lg_conf: + log.info(f"Instantiating logger <{lg_conf._target_}>") + logger.append(hydra.utils.instantiate(lg_conf)) + + return logger + + +@rank_zero_only +def log_hyperparameters(object_dict: dict) -> None: + """Controls which config parts are saved by lightning loggers. + + Additionally saves: + - Number of model parameters + """ + + hparams = {} + + cfg = OmegaConf.to_container(object_dict["cfg"]) + model = object_dict["model"] + trainer = object_dict["trainer"] + + if not trainer.logger: + log.warning("Logger not found! Skipping hyperparameter logging...") + return + + hparams["model"] = cfg["model"] + + # save number of model parameters + hparams["model/params/total"] = sum(p.numel() for p in model.parameters()) + hparams["model/params/trainable"] = sum( + p.numel() for p in model.parameters() if p.requires_grad + ) + hparams["model/params/non_trainable"] = sum( + p.numel() for p in model.parameters() if not p.requires_grad + ) + + ## Note: we do not use the data config, since it is dealt with in the model + ## which is a `LightningModule` + # hparams["data"] = cfg["data"] + hparams["trainer"] = cfg["trainer"] + + hparams["callbacks"] = cfg.get("callbacks") + hparams["extras"] = cfg.get("extras") + + hparams["task_name"] = cfg.get("task_name") + hparams["tags"] = cfg.get("tags") + hparams["ckpt_path"] = cfg.get("ckpt_path") + hparams["seed"] = cfg.get("seed") + + # send hparams to all loggers + for logger in trainer.loggers: + logger.log_hyperparams(hparams) + + +def get_metric_value(metric_dict: dict, metric_name: str) -> float: + """Safely retrieves value of the metric logged in LightningModule.""" + + if not metric_name: + log.info("Metric name is None! Skipping metric value retrieval...") + return None + + if metric_name not in metric_dict: + raise Exception( + f"Metric value not found! \n" + "Make sure metric name logged in LightningModule is correct!\n" + "Make sure `optimized_metric` name in `hparams_search` config is correct!" + ) + + metric_value = metric_dict[metric_name].item() + log.info(f"Retrieved metric value! <{metric_name}={metric_value}>") + + return metric_value + + +def close_loggers() -> None: + """Makes sure all loggers closed properly (prevents logging failure during multirun).""" + + log.info("Closing loggers...") + + if find_spec("wandb"): # if wandb is installed + import wandb + + if wandb.run: + log.info("Closing wandb!") + wandb.finish() + + +@rank_zero_only +def save_file(path: str, content: str) -> None: + """Save file in rank zero mode (only on one process in multi-GPU setup).""" + with open(path, "w+") as file: + file.write(content) + + +def merge_with_defaults(_config=None, **defaults) -> dict: + """Merge configuration with default values. + + This function merges a provided configuration dictionary with default values. + If no configuration is provided (`_config` is None), it returns the default values. + If a dictionary is provided, it updates the defaults dictionary with the values from the provided dictionary. + Otherwise, it sets all keys in the defaults dictionary to `_config`. + + Args: + _config: Configuration to merge. Defaults to None. + **defaults: Default values to merge with the configuration. + + Returns: + dict: Merged configuration with default values. + """ + if _config is None: + return defaults + elif isinstance(_config, (DictConfig, dict)): + defaults.update(dict(**_config)) # type: ignore + return defaults + else: + return {key: _config for key in defaults.keys()} + + +def show_versions(): + """ + This function prints version information that is useful when filing bug + reports. Inspired by https://github.com/PyVRP/PyVRP + """ + + modules = { + "rl4co": "rl4co", + "torch": "torch", + "lightning": "pytorch_lightning", # Updated module name if necessary + "torchrl": "torchrl", + "tensordict": "tensordict", + "numpy": "numpy", + "pytorch_geometric": "torch_geometric", + "hydra-core": "hydra", + "omegaconf": "omegaconf", + "matplotlib": "matplotlib", + } + + # Find the longest module name for formatting + longest_name = max(len(name) for name in modules.keys()) + + print("INSTALLED VERSIONS") + print("-" * (longest_name + 20)) + # modules + for name, module in modules.items(): + try: + imported_module = importlib.import_module(module) + version = imported_module.__version__ + except ImportError: + version = "Not installed" + print(f"{name.rjust(longest_name)} : {version}") + # platform information + print(f'{"Python".rjust(longest_name)} : {sys.version.split()[0]}') + print(f'{"Platform".rjust(longest_name)} : {platform.platform()}') + try: + lightning_auto_device = _AcceleratorConnector()._choose_auto_accelerator(None) + except Exception: + lightning_auto_device = _AcceleratorConnector()._choose_auto_accelerator() + # lightning hardware accelerators + print(f'{"Lightning device".rjust(longest_name)} : {lightning_auto_device}') diff --git a/search/search_index.json b/search/search_index.json new file mode 100644 index 00000000..20ae95ff --- /dev/null +++ b/search/search_index.json @@ -0,0 +1 @@ +{"config":{"lang":["en"],"separator":"[\\s\\-]+","pipeline":["stopWordFilter"]},"docs":[{"location":"","title":"Home","text":"Loading...

An extensive Reinforcement Learning (RL) for Combinatorial Optimization (CO) benchmark. Our goal is to provide a unified framework for RL-based CO algorithms, and to facilitate reproducible research in this field, decoupling the science from the engineering.

RL4CO is built upon:

  • TorchRL: official PyTorch framework for RL algorithms and vectorized environments on GPUs
  • TensorDict: a library to easily handle heterogeneous data such as states, actions and rewards
  • PyTorch Lightning: a lightweight PyTorch wrapper for high-performance AI research
  • Hydra: a framework for elegantly configuring complex applications

We offer flexible and efficient implementations of the following policies:

  • Constructive: learn to construct a solution from scratch
    • Autoregressive (AR): construct solutions one step at a time via a decoder
    • NonAutoregressive (NAR): learn to predict a heuristic, such as a heatmap, to then construct a solution
  • Improvement: learn to improve a pre-existing solution

We provide several utilities and modularization. For example, we modularize reusable components such as environment embeddings that can easily be swapped to solve new problems.

"},{"location":"#getting-started","title":"Getting started","text":"

RL4CO is now available for installation on pip!

pip install rl4co\n

To get started, we recommend checking out our quickstart notebook or the minimalistic example below.

"},{"location":"#install-from-source","title":"Install from source","text":"

This command installs the bleeding edge main version, useful for staying up-to-date with the latest developments - for instance, if a bug has been fixed since the last official release but a new release hasn\u2019t been rolled out yet:

pip install -U git+https://github.com/ai4co/rl4co.git\n
"},{"location":"#local-install-and-development","title":"Local install and development","text":"

If you want to develop RL4CO we recommend you to install it locally with pip in editable mode:

git clone https://github.com/ai4co/rl4co && cd rl4co\npip install -e .\n

We recommend using a virtual environment such as conda to install rl4co locally.

"},{"location":"#usage","title":"Usage","text":"

Train model with default configuration (AM on TSP environment):

python run.py\n

Tip

You may check out this notebook to get started with Hydra!

Change experiment settings Train model with chosen experiment configuration from [configs/experiment/](configs/experiment/)
python run.py experiment=routing/am env=tsp env.num_loc=50 model.optimizer_kwargs.lr=2e-4\n
Here you may change the environment, e.g. with `env=cvrp` by command line or by modifying the corresponding experiment e.g. [configs/experiment/routing/am.yaml](configs/experiment/routing/am.yaml). Disable logging
python run.py experiment=routing/am logger=none '~callbacks.learning_rate_monitor'\n
Note that `~` is used to disable a callback that would need a logger. Create a sweep over hyperparameters (-m for multirun)
python run.py -m experiment=routing/am  model.optimizer.lr=1e-3,1e-4,1e-5\n
"},{"location":"#minimalistic-example","title":"Minimalistic Example","text":"

Here is a minimalistic example training the Attention Model with greedy rollout baseline on TSP in less than 30 lines of code:

from rl4co.envs.routing import TSPEnv, TSPGenerator\nfrom rl4co.models import AttentionModelPolicy, POMO\nfrom rl4co.utils import RL4COTrainer\n\n# Instantiate generator and environment\ngenerator = TSPGenerator(num_loc=50, loc_distribution=\"uniform\")\nenv = TSPEnv(generator)\n\n# Create policy and RL model\npolicy = AttentionModelPolicy(env_name=env.name, num_encoder_layers=6)\nmodel = POMO(env, policy, batch_size=64, optimizer_kwargs={\"lr\": 1e-4})\n\n# Instantiate Trainer and fit\ntrainer = RL4COTrainer(max_epochs=10, accelerator=\"gpu\", precision=\"16-mixed\")\ntrainer.fit(model)\n

Other examples can be found on our documentation!

"},{"location":"#testing","title":"Testing","text":"

Run tests with pytest from the root directory:

pytest tests\n
"},{"location":"#known-bugs","title":"Known Bugs","text":""},{"location":"#bugs-installing-pytorch-geometric-pyg","title":"Bugs installing PyTorch Geometric (PyG)","text":"

Installing PyG via Conda seems to update Torch itself. We have found that this update introduces some bugs with torchrl. At this moment, we recommend installing PyG with Pip:

pip install torch_geometric\n

"},{"location":"#contributing","title":"Contributing","text":"

Have a suggestion, request, or found a bug? Feel free to open an issue or submit a pull request. If you would like to contribute, please check out our contribution guidelines here. We welcome and look forward to all contributions to RL4CO!

We are also on Slack if you have any questions or would like to discuss RL4CO with us. We are open to collaborations and would love to hear from you \ud83d\ude80

"},{"location":"#contributors","title":"Contributors","text":""},{"location":"#citation","title":"Citation","text":"

If you find RL4CO valuable for your research or applied projects:

@article{berto2024rl4co,\n    title={{RL4CO: an Extensive Reinforcement Learning for Combinatorial Optimization Benchmark}},\n    author={Federico Berto and Chuanbo Hua and Junyoung Park and Laurin Luttmann and Yining Ma and Fanchen Bu and Jiarui Wang and Haoran Ye and Minsu Kim and Sanghyeok Choi and Nayeli Gast Zepeda and Andr\\'e Hottung and Jianan Zhou and Jieyi Bi and Yu Hu and Fei Liu and Hyeonah Kim and Jiwoo Son and Haeyeon Kim and Davide Angioni and Wouter Kool and Zhiguang Cao and Jie Zhang and Kijung Shin and Cathy Wu and Sungsoo Ahn and Guojie Song and Changhyun Kwon and Lin Xie and Jinkyoo Park},\n    year={2024},\n    journal={arXiv preprint arXiv:2306.17100},\n    note={\\url{https://github.com/ai4co/rl4co}}\n}\n

Note that a previous version of RL4CO has been accepted as an oral presentation at the NeurIPS 2023 GLFrontiers Workshop. Since then, the library has greatly evolved and improved!

"},{"location":"#join-us","title":"Join us","text":"

We invite you to join our AI4CO community, an open research group in Artificial Intelligence (AI) for Combinatorial Optimization (CO)!

"},{"location":"README_backup/","title":"README backup","text":"

Documentation | Getting Started | Usage | Contributing | Paper | Join Us

An extensive Reinforcement Learning (RL) for Combinatorial Optimization (CO) benchmark. Our goal is to provide a unified framework for RL-based CO algorithms, and to facilitate reproducible research in this field, decoupling the science from the engineering.

RL4CO is built upon:

  • TorchRL: official PyTorch framework for RL algorithms and vectorized environments on GPUs
  • TensorDict: a library to easily handle heterogeneous data such as states, actions and rewards
  • PyTorch Lightning: a lightweight PyTorch wrapper for high-performance AI research
  • Hydra: a framework for elegantly configuring complex applications

We offer flexible and efficient implementations of the following policies:

  • Constructive: learn to construct a solution from scratch
    • Autoregressive (AR): construct solutions one step at a time via a decoder
    • NonAutoregressive (NAR): learn to predict a heuristic, such as a heatmap, to then construct a solution
  • Improvement: learn to improve a pre-existing solution

We provide several utilities and modularization. For example, we modularize reusable components such as environment embeddings that can easily be swapped to solve new problems.

"},{"location":"README_backup/#getting-started","title":"Getting started","text":"

RL4CO is now available for installation on pip!

pip install rl4co\n

To get started, we recommend checking out our quickstart notebook or the minimalistic example below.

"},{"location":"README_backup/#install-from-source","title":"Install from source","text":"

This command installs the bleeding edge main version, useful for staying up-to-date with the latest developments - for instance, if a bug has been fixed since the last official release but a new release hasn\u2019t been rolled out yet:

pip install -U git+https://github.com/ai4co/rl4co.git\n
"},{"location":"README_backup/#local-install-and-development","title":"Local install and development","text":"

If you want to develop RL4CO we recommend you to install it locally with pip in editable mode:

git clone https://github.com/ai4co/rl4co && cd rl4co\npip install -e .\n

We recommend using a virtual environment such as conda to install rl4co locally.

"},{"location":"README_backup/#usage","title":"Usage","text":"

Train model with default configuration (AM on TSP environment):

python run.py\n

Tip

You may check out this notebook to get started with Hydra!

Change experiment settings Train model with chosen experiment configuration from [configs/experiment/](configs/experiment/)
python run.py experiment=routing/am env=tsp env.num_loc=50 model.optimizer_kwargs.lr=2e-4\n
Here you may change the environment, e.g. with `env=cvrp` by command line or by modifying the corresponding experiment e.g. [configs/experiment/routing/am.yaml](configs/experiment/routing/am.yaml). Disable logging
python run.py experiment=routing/am logger=none '~callbacks.learning_rate_monitor'\n
Note that `~` is used to disable a callback that would need a logger. Create a sweep over hyperparameters (-m for multirun)
python run.py -m experiment=routing/am  model.optimizer.lr=1e-3,1e-4,1e-5\n
"},{"location":"README_backup/#minimalistic-example","title":"Minimalistic Example","text":"

Here is a minimalistic example training the Attention Model with greedy rollout baseline on TSP in less than 30 lines of code:

from rl4co.envs.routing import TSPEnv, TSPGenerator\nfrom rl4co.models import AttentionModelPolicy, POMO\nfrom rl4co.utils import RL4COTrainer\n\n# Instantiate generator and environment\ngenerator = TSPGenerator(num_loc=50, loc_distribution=\"uniform\")\nenv = TSPEnv(generator)\n\n# Create policy and RL model\npolicy = AttentionModelPolicy(env_name=env.name, num_encoder_layers=6)\nmodel = POMO(env, policy, batch_size=64, optimizer_kwargs={\"lr\": 1e-4})\n\n# Instantiate Trainer and fit\ntrainer = RL4COTrainer(max_epochs=10, accelerator=\"gpu\", precision=\"16-mixed\")\ntrainer.fit(model)\n

Other examples can be found on our documentation!

"},{"location":"README_backup/#testing","title":"Testing","text":"

Run tests with pytest from the root directory:

pytest tests\n
"},{"location":"README_backup/#known-bugs","title":"Known Bugs","text":""},{"location":"README_backup/#bugs-installing-pytorch-geometric-pyg","title":"Bugs installing PyTorch Geometric (PyG)","text":"

Installing PyG via Conda seems to update Torch itself. We have found that this update introduces some bugs with torchrl. At this moment, we recommend installing PyG with Pip:

pip install torch_geometric\n

"},{"location":"README_backup/#contributing","title":"Contributing","text":"

Have a suggestion, request, or found a bug? Feel free to open an issue or submit a pull request. If you would like to contribute, please check out our contribution guidelines here. We welcome and look forward to all contributions to RL4CO!

We are also on Slack if you have any questions or would like to discuss RL4CO with us. We are open to collaborations and would love to hear from you \ud83d\ude80

"},{"location":"README_backup/#contributors","title":"Contributors","text":""},{"location":"README_backup/#citation","title":"Citation","text":"

If you find RL4CO valuable for your research or applied projects:

@article{berto2024rl4co,\n    title={{RL4CO: an Extensive Reinforcement Learning for Combinatorial Optimization Benchmark}},\n    author={Federico Berto and Chuanbo Hua and Junyoung Park and Laurin Luttmann and Yining Ma and Fanchen Bu and Jiarui Wang and Haoran Ye and Minsu Kim and Sanghyeok Choi and Nayeli Gast Zepeda and Andr\\'e Hottung and Jianan Zhou and Jieyi Bi and Yu Hu and Fei Liu and Hyeonah Kim and Jiwoo Son and Haeyeon Kim and Davide Angioni and Wouter Kool and Zhiguang Cao and Jie Zhang and Kijung Shin and Cathy Wu and Sungsoo Ahn and Guojie Song and Changhyun Kwon and Lin Xie and Jinkyoo Park},\n    year={2024},\n    journal={arXiv preprint arXiv:2306.17100},\n    note={\\url{https://github.com/ai4co/rl4co}}\n}\n

Note that a previous version of RL4CO has been accepted as an oral presentation at the NeurIPS 2023 GLFrontiers Workshop. Since then, the library has greatly evolved and improved!

"},{"location":"README_backup/#join-us","title":"Join us","text":"

We invite you to join our AI4CO community, an open research group in Artificial Intelligence (AI) for Combinatorial Optimization (CO)!

"},{"location":"docs/","title":"RL4CO Documentation","text":"

We use MkDocs to generate the documentation with the MkDocs Material theme.

"},{"location":"docs/#development","title":"Development","text":"

From the root directory:

  1. Install RL4CO locally
pip install -e \".[dev,graph,routing,docs]\"\n

note that docs is the extra requirement for the documentation.

  1. To build the documentation, run:
mkdocs serve\n
"},{"location":"docs/#hooks","title":"Hooks","text":"

We are using the hooks.py for additional modifications. MkDocs for instance cannot detect files that are not in the same directory as an __init__.py (as described here) so we are automatically creating and deleting such files with our script

"},{"location":"docs/content/api/data/","title":"Data","text":""},{"location":"docs/content/api/data/#datasets","title":"Datasets","text":"

Classes:

  • FastTdDataset \u2013

    Note:

  • TensorDictDataset \u2013

    Dataset compatible with TensorDicts with low CPU usage.

  • ExtraKeyDataset \u2013

    Dataset that includes an extra key to add to the data dict.

  • TensorDictDatasetFastGeneration \u2013

    Dataset compatible with TensorDicts.

"},{"location":"docs/content/api/data/#data.dataset.FastTdDataset","title":"FastTdDataset","text":"
FastTdDataset(td: TensorDict)\n

Bases: Dataset

Note

Check out the issue on tensordict for more details: https://github.com/pytorch-labs/tensordict/issues/374.

Methods:

  • collate_fn \u2013

    Collate function compatible with TensorDicts that reassembles a list of dicts.

Source code in rl4co/data/dataset.py
def __init__(self, td: TensorDict):\n    self.data_len = td.batch_size[0]\n    self.data = td\n
"},{"location":"docs/content/api/data/#data.dataset.FastTdDataset.collate_fn","title":"collate_fn staticmethod","text":"
collate_fn(batch: Union[dict, TensorDict])\n

Collate function compatible with TensorDicts that reassembles a list of dicts.

Source code in rl4co/data/dataset.py
@staticmethod\ndef collate_fn(batch: Union[dict, TensorDict]):\n    \"\"\"Collate function compatible with TensorDicts that reassembles a list of dicts.\"\"\"\n    return batch\n
"},{"location":"docs/content/api/data/#data.dataset.TensorDictDataset","title":"TensorDictDataset","text":"
TensorDictDataset(td: TensorDict)\n

Bases: Dataset

Dataset compatible with TensorDicts with low CPU usage. Fast loading but somewhat slow instantiation due to list comprehension since we \"disassemble\" the TensorDict into a list of dicts.

Note

Check out the issue on tensordict for more details: https://github.com/pytorch-labs/tensordict/issues/374.

Methods:

  • collate_fn \u2013

    Collate function compatible with TensorDicts that reassembles a list of dicts.

Source code in rl4co/data/dataset.py
def __init__(self, td: TensorDict):\n    self.data_len = td.batch_size[0]\n    self.data = [\n        {key: value[i] for key, value in td.items()} for i in range(self.data_len)\n    ]\n
"},{"location":"docs/content/api/data/#data.dataset.TensorDictDataset.collate_fn","title":"collate_fn staticmethod","text":"
collate_fn(batch: Union[dict, TensorDict])\n

Collate function compatible with TensorDicts that reassembles a list of dicts.

Source code in rl4co/data/dataset.py
@staticmethod\ndef collate_fn(batch: Union[dict, TensorDict]):\n    \"\"\"Collate function compatible with TensorDicts that reassembles a list of dicts.\"\"\"\n    return TensorDict(\n        {key: torch.stack([b[key] for b in batch]) for key in batch[0].keys()},\n        batch_size=torch.Size([len(batch)]),\n        **td_kwargs,\n    )\n
"},{"location":"docs/content/api/data/#data.dataset.ExtraKeyDataset","title":"ExtraKeyDataset","text":"
ExtraKeyDataset(\n    dataset: TensorDictDataset,\n    extra: Tensor,\n    key_name=\"extra\",\n)\n

Bases: TensorDictDataset

Dataset that includes an extra key to add to the data dict. This is useful for adding a REINFORCE baseline reward to the data dict. Note that this is faster to instantiate than using list comprehension.

Source code in rl4co/data/dataset.py
def __init__(self, dataset: TensorDictDataset, extra: torch.Tensor, key_name=\"extra\"):\n    self.data_len = len(dataset)\n    assert self.data_len == len(extra), \"Data and extra must be same length\"\n    self.data = dataset.data\n    self.extra = extra\n    self.key_name = key_name\n
"},{"location":"docs/content/api/data/#data.dataset.TensorDictDatasetFastGeneration","title":"TensorDictDatasetFastGeneration","text":"
TensorDictDatasetFastGeneration(td: TensorDict)\n

Bases: Dataset

Dataset compatible with TensorDicts. Similar performance in loading to list comprehension, but is faster in instantiation than :class:TensorDictDatasetList (more than 10x faster).

Warning

Note that directly indexing TensorDicts may be faster in creating the dataset but uses > 3x more CPU. We may generally recommend using the :class:TensorDictDatasetList

Note

Check out the issue on tensordict for more details: https://github.com/pytorch-labs/tensordict/issues/374.

Methods:

  • collate_fn \u2013

    Equivalent to collating with lambda x: x

Source code in rl4co/data/dataset.py
def __init__(self, td: TensorDict):\n    self.data = td\n
"},{"location":"docs/content/api/data/#data.dataset.TensorDictDatasetFastGeneration.collate_fn","title":"collate_fn staticmethod","text":"
collate_fn(batch: Union[dict, TensorDict])\n

Equivalent to collating with lambda x: x

Source code in rl4co/data/dataset.py
@staticmethod\ndef collate_fn(batch: Union[dict, TensorDict]):\n    \"\"\"Equivalent to collating with `lambda x: x`\"\"\"\n    return batch\n
"},{"location":"docs/content/api/data/#data-generation","title":"Data Generation","text":"

Functions:

  • generate_env_data \u2013

    Generate data for a given environment type in the form of a dictionary

  • generate_mdpp_data \u2013

    Generate data for the nDPP problem.

  • generate_dataset \u2013

    We keep a similar structure as in Kool et al. 2019 but save and load the data as npz

  • generate_default_datasets \u2013

    Generate the default datasets used in the paper and save them to data_dir/problem

"},{"location":"docs/content/api/data/#data.generate_data.generate_env_data","title":"generate_env_data","text":"
generate_env_data(env_type, *args, **kwargs)\n

Generate data for a given environment type in the form of a dictionary

Source code in rl4co/data/generate_data.py
def generate_env_data(env_type, *args, **kwargs):\n    \"\"\"Generate data for a given environment type in the form of a dictionary\"\"\"\n    try:\n        # breakpoint()\n        # remove all None values from args\n        args = [arg for arg in args if arg is not None]\n\n        return getattr(sys.modules[__name__], f\"generate_{env_type}_data\")(\n            *args, **kwargs\n        )\n    except AttributeError:\n        raise NotImplementedError(f\"Environment type {env_type} not implemented\")\n
"},{"location":"docs/content/api/data/#data.generate_data.generate_mdpp_data","title":"generate_mdpp_data","text":"
generate_mdpp_data(\n    dataset_size,\n    size=10,\n    num_probes_min=2,\n    num_probes_max=5,\n    num_keepout_min=1,\n    num_keepout_max=50,\n    lock_size=True,\n)\n

Generate data for the nDPP problem. If lock_size is True, then the size if fixed and we skip the size argument if it is not 10. This is because the RL environment is based on a real-world PCB (parametrized with data)

Source code in rl4co/data/generate_data.py
def generate_mdpp_data(\n    dataset_size,\n    size=10,\n    num_probes_min=2,\n    num_probes_max=5,\n    num_keepout_min=1,\n    num_keepout_max=50,\n    lock_size=True,\n):\n    \"\"\"Generate data for the nDPP problem.\n    If `lock_size` is True, then the size if fixed and we skip the `size` argument if it is not 10.\n    This is because the RL environment is based on a real-world PCB (parametrized with data)\n    \"\"\"\n    if lock_size and size != 10:\n        # log.info(\"Locking size to 10, skipping generate_mdpp_data with size {}\".format(size))\n        return None\n\n    bs = dataset_size  # bs = batch_size to generate data in batch\n    m = n = size\n    if isinstance(bs, int):\n        bs = [bs]\n\n    locs = np.stack(np.meshgrid(np.arange(m), np.arange(n)), axis=-1).reshape(-1, 2)\n    locs = locs / np.array([m, n], dtype=np.float32)\n    locs = np.expand_dims(locs, axis=0)\n    locs = np.repeat(locs, bs[0], axis=0)\n\n    available = np.ones((bs[0], m * n), dtype=bool)\n\n    probe = np.random.randint(0, high=m * n, size=(bs[0], 1))\n    np.put_along_axis(available, probe, False, axis=1)\n\n    num_probe = np.random.randint(num_probes_min, num_probes_max + 1, size=(bs[0], 1))\n    probes = np.zeros((bs[0], m * n), dtype=bool)\n    for i in range(bs[0]):\n        p = np.random.choice(m * n, num_probe[i], replace=False)\n        np.put_along_axis(available[i], p, False, axis=0)\n        np.put_along_axis(probes[i], p, True, axis=0)\n\n    num_keepout = np.random.randint(num_keepout_min, num_keepout_max + 1, size=(bs[0], 1))\n    for i in range(bs[0]):\n        k = np.random.choice(m * n, num_keepout[i], replace=False)\n        np.put_along_axis(available[i], k, False, axis=0)\n\n    return {\n        \"locs\": locs.astype(np.float32),\n        \"probe\": probes.astype(bool),\n        \"action_mask\": available.astype(bool),\n    }\n
"},{"location":"docs/content/api/data/#data.generate_data.generate_dataset","title":"generate_dataset","text":"
generate_dataset(\n    filename: Union[str, List[str]] = None,\n    data_dir: str = \"data\",\n    name: str = None,\n    problem: Union[str, List[str]] = \"all\",\n    data_distribution: str = \"all\",\n    dataset_size: int = 10000,\n    graph_sizes: Union[int, List[int]] = [20, 50, 100],\n    overwrite: bool = False,\n    seed: int = 1234,\n    disable_warning: bool = True,\n    distributions_per_problem: Union[int, dict] = None,\n)\n

We keep a similar structure as in Kool et al. 2019 but save and load the data as npz This is way faster and more memory efficient than pickle and also allows for easy transfer to TensorDict

Parameters:

  • filename (Union[str, List[str]], default: None ) \u2013

    Filename to save the data to. If None, the data is saved to data_dir/problem/problem_graph_size_seed.npz. Defaults to None.

  • data_dir (str, default: 'data' ) \u2013

    Directory to save the data to. Defaults to \"data\".

  • name (str, default: None ) \u2013

    Name of the dataset. Defaults to None.

  • problem (Union[str, List[str]], default: 'all' ) \u2013

    Problem to generate data for. Defaults to \"all\".

  • data_distribution (str, default: 'all' ) \u2013

    Data distribution to generate data for. Defaults to \"all\".

  • dataset_size (int, default: 10000 ) \u2013

    Number of datasets to generate. Defaults to 10000.

  • graph_sizes (Union[int, List[int]], default: [20, 50, 100] ) \u2013

    Graph size to generate data for. Defaults to [20, 50, 100].

  • overwrite (bool, default: False ) \u2013

    Whether to overwrite existing files. Defaults to False.

  • seed (int, default: 1234 ) \u2013

    Random seed. Defaults to 1234.

  • disable_warning (bool, default: True ) \u2013

    Whether to disable warnings. Defaults to True.

  • distributions_per_problem (Union[int, dict], default: None ) \u2013

    Number of distributions to generate per problem. Defaults to None.

Source code in rl4co/data/generate_data.py
def generate_dataset(\n    filename: Union[str, List[str]] = None,\n    data_dir: str = \"data\",\n    name: str = None,\n    problem: Union[str, List[str]] = \"all\",\n    data_distribution: str = \"all\",\n    dataset_size: int = 10000,\n    graph_sizes: Union[int, List[int]] = [20, 50, 100],\n    overwrite: bool = False,\n    seed: int = 1234,\n    disable_warning: bool = True,\n    distributions_per_problem: Union[int, dict] = None,\n):\n    \"\"\"We keep a similar structure as in Kool et al. 2019 but save and load the data as npz\n    This is way faster and more memory efficient than pickle and also allows for easy transfer to TensorDict\n\n    Args:\n        filename: Filename to save the data to. If None, the data is saved to data_dir/problem/problem_graph_size_seed.npz. Defaults to None.\n        data_dir: Directory to save the data to. Defaults to \"data\".\n        name: Name of the dataset. Defaults to None.\n        problem: Problem to generate data for. Defaults to \"all\".\n        data_distribution: Data distribution to generate data for. Defaults to \"all\".\n        dataset_size: Number of datasets to generate. Defaults to 10000.\n        graph_sizes: Graph size to generate data for. Defaults to [20, 50, 100].\n        overwrite: Whether to overwrite existing files. Defaults to False.\n        seed: Random seed. Defaults to 1234.\n        disable_warning: Whether to disable warnings. Defaults to True.\n        distributions_per_problem: Number of distributions to generate per problem. Defaults to None.\n    \"\"\"\n\n    if isinstance(problem, list) and len(problem) == 1:\n        problem = problem[0]\n\n    graph_sizes = [graph_sizes] if isinstance(graph_sizes, int) else graph_sizes\n\n    if distributions_per_problem is None:\n        distributions_per_problem = DISTRIBUTIONS_PER_PROBLEM\n\n    if problem == \"all\":\n        problems = distributions_per_problem\n    else:\n        problems = {\n            problem: distributions_per_problem[problem]\n            if data_distribution == \"all\"\n            else [data_distribution]\n        }\n\n    # Support multiple filenames if necessary\n    filenames = [filename] if isinstance(filename, str) else filename\n    iter = 0\n\n    # Main loop for data generation. We loop over all problems, distributions and sizes\n    for problem, distributions in problems.items():\n        for distribution in distributions or [None]:\n            for graph_size in graph_sizes:\n                if filename is None:\n                    datadir = os.path.join(data_dir, problem)\n                    os.makedirs(datadir, exist_ok=True)\n                    fname = os.path.join(\n                        datadir,\n                        \"{}{}{}_{}_seed{}.npz\".format(\n                            problem,\n                            \"_{}\".format(distribution)\n                            if distribution is not None\n                            else \"\",\n                            graph_size,\n                            name,\n                            seed,\n                        ),\n                    )\n                else:\n                    try:\n                        fname = filenames[iter]\n                        # make directory if necessary\n                        os.makedirs(os.path.dirname(fname), exist_ok=True)\n                        iter += 1\n                    except Exception:\n                        raise ValueError(\n                            \"Number of filenames does not match number of problems\"\n                        )\n                    fname = check_extension(filename, extension=\".npz\")\n\n                if not overwrite and os.path.isfile(\n                    check_extension(fname, extension=\".npz\")\n                ):\n                    if not disable_warning:\n                        log.info(\n                            \"File {} already exists! Run with -f option to overwrite. Skipping...\".format(\n                                fname\n                            )\n                        )\n                    continue\n\n                # Set seed\n                np.random.seed(seed)\n\n                # Automatically generate dataset\n                dataset = generate_env_data(\n                    problem, dataset_size, graph_size, distribution\n                )\n\n                # A function can return None in case of an error or a skip\n                if dataset is not None:\n                    # Save to disk as dict\n                    log.info(\"Saving {} dataset to {}\".format(problem, fname))\n                    np.savez(fname, **dataset)\n
"},{"location":"docs/content/api/data/#data.generate_data.generate_default_datasets","title":"generate_default_datasets","text":"
generate_default_datasets(data_dir, generate_eda=False)\n

Generate the default datasets used in the paper and save them to data_dir/problem

Source code in rl4co/data/generate_data.py
def generate_default_datasets(data_dir, generate_eda=False):\n    \"\"\"Generate the default datasets used in the paper and save them to data_dir/problem\"\"\"\n    generate_dataset(data_dir=data_dir, name=\"val\", problem=\"all\", seed=4321)\n    generate_dataset(data_dir=data_dir, name=\"test\", problem=\"all\", seed=1234)\n\n    # By default, we skip the EDA datasets since they can easily be generated on the fly when needed\n    if generate_eda:\n        generate_dataset(\n            data_dir=data_dir,\n            name=\"test\",\n            problem=\"mdpp\",\n            seed=1234,\n            graph_sizes=[10],\n            dataset_size=100,\n        )  # EDA (mDPP)\n
"},{"location":"docs/content/api/data/#transforms","title":"Transforms","text":"

Classes:

  • StateAugmentation \u2013

    Augment state by N times via symmetric rotation/reflection transform

Functions:

  • dihedral_8_augmentation \u2013

    Augmentation (x8) for grid-based data (x, y) as done in POMO.

  • dihedral_8_augmentation_wrapper \u2013

    Wrapper for dihedral_8_augmentation. If reduce, only return the first 1/8 of the augmented data

  • symmetric_transform \u2013

    SR group transform with rotation and reflection

  • symmetric_augmentation \u2013

    Augment xy data by num_augment times via symmetric rotation transform and concatenate to original data

"},{"location":"docs/content/api/data/#data.transforms.StateAugmentation","title":"StateAugmentation","text":"
StateAugmentation(\n    num_augment: int = 8,\n    augment_fn: Union[str, callable] = \"symmetric\",\n    first_aug_identity: bool = True,\n    normalize: bool = False,\n    feats: list = None,\n)\n

Bases: object

Augment state by N times via symmetric rotation/reflection transform

Parameters:

  • num_augment (int, default: 8 ) \u2013

    number of augmentations

  • augment_fn (Union[str, callable], default: 'symmetric' ) \u2013

    augmentation function to use, e.g. 'symmetric' (default) or 'dihedral8', if callable, then use the function directly. If 'dihedral8', then num_augment must be 8

  • first_aug_identity (bool, default: True ) \u2013

    whether to augment the first data point too

  • normalize (bool, default: False ) \u2013

    whether to normalize the augmented data

  • feats (list, default: None ) \u2013

    list of features to augment

Source code in rl4co/data/transforms.py
def __init__(\n    self,\n    num_augment: int = 8,\n    augment_fn: Union[str, callable] = 'symmetric', \n    first_aug_identity: bool = True,\n    normalize: bool = False,\n    feats: list = None,\n):\n    self.augmentation = get_augment_function(augment_fn)\n    assert not (\n        self.augmentation == dihedral_8_augmentation_wrapper and num_augment != 8\n    ), \"When using the `dihedral8` augmentation function, then num_augment must be 8\"\n\n    if feats is None:\n        log.info(\"Features not passed, defaulting to 'locs'\")\n        self.feats = [\"locs\"]\n    else:\n        self.feats = feats\n    self.num_augment = num_augment\n    self.normalize = normalize\n    self.first_aug_identity = first_aug_identity\n
"},{"location":"docs/content/api/data/#data.transforms.dihedral_8_augmentation","title":"dihedral_8_augmentation","text":"
dihedral_8_augmentation(xy: Tensor) -> Tensor\n

Augmentation (x8) for grid-based data (x, y) as done in POMO. This is a Dihedral group of order 8 (rotations and reflections) https://en.wikipedia.org/wiki/Examples_of_groups#dihedral_group_of_order_8

Parameters:

  • xy (Tensor) \u2013

    [batch, graph, 2] tensor of x and y coordinates

Source code in rl4co/data/transforms.py
def dihedral_8_augmentation(xy: Tensor) -> Tensor:\n    \"\"\"\n    Augmentation (x8) for grid-based data (x, y) as done in POMO.\n    This is a Dihedral group of order 8 (rotations and reflections)\n    https://en.wikipedia.org/wiki/Examples_of_groups#dihedral_group_of_order_8\n\n    Args:\n        xy: [batch, graph, 2] tensor of x and y coordinates\n    \"\"\"\n    # [batch, graph, 2]\n    x, y = xy.split(1, dim=2)\n    # augmnetations [batch, graph, 2]\n    z0 = torch.cat((x, y), dim=2)\n    z1 = torch.cat((1 - x, y), dim=2)\n    z2 = torch.cat((x, 1 - y), dim=2)\n    z3 = torch.cat((1 - x, 1 - y), dim=2)\n    z4 = torch.cat((y, x), dim=2)\n    z5 = torch.cat((1 - y, x), dim=2)\n    z6 = torch.cat((y, 1 - x), dim=2)\n    z7 = torch.cat((1 - y, 1 - x), dim=2)\n    # [batch*8, graph, 2]\n    aug_xy = torch.cat((z0, z1, z2, z3, z4, z5, z6, z7), dim=0)\n    return aug_xy\n
"},{"location":"docs/content/api/data/#data.transforms.dihedral_8_augmentation_wrapper","title":"dihedral_8_augmentation_wrapper","text":"
dihedral_8_augmentation_wrapper(\n    xy: Tensor, reduce: bool = True, *args, **kw\n) -> Tensor\n

Wrapper for dihedral_8_augmentation. If reduce, only return the first 1/8 of the augmented data since the augmentation augments the data 8 times.

Source code in rl4co/data/transforms.py
def dihedral_8_augmentation_wrapper(\n    xy: Tensor, reduce: bool = True, *args, **kw\n) -> Tensor:\n    \"\"\"Wrapper for dihedral_8_augmentation. If reduce, only return the first 1/8 of the augmented data\n    since the augmentation augments the data 8 times.\n    \"\"\"\n    xy = xy[: xy.shape[0] // 8, ...] if reduce else xy\n    return dihedral_8_augmentation(xy)\n
"},{"location":"docs/content/api/data/#data.transforms.symmetric_transform","title":"symmetric_transform","text":"
symmetric_transform(\n    x: Tensor, y: Tensor, phi: Tensor, offset: float = 0.5\n)\n

SR group transform with rotation and reflection Like the one in SymNCO, but a vectorized version

Parameters:

  • x (Tensor) \u2013

    [batch, graph, 1] tensor of x coordinates

  • y (Tensor) \u2013

    [batch, graph, 1] tensor of y coordinates

  • phi (Tensor) \u2013

    [batch, 1] tensor of random rotation angles

  • offset (float, default: 0.5 ) \u2013

    offset for x and y coordinates

Source code in rl4co/data/transforms.py
def symmetric_transform(x: Tensor, y: Tensor, phi: Tensor, offset: float = 0.5):\n    \"\"\"SR group transform with rotation and reflection\n    Like the one in SymNCO, but a vectorized version\n\n    Args:\n        x: [batch, graph, 1] tensor of x coordinates\n        y: [batch, graph, 1] tensor of y coordinates\n        phi: [batch, 1] tensor of random rotation angles\n        offset: offset for x and y coordinates\n    \"\"\"\n    x, y = x - offset, y - offset\n    # random rotation\n    x_prime = torch.cos(phi) * x - torch.sin(phi) * y\n    y_prime = torch.sin(phi) * x + torch.cos(phi) * y\n    # make random reflection if phi > 2*pi (i.e. 50% of the time)\n    mask = phi > 2 * math.pi\n    # vectorized random reflection: swap axes x and y if mask\n    xy = torch.cat((x_prime, y_prime), dim=-1)\n    xy = torch.where(mask, xy.flip(-1), xy)\n    return xy + offset\n
"},{"location":"docs/content/api/data/#data.transforms.symmetric_augmentation","title":"symmetric_augmentation","text":"
symmetric_augmentation(\n    xy: Tensor,\n    num_augment: int = 8,\n    first_augment: bool = False,\n)\n

Augment xy data by num_augment times via symmetric rotation transform and concatenate to original data

Parameters:

  • xy (Tensor) \u2013

    [batch, graph, 2] tensor of x and y coordinates

  • num_augment (int, default: 8 ) \u2013

    number of augmentations

  • first_augment (bool, default: False ) \u2013

    whether to augment the first data point

Source code in rl4co/data/transforms.py
def symmetric_augmentation(xy: Tensor, num_augment: int = 8, first_augment: bool = False):\n    \"\"\"Augment xy data by `num_augment` times via symmetric rotation transform and concatenate to original data\n\n    Args:\n        xy: [batch, graph, 2] tensor of x and y coordinates\n        num_augment: number of augmentations\n        first_augment: whether to augment the first data point\n    \"\"\"\n    # create random rotation angles (4*pi for reflection, 2*pi for rotation)\n    phi = torch.rand(xy.shape[0], device=xy.device) * 4 * math.pi\n\n    # set phi to 0 for first , i.e. no augmentation as in SymNCO\n    if not first_augment:\n        phi[: xy.shape[0] // num_augment] = 0.0\n    x, y = xy[..., [0]], xy[..., [1]]\n    return symmetric_transform(x, y, phi[:, None, None])\n
"},{"location":"docs/content/api/data/#utils","title":"Utils","text":"

Functions:

  • load_npz_to_tensordict \u2013

    Load a npz file directly into a TensorDict

  • save_tensordict_to_npz \u2013

    Save a TensorDict to a npz file

  • check_extension \u2013

    Check that filename has extension, otherwise add it

  • load_solomon_instance \u2013

    Load solomon instance from a file

  • load_solomon_solution \u2013

    Load solomon solution from a file

"},{"location":"docs/content/api/data/#data.utils.load_npz_to_tensordict","title":"load_npz_to_tensordict","text":"
load_npz_to_tensordict(filename)\n

Load a npz file directly into a TensorDict We assume that the npz file contains a dictionary of numpy arrays This is at least an order of magnitude faster than pickle

Source code in rl4co/data/utils.py
def load_npz_to_tensordict(filename):\n    \"\"\"Load a npz file directly into a TensorDict\n    We assume that the npz file contains a dictionary of numpy arrays\n    This is at least an order of magnitude faster than pickle\n    \"\"\"\n    x = np.load(filename)\n    x_dict = dict(x)\n    batch_size = x_dict[list(x_dict.keys())[0]].shape[0]\n    return TensorDict(x_dict, batch_size=batch_size)\n
"},{"location":"docs/content/api/data/#data.utils.save_tensordict_to_npz","title":"save_tensordict_to_npz","text":"
save_tensordict_to_npz(\n    tensordict, filename, compress: bool = False\n)\n

Save a TensorDict to a npz file We assume that the TensorDict contains a dictionary of tensors

Source code in rl4co/data/utils.py
def save_tensordict_to_npz(tensordict, filename, compress: bool = False):\n    \"\"\"Save a TensorDict to a npz file\n    We assume that the TensorDict contains a dictionary of tensors\n    \"\"\"\n    x_dict = {k: v.numpy() for k, v in tensordict.items()}\n    if compress:\n        np.savez_compressed(filename, **x_dict)\n    else:\n        np.savez(filename, **x_dict)\n
"},{"location":"docs/content/api/data/#data.utils.check_extension","title":"check_extension","text":"
check_extension(filename, extension='.npz')\n

Check that filename has extension, otherwise add it

Source code in rl4co/data/utils.py
def check_extension(filename, extension=\".npz\"):\n    \"\"\"Check that filename has extension, otherwise add it\"\"\"\n    if os.path.splitext(filename)[1] != extension:\n        return filename + extension\n    return filename\n
"},{"location":"docs/content/api/data/#data.utils.load_solomon_instance","title":"load_solomon_instance","text":"
load_solomon_instance(name, path=None, edge_weights=False)\n

Load solomon instance from a file

Source code in rl4co/data/utils.py
def load_solomon_instance(name, path=None, edge_weights=False):\n    \"\"\"Load solomon instance from a file\"\"\"\n    import vrplib\n\n    if not path:\n        path = \"data/solomon/instances/\"\n        path = os.path.join(ROOT_PATH, path)\n    if not os.path.isdir(path):\n        os.makedirs(path)\n    file_path = f\"{path}{name}.txt\"\n    if not os.path.isfile(file_path):\n        vrplib.download_instance(name=name, path=path)\n    return vrplib.read_instance(\n        path=file_path,\n        instance_format=\"solomon\",\n        compute_edge_weights=edge_weights,\n    )\n
"},{"location":"docs/content/api/data/#data.utils.load_solomon_solution","title":"load_solomon_solution","text":"
load_solomon_solution(name, path=None)\n

Load solomon solution from a file

Source code in rl4co/data/utils.py
def load_solomon_solution(name, path=None):\n    \"\"\"Load solomon solution from a file\"\"\"\n    import vrplib\n\n    if not path:\n        path = \"data/solomon/solutions/\"\n        path = os.path.join(ROOT_PATH, path)\n    if not os.path.isdir(path):\n        os.makedirs(path)\n    file_path = f\"{path}{name}.sol\"\n    if not os.path.isfile(file_path):\n        vrplib.download_solution(name=name, path=path)\n    return vrplib.read_solution(path=file_path)\n
"},{"location":"docs/content/api/decoding/","title":"Decoding Strategies","text":"

Classes:

  • DecodingStrategy \u2013

    Base class for decoding strategies. Subclasses should implement the :meth:_step method.

  • Greedy \u2013
  • Sampling \u2013
  • Evaluate \u2013
  • BeamSearch \u2013

Functions:

  • get_log_likelihood \u2013

    Get log likelihood of selected actions.

  • decode_logprobs \u2013

    Decode log probabilities to select actions with mask.

  • random_policy \u2013

    Helper function to select a random action from available actions

  • rollout \u2013

    Helper function to rollout a policy. Currently, TorchRL does not allow to step

  • modify_logits_for_top_k_filtering \u2013

    Set the logits for none top-k values to -inf. Done out-of-place.

  • modify_logits_for_top_p_filtering \u2013

    Set the logits for none top-p values to -inf. Done out-of-place.

  • process_logits \u2013

    Convert logits to log probabilities with additional features like temperature scaling, top-k and top-p sampling.

"},{"location":"docs/content/api/decoding/#utils.decoding.DecodingStrategy","title":"DecodingStrategy","text":"
DecodingStrategy(\n    temperature: float = 1.0,\n    top_p: float = 0.0,\n    top_k: int = 0,\n    mask_logits: bool = True,\n    tanh_clipping: float = 0,\n    num_samples: Optional[int] = None,\n    multisample: bool = False,\n    num_starts: Optional[int] = None,\n    multistart: bool = False,\n    select_start_nodes_fn: Optional[callable] = None,\n    improvement_method_mode: bool = False,\n    select_best: bool = False,\n    store_all_logp: bool = False,\n    **kwargs\n)\n

Base class for decoding strategies. Subclasses should implement the :meth:_step method. Includes hooks for pre and post main decoding operations.

Parameters:

  • temperature (float, default: 1.0 ) \u2013

    Temperature scaling. Higher values make the distribution more uniform (exploration), lower values make it more peaky (exploitation). Defaults to 1.0.

  • top_p (float, default: 0.0 ) \u2013

    Top-p sampling, a.k.a. Nucleus Sampling (https://arxiv.org/abs/1904.09751). Defaults to 0.0.

  • top_k (int, default: 0 ) \u2013

    Top-k sampling, i.e. restrict sampling to the top k logits. If 0, do not perform. Defaults to 0.

  • mask_logits (bool, default: True ) \u2013

    Whether to mask logits of infeasible actions. Defaults to True.

  • tanh_clipping (float, default: 0 ) \u2013

    Tanh clipping (https://arxiv.org/abs/1611.09940). Defaults to 0.

  • multisample (bool, default: False ) \u2013

    Whether to use sampling decoding. Defaults to False.

  • num_samples (Optional[int], default: None ) \u2013

    Number of samples to evaluate during decoding. Defaults to None.

  • num_starts (Optional[int], default: None ) \u2013

    Number of starts for multistart decoding. Defaults to None.

  • multistart (bool, default: False ) \u2013

    Whether to use multistart decoding. Defaults to False.

  • select_start_nodes_fn (Optional[callable], default: None ) \u2013

    Function to select start nodes for multistart decoding. Defaults to None.

  • improvement_method_mode (bool, default: False ) \u2013

    Whether to use improvement method mode. Defaults to False.

  • select_best (bool, default: False ) \u2013

    Whether to select the best action or return all. Defaults to False.

  • store_all_logp (bool, default: False ) \u2013

    Whether to store all log probabilities. Defaults to False. If True, logprobs will be stored for all actions. Note that this will increase memory usage.

Methods:

  • pre_decoder_hook \u2013

    Pre decoding hook. This method is called before the main decoding operation.

  • step \u2013

    Main decoding operation. This method should be called in a loop until all sequences are done.

  • greedy \u2013

    Select the action with the highest probability.

  • sampling \u2013

    Sample an action with a multinomial distribution given by the log probabilities.

Source code in rl4co/utils/decoding.py
def __init__(\n    self,\n    temperature: float = 1.0,\n    top_p: float = 0.0,\n    top_k: int = 0,\n    mask_logits: bool = True,\n    tanh_clipping: float = 0,\n    num_samples: Optional[int] = None,\n    multisample: bool = False,\n    num_starts: Optional[int] = None,\n    multistart: bool = False,\n    select_start_nodes_fn: Optional[callable] = None,\n    improvement_method_mode: bool = False,\n    select_best: bool = False,\n    store_all_logp: bool = False,\n    **kwargs,\n) -> None:\n    self.temperature = temperature\n    self.top_p = top_p\n    self.top_k = top_k\n    self.mask_logits = mask_logits\n    self.tanh_clipping = tanh_clipping\n    # check if multistart (POMO) and multisample flags\n    assert not (\n        multistart and multisample\n    ), \"Using both multistart and multisample is not supported\"\n    if num_samples and num_starts:\n        assert not (\n            num_samples > 1 and num_starts > 1\n        ), f\"num_samples={num_samples} and num_starts={num_starts} are both > 1\"\n    if num_samples is not None:\n        multisample = True if num_samples > 1 else False\n    if num_starts is not None:\n        multistart = True if num_starts > 1 else False\n    self.multistart = multistart\n    self.multisample = multisample\n    # num_starts is used for both multistart and multisample\n    # the function is to use start multiple rollouts for the same instance in parallel\n    self.num_starts = num_starts if multistart else num_samples\n\n    self.select_start_nodes_fn = select_start_nodes_fn\n    self.improvement_method_mode = improvement_method_mode\n    self.select_best = select_best\n    self.store_all_logp = store_all_logp\n    # initialize buffers\n    self.actions = []\n    self.logprobs = []\n
"},{"location":"docs/content/api/decoding/#utils.decoding.DecodingStrategy.pre_decoder_hook","title":"pre_decoder_hook","text":"
pre_decoder_hook(\n    td: TensorDict, env: RL4COEnvBase, action: Tensor = None\n)\n

Pre decoding hook. This method is called before the main decoding operation.

Source code in rl4co/utils/decoding.py
def pre_decoder_hook(\n    self, td: TensorDict, env: RL4COEnvBase, action: torch.Tensor = None\n):\n    \"\"\"Pre decoding hook. This method is called before the main decoding operation.\"\"\"\n\n    # Multi-start decoding. If num_starts is None, we use the number of actions in the action mask\n    if self.multistart or self.multisample:\n        if self.num_starts is None:\n            self.num_starts = env.get_num_starts(td)\n            if self.multisample:\n                log.warn(\n                    f\"num_starts is not provided for sampling, using num_starts={self.num_starts}\"\n                )\n    else:\n        if self.num_starts is not None:\n            if self.num_starts >= 1:\n                log.warn(\n                    f\"num_starts={self.num_starts} is ignored for decode_type={self.name}\"\n                )\n\n        self.num_starts = 0\n\n    # Multi-start decoding: first action is chosen by ad-hoc node selection\n    if self.num_starts >= 1:\n        if self.multistart:\n            if action is None:  # if action is provided, we use it as the first action\n                if self.select_start_nodes_fn is not None:\n                    action = self.select_start_nodes_fn(td, env, self.num_starts)\n                else:\n                    action = env.select_start_nodes(td, num_starts=self.num_starts)\n\n            # Expand td to batch_size * num_starts\n            td = batchify(td, self.num_starts)\n\n            td.set(\"action\", action)\n            td = env.step(td)[\"next\"]\n            # first logprobs is 0, so p = logprobs.exp() = 1\n            if self.store_all_logp:\n                logprobs = torch.zeros_like(td[\"action_mask\"])  # [B, N]\n            else:\n                logprobs = torch.zeros_like(action, device=td.device)  # [B]\n\n            self.logprobs.append(logprobs)\n            self.actions.append(action)\n        else:\n            # Expand td to batch_size * num_samplestarts\n            td = batchify(td, self.num_starts)\n\n    return td, env, self.num_starts\n
"},{"location":"docs/content/api/decoding/#utils.decoding.DecodingStrategy.step","title":"step","text":"
step(\n    logits: Tensor,\n    mask: Tensor,\n    td: TensorDict = None,\n    action: Tensor = None,\n    **kwargs\n) -> TensorDict\n

Main decoding operation. This method should be called in a loop until all sequences are done.

Parameters:

  • logits (Tensor) \u2013

    Logits from the model.

  • mask (Tensor) \u2013

    Action mask. 1 if feasible, 0 otherwise (so we keep if 1 as done in PyTorch).

  • td (TensorDict, default: None ) \u2013

    TensorDict containing the current state of the environment.

  • action (Tensor, default: None ) \u2013

    Optional action to use, e.g. for evaluating log probabilities.

Source code in rl4co/utils/decoding.py
def step(\n    self,\n    logits: torch.Tensor,\n    mask: torch.Tensor,\n    td: TensorDict = None,\n    action: torch.Tensor = None,\n    **kwargs,\n) -> TensorDict:\n    \"\"\"Main decoding operation. This method should be called in a loop until all sequences are done.\n\n    Args:\n        logits: Logits from the model.\n        mask: Action mask. 1 if feasible, 0 otherwise (so we keep if 1 as done in PyTorch).\n        td: TensorDict containing the current state of the environment.\n        action: Optional action to use, e.g. for evaluating log probabilities.\n    \"\"\"\n    if not self.mask_logits:  # set mask_logit to None if mask_logits is False\n        mask = None\n\n    logprobs = process_logits(\n        logits,\n        mask,\n        temperature=self.temperature,\n        top_p=self.top_p,\n        top_k=self.top_k,\n        tanh_clipping=self.tanh_clipping,\n        mask_logits=self.mask_logits,\n    )\n    logprobs, selected_action, td = self._step(\n        logprobs, mask, td, action=action, **kwargs\n    )\n\n    # directly return for improvement methods, since the action for improvement methods is finalized in its own policy\n    if self.improvement_method_mode:\n        return logprobs, selected_action\n    # for others\n    if not self.store_all_logp:\n        logprobs = gather_by_index(logprobs, selected_action, dim=1)\n    td.set(\"action\", selected_action)\n    self.actions.append(selected_action)\n    self.logprobs.append(logprobs)\n    return td\n
"},{"location":"docs/content/api/decoding/#utils.decoding.DecodingStrategy.greedy","title":"greedy staticmethod","text":"
greedy(logprobs, mask=None)\n

Select the action with the highest probability.

Source code in rl4co/utils/decoding.py
@staticmethod\ndef greedy(logprobs, mask=None):\n    \"\"\"Select the action with the highest probability.\"\"\"\n    # [BS], [BS]\n    selected = logprobs.argmax(dim=-1)\n    if mask is not None:\n        assert (\n            not (~mask).gather(1, selected.unsqueeze(-1)).data.any()\n        ), \"infeasible action selected\"\n\n    return selected\n
"},{"location":"docs/content/api/decoding/#utils.decoding.DecodingStrategy.sampling","title":"sampling staticmethod","text":"
sampling(logprobs, mask=None)\n

Sample an action with a multinomial distribution given by the log probabilities.

Source code in rl4co/utils/decoding.py
@staticmethod\ndef sampling(logprobs, mask=None):\n    \"\"\"Sample an action with a multinomial distribution given by the log probabilities.\"\"\"\n    probs = logprobs.exp()\n    selected = torch.multinomial(probs, 1).squeeze(1)\n\n    if mask is not None:\n        while (~mask).gather(1, selected.unsqueeze(-1)).data.any():\n            log.info(\"Sampled bad values, resampling!\")\n            selected = probs.multinomial(1).squeeze(1)\n        assert (\n            not (~mask).gather(1, selected.unsqueeze(-1)).data.any()\n        ), \"infeasible action selected\"\n\n    return selected\n
"},{"location":"docs/content/api/decoding/#utils.decoding.Greedy","title":"Greedy","text":"
Greedy(\n    temperature: float = 1.0,\n    top_p: float = 0.0,\n    top_k: int = 0,\n    mask_logits: bool = True,\n    tanh_clipping: float = 0,\n    num_samples: Optional[int] = None,\n    multisample: bool = False,\n    num_starts: Optional[int] = None,\n    multistart: bool = False,\n    select_start_nodes_fn: Optional[callable] = None,\n    improvement_method_mode: bool = False,\n    select_best: bool = False,\n    store_all_logp: bool = False,\n    **kwargs\n)\n

Bases: DecodingStrategy

Source code in rl4co/utils/decoding.py
def __init__(\n    self,\n    temperature: float = 1.0,\n    top_p: float = 0.0,\n    top_k: int = 0,\n    mask_logits: bool = True,\n    tanh_clipping: float = 0,\n    num_samples: Optional[int] = None,\n    multisample: bool = False,\n    num_starts: Optional[int] = None,\n    multistart: bool = False,\n    select_start_nodes_fn: Optional[callable] = None,\n    improvement_method_mode: bool = False,\n    select_best: bool = False,\n    store_all_logp: bool = False,\n    **kwargs,\n) -> None:\n    self.temperature = temperature\n    self.top_p = top_p\n    self.top_k = top_k\n    self.mask_logits = mask_logits\n    self.tanh_clipping = tanh_clipping\n    # check if multistart (POMO) and multisample flags\n    assert not (\n        multistart and multisample\n    ), \"Using both multistart and multisample is not supported\"\n    if num_samples and num_starts:\n        assert not (\n            num_samples > 1 and num_starts > 1\n        ), f\"num_samples={num_samples} and num_starts={num_starts} are both > 1\"\n    if num_samples is not None:\n        multisample = True if num_samples > 1 else False\n    if num_starts is not None:\n        multistart = True if num_starts > 1 else False\n    self.multistart = multistart\n    self.multisample = multisample\n    # num_starts is used for both multistart and multisample\n    # the function is to use start multiple rollouts for the same instance in parallel\n    self.num_starts = num_starts if multistart else num_samples\n\n    self.select_start_nodes_fn = select_start_nodes_fn\n    self.improvement_method_mode = improvement_method_mode\n    self.select_best = select_best\n    self.store_all_logp = store_all_logp\n    # initialize buffers\n    self.actions = []\n    self.logprobs = []\n
"},{"location":"docs/content/api/decoding/#utils.decoding.Sampling","title":"Sampling","text":"
Sampling(\n    temperature: float = 1.0,\n    top_p: float = 0.0,\n    top_k: int = 0,\n    mask_logits: bool = True,\n    tanh_clipping: float = 0,\n    num_samples: Optional[int] = None,\n    multisample: bool = False,\n    num_starts: Optional[int] = None,\n    multistart: bool = False,\n    select_start_nodes_fn: Optional[callable] = None,\n    improvement_method_mode: bool = False,\n    select_best: bool = False,\n    store_all_logp: bool = False,\n    **kwargs\n)\n

Bases: DecodingStrategy

Source code in rl4co/utils/decoding.py
def __init__(\n    self,\n    temperature: float = 1.0,\n    top_p: float = 0.0,\n    top_k: int = 0,\n    mask_logits: bool = True,\n    tanh_clipping: float = 0,\n    num_samples: Optional[int] = None,\n    multisample: bool = False,\n    num_starts: Optional[int] = None,\n    multistart: bool = False,\n    select_start_nodes_fn: Optional[callable] = None,\n    improvement_method_mode: bool = False,\n    select_best: bool = False,\n    store_all_logp: bool = False,\n    **kwargs,\n) -> None:\n    self.temperature = temperature\n    self.top_p = top_p\n    self.top_k = top_k\n    self.mask_logits = mask_logits\n    self.tanh_clipping = tanh_clipping\n    # check if multistart (POMO) and multisample flags\n    assert not (\n        multistart and multisample\n    ), \"Using both multistart and multisample is not supported\"\n    if num_samples and num_starts:\n        assert not (\n            num_samples > 1 and num_starts > 1\n        ), f\"num_samples={num_samples} and num_starts={num_starts} are both > 1\"\n    if num_samples is not None:\n        multisample = True if num_samples > 1 else False\n    if num_starts is not None:\n        multistart = True if num_starts > 1 else False\n    self.multistart = multistart\n    self.multisample = multisample\n    # num_starts is used for both multistart and multisample\n    # the function is to use start multiple rollouts for the same instance in parallel\n    self.num_starts = num_starts if multistart else num_samples\n\n    self.select_start_nodes_fn = select_start_nodes_fn\n    self.improvement_method_mode = improvement_method_mode\n    self.select_best = select_best\n    self.store_all_logp = store_all_logp\n    # initialize buffers\n    self.actions = []\n    self.logprobs = []\n
"},{"location":"docs/content/api/decoding/#utils.decoding.Evaluate","title":"Evaluate","text":"
Evaluate(\n    temperature: float = 1.0,\n    top_p: float = 0.0,\n    top_k: int = 0,\n    mask_logits: bool = True,\n    tanh_clipping: float = 0,\n    num_samples: Optional[int] = None,\n    multisample: bool = False,\n    num_starts: Optional[int] = None,\n    multistart: bool = False,\n    select_start_nodes_fn: Optional[callable] = None,\n    improvement_method_mode: bool = False,\n    select_best: bool = False,\n    store_all_logp: bool = False,\n    **kwargs\n)\n

Bases: DecodingStrategy

Source code in rl4co/utils/decoding.py
def __init__(\n    self,\n    temperature: float = 1.0,\n    top_p: float = 0.0,\n    top_k: int = 0,\n    mask_logits: bool = True,\n    tanh_clipping: float = 0,\n    num_samples: Optional[int] = None,\n    multisample: bool = False,\n    num_starts: Optional[int] = None,\n    multistart: bool = False,\n    select_start_nodes_fn: Optional[callable] = None,\n    improvement_method_mode: bool = False,\n    select_best: bool = False,\n    store_all_logp: bool = False,\n    **kwargs,\n) -> None:\n    self.temperature = temperature\n    self.top_p = top_p\n    self.top_k = top_k\n    self.mask_logits = mask_logits\n    self.tanh_clipping = tanh_clipping\n    # check if multistart (POMO) and multisample flags\n    assert not (\n        multistart and multisample\n    ), \"Using both multistart and multisample is not supported\"\n    if num_samples and num_starts:\n        assert not (\n            num_samples > 1 and num_starts > 1\n        ), f\"num_samples={num_samples} and num_starts={num_starts} are both > 1\"\n    if num_samples is not None:\n        multisample = True if num_samples > 1 else False\n    if num_starts is not None:\n        multistart = True if num_starts > 1 else False\n    self.multistart = multistart\n    self.multisample = multisample\n    # num_starts is used for both multistart and multisample\n    # the function is to use start multiple rollouts for the same instance in parallel\n    self.num_starts = num_starts if multistart else num_samples\n\n    self.select_start_nodes_fn = select_start_nodes_fn\n    self.improvement_method_mode = improvement_method_mode\n    self.select_best = select_best\n    self.store_all_logp = store_all_logp\n    # initialize buffers\n    self.actions = []\n    self.logprobs = []\n
"},{"location":"docs/content/api/decoding/#utils.decoding.BeamSearch","title":"BeamSearch","text":"
BeamSearch(beam_width=None, select_best=True, **kwargs)\n

Bases: DecodingStrategy

Methods:

  • pre_decoder_hook \u2013

    Pre decoding hook. This method is called before the main decoding operation.

Source code in rl4co/utils/decoding.py
def __init__(self, beam_width=None, select_best=True, **kwargs) -> None:\n    # TODO do we really need all logp in beam search?\n    kwargs[\"store_all_logp\"] = True\n    super().__init__(**kwargs)\n    self.beam_width = beam_width\n    self.select_best = select_best\n    self.parent_beam_logprobs = None\n    self.beam_path = []\n
"},{"location":"docs/content/api/decoding/#utils.decoding.BeamSearch.pre_decoder_hook","title":"pre_decoder_hook","text":"
pre_decoder_hook(\n    td: TensorDict, env: RL4COEnvBase, **kwargs\n)\n

Pre decoding hook. This method is called before the main decoding operation.

Source code in rl4co/utils/decoding.py
def pre_decoder_hook(self, td: TensorDict, env: RL4COEnvBase, **kwargs):\n    if self.beam_width is None:\n        self.beam_width = env.get_num_starts(td)\n    assert self.beam_width > 1, \"beam width must be larger than 1\"\n\n    # select start nodes. TODO: include first step in beam search as well\n    if self.select_start_nodes_fn is not None:\n        action = self.select_start_nodes_fn(td, env, self.beam_width)\n    else:\n        action = env.select_start_nodes(td, num_starts=self.beam_width)\n\n    # Expand td to batch_size * beam_width\n    td = batchify(td, self.beam_width)\n\n    td.set(\"action\", action)\n    td = env.step(td)[\"next\"]\n\n    logprobs = torch.zeros_like(td[\"action_mask\"], device=td.device)\n    beam_parent = torch.zeros(logprobs.size(0), device=td.device, dtype=torch.int32)\n\n    self.logprobs.append(logprobs)\n    self.actions.append(action)\n    self.parent_beam_logprobs = logprobs.gather(1, action[..., None])\n    self.beam_path.append(beam_parent)\n\n    return td, env, self.beam_width\n
"},{"location":"docs/content/api/decoding/#utils.decoding.get_log_likelihood","title":"get_log_likelihood","text":"
get_log_likelihood(\n    logprobs,\n    actions=None,\n    mask=None,\n    return_sum: bool = True,\n)\n

Get log likelihood of selected actions. Note that mask is a boolean tensor where True means the value should be kept.

Parameters:

  • logprobs \u2013

    Log probabilities of actions from the model (batch_size, seq_len, action_dim).

  • actions \u2013

    Selected actions (batch_size, seq_len).

  • mask \u2013

    Action mask. 1 if feasible, 0 otherwise (so we keep if 1 as done in PyTorch).

  • return_sum (bool, default: True ) \u2013

    Whether to return the sum of log probabilities or not. Defaults to True.

Source code in rl4co/utils/decoding.py
def get_log_likelihood(logprobs, actions=None, mask=None, return_sum: bool = True):\n    \"\"\"Get log likelihood of selected actions.\n    Note that mask is a boolean tensor where True means the value should be kept.\n\n    Args:\n        logprobs: Log probabilities of actions from the model (batch_size, seq_len, action_dim).\n        actions: Selected actions (batch_size, seq_len).\n        mask: Action mask. 1 if feasible, 0 otherwise (so we keep if 1 as done in PyTorch).\n        return_sum: Whether to return the sum of log probabilities or not. Defaults to True.\n    \"\"\"\n    # Optional: select logp when logp.shape = (bs, dec_steps, N)\n    if actions is not None and logprobs.dim() == 3:\n        logprobs = logprobs.gather(-1, actions.unsqueeze(-1)).squeeze(-1)\n\n    # Optional: mask out actions irrelevant to objective so they do not get reinforced\n    if mask is not None:\n        logprobs[~mask] = 0\n\n    assert (\n        logprobs > -1000\n    ).data.all(), \"Logprobs should not be -inf, check sampling procedure!\"\n\n    # Calculate log_likelihood\n    if return_sum:\n        return logprobs.sum(1)  # [batch]\n    else:\n        return logprobs  # [batch, decode_len]\n
"},{"location":"docs/content/api/decoding/#utils.decoding.decode_logprobs","title":"decode_logprobs","text":"
decode_logprobs(logprobs, mask, decode_type='sampling')\n

Decode log probabilities to select actions with mask. Note that mask is a boolean tensor where True means the value should be kept.

Source code in rl4co/utils/decoding.py
def decode_logprobs(logprobs, mask, decode_type=\"sampling\"):\n    \"\"\"Decode log probabilities to select actions with mask.\n    Note that mask is a boolean tensor where True means the value should be kept.\n    \"\"\"\n    if \"greedy\" in decode_type:\n        selected = DecodingStrategy.greedy(logprobs, mask)\n    elif \"sampling\" in decode_type:\n        selected = DecodingStrategy.sampling(logprobs, mask)\n    else:\n        assert False, \"Unknown decode type: {}\".format(decode_type)\n    return selected\n
"},{"location":"docs/content/api/decoding/#utils.decoding.random_policy","title":"random_policy","text":"
random_policy(td)\n

Helper function to select a random action from available actions

Source code in rl4co/utils/decoding.py
def random_policy(td):\n    \"\"\"Helper function to select a random action from available actions\"\"\"\n    action = torch.multinomial(td[\"action_mask\"].float(), 1).squeeze(-1)\n    td.set(\"action\", action)\n    return td\n
"},{"location":"docs/content/api/decoding/#utils.decoding.rollout","title":"rollout","text":"
rollout(env, td, policy, max_steps: int = None)\n

Helper function to rollout a policy. Currently, TorchRL does not allow to step over envs when done with env.rollout(). We need this because for environments that complete at different steps.

Source code in rl4co/utils/decoding.py
def rollout(env, td, policy, max_steps: int = None):\n    \"\"\"Helper function to rollout a policy. Currently, TorchRL does not allow to step\n    over envs when done with `env.rollout()`. We need this because for environments that complete at different steps.\n    \"\"\"\n\n    max_steps = float(\"inf\") if max_steps is None else max_steps\n    actions = []\n    steps = 0\n\n    while not td[\"done\"].all():\n        td = policy(td)\n        actions.append(td[\"action\"])\n        td = env.step(td)[\"next\"]\n        steps += 1\n        if steps > max_steps:\n            log.info(\"Max steps reached\")\n            break\n    return (\n        env.get_reward(td, torch.stack(actions, dim=1)),\n        td,\n        torch.stack(actions, dim=1),\n    )\n
"},{"location":"docs/content/api/decoding/#utils.decoding.modify_logits_for_top_k_filtering","title":"modify_logits_for_top_k_filtering","text":"
modify_logits_for_top_k_filtering(logits, top_k)\n

Set the logits for none top-k values to -inf. Done out-of-place. Ref: https://github.com/togethercomputer/stripedhyena/blob/7e13f618027fea9625be1f2d2d94f9a361f6bd02/stripedhyena/sample.py#L6

Source code in rl4co/utils/decoding.py
def modify_logits_for_top_k_filtering(logits, top_k):\n    \"\"\"Set the logits for none top-k values to -inf. Done out-of-place.\n    Ref: https://github.com/togethercomputer/stripedhyena/blob/7e13f618027fea9625be1f2d2d94f9a361f6bd02/stripedhyena/sample.py#L6\n    \"\"\"\n    indices_to_remove = logits < torch.topk(logits, top_k)[0][..., -1, None]\n    return logits.masked_fill(indices_to_remove, float(\"-inf\"))\n
"},{"location":"docs/content/api/decoding/#utils.decoding.modify_logits_for_top_p_filtering","title":"modify_logits_for_top_p_filtering","text":"
modify_logits_for_top_p_filtering(logits, top_p)\n

Set the logits for none top-p values to -inf. Done out-of-place. Ref: https://github.com/togethercomputer/stripedhyena/blob/7e13f618027fea9625be1f2d2d94f9a361f6bd02/stripedhyena/sample.py#L14

Source code in rl4co/utils/decoding.py
def modify_logits_for_top_p_filtering(logits, top_p):\n    \"\"\"Set the logits for none top-p values to -inf. Done out-of-place.\n    Ref: https://github.com/togethercomputer/stripedhyena/blob/7e13f618027fea9625be1f2d2d94f9a361f6bd02/stripedhyena/sample.py#L14\n    \"\"\"\n    if top_p <= 0.0 or top_p >= 1.0:\n        return logits\n\n    # First sort and calculate cumulative sum of probabilities.\n    sorted_logits, sorted_indices = torch.sort(logits, descending=False)\n    cumulative_probs = sorted_logits.softmax(dim=-1).cumsum(dim=-1)\n\n    # Remove tokens with cumulative top_p above the threshold (token with 0 are kept)\n    sorted_indices_to_remove = cumulative_probs <= (1 - top_p)\n\n    # Scatter sorted tensors to original indexing\n    indices_to_remove = sorted_indices_to_remove.scatter(\n        -1, sorted_indices, sorted_indices_to_remove\n    )\n    return logits.masked_fill(indices_to_remove, float(\"-inf\"))\n
"},{"location":"docs/content/api/decoding/#utils.decoding.process_logits","title":"process_logits","text":"
process_logits(\n    logits: Tensor,\n    mask: Tensor = None,\n    temperature: float = 1.0,\n    top_p: float = 0.0,\n    top_k: int = 0,\n    tanh_clipping: float = 0,\n    mask_logits: bool = True,\n)\n

Convert logits to log probabilities with additional features like temperature scaling, top-k and top-p sampling.

Note

We convert to log probabilities instead of probabilities to avoid numerical instability. This is because, roughly, softmax = exp(logits) / sum(exp(logits)) and log(softmax) = logits - log(sum(exp(logits))), and avoiding the division by the sum of exponentials can help with numerical stability. You may check the official PyTorch documentation.

Parameters:

  • logits (Tensor) \u2013

    Logits from the model (batch_size, num_actions).

  • mask (Tensor, default: None ) \u2013

    Action mask. 1 if feasible, 0 otherwise (so we keep if 1 as done in PyTorch).

  • temperature (float, default: 1.0 ) \u2013

    Temperature scaling. Higher values make the distribution more uniform (exploration), lower values make it more peaky (exploitation).

  • top_p (float, default: 0.0 ) \u2013

    Top-p sampling, a.k.a. Nucleus Sampling (https://arxiv.org/abs/1904.09751). Remove tokens that have a cumulative probability less than the threshold 1 - top_p (lower tail of the distribution). If 0, do not perform.

  • top_k (int, default: 0 ) \u2013

    Top-k sampling, i.e. restrict sampling to the top k logits. If 0, do not perform. Note that we only do filtering and do not return all the top-k logits here.

  • tanh_clipping (float, default: 0 ) \u2013

    Tanh clipping (https://arxiv.org/abs/1611.09940).

  • mask_logits (bool, default: True ) \u2013

    Whether to mask logits of infeasible actions.

Source code in rl4co/utils/decoding.py
def process_logits(\n    logits: torch.Tensor,\n    mask: torch.Tensor = None,\n    temperature: float = 1.0,\n    top_p: float = 0.0,\n    top_k: int = 0,\n    tanh_clipping: float = 0,\n    mask_logits: bool = True,\n):\n    \"\"\"Convert logits to log probabilities with additional features like temperature scaling, top-k and top-p sampling.\n\n    Note:\n        We convert to log probabilities instead of probabilities to avoid numerical instability.\n        This is because, roughly, softmax = exp(logits) / sum(exp(logits)) and log(softmax) = logits - log(sum(exp(logits))),\n        and avoiding the division by the sum of exponentials can help with numerical stability.\n        You may check the [official PyTorch documentation](https://pytorch.org/docs/stable/generated/torch.nn.functional.log_softmax.html).\n\n    Args:\n        logits: Logits from the model (batch_size, num_actions).\n        mask: Action mask. 1 if feasible, 0 otherwise (so we keep if 1 as done in PyTorch).\n        temperature: Temperature scaling. Higher values make the distribution more uniform (exploration),\n            lower values make it more peaky (exploitation).\n        top_p: Top-p sampling, a.k.a. Nucleus Sampling (https://arxiv.org/abs/1904.09751). Remove tokens that have a cumulative probability\n            less than the threshold 1 - top_p (lower tail of the distribution). If 0, do not perform.\n        top_k: Top-k sampling, i.e. restrict sampling to the top k logits. If 0, do not perform. Note that we only do filtering and\n            do not return all the top-k logits here.\n        tanh_clipping: Tanh clipping (https://arxiv.org/abs/1611.09940).\n        mask_logits: Whether to mask logits of infeasible actions.\n    \"\"\"\n\n    # Tanh clipping from Bello et al. 2016\n    if tanh_clipping > 0:\n        logits = torch.tanh(logits) * tanh_clipping\n\n    # In RL, we want to mask the logits to prevent the agent from selecting infeasible actions\n    if mask_logits:\n        assert mask is not None, \"mask must be provided if mask_logits is True\"\n        logits[~mask] = float(\"-inf\")\n\n    logits = logits / temperature  # temperature scaling\n\n    if top_k > 0:\n        top_k = min(top_k, logits.size(-1))  # safety check\n        logits = modify_logits_for_top_k_filtering(logits, top_k)\n\n    if top_p > 0:\n        assert top_p <= 1.0, \"top-p should be in (0, 1].\"\n        logits = modify_logits_for_top_p_filtering(logits, top_p)\n\n    # Compute log probabilities\n    return F.log_softmax(logits, dim=-1)\n
"},{"location":"docs/content/api/tasks/","title":"Train and Evaluation","text":""},{"location":"docs/content/api/tasks/#train","title":"Train","text":"

Functions:

  • run \u2013

    Trains the model. Can additionally evaluate on a testset, using best weights obtained during

"},{"location":"docs/content/api/tasks/#tasks.train.run","title":"run","text":"
run(cfg: DictConfig) -> Tuple[dict, dict]\n

Trains the model. Can additionally evaluate on a testset, using best weights obtained during training. This method is wrapped in optional @task_wrapper decorator, that controls the behavior during failure. Useful for multiruns, saving info about the crash, etc.

Parameters:

  • cfg (DictConfig) \u2013

    Configuration composed by Hydra.

Returns: Tuple[dict, dict]: Dict with metrics and dict with all instantiated objects.

Source code in rl4co/tasks/train.py
@utils.task_wrapper\ndef run(cfg: DictConfig) -> Tuple[dict, dict]:\n    \"\"\"Trains the model. Can additionally evaluate on a testset, using best weights obtained during\n    training.\n    This method is wrapped in optional @task_wrapper decorator, that controls the behavior during\n    failure. Useful for multiruns, saving info about the crash, etc.\n\n    Args:\n        cfg (DictConfig): Configuration composed by Hydra.\n    Returns:\n        Tuple[dict, dict]: Dict with metrics and dict with all instantiated objects.\n    \"\"\"\n\n    # set seed for random number generators in pytorch, numpy and python.random\n    if cfg.get(\"seed\"):\n        L.seed_everything(cfg.seed, workers=True)\n\n    # We instantiate the environment separately and then pass it to the model\n    log.info(f\"Instantiating environment <{cfg.env._target_}>\")\n    env = hydra.utils.instantiate(cfg.env)\n\n    # Note that the RL environment is instantiated inside the model\n    log.info(f\"Instantiating model <{cfg.model._target_}>\")\n    model: LightningModule = hydra.utils.instantiate(cfg.model, env)\n\n    log.info(\"Instantiating callbacks...\")\n    callbacks: List[Callback] = utils.instantiate_callbacks(cfg.get(\"callbacks\"))\n\n    log.info(\"Instantiating loggers...\")\n    logger: List[Logger] = utils.instantiate_loggers(cfg.get(\"logger\"), model)\n\n    log.info(\"Instantiating trainer...\")\n    trainer: RL4COTrainer = hydra.utils.instantiate(\n        cfg.trainer,\n        callbacks=callbacks,\n        logger=logger,\n    )\n\n    object_dict = {\n        \"cfg\": cfg,\n        \"model\": model,\n        \"callbacks\": callbacks,\n        \"logger\": logger,\n        \"trainer\": trainer,\n    }\n\n    if logger:\n        log.info(\"Logging hyperparameters!\")\n        utils.log_hyperparameters(object_dict)\n\n    if cfg.get(\"compile\", False):\n        log.info(\"Compiling model!\")\n        model = torch.compile(model)\n\n    if cfg.get(\"train\"):\n        log.info(\"Starting training!\")\n        trainer.fit(model=model, ckpt_path=cfg.get(\"ckpt_path\"))\n\n        train_metrics = trainer.callback_metrics\n\n    if cfg.get(\"test\"):\n        log.info(\"Starting testing!\")\n        ckpt_path = trainer.checkpoint_callback.best_model_path\n        if ckpt_path == \"\":\n            log.warning(\"Best ckpt not found! Using current weights for testing...\")\n            ckpt_path = None\n        trainer.test(model=model, ckpt_path=ckpt_path)\n        log.info(f\"Best ckpt path: {ckpt_path}\")\n\n    test_metrics = trainer.callback_metrics\n\n    # merge train and test metrics\n    metric_dict = {**train_metrics, **test_metrics}\n\n    return metric_dict, object_dict\n
"},{"location":"docs/content/api/tasks/#evaluate","title":"Evaluate","text":"

Classes:

  • EvalBase \u2013

    Base class for evaluation

  • GreedyEval \u2013

    Evaluates the policy using greedy decoding and single trajectory

  • AugmentationEval \u2013

    Evaluates the policy via N state augmentations

  • SamplingEval \u2013

    Evaluates the policy via N samples from the policy

  • GreedyMultiStartEval \u2013

    Evaluates the policy via num_starts greedy multistarts samples from the policy

  • GreedyMultiStartAugmentEval \u2013

    Evaluates the policy via num_starts samples from the policy

Functions:

  • get_automatic_batch_size \u2013

    Automatically reduces the batch size based on the eval function

"},{"location":"docs/content/api/tasks/#tasks.eval.EvalBase","title":"EvalBase","text":"
EvalBase(env, progress=True, **kwargs)\n

Base class for evaluation

Parameters:

  • env \u2013

    Environment

  • progress \u2013

    Whether to show progress bar

  • **kwargs \u2013

    Additional arguments (to be implemented in subclasses)

Source code in rl4co/tasks/eval.py
def __init__(self, env, progress=True, **kwargs):\n    check_unused_kwargs(self, kwargs)\n    self.env = env\n    self.progress = progress\n
"},{"location":"docs/content/api/tasks/#tasks.eval.GreedyEval","title":"GreedyEval","text":"
GreedyEval(env, **kwargs)\n

Bases: EvalBase

Evaluates the policy using greedy decoding and single trajectory

Source code in rl4co/tasks/eval.py
def __init__(self, env, **kwargs):\n    check_unused_kwargs(self, kwargs)\n    super().__init__(env, kwargs.get(\"progress\", True))\n
"},{"location":"docs/content/api/tasks/#tasks.eval.AugmentationEval","title":"AugmentationEval","text":"
AugmentationEval(\n    env,\n    num_augment=8,\n    force_dihedral_8=False,\n    feats=None,\n    **kwargs\n)\n

Bases: EvalBase

Evaluates the policy via N state augmentations force_dihedral_8 forces the use of 8 augmentations (rotations and flips) as in POMO https://en.wikipedia.org/wiki/Examples_of_groups#dihedral_group_of_order_8

Parameters:

  • num_augment (int, default: 8 ) \u2013

    Number of state augmentations

  • force_dihedral_8 (bool, default: False ) \u2013

    Whether to force the use of 8 augmentations

Source code in rl4co/tasks/eval.py
def __init__(self, env, num_augment=8, force_dihedral_8=False, feats=None, **kwargs):\n    check_unused_kwargs(self, kwargs)\n    super().__init__(env, kwargs.get(\"progress\", True))\n    self.augmentation = StateAugmentation(\n        num_augment=num_augment,\n        augment_fn=\"dihedral8\" if force_dihedral_8 else \"symmetric\",\n        feats=feats,\n    )\n
"},{"location":"docs/content/api/tasks/#tasks.eval.SamplingEval","title":"SamplingEval","text":"
SamplingEval(\n    env,\n    samples,\n    softmax_temp=None,\n    select_best=True,\n    temperature=1.0,\n    top_p=0.0,\n    top_k=0,\n    **kwargs\n)\n

Bases: EvalBase

Evaluates the policy via N samples from the policy

Parameters:

  • samples (int) \u2013

    Number of samples to take

  • softmax_temp (float, default: None ) \u2013

    Temperature for softmax sampling. The higher the temperature, the more random the sampling

Source code in rl4co/tasks/eval.py
def __init__(\n    self,\n    env,\n    samples,\n    softmax_temp=None,\n    select_best=True,\n    temperature=1.0,\n    top_p=0.0,\n    top_k=0,\n    **kwargs,\n):\n    check_unused_kwargs(self, kwargs)\n    super().__init__(env, kwargs.get(\"progress\", True))\n\n    self.samples = samples\n    self.softmax_temp = softmax_temp\n    self.temperature = temperature\n    self.select_best = select_best\n    self.top_p = top_p\n    self.top_k = top_k\n
"},{"location":"docs/content/api/tasks/#tasks.eval.GreedyMultiStartEval","title":"GreedyMultiStartEval","text":"
GreedyMultiStartEval(env, num_starts=None, **kwargs)\n

Bases: EvalBase

Evaluates the policy via num_starts greedy multistarts samples from the policy

Parameters:

  • num_starts (int, default: None ) \u2013

    Number of greedy multistarts to use

Source code in rl4co/tasks/eval.py
def __init__(self, env, num_starts=None, **kwargs):\n    check_unused_kwargs(self, kwargs)\n    super().__init__(env, kwargs.get(\"progress\", True))\n\n    assert num_starts is not None, \"Must specify num_starts\"\n    self.num_starts = num_starts\n
"},{"location":"docs/content/api/tasks/#tasks.eval.GreedyMultiStartAugmentEval","title":"GreedyMultiStartAugmentEval","text":"
GreedyMultiStartAugmentEval(\n    env,\n    num_starts=None,\n    num_augment=8,\n    force_dihedral_8=False,\n    feats=None,\n    **kwargs\n)\n

Bases: EvalBase

Evaluates the policy via num_starts samples from the policy and num_augment augmentations of each sample.force_dihedral_8` forces the use of 8 augmentations (rotations and flips) as in POMO https://en.wikipedia.org/wiki/Examples_of_groups#dihedral_group_of_order_8

Parameters:

  • num_starts \u2013

    Number of greedy multistart samples

  • num_augment \u2013

    Number of augmentations per sample

  • force_dihedral_8 \u2013

    If True, force the use of 8 augmentations (rotations and flips) as in POMO

Source code in rl4co/tasks/eval.py
def __init__(\n    self,\n    env,\n    num_starts=None,\n    num_augment=8,\n    force_dihedral_8=False,\n    feats=None,\n    **kwargs,\n):\n    check_unused_kwargs(self, kwargs)\n    super().__init__(env, kwargs.get(\"progress\", True))\n\n    assert num_starts is not None, \"Must specify num_starts\"\n    self.num_starts = num_starts\n    assert not (\n        num_augment != 8 and force_dihedral_8\n    ), \"Cannot force dihedral 8 when num_augment != 8\"\n    self.augmentation = StateAugmentation(\n        num_augment=num_augment,\n        augment_fn=\"dihedral8\" if force_dihedral_8 else \"symmetric\",\n        feats=feats,\n    )\n
"},{"location":"docs/content/api/tasks/#tasks.eval.get_automatic_batch_size","title":"get_automatic_batch_size","text":"
get_automatic_batch_size(\n    eval_fn, start_batch_size=8192, max_batch_size=4096\n)\n

Automatically reduces the batch size based on the eval function

Parameters:

  • eval_fn \u2013

    The eval function

  • start_batch_size \u2013

    The starting batch size. This should be the theoretical maximum batch size

  • max_batch_size \u2013

    The maximum batch size. This is the practical maximum batch size

Source code in rl4co/tasks/eval.py
def get_automatic_batch_size(eval_fn, start_batch_size=8192, max_batch_size=4096):\n    \"\"\"Automatically reduces the batch size based on the eval function\n\n    Args:\n        eval_fn: The eval function\n        start_batch_size: The starting batch size. This should be the theoretical maximum batch size\n        max_batch_size: The maximum batch size. This is the practical maximum batch size\n    \"\"\"\n    batch_size = start_batch_size\n\n    effective_ratio = 1\n\n    if hasattr(eval_fn, \"num_starts\"):\n        batch_size = batch_size // (eval_fn.num_starts // 10)\n        effective_ratio *= eval_fn.num_starts // 10\n    if hasattr(eval_fn, \"num_augment\"):\n        batch_size = batch_size // eval_fn.num_augment\n        effective_ratio *= eval_fn.num_augment\n    if hasattr(eval_fn, \"samples\"):\n        batch_size = batch_size // eval_fn.samples\n        effective_ratio *= eval_fn.samples\n\n    batch_size = min(batch_size, max_batch_size)\n    # get closest integer power of 2\n    batch_size = 2 ** int(np.log2(batch_size))\n\n    print(f\"Effective batch size: {batch_size} (ratio: {effective_ratio})\")\n\n    return batch_size\n
"},{"location":"docs/content/api/envs/base/","title":"Base Environment","text":"

This is the base wrapper around TorchRL's EnvBase, with additional functionality.

"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase","title":"RL4COEnvBase","text":"
RL4COEnvBase(\n    *,\n    data_dir: str = \"data/\",\n    train_file: str = None,\n    val_file: str = None,\n    test_file: str = None,\n    val_dataloader_names: list = None,\n    test_dataloader_names: list = None,\n    check_solution: bool = True,\n    dataset_cls: callable = TensorDictDataset,\n    seed: int = None,\n    device: str = \"cpu\",\n    batch_size: Size = None,\n    run_type_checks: bool = False,\n    allow_done_after_reset: bool = False,\n    _torchrl_mode: bool = False,\n    **kwargs\n)\n

Bases: EnvBase

Base class for RL4CO environments based on TorchRL EnvBase. The environment has the usual methods for stepping, resetting, and getting the specifications of the environment that shoud be implemented by the subclasses of this class. It also has methods for getting the reward, action mask, and checking the validity of the solution, and for generating and loading the datasets (supporting multiple dataloaders as well for validation and testing).

Parameters:

  • data_dir (str, default: 'data/' ) \u2013

    Root directory for the dataset

  • train_file (str, default: None ) \u2013

    Name of the training file

  • val_file (str, default: None ) \u2013

    Name of the validation file

  • test_file (str, default: None ) \u2013

    Name of the test file

  • val_dataloader_names (list, default: None ) \u2013

    Names of the dataloaders to use for validation

  • test_dataloader_names (list, default: None ) \u2013

    Names of the dataloaders to use for testing

  • check_solution (bool, default: True ) \u2013

    Whether to check the validity of the solution at the end of the episode

  • dataset_cls (callable, default: TensorDictDataset ) \u2013

    Dataset class to use for the environment (which can influence performance)

  • seed (int, default: None ) \u2013

    Seed for the environment

  • device (str, default: 'cpu' ) \u2013

    Device to use. Generally, no need to set as tensors are updated on the fly

  • batch_size (Size, default: None ) \u2013

    Batch size to use for the environment. Generally, no need to set as tensors are updated on the fly

  • run_type_checks (bool, default: False ) \u2013

    If True, run type checks on the TensorDicts at each step

  • allow_done_after_reset (bool, default: False ) \u2013

    If True, an environment can be done after a reset

  • _torchrl_mode (bool, default: False ) \u2013

    Whether to use the TorchRL mode (see :meth:step for more details)

Methods:

  • step \u2013

    Step function to call at each step of the episode containing an action.

  • reset \u2013

    Reset function to call at the beginning of each episode

  • get_reward \u2013

    Function to compute the reward. Can be called by the agent to compute the reward of the current state

  • get_action_mask \u2013

    Function to compute the action mask (feasible actions) for the current state

  • check_solution_validity \u2013

    Function to check whether the solution is valid. Can be called by the agent to check the validity of the current state

  • replace_selected_actions \u2013

    Replace selected current actions with updated actions based on selection_mask.

  • local_search \u2013

    Function to improve the solution. Can be called by the agent to improve the current state

  • dataset \u2013

    Return a dataset of observations

  • transform \u2013

    Used for converting TensorDict variables (such as with torch.cat) efficiently

  • render \u2013

    Render the environment

  • load_data \u2013

    Dataset loading from file

  • to \u2013

    Override to device method for safety against None device (may be found in TensorDict)

  • solve \u2013

    Classical solver for the environment. This is a wrapper for the baselines solver.

Source code in rl4co/envs/common/base.py
def __init__(\n    self,\n    *,\n    data_dir: str = \"data/\",\n    train_file: str = None,\n    val_file: str = None,\n    test_file: str = None,\n    val_dataloader_names: list = None,\n    test_dataloader_names: list = None,\n    check_solution: bool = True,\n    dataset_cls: callable = TensorDictDataset,\n    seed: int = None,\n    device: str = \"cpu\",\n    batch_size: torch.Size = None,\n    run_type_checks: bool = False,\n    allow_done_after_reset: bool = False,\n    _torchrl_mode: bool = False,\n    **kwargs,\n):\n    super().__init__(\n        device=device,\n        batch_size=batch_size,\n        run_type_checks=run_type_checks,\n        allow_done_after_reset=allow_done_after_reset,\n    )\n    # if any kwargs are left, we want to warn the user\n    kwargs.pop(\"name\", None)  # we remove the name for checking\n    if kwargs:\n        log.error(\n            f\"Unused keyword arguments: {', '.join(kwargs.keys())}. \"\n            \"Please check the base class documentation at https://rl4co.readthedocs.io/en/latest/_content/api/envs/base.html. \"\n            \"In case you would like to pass data generation arguments, please pass a `generator` method instead \"\n            \"or for example: `generator_kwargs=dict(num_loc=50)` to the constructor.\"\n        )\n    self.data_dir = data_dir\n    self.train_file = pjoin(data_dir, train_file) if train_file is not None else None\n    self._torchrl_mode = _torchrl_mode\n    self.dataset_cls = dataset_cls\n\n    def get_files(f):\n        if f is not None:\n            if isinstance(f, Iterable) and not isinstance(f, str):\n                return [pjoin(data_dir, _f) for _f in f]\n            else:\n                return pjoin(data_dir, f)\n        return None\n\n    def get_multiple_dataloader_names(f, names):\n        if f is not None:\n            if isinstance(f, Iterable) and not isinstance(f, str):\n                if names is None:\n                    names = [f\"{i}\" for i in range(len(f))]\n                else:\n                    assert len(names) == len(\n                        f\n                    ), \"Number of dataloader names must match number of files\"\n            else:\n                if names is not None:\n                    log.warning(\n                        \"Ignoring dataloader names since only one dataloader is provided\"\n                    )\n        return names\n\n    self.val_file = get_files(val_file)\n    self.test_file = get_files(test_file)\n    self.val_dataloader_names = get_multiple_dataloader_names(\n        self.val_file, val_dataloader_names\n    )\n    self.test_dataloader_names = get_multiple_dataloader_names(\n        self.test_file, test_dataloader_names\n    )\n    self.check_solution = check_solution\n    if seed is None:\n        seed = torch.empty((), dtype=torch.int64).random_().item()\n    self.set_seed(seed)\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.step","title":"step","text":"
step(td: TensorDict) -> TensorDict\n

Step function to call at each step of the episode containing an action. If _torchrl_mode is True, we call _torchrl_step instead which set the next key of the TensorDict to the next state - this is the usual way to do it in TorchRL, but inefficient in our case

Source code in rl4co/envs/common/base.py
def step(self, td: TensorDict) -> TensorDict:\n    \"\"\"Step function to call at each step of the episode containing an action.\n    If `_torchrl_mode` is True, we call `_torchrl_step` instead which set the\n    `next` key of the TensorDict to the next state - this is the usual way to do it in TorchRL,\n    but inefficient in our case\n    \"\"\"\n    if not self._torchrl_mode:\n        # Default: just return the TensorDict without farther checks etc is faster\n        td = self._step(td)\n        return {\"next\": td}\n    else:\n        # Since we simplify the syntax\n        return self._torchrl_step(td)\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.reset","title":"reset","text":"
reset(\n    td: Optional[TensorDict] = None, batch_size=None\n) -> TensorDict\n

Reset function to call at the beginning of each episode

Source code in rl4co/envs/common/base.py
def reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict:\n    \"\"\"Reset function to call at the beginning of each episode\"\"\"\n    if batch_size is None:\n        batch_size = self.batch_size if td is None else td.batch_size\n    if td is None or td.is_empty():\n        td = self.generator(batch_size=batch_size)\n    batch_size = [batch_size] if isinstance(batch_size, int) else batch_size\n    self.to(td.device)\n    return super().reset(td, batch_size=batch_size)\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.get_reward","title":"get_reward","text":"
get_reward(td: TensorDict, actions: Tensor) -> Tensor\n

Function to compute the reward. Can be called by the agent to compute the reward of the current state This is faster than calling step() and getting the reward from the returned TensorDict at each time for CO tasks

Source code in rl4co/envs/common/base.py
def get_reward(self, td: TensorDict, actions: torch.Tensor) -> torch.Tensor:\n    \"\"\"Function to compute the reward. Can be called by the agent to compute the reward of the current state\n    This is faster than calling step() and getting the reward from the returned TensorDict at each time for CO tasks\n    \"\"\"\n    if self.check_solution:\n        self.check_solution_validity(td, actions)\n    return self._get_reward(td, actions)\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.get_action_mask","title":"get_action_mask","text":"
get_action_mask(td: TensorDict) -> Tensor\n

Function to compute the action mask (feasible actions) for the current state Action mask is 1 if the action is feasible, 0 otherwise

Source code in rl4co/envs/common/base.py
def get_action_mask(self, td: TensorDict) -> torch.Tensor:\n    \"\"\"Function to compute the action mask (feasible actions) for the current state\n    Action mask is 1 if the action is feasible, 0 otherwise\n    \"\"\"\n    raise NotImplementedError\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.check_solution_validity","title":"check_solution_validity","text":"
check_solution_validity(\n    td: TensorDict, actions: Tensor\n) -> None\n

Function to check whether the solution is valid. Can be called by the agent to check the validity of the current state This is called with the full solution (i.e. all actions) at the end of the episode

Source code in rl4co/envs/common/base.py
def check_solution_validity(self, td: TensorDict, actions: torch.Tensor) -> None:\n    \"\"\"Function to check whether the solution is valid. Can be called by the agent to check the validity of the current state\n    This is called with the full solution (i.e. all actions) at the end of the episode\n    \"\"\"\n    raise NotImplementedError\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.replace_selected_actions","title":"replace_selected_actions","text":"
replace_selected_actions(\n    cur_actions: Tensor,\n    new_actions: Tensor,\n    selection_mask: Tensor,\n) -> Tensor\n

Replace selected current actions with updated actions based on selection_mask.

Source code in rl4co/envs/common/base.py
def replace_selected_actions(\n    self,\n    cur_actions: torch.Tensor,\n    new_actions: torch.Tensor,\n    selection_mask: torch.Tensor,\n) -> torch.Tensor:\n    \"\"\"\n    Replace selected current actions with updated actions based on `selection_mask`.\n    \"\"\"\n    raise NotImplementedError\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.local_search","title":"local_search","text":"
local_search(\n    td: TensorDict, actions: Tensor, **kwargs\n) -> Tensor\n

Function to improve the solution. Can be called by the agent to improve the current state This is called with the full solution (i.e. all actions) at the end of the episode

Source code in rl4co/envs/common/base.py
def local_search(\n    self, td: TensorDict, actions: torch.Tensor, **kwargs\n) -> torch.Tensor:\n    \"\"\"Function to improve the solution. Can be called by the agent to improve the current state\n    This is called with the full solution (i.e. all actions) at the end of the episode\n    \"\"\"\n    raise NotImplementedError(\n        f\"Local is not implemented yet for {self.name} environment\"\n    )\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.dataset","title":"dataset","text":"
dataset(batch_size=[], phase='train', filename=None)\n

Return a dataset of observations Generates the dataset if it does not exist, otherwise loads it from file

Source code in rl4co/envs/common/base.py
def dataset(self, batch_size=[], phase=\"train\", filename=None):\n    \"\"\"Return a dataset of observations\n    Generates the dataset if it does not exist, otherwise loads it from file\n    \"\"\"\n    if filename is not None:\n        log.info(f\"Overriding dataset filename from {filename}\")\n    f = getattr(self, f\"{phase}_file\") if filename is None else filename\n    if f is None:\n        if phase != \"train\":\n            log.warning(f\"{phase}_file not set. Generating dataset instead\")\n        td = self.generator(batch_size)\n    else:\n        log.info(f\"Loading {phase} dataset from {f}\")\n        if phase == \"train\":\n            log.warning(\n                \"Loading training dataset from file. This may not be desired in RL since \"\n                \"the dataset is fixed and the agent will not be able to explore new states\"\n            )\n        try:\n            if isinstance(f, Iterable) and not isinstance(f, str):\n                names = getattr(self, f\"{phase}_dataloader_names\")\n                return {\n                    name: self.dataset_cls(self.load_data(_f, batch_size))\n                    for name, _f in zip(names, f)\n                }\n            else:\n                td = self.load_data(f, batch_size)\n        except FileNotFoundError:\n            log.error(\n                f\"Provided file name {f} not found. Make sure to provide a file in the right path first or \"\n                f\"unset {phase}_file to generate data automatically instead\"\n            )\n            td = self.generator(batch_size)\n\n    return self.dataset_cls(td)\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.transform","title":"transform","text":"
transform()\n

Used for converting TensorDict variables (such as with torch.cat) efficiently https://pytorch.org/rl/reference/generated/torchrl.envs.transforms.Transform.html By default, we do not need to transform the environment since we use specific embeddings

Source code in rl4co/envs/common/base.py
def transform(self):\n    \"\"\"Used for converting TensorDict variables (such as with torch.cat) efficiently\n    https://pytorch.org/rl/reference/generated/torchrl.envs.transforms.Transform.html\n    By default, we do not need to transform the environment since we use specific embeddings\n    \"\"\"\n    return self\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.render","title":"render","text":"
render(*args, **kwargs)\n

Render the environment

Source code in rl4co/envs/common/base.py
def render(self, *args, **kwargs):\n    \"\"\"Render the environment\"\"\"\n    raise NotImplementedError\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.load_data","title":"load_data staticmethod","text":"
load_data(fpath, batch_size=[])\n

Dataset loading from file

Source code in rl4co/envs/common/base.py
@staticmethod\ndef load_data(fpath, batch_size=[]):\n    \"\"\"Dataset loading from file\"\"\"\n    return load_npz_to_tensordict(fpath)\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.to","title":"to","text":"
to(device)\n

Override to device method for safety against None device (may be found in TensorDict)

Source code in rl4co/envs/common/base.py
def to(self, device):\n    \"\"\"Override `to` device method for safety against `None` device (may be found in `TensorDict`)\"\"\"\n    if device is None:\n        return self\n    else:\n        return super().to(device)\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.RL4COEnvBase.solve","title":"solve staticmethod","text":"
solve(\n    instances: TensorDict,\n    max_runtime: float,\n    num_procs: int = 1,\n    **kwargs\n) -> tuple[Tensor, Tensor]\n

Classical solver for the environment. This is a wrapper for the baselines solver.

Parameters:

  • instances (TensorDict) \u2013

    The instances to solve

  • max_runtime (float) \u2013

    The maximum runtime for the solver

  • num_procs (int, default: 1 ) \u2013

    The number of processes to use

Returns:

  • tuple[Tensor, Tensor] \u2013

    A tuple containing the action and the cost, respectively

Source code in rl4co/envs/common/base.py
@staticmethod\ndef solve(\n    instances: TensorDict,\n    max_runtime: float,\n    num_procs: int = 1,\n    **kwargs,\n) -> tuple[torch.Tensor, torch.Tensor]:\n    \"\"\"Classical solver for the environment. This is a wrapper for the baselines solver.\n\n    Args:\n        instances: The instances to solve\n        max_runtime: The maximum runtime for the solver\n        num_procs: The number of processes to use\n\n    Returns:\n        A tuple containing the action and the cost, respectively\n    \"\"\"\n    raise NotImplementedError\n
"},{"location":"docs/content/api/envs/base/#envs.common.base.ImprovementEnvBase","title":"ImprovementEnvBase","text":"
ImprovementEnvBase(**kwargs)\n

Bases: RL4COEnvBase

Base class for Improvement environments based on RL4CO EnvBase. Note that this class assumes that the solution is stored in a linked list format. Here, if rec[i] = j, it means the node i is connected to node j, i.e., edge i-j is in the solution. For example, if edge 0-1, edge 1-5, edge 2-10 are in the solution, so we have rec[0]=1, rec[1]=5 and rec[2]=10. Kindly see https://github.com/yining043/VRP-DACT/blob/new_version/Play_with_DACT.ipynb for an example at the end for TSP.

Source code in rl4co/envs/common/base.py
def __init__(\n    self,\n    **kwargs,\n):\n    super().__init__(**kwargs)\n
"},{"location":"docs/content/api/envs/base/#utilities","title":"Utilities","text":"

These contain utilities such as the base Generator class and get_sampler.

"},{"location":"docs/content/api/envs/base/#envs.common.utils.Generator","title":"Generator","text":"
Generator(**kwargs)\n

Base data generator class, to be called with env.generator(batch_size)

Source code in rl4co/envs/common/utils.py
def __init__(self, **kwargs):\n    self.kwargs = kwargs\n
"},{"location":"docs/content/api/envs/base/#envs.common.utils.get_sampler","title":"get_sampler","text":"
get_sampler(\n    val_name: str,\n    distribution: Union[int, float, str, type, Callable],\n    low: float = 0,\n    high: float = 1.0,\n    **kwargs\n)\n

Get the sampler for the variable with the given distribution. If kwargs are passed, they will be parsed e.g. with val_name + _dist_arg (e.g. loc_std for Normal distribution).

Parameters:

  • val_name (str) \u2013

    Name of the variable

  • distribution (Union[int, float, str, type, Callable]) \u2013

    int/float value (as constant distribution), or string with the distribution name (supporting uniform, normal, exponential, and poisson) or PyTorch Distribution type or a callable function that returns a PyTorch Distribution

  • low (float, default: 0 ) \u2013

    Minimum value for the variable, used for Uniform distribution

  • high (float, default: 1.0 ) \u2013

    Maximum value for the variable, used for Uniform distribution

  • kwargs \u2013

    Additional arguments for the distribution

Example
sampler_uniform = get_sampler(\"loc\", \"uniform\", 0, 1)\nsampler_normal = get_sampler(\"loc\", \"normal\", loc_mean=0.5, loc_std=.2)\n
Source code in rl4co/envs/common/utils.py
def get_sampler(\n    val_name: str,\n    distribution: Union[int, float, str, type, Callable],\n    low: float = 0,\n    high: float = 1.0,\n    **kwargs,\n):\n    \"\"\"Get the sampler for the variable with the given distribution.\n    If kwargs are passed, they will be parsed e.g. with `val_name` + `_dist_arg` (e.g. `loc_std` for Normal distribution).\n\n    Args:\n        val_name: Name of the variable\n        distribution: int/float value (as constant distribution), or string with the distribution name (supporting\n            uniform, normal, exponential, and poisson) or PyTorch Distribution type or a callable function that\n            returns a PyTorch Distribution\n        low: Minimum value for the variable, used for Uniform distribution\n        high: Maximum value for the variable, used for Uniform distribution\n        kwargs: Additional arguments for the distribution\n\n    Example:\n        ```python\n        sampler_uniform = get_sampler(\"loc\", \"uniform\", 0, 1)\n        sampler_normal = get_sampler(\"loc\", \"normal\", loc_mean=0.5, loc_std=.2)\n        ```\n    \"\"\"\n    if isinstance(distribution, (int, float)):\n        return Uniform(low=distribution, high=distribution)\n    elif distribution == Uniform or distribution == \"uniform\":\n        return Uniform(low=low, high=high)\n    elif distribution == Normal or distribution == \"normal\" or distribution == \"gaussian\":\n        assert (\n            kwargs.get(val_name + \"_mean\", None) is not None\n        ), \"mean is required for Normal distribution\"\n        assert (\n            kwargs.get(val_name + \"_std\", None) is not None\n        ), \"std is required for Normal distribution\"\n        return Normal(loc=kwargs[val_name + \"_mean\"], scale=kwargs[val_name + \"_std\"])\n    elif distribution == Exponential or distribution == \"exponential\":\n        assert (\n            kwargs.get(val_name + \"_rate\", None) is not None\n        ), \"rate is required for Exponential/Poisson distribution\"\n        return Exponential(rate=kwargs[val_name + \"_rate\"])\n    elif distribution == Poisson or distribution == \"poisson\":\n        assert (\n            kwargs.get(val_name + \"_rate\", None) is not None\n        ), \"rate is required for Exponential/Poisson distribution\"\n        return Poisson(rate=kwargs[val_name + \"_rate\"])\n    elif distribution == \"center\":\n        return Uniform(low=(high - low) / 2, high=(high - low) / 2)\n    elif distribution == \"corner\":\n        return Uniform(\n            low=low, high=low\n        )  # todo: should be also `low, high` and any other corner\n    elif isinstance(distribution, Callable):\n        return distribution(**kwargs)\n    elif distribution == \"gaussian_mixture\":\n        return Gaussian_Mixture(num_modes=kwargs[\"num_modes\"], cdist=kwargs[\"cdist\"])\n    elif distribution == \"cluster\":\n        return Cluster(kwargs[\"n_cluster\"])\n    elif distribution == \"mixed\":\n        return Mixed(kwargs[\"n_cluster_mix\"])\n    elif distribution == \"mix_distribution\":\n        return Mix_Distribution(kwargs[\"n_cluster\"], kwargs[\"n_cluster_mix\"])\n    elif distribution == \"mix_multi_distributions\":\n        return Mix_Multi_Distributions()\n    else:\n        raise ValueError(f\"Invalid distribution type of {distribution}\")\n
"},{"location":"docs/content/api/envs/base/#envs.common.utils.batch_to_scalar","title":"batch_to_scalar","text":"
batch_to_scalar(param)\n

Return first element if in batch. Used for batched parameters that are the same for all elements in the batch.

Source code in rl4co/envs/common/utils.py
def batch_to_scalar(param):\n    \"\"\"Return first element if in batch. Used for batched parameters that are the same for all elements in the batch.\"\"\"\n    if len(param.shape) > 0:\n        return param[0].item()\n    if isinstance(param, torch.Tensor):\n        return param.item()\n    return param\n
"},{"location":"docs/content/api/envs/eda/","title":"EDA Problems","text":"

Environment for Electronic Design Automation (EDA) problems

"},{"location":"docs/content/api/envs/eda/#decap-placement-problem-dpp","title":"Decap Placement Problem (DPP)","text":""},{"location":"docs/content/api/envs/eda/#envs.eda.dpp.env.DPPEnv","title":"DPPEnv","text":"
DPPEnv(\n    generator: DPPGenerator = None,\n    generator_params: dict = {},\n    **kwargs\n)\n

Bases: RL4COEnvBase

Decap Placement Problem (DPP) as done in DevFormer paper: https://arxiv.org/abs/2205.13225

The environment is a 10x10 grid with 100 locations containing either a probing port or a keepout region. The goal is to place decaps (decoupling capacitors) to maximize the impedance suppression at the probing port. Decaps cannot be placed in keepout regions or at the probing port and the number of decaps is limited.

Observations
  • locations of the probing port and keepout regions
  • current decap placement
  • remaining decaps
Constraints
  • decaps cannot be placed at the probing port or keepout regions
  • the number of decaps is limited
Finish Condition
  • the number of decaps exceeds the limit
Reward
  • the impedance suppression at the probing port

Parameters:

  • generator (DPPGenerator, default: None ) \u2013

    DPPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Source code in rl4co/envs/eda/dpp/env.py
def __init__(\n    self,\n    generator: DPPGenerator = None,\n    generator_params: dict = {},\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = DPPGenerator(**generator_params)\n    self.generator = generator\n\n    self.max_decaps = self.generator.max_decaps\n    self.size = self.generator.size\n    self.raw_pdn = self.generator.raw_pdn\n    self.decap = self.generator.decap\n    self.freq = self.generator.freq\n    self.num_freq = self.generator.num_freq\n    self.data_dir = self.generator.data_dir\n\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/eda/#envs.eda.dpp.generator.DPPGenerator","title":"DPPGenerator","text":"
DPPGenerator(\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    num_keepout_min: int = 1,\n    num_keepout_max: int = 50,\n    max_decaps: int = 20,\n    data_dir: str = \"data/dpp/\",\n    chip_file: str = \"10x10_pkg_chip.npy\",\n    decap_file: str = \"01nF_decap.npy\",\n    freq_file: str = \"freq_201.npy\",\n    url: str = None,\n    **unused_kwargs\n)\n

Bases: Generator

Data generator for the Decap Placement Problem (DPP).

Parameters:

  • min_loc (float, default: 0.0 ) \u2013

    Minimum location value. Defaults to 0.

  • max_loc (float, default: 1.0 ) \u2013

    Maximum location value. Defaults to 1.

  • num_keepout_min (int, default: 1 ) \u2013

    Minimum number of keepout regions. Defaults to 1.

  • num_keepout_max (int, default: 50 ) \u2013

    Maximum number of keepout regions. Defaults to 50.

  • max_decaps (int, default: 20 ) \u2013

    Maximum number of decaps. Defaults to 20.

  • data_dir (str, default: 'data/dpp/' ) \u2013

    Directory to store data. Defaults to \"data/dpp/\". This can be downloaded from this url.

  • chip_file (str, default: '10x10_pkg_chip.npy' ) \u2013

    Name of the chip file. Defaults to \"10x10_pkg_chip.npy\".

  • decap_file (str, default: '01nF_decap.npy' ) \u2013

    Name of the decap file. Defaults to \"01nF_decap.npy\".

  • freq_file (str, default: 'freq_201.npy' ) \u2013

    Name of the frequency file. Defaults to \"freq_201.npy\".

  • url (str, default: None ) \u2013

    URL to download data from. Defaults to None.

Returns:

  • \u2013

    A TensorDict with the following keys: locs [batch_size, num_loc, 2]: locations of each customer depot [batch_size, 2]: location of the depot demand [batch_size, num_loc]: demand of each customer capacity [batch_size]: capacity of the vehicle

Source code in rl4co/envs/eda/dpp/generator.py
def __init__(\n    self,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    num_keepout_min: int = 1,\n    num_keepout_max: int = 50,\n    max_decaps: int = 20,\n    data_dir: str = \"data/dpp/\",\n    chip_file: str = \"10x10_pkg_chip.npy\",\n    decap_file: str = \"01nF_decap.npy\",\n    freq_file: str = \"freq_201.npy\",\n    url: str = None,\n    **unused_kwargs\n):\n    self.min_loc = min_loc\n    self.max_loc = max_loc\n    self.num_keepout_min = num_keepout_min\n    self.num_keepout_max = num_keepout_max\n    self.max_decaps = max_decaps\n    self.data_dir = data_dir\n\n    # DPP environment doen't have any other kwargs\n    if len(unused_kwargs) > 0:\n        log.error(f\"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}\")\n\n\n    # Download and load the data from online dataset\n    self.url = (\n        \"https://github.com/kaist-silab/devformer/raw/main/data/data.zip\"\n        if url is None\n        else url\n    )\n    self.backup_url = (\n        \"https://drive.google.com/uc?id=1IEuR2v8Le-mtHWHxwTAbTOPIkkQszI95\"\n    )\n    self._load_dpp_data(chip_file, decap_file, freq_file)\n\n    # Check the validity of the keepout parameters\n    assert (\n        num_keepout_min <= num_keepout_max\n    ), \"num_keepout_min must be <= num_keepout_max\"\n    assert (\n        num_keepout_max <= self.size**2\n    ), \"num_keepout_max must be <= size * size (total number of locations)\"\n
"},{"location":"docs/content/api/envs/eda/#multi-port-decap-placement-problem-mdpp","title":"Multi-port Decap Placement Problem (mDPP)","text":""},{"location":"docs/content/api/envs/eda/#envs.eda.mdpp.env.MDPPEnv","title":"MDPPEnv","text":"
MDPPEnv(\n    generator: MDPPGenerator = None,\n    generator_params: dict = {},\n    reward_type: str = \"minmax\",\n    **kwargs\n)\n

Bases: DPPEnv

Multiple decap placement problem (mDPP) environment This is a modified version of the DPP environment where we allow multiple probing ports

Observations
  • locations of the probing ports and keepout regions
  • current decap placement
  • remaining decaps
Constraints
  • decaps cannot be placed at the probing ports or keepout regions
  • the number of decaps is limited
Finish Condition
  • the number of decaps exceeds the limit
Reward
  • the impedance suppression at the probing ports

Parameters:

  • generator (MDPPGenerator, default: None ) \u2013

    DPPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

  • reward_type (str, default: 'minmax' ) \u2013

    reward type, either minmax or meansum

    • minmax: min of the max of the decap scores
    • meansum: mean of the sum of the decap scores
Note

The minmax is more challenging as it requires to find the best decap location for the worst case

Source code in rl4co/envs/eda/mdpp/env.py
def __init__(\n    self,\n    generator: MDPPGenerator = None,\n    generator_params: dict = {},\n    reward_type: str = \"minmax\",\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = MDPPGenerator(**generator_params)\n    self.generator = generator\n\n    assert reward_type in [\n        \"minmax\",\n        \"meansum\",\n    ], \"reward_type must be minmax or meansum\"\n    self.reward_type = reward_type\n\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/eda/#envs.eda.mdpp.generator.MDPPGenerator","title":"MDPPGenerator","text":"
MDPPGenerator(\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    num_keepout_min: int = 1,\n    num_keepout_max: int = 50,\n    num_probes_min: int = 2,\n    num_probes_max: int = 5,\n    max_decaps: int = 20,\n    data_dir: str = \"data/dpp/\",\n    chip_file: str = \"10x10_pkg_chip.npy\",\n    decap_file: str = \"01nF_decap.npy\",\n    freq_file: str = \"freq_201.npy\",\n    url: str = None,\n    **unused_kwargs\n)\n

Bases: Generator

Data generator for the Multi Decap Placement Problem (MDPP).

Parameters:

  • min_loc (float, default: 0.0 ) \u2013

    Minimum location value. Defaults to 0.

  • max_loc (float, default: 1.0 ) \u2013

    Maximum location value. Defaults to 1.

  • num_keepout_min (int, default: 1 ) \u2013

    Minimum number of keepout regions. Defaults to 1.

  • num_keepout_max (int, default: 50 ) \u2013

    Maximum number of keepout regions. Defaults to 50.

  • max_decaps (int, default: 20 ) \u2013

    Maximum number of decaps. Defaults to 20.

  • data_dir (str, default: 'data/dpp/' ) \u2013

    Directory to store data. Defaults to \"data/dpp/\". This can be downloaded from this url.

  • chip_file (str, default: '10x10_pkg_chip.npy' ) \u2013

    Name of the chip file. Defaults to \"10x10_pkg_chip.npy\".

  • decap_file (str, default: '01nF_decap.npy' ) \u2013

    Name of the decap file. Defaults to \"01nF_decap.npy\".

  • freq_file (str, default: 'freq_201.npy' ) \u2013

    Name of the frequency file. Defaults to \"freq_201.npy\".

  • url (str, default: None ) \u2013

    URL to download data from. Defaults to None.

Returns:

  • \u2013

    A TensorDict with the following keys: locs [batch_size, num_loc, 2]: locations of each customer depot [batch_size, 2]: location of the depot demand [batch_size, num_loc]: demand of each customer capacity [batch_size]: capacity of the vehicle

Source code in rl4co/envs/eda/mdpp/generator.py
def __init__(\n    self,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    num_keepout_min: int = 1,\n    num_keepout_max: int = 50,\n    num_probes_min: int = 2,\n    num_probes_max: int = 5,\n    max_decaps: int = 20,\n    data_dir: str = \"data/dpp/\",\n    chip_file: str = \"10x10_pkg_chip.npy\",\n    decap_file: str = \"01nF_decap.npy\",\n    freq_file: str = \"freq_201.npy\",\n    url: str = None,\n    **unused_kwargs\n):\n    self.min_loc = min_loc\n    self.max_loc = max_loc\n    self.num_keepout_min = num_keepout_min\n    self.num_keepout_max = num_keepout_max\n    self.num_probes_min = num_probes_min\n    self.num_probes_max = num_probes_max\n    self.max_decaps = max_decaps\n    self.data_dir = data_dir\n\n    # DPP environment doen't have any other kwargs\n    if len(unused_kwargs) > 0:\n        log.error(f\"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}\")\n\n\n    # Download and load the data from online dataset\n    self.url = (\n        \"https://github.com/kaist-silab/devformer/raw/main/data/data.zip\"\n        if url is None\n        else url\n    )\n    self.backup_url = (\n        \"https://drive.google.com/uc?id=1IEuR2v8Le-mtHWHxwTAbTOPIkkQszI95\"\n    )\n    self._load_dpp_data(chip_file, decap_file, freq_file)\n\n    # Check the validity of the keepout parameters\n    assert (\n        num_keepout_min <= num_keepout_max\n    ), \"num_keepout_min must be <= num_keepout_max\"\n    assert (\n        num_keepout_max <= self.size**2\n    ), \"num_keepout_max must be <= size * size (total number of locations)\"\n
"},{"location":"docs/content/api/envs/graph/","title":"Graph Problems","text":""},{"location":"docs/content/api/envs/graph/#facility-location-problem-flp","title":"Facility Location Problem (FLP)","text":""},{"location":"docs/content/api/envs/graph/#envs.graph.flp.env.FLPEnv","title":"FLPEnv","text":"
FLPEnv(\n    generator: FLPGenerator = None,\n    generator_params: dict = {},\n    check_solution=False,\n    **kwargs\n)\n

Bases: RL4COEnvBase

Facility Location Problem (FLP) environment At each step, the agent chooses a location. The reward is 0 unless enough number of locations are chosen. The reward is (-) the total distance of each location to its closest chosen location.

Observations
  • the locations
  • the number of locations to choose
Constraints
  • the given number of locations must be chosen
Finish condition
  • the given number of locations are chosen
Reward
  • (minus) the total distance of each location to its closest chosen location

Parameters:

  • generator (FLPGenerator, default: None ) \u2013

    FLPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Source code in rl4co/envs/graph/flp/env.py
def __init__(\n    self,\n    generator: FLPGenerator = None,\n    generator_params: dict = {},\n    check_solution=False,\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = FLPGenerator(**generator_params)\n    self.generator = generator\n    self.check_solution = check_solution\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/graph/#envs.graph.flp.generator.FLPGenerator","title":"FLPGenerator","text":"
FLPGenerator(\n    num_loc: int = 100,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    to_choose: int = 10,\n    **kwargs\n)\n

Bases: Generator

Data generator for the Facility Location Problem (FLP).

Parameters:

  • num_loc (int, default: 100 ) \u2013

    number of locations in the FLP

  • min_loc (float, default: 0.0 ) \u2013

    minimum value for the location coordinates

  • max_loc (float, default: 1.0 ) \u2013

    maximum value for the location coordinates

  • loc_distribution (Union[int, float, str, type, Callable], default: Uniform ) \u2013

    distribution for the location coordinates

Returns:

  • \u2013

    A TensorDict with the following keys: locs [batch_size, num_loc, 2]: locations orig_distances [batch_size, num_loc, num_loc]: original distances between locations distances [batch_size, num_loc]: the current minimum distance rom each location to the chosen locations chosen [batch_size, num_loc]: indicators of chosen locations to_choose [batch_size, 1]: number of locations to choose in the FLP

Source code in rl4co/envs/graph/flp/generator.py
def __init__(\n    self,\n    num_loc: int = 100,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[int, float, str, type, Callable] = Uniform,\n    to_choose: int = 10,\n    **kwargs,\n):\n    self.num_loc = num_loc\n    self.min_loc = min_loc\n    self.max_loc = max_loc\n    self.to_choose = to_choose\n\n    # Location distribution\n    if kwargs.get(\"loc_sampler\", None) is not None:\n        self.loc_sampler = kwargs[\"loc_sampler\"]\n    else:\n        self.loc_sampler = get_sampler(\n            \"loc\", loc_distribution, min_loc, max_loc, **kwargs\n        )\n
"},{"location":"docs/content/api/envs/graph/#maximum-coverage-problem-mcp","title":"Maximum Coverage Problem (MCP)","text":""},{"location":"docs/content/api/envs/graph/#envs.graph.mcp.env.MCPEnv","title":"MCPEnv","text":"
MCPEnv(\n    generator: MCPGenerator = None,\n    generator_params: dict = {},\n    check_solution=False,\n    **kwargs\n)\n

Bases: RL4COEnvBase

Maximum Coverage Problem (MCP) environment At each step, the agent chooses a set. The reward is 0 unless enough number of sets are chosen. The reward is the total weights of the covered items (i.e., items in any chosen set).

Observations
  • the weights of items
  • the membership of items in sets
  • the number of sets to choose
Constraints
  • the given number of sets must be chosen
Finish condition
  • the given number of sets are chosen
Reward
  • the total weights of the covered items (i.e., items in any chosen set)

Parameters:

  • generator (MCPGenerator, default: None ) \u2013

    MCPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Source code in rl4co/envs/graph/mcp/env.py
def __init__(\n    self,\n    generator: MCPGenerator = None,\n    generator_params: dict = {},\n    check_solution=False,\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = MCPGenerator(**generator_params)\n    self.generator = generator\n    self.check_solution = check_solution\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/graph/#envs.graph.mcp.generator.MCPGenerator","title":"MCPGenerator","text":"
MCPGenerator(\n    num_items: int = 200,\n    num_sets: int = 100,\n    min_weight: int = 1,\n    max_weight: int = 10,\n    min_size: int = 5,\n    max_size: int = 15,\n    n_sets_to_choose: int = 10,\n    size_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    weight_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    **kwargs\n)\n

Bases: Generator

Data generator for the Maximum Coverage Problem (MCP).

Parameters:

  • num_items (int, default: 200 ) \u2013

    number of items in the MCP

  • num_sets (int, default: 100 ) \u2013

    number of sets in the MCP

  • min_weight (int, default: 1 ) \u2013

    minimum value for the item weights

  • max_weight (int, default: 10 ) \u2013

    maximum value for the item weights

  • min_size (int, default: 5 ) \u2013

    minimum size for the sets

  • max_size (int, default: 15 ) \u2013

    maximum size for the sets

  • n_sets_to_choose (int, default: 10 ) \u2013

    number of sets to choose in the MCP

Returns:

  • \u2013

    A TensorDict with the following keys: membership [batch_size, num_sets, max_size]: membership of items in sets weights [batch_size, num_items]: weights of the items n_sets_to_choose [batch_size, 1]: number of sets to choose in the MCP

Source code in rl4co/envs/graph/mcp/generator.py
def __init__(\n    self,\n    num_items: int = 200,\n    num_sets: int = 100,\n    min_weight: int = 1,\n    max_weight: int = 10,\n    min_size: int = 5,\n    max_size: int = 15,\n    n_sets_to_choose: int = 10,\n    size_distribution: Union[int, float, str, type, Callable] = Uniform,\n    weight_distribution: Union[int, float, str, type, Callable] = Uniform,\n    **kwargs,\n):\n    self.num_items = num_items\n    self.num_sets = num_sets\n    self.min_weight = min_weight\n    self.max_weight = max_weight\n    self.min_size = min_size\n    self.max_size = max_size\n    self.n_sets_to_choose = n_sets_to_choose\n\n    # Set size distribution\n    if kwargs.get(\"size_sampler\", None) is not None:\n        self.size_sampler = kwargs[\"size_sampler\"]\n    else:\n        self.size_sampler = get_sampler(\n            \"size\", size_distribution, min_size, max_size + 1, **kwargs\n        )\n\n    # Item weight distribution\n    if kwargs.get(\"weight_sampler\", None) is not None:\n        self.weight_sampler = kwargs[\"weight_sampler\"]\n    else:\n        self.weight_sampler = get_sampler(\n            \"weight\", weight_distribution, min_weight, max_weight + 1, **kwargs\n        )\n
"},{"location":"docs/content/api/envs/routing/","title":"Routing Problems","text":"

See also the Multi-Task VRP at the bottom of this page, that includes 16 variants!

"},{"location":"docs/content/api/envs/routing/#asymmetric-traveling-salesman-problem-atsp","title":"Asymmetric Traveling Salesman Problem (ATSP)","text":""},{"location":"docs/content/api/envs/routing/#envs.routing.atsp.env.ATSPEnv","title":"ATSPEnv","text":"
ATSPEnv(\n    generator: ATSPGenerator = None,\n    generator_params: dict = {},\n    **kwargs\n)\n

Bases: RL4COEnvBase

Asymmetric Traveling Salesman Problem (ATSP) environment At each step, the agent chooses a customer to visit. The reward is 0 unless the agent visits all the customers. In that case, the reward is (-)length of the path: maximizing the reward is equivalent to minimizing the path length. Unlike the TSP, the distance matrix is asymmetric, i.e., the distance from A to B is not necessarily the same as the distance from B to A.

Observations
  • distance matrix between customers
  • the current customer
  • the first customer (for calculating the reward)
  • the remaining unvisited customers
Constraints
  • the tour starts and ends at the same customer.
  • each customer must be visited exactly once.
Finish Condition
  • the agent has visited all customers.
Reward
  • (minus) the negative length of the path.

Parameters:

  • generator (ATSPGenerator, default: None ) \u2013

    ATSPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Source code in rl4co/envs/routing/atsp/env.py
def __init__(\n    self,\n    generator: ATSPGenerator = None,\n    generator_params: dict = {},\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = ATSPGenerator(**generator_params)\n    self.generator = generator\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.atsp.generator.ATSPGenerator","title":"ATSPGenerator","text":"
ATSPGenerator(\n    num_loc: int = 10,\n    min_dist: float = 0.0,\n    max_dist: float = 1.0,\n    dist_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    tmat_class: bool = True,\n    **kwargs\n)\n

Bases: Generator

Data generator for the Asymmetric Travelling Salesman Problem (ATSP) Generate distance matrices inspired by the reference MatNet (Kwon et al., 2021) We satifsy the triangle inequality (TMAT class) in a batch

Parameters:

  • num_loc (int, default: 10 ) \u2013

    number of locations (customers) in the TSP

  • min_dist (float, default: 0.0 ) \u2013

    minimum value for the distance between nodes

  • max_dist (float, default: 1.0 ) \u2013

    maximum value for the distance between nodes

  • dist_distribution (Union[int, float, str, type, Callable], default: Uniform ) \u2013

    distribution for the distance between nodes

  • tmat_class (bool, default: True ) \u2013

    whether to generate a class of distance matrix

Returns:

  • \u2013

    A TensorDict with the following keys: locs [batch_size, num_loc, 2]: locations of each customer

Source code in rl4co/envs/routing/atsp/generator.py
def __init__(\n    self,\n    num_loc: int = 10,\n    min_dist: float = 0.0,\n    max_dist: float = 1.0,\n    dist_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    tmat_class: bool = True,\n    **kwargs\n):\n    self.num_loc = num_loc\n    self.min_dist = min_dist\n    self.max_dist = max_dist\n    self.tmat_class = tmat_class\n\n    # Distance distribution\n    if kwargs.get(\"dist_sampler\", None) is not None:\n        self.dist_sampler = kwargs[\"dist_sampler\"]\n    else:\n        self.dist_sampler = get_sampler(\"dist\", dist_distribution, 0.0, 1.0, **kwargs)\n
"},{"location":"docs/content/api/envs/routing/#capacitated-vehicle-routing-problem-cvrp","title":"Capacitated Vehicle Routing Problem (CVRP)","text":""},{"location":"docs/content/api/envs/routing/#envs.routing.cvrp.env.CVRPEnv","title":"CVRPEnv","text":"
CVRPEnv(\n    generator: CVRPGenerator = None,\n    generator_params: dict = {},\n    **kwargs\n)\n

Bases: RL4COEnvBase

Capacitated Vehicle Routing Problem (CVRP) environment. At each step, the agent chooses a customer to visit depending on the current location and the remaining capacity. When the agent visits a customer, the remaining capacity is updated. If the remaining capacity is not enough to visit any customer, the agent must go back to the depot. The reward is 0 unless the agent visits all the cities. In that case, the reward is (-)length of the path: maximizing the reward is equivalent to minimizing the path length.

Observations
  • location of the depot.
  • locations and demand of each customer.
  • current location of the vehicle.
  • the remaining customer of the vehicle,
Constraints
  • the tour starts and ends at the depot.
  • each customer must be visited exactly once.
  • the vehicle cannot visit customers exceed the remaining capacity.
  • the vehicle can return to the depot to refill the capacity.
Finish Condition
  • the vehicle has visited all customers and returned to the depot.
Reward
  • (minus) the negative length of the path.

Parameters:

  • generator (CVRPGenerator, default: None ) \u2013

    CVRPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Methods:

  • check_solution_validity \u2013

    Check that solution is valid: nodes are not visited twice except depot and capacity is not exceeded

  • load_data \u2013

    Dataset loading from file

  • replace_selected_actions \u2013

    Replace selected current actions with updated actions based on selection_mask.

Source code in rl4co/envs/routing/cvrp/env.py
def __init__(\n    self,\n    generator: CVRPGenerator = None,\n    generator_params: dict = {},\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = CVRPGenerator(**generator_params)\n    self.generator = generator\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.cvrp.env.CVRPEnv.check_solution_validity","title":"check_solution_validity staticmethod","text":"
check_solution_validity(td: TensorDict, actions: Tensor)\n

Check that solution is valid: nodes are not visited twice except depot and capacity is not exceeded

Source code in rl4co/envs/routing/cvrp/env.py
@staticmethod\ndef check_solution_validity(td: TensorDict, actions: torch.Tensor):\n    \"\"\"Check that solution is valid: nodes are not visited twice except depot and capacity is not exceeded\"\"\"\n    # Check if tour is valid, i.e. contain 0 to n-1\n    batch_size, graph_size = td[\"demand\"].size()\n    sorted_pi = actions.data.sort(1)[0]\n\n    # Sorting it should give all zeros at front and then 1...n\n    assert (\n        torch.arange(1, graph_size + 1, out=sorted_pi.data.new())\n        .view(1, -1)\n        .expand(batch_size, graph_size)\n        == sorted_pi[:, -graph_size:]\n    ).all() and (sorted_pi[:, :-graph_size] == 0).all(), \"Invalid tour\"\n\n    # Visiting depot resets capacity so we add demand = -capacity (we make sure it does not become negative)\n    demand_with_depot = torch.cat((-td[\"vehicle_capacity\"], td[\"demand\"]), 1)\n    d = demand_with_depot.gather(1, actions)\n\n    used_cap = torch.zeros_like(td[\"demand\"][:, 0])\n    for i in range(actions.size(1)):\n        used_cap += d[\n            :, i\n        ]  # This will reset/make capacity negative if i == 0, e.g. depot visited\n        # Cannot use less than 0\n        used_cap[used_cap < 0] = 0\n        assert (\n            used_cap <= td[\"vehicle_capacity\"] + 1e-5\n        ).all(), \"Used more than capacity\"\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.cvrp.env.CVRPEnv.load_data","title":"load_data staticmethod","text":"
load_data(fpath, batch_size=[])\n

Dataset loading from file Normalize demand by capacity to be in [0, 1]

Source code in rl4co/envs/routing/cvrp/env.py
@staticmethod\ndef load_data(fpath, batch_size=[]):\n    \"\"\"Dataset loading from file\n    Normalize demand by capacity to be in [0, 1]\n    \"\"\"\n    td_load = load_npz_to_tensordict(fpath)\n    td_load.set(\"demand\", td_load[\"demand\"] / td_load[\"capacity\"][:, None])\n    return td_load\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.cvrp.env.CVRPEnv.replace_selected_actions","title":"replace_selected_actions","text":"
replace_selected_actions(\n    cur_actions: Tensor,\n    new_actions: Tensor,\n    selection_mask: Tensor,\n) -> Tensor\n

Replace selected current actions with updated actions based on selection_mask.

Source code in rl4co/envs/routing/cvrp/env.py
def replace_selected_actions(\n    self,\n    cur_actions: torch.Tensor,\n    new_actions: torch.Tensor,\n    selection_mask: torch.Tensor,\n) -> torch.Tensor:\n    \"\"\"\n    Replace selected current actions with updated actions based on `selection_mask`.\n\n    Args:\n        cur_actions [batch_size, num_loc]\n        new_actions [batch_size, num_loc]\n        selection_mask [batch_size,]\n    \"\"\"\n    diff_length = cur_actions.size(-1) - new_actions.size(-1)\n    if diff_length > 0:\n        new_actions = torch.nn.functional.pad(\n            new_actions, (0, diff_length, 0, 0), mode=\"constant\", value=0\n        )\n    elif diff_length < 0:\n        cur_actions = torch.nn.functional.pad(\n            cur_actions, (0, -diff_length, 0, 0), mode=\"constant\", value=0\n        )\n    cur_actions[selection_mask] = new_actions[selection_mask]\n    return cur_actions\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.cvrp.generator.CVRPGenerator","title":"CVRPGenerator","text":"
CVRPGenerator(\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    depot_distribution: Union[\n        int, float, str, type, Callable\n    ] = None,\n    min_demand: int = 1,\n    max_demand: int = 10,\n    demand_distribution: Union[\n        int, float, type, Callable\n    ] = Uniform,\n    vehicle_capacity: float = 1.0,\n    capacity: float = None,\n    **kwargs\n)\n

Bases: Generator

Data generator for the Capacitated Vehicle Routing Problem (CVRP).

Parameters:

  • num_loc (int, default: 20 ) \u2013

    number of locations (cities) in the VRP, without the depot. (e.g. 10 means 10 locs + 1 depot)

  • min_loc (float, default: 0.0 ) \u2013

    minimum value for the location coordinates

  • max_loc (float, default: 1.0 ) \u2013

    maximum value for the location coordinates

  • loc_distribution (Union[int, float, str, type, Callable], default: Uniform ) \u2013

    distribution for the location coordinates

  • depot_distribution (Union[int, float, str, type, Callable], default: None ) \u2013

    distribution for the depot location. If None, sample the depot from the locations

  • min_demand (int, default: 1 ) \u2013

    minimum value for the demand of each customer

  • max_demand (int, default: 10 ) \u2013

    maximum value for the demand of each customer

  • demand_distribution (Union[int, float, type, Callable], default: Uniform ) \u2013

    distribution for the demand of each customer

  • capacity (float, default: None ) \u2013

    capacity of the vehicle

Returns:

  • \u2013

    A TensorDict with the following keys: locs [batch_size, num_loc, 2]: locations of each customer depot [batch_size, 2]: location of the depot demand [batch_size, num_loc]: demand of each customer capacity [batch_size]: capacity of the vehicle

Source code in rl4co/envs/routing/cvrp/generator.py
def __init__(\n    self,\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[int, float, str, type, Callable] = Uniform,\n    depot_distribution: Union[int, float, str, type, Callable] = None,\n    min_demand: int = 1,\n    max_demand: int = 10,\n    demand_distribution: Union[int, float, type, Callable] = Uniform,\n    vehicle_capacity: float = 1.0,\n    capacity: float = None,\n    **kwargs,\n):\n    self.num_loc = num_loc\n    self.min_loc = min_loc\n    self.max_loc = max_loc\n    self.min_demand = min_demand\n    self.max_demand = max_demand\n    self.vehicle_capacity = vehicle_capacity\n\n    # Location distribution\n    if kwargs.get(\"loc_sampler\", None) is not None:\n        self.loc_sampler = kwargs[\"loc_sampler\"]\n    else:\n        self.loc_sampler = get_sampler(\n            \"loc\", loc_distribution, min_loc, max_loc, **kwargs\n        )\n\n    # Depot distribution\n    if kwargs.get(\"depot_sampler\", None) is not None:\n        self.depot_sampler = kwargs[\"depot_sampler\"]\n    else:\n        self.depot_sampler = get_sampler(\n            \"depot\", depot_distribution, min_loc, max_loc, **kwargs\n        ) if depot_distribution is not None else None\n\n    # Demand distribution\n    if kwargs.get(\"demand_sampler\", None) is not None:\n        self.demand_sampler = kwargs[\"demand_sampler\"]\n    else:\n        self.demand_sampler = get_sampler(\n            \"demand\", demand_distribution, min_demand - 1, max_demand - 1, **kwargs\n        )\n\n    # Capacity\n    if (\n        capacity is None\n    ):  # If not provided, use the default capacity from Kool et al. 2019\n        capacity = CAPACITIES.get(num_loc, None)\n    if (\n        capacity is None\n    ):  # If not in the table keys, find the closest number of nodes as the key\n        closest_num_loc = min(CAPACITIES.keys(), key=lambda x: abs(x - num_loc))\n        capacity = CAPACITIES[closest_num_loc]\n        log.warning(\n            f\"The capacity capacity for {num_loc} locations is not defined. Using the closest capacity: {capacity}\\\n                with {closest_num_loc} locations.\"\n        )\n    self.capacity = capacity\n
"},{"location":"docs/content/api/envs/routing/#multiple-traveling-salesman-problem-mtsp","title":"Multiple Traveling Salesman Problem (mTSP)","text":""},{"location":"docs/content/api/envs/routing/#envs.routing.mtsp.env.MTSPEnv","title":"MTSPEnv","text":"
MTSPEnv(\n    generator: MTSPGenerator = None,\n    generator_params: dict = {},\n    cost_type: str = \"minmax\",\n    **kwargs\n)\n

Bases: RL4COEnvBase

Multiple Traveling Salesman Problem environment At each step, an agent chooses to visit a city. A maximum of num_agents agents can be employed to visit the cities. The cost can be defined in two ways:

- `minmax`: (default) the reward is the maximum of the path lengths of all the agents\n- `sum`: the cost is the sum of the path lengths of all the agents\n

Reward is - cost, so the goal is to maximize the reward (minimize the cost).

Observations
  • locations of the depot and each customer.
  • number of agents.
  • the current agent index.
  • the current location of the vehicle.
Constrains
  • each agent's tour starts and ends at the depot.
  • each customer must be visited exactly once.
Finish condition
  • all customers are visited and all agents back to the depot.
Reward

There are two ways to calculate the cost (-reward):

  • minmax: (default) the cost is the maximum of the path lengths of all the agents.
  • sum: the cost is the sum of the path lengths of all the agents.

Parameters:

  • cost_type (str, default: 'minmax' ) \u2013

    type of cost to use, either minmax or sum

  • generator (MTSPGenerator, default: None ) \u2013

    MTSPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Source code in rl4co/envs/routing/mtsp/env.py
def __init__(\n    self,\n    generator: MTSPGenerator = None,\n    generator_params: dict = {},\n    cost_type: str = \"minmax\",\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = MTSPGenerator(**generator_params)\n    self.generator = generator\n    self.cost_type = cost_type\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtsp.generator.MTSPGenerator","title":"MTSPGenerator","text":"
MTSPGenerator(\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    min_num_agents: int = 5,\n    max_num_agents: int = 5,\n    **kwargs\n)\n

Bases: Generator

Data generator for the Multiple Travelling Salesman Problem (mTSP).

Parameters:

  • num_loc (int, default: 20 ) \u2013

    number of locations (customers) in the TSP

  • min_loc (float, default: 0.0 ) \u2013

    minimum value for the location coordinates

  • max_loc (float, default: 1.0 ) \u2013

    maximum value for the location coordinates

  • loc_distribution (Union[int, float, str, type, Callable], default: Uniform ) \u2013

    distribution for the location coordinates

  • min_num_agents (int, default: 5 ) \u2013

    minimum number of agents (vehicles), include

  • max_num_agents (int, default: 5 ) \u2013

    maximum number of agents (vehicles), include

Returns:

  • \u2013

    A TensorDict with the following keys: locs [batch_size, num_loc, 2]: locations of each customer num_agents [batch_size]: number of agents (vehicles)

Source code in rl4co/envs/routing/mtsp/generator.py
def __init__(\n    self,\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[int, float, str, type, Callable] = Uniform,\n    min_num_agents: int = 5,\n    max_num_agents: int = 5,\n    **kwargs,\n):\n    self.num_loc = num_loc\n    self.min_loc = min_loc\n    self.max_loc = max_loc\n    self.min_num_agents = min_num_agents\n    self.max_num_agents = max_num_agents\n\n    # Location distribution\n    if kwargs.get(\"loc_sampler\", None) is not None:\n        self.loc_sampler = kwargs[\"loc_sampler\"]\n    else:\n        self.loc_sampler = get_sampler(\n            \"loc\", loc_distribution, min_loc, max_loc, **kwargs\n        )\n
"},{"location":"docs/content/api/envs/routing/#orienteering-problem-op","title":"Orienteering Problem (OP)","text":""},{"location":"docs/content/api/envs/routing/#envs.routing.op.env.OPEnv","title":"OPEnv","text":"
OPEnv(\n    generator: OPGenerator = None,\n    generator_params: dict = {},\n    prize_type: str = \"dist\",\n    **kwargs\n)\n

Bases: RL4COEnvBase

Orienteering Problem (OP) environment. At each step, the agent chooses a location to visit in order to maximize the collected prize. The total length of the path must not exceed a given threshold.

Observations
  • location of the depot
  • locations and prize of each customer
  • current location of the vehicle
  • current tour length
  • current total prize
  • the remaining length of the path
Constraints
  • the tour starts and ends at the depot
  • not all customers need to be visited
  • the vehicle cannot visit customers exceed the remaining length of the path
Finish Condition
  • the vehicle back to the depot
Reward
  • the sum of the prizes of visited nodes

Parameters:

  • generator (OPGenerator, default: None ) \u2013

    OPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Methods:

  • get_action_mask \u2013

    Get action mask with 1 = feasible action, 0 = infeasible action.

  • check_solution_validity \u2013

    Check that solution is valid: nodes are not visited twice except depot and capacity is not exceeded.

Source code in rl4co/envs/routing/op/env.py
def __init__(\n    self,\n    generator: OPGenerator = None,\n    generator_params: dict = {},\n    prize_type: str = \"dist\",\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = OPGenerator(**generator_params)\n    self.generator = generator\n    self.prize_type = prize_type\n    assert self.prize_type in [\n        \"dist\",\n        \"unif\",\n        \"const\",\n    ], f\"Invalid prize_type: {self.prize_type}\"\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.op.env.OPEnv.get_action_mask","title":"get_action_mask staticmethod","text":"
get_action_mask(td: TensorDict) -> Tensor\n

Get action mask with 1 = feasible action, 0 = infeasible action. Cannot visit if already visited, if depot has been visited, or if the length exceeds the maximum length.

Source code in rl4co/envs/routing/op/env.py
@staticmethod\ndef get_action_mask(td: TensorDict) -> torch.Tensor:\n    \"\"\"Get action mask with 1 = feasible action, 0 = infeasible action.\n    Cannot visit if already visited, if depot has been visited, or if the length exceeds the maximum length.\n    \"\"\"\n    current_loc = gather_by_index(td[\"locs\"], td[\"current_node\"])[..., None, :]\n    exceeds_length = (\n        td[\"tour_length\"][..., None] + (td[\"locs\"] - current_loc).norm(p=2, dim=-1)\n        > td[\"max_length\"]\n    )\n    mask = td[\"visited\"] | td[\"visited\"][..., 0:1] | exceeds_length\n\n    action_mask = ~mask  # 1 = feasible action, 0 = infeasible action\n\n    # Depot can always be visited: we do not hardcode knowledge that this is strictly suboptimal if other options are available\n    action_mask[..., 0] = 1\n    return action_mask\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.op.env.OPEnv.check_solution_validity","title":"check_solution_validity staticmethod","text":"
check_solution_validity(\n    td: TensorDict,\n    actions: Tensor,\n    add_distance_to_depot: bool = True,\n) -> None\n

Check that solution is valid: nodes are not visited twice except depot and capacity is not exceeded. If add_distance_to_depot if True, then the distance to the depot is added to max length since by default, the max length is modified in the reset function to account for the distance to the depot.

Source code in rl4co/envs/routing/op/env.py
@staticmethod\ndef check_solution_validity(\n    td: TensorDict, actions: torch.Tensor, add_distance_to_depot: bool = True\n) -> None:\n    \"\"\"Check that solution is valid: nodes are not visited twice except depot and capacity is not exceeded.\n    If `add_distance_to_depot` if True, then the distance to the depot is added to max length since by default, the max length is\n    modified in the reset function to account for the distance to the depot.\n    \"\"\"\n\n    # Check that tours are valid, i.e. contain 0 to n -1\n    sorted_actions = actions.data.sort(1)[0]\n    # Make sure each node visited once at most (except for depot)\n    assert (\n        (sorted_actions[:, 1:] == 0)\n        | (sorted_actions[:, 1:] > sorted_actions[:, :-1])\n    ).all(), \"Duplicates\"\n\n    # Gather locations in order of tour and get the length of tours\n    locs_ordered = gather_by_index(td[\"locs\"], actions)\n    length = get_tour_length(locs_ordered)\n\n    max_length = td[\"max_length\"]\n    if add_distance_to_depot:\n        max_length = (\n            max_length\n            + (td[\"locs\"][..., 0:1, :] - td[\"locs\"]).norm(p=2, dim=-1)\n            + 1e-6\n        )\n    assert (\n        length[..., None] <= max_length + 1e-5\n    ).all(), \"Max length exceeded by {}\".format(\n        (length[..., None] - max_length).max()\n    )\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.op.generator.OPGenerator","title":"OPGenerator","text":"
OPGenerator(\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    depot_distribution: Union[\n        int, float, str, type, Callable\n    ] = None,\n    min_prize: float = 1.0,\n    max_prize: float = 1.0,\n    prize_distribution: Union[\n        int, float, type, Callable\n    ] = Uniform,\n    prize_type: str = \"dist\",\n    max_length: Union[float, Tensor] = None,\n    **kwargs\n)\n

Bases: Generator

Data generator for the Orienteering Problem (OP).

Parameters:

  • num_loc (int, default: 20 ) \u2013

    number of locations (customers) in the OP, without the depot. (e.g. 10 means 10 locs + 1 depot)

  • min_loc (float, default: 0.0 ) \u2013

    minimum value for the location coordinates

  • max_loc (float, default: 1.0 ) \u2013

    maximum value for the location coordinates

  • loc_distribution (Union[int, float, str, type, Callable], default: Uniform ) \u2013

    distribution for the location coordinates

  • depot_distribution (Union[int, float, str, type, Callable], default: None ) \u2013

    distribution for the depot location. If None, sample the depot from the locations

  • min_prize (float, default: 1.0 ) \u2013

    minimum value for the prize of each customer

  • max_prize (float, default: 1.0 ) \u2013

    maximum value for the prize of each customer

  • prize_distribution (Union[int, float, type, Callable], default: Uniform ) \u2013

    distribution for the prize of each customer

  • max_length (Union[float, Tensor], default: None ) \u2013

    maximum length of the path

Returns:

  • \u2013

    A TensorDict with the following keys: locs [batch_size, num_loc, 2]: locations of each customer depot [batch_size, 2]: location of the depot prize [batch_size, num_loc]: prize of each customer max_length [batch_size, 1]: maximum length of the path for each customer

Source code in rl4co/envs/routing/op/generator.py
def __init__(\n    self,\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[int, float, str, type, Callable] = Uniform,\n    depot_distribution: Union[int, float, str, type, Callable] = None,\n    min_prize: float = 1.0,\n    max_prize: float = 1.0,\n    prize_distribution: Union[int, float, type, Callable] = Uniform,\n    prize_type: str = \"dist\",\n    max_length: Union[float, torch.Tensor] = None,\n    **kwargs,\n):\n    self.num_loc = num_loc\n    self.min_loc = min_loc\n    self.max_loc = max_loc\n    self.min_prize = min_prize\n    self.max_prize = max_prize\n    self.prize_type = prize_type\n    self.max_length = max_length\n\n    # Location distribution\n    if kwargs.get(\"loc_sampler\", None) is not None:\n        self.loc_sampler = kwargs[\"loc_sampler\"]\n    else:\n        self.loc_sampler = get_sampler(\n            \"loc\", loc_distribution, min_loc, max_loc, **kwargs\n        )\n\n    # Depot distribution\n    if kwargs.get(\"depot_sampler\", None) is not None:\n        self.depot_sampler = kwargs[\"depot_sampler\"]\n    else:\n        self.depot_sampler = get_sampler(\n            \"depot\", depot_distribution, min_loc, max_loc, **kwargs\n        ) if depot_distribution is not None else None\n\n    # Prize distribution\n    if kwargs.get(\"prize_sampler\", None) is not None:\n        self.prize_sampler = kwargs[\"prize_sampler\"]\n    elif (\n        prize_distribution == \"dist\"\n    ):  # If prize_distribution is 'dist', then the prize is the distance from the depot\n        self.prize_sampler = None\n    else:\n        self.prize_sampler = get_sampler(\n            \"prize\", prize_distribution, min_prize, max_prize, **kwargs\n        )\n\n    # Max length\n    if max_length is not None:\n        self.max_length = max_length\n    else:\n        self.max_length = MAX_LENGTHS.get(num_loc, None)\n    if self.max_length is None:\n        closest_num_loc = min(MAX_LENGTHS.keys(), key=lambda x: abs(x - num_loc))\n        self.max_length = MAX_LENGTHS[closest_num_loc]\n        log.warning(\n            f\"The max length for {num_loc} locations is not defined. Using the closest max length: {self.max_length}\\\n                with {closest_num_loc} locations.\"\n        )\n
"},{"location":"docs/content/api/envs/routing/#pickup-and-delivery-problem-pdp","title":"Pickup and Delivery Problem (PDP)","text":""},{"location":"docs/content/api/envs/routing/#envs.routing.pdp.env.PDPEnv","title":"PDPEnv","text":"
PDPEnv(\n    generator: PDPGenerator = None,\n    generator_params: dict = {},\n    **kwargs\n)\n

Bases: RL4COEnvBase

Pickup and Delivery Problem (PDP) environment. The environment is made of num_loc + 1 locations (cities):

- 1 depot\n- `num_loc` / 2 pickup locations\n- `num_loc` / 2 delivery locations\n

The goal is to visit all the pickup and delivery locations in the shortest path possible starting from the depot The conditions is that the agent must visit a pickup location before visiting its corresponding delivery location

Observations
  • locations of the depot, pickup, and delivery locations
  • current location of the vehicle
  • the remaining locations to deliver
  • the visited locations
  • the current step
Constraints
  • the tour starts and ends at the depot
  • each pickup location must be visited before its corresponding delivery location
  • the vehicle cannot visit the same location twice
Finish Condition
  • the vehicle has visited all locations
Reward
  • (minus) the negative length of the path

Parameters:

  • generator (PDPGenerator, default: None ) \u2013

    PDPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Methods:

  • get_num_starts \u2013

    Only half of the nodes (i.e. pickup nodes) can be start nodes

  • select_start_nodes \u2013

    Only nodes from [1 : num_loc // 2 +1] (i.e. pickups) can be selected

Source code in rl4co/envs/routing/pdp/env.py
def __init__(\n    self,\n    generator: PDPGenerator = None,\n    generator_params: dict = {},\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = PDPGenerator(**generator_params)\n    self.generator = generator\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.pdp.env.PDPEnv.get_num_starts","title":"get_num_starts","text":"
get_num_starts(td)\n

Only half of the nodes (i.e. pickup nodes) can be start nodes

Source code in rl4co/envs/routing/pdp/env.py
def get_num_starts(self, td):\n    \"\"\"Only half of the nodes (i.e. pickup nodes) can be start nodes\"\"\"\n    return (td[\"locs\"].shape[-2] - 1) // 2\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.pdp.env.PDPEnv.select_start_nodes","title":"select_start_nodes","text":"
select_start_nodes(td, num_starts)\n

Only nodes from [1 : num_loc // 2 +1] (i.e. pickups) can be selected

Source code in rl4co/envs/routing/pdp/env.py
def select_start_nodes(self, td, num_starts):\n    \"\"\"Only nodes from [1 : num_loc // 2 +1] (i.e. pickups) can be selected\"\"\"\n    num_possible_starts = (td[\"locs\"].shape[-2] - 1) // 2\n    selected = (\n        torch.arange(num_starts, device=td.device).repeat_interleave(td.shape[0])\n        % num_possible_starts\n        + 1\n    )\n    return selected\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.pdp.generator.PDPGenerator","title":"PDPGenerator","text":"
PDPGenerator(\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    init_sol_type: str = \"random\",\n    loc_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    depot_distribution: Union[\n        int, float, str, type, Callable\n    ] = None,\n    **kwargs\n)\n

Bases: Generator

Data generator for the Pickup and Delivery Problem (PDP). Args: num_loc: number of locations (customers) in the PDP, without the depot. (e.g. 10 means 10 locs + 1 depot)

    - 1 depot\n    - `num_loc` / 2 pickup locations\n    - `num_loc` / 2 delivery locations\nmin_loc: minimum value for the location coordinates\nmax_loc: maximum value for the location coordinates\ninit_sol_type: the method type used for generating initial solutions (random or greedy)\nloc_distribution: distribution for the location coordinates\ndepot_distribution: distribution for the depot location. If None, sample the depot from the locations\n

Returns:

  • \u2013

    A TensorDict with the following keys: locs [batch_size, num_loc, 2]: locations of each customer depot [batch_size, 2]: location of the depot

Source code in rl4co/envs/routing/pdp/generator.py
def __init__(\n    self,\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    init_sol_type: str = \"random\",\n    loc_distribution: Union[int, float, str, type, Callable] = Uniform,\n    depot_distribution: Union[int, float, str, type, Callable] = None,\n    **kwargs,\n):\n    self.num_loc = num_loc\n    self.min_loc = min_loc\n    self.max_loc = max_loc\n    self.init_sol_type = init_sol_type\n\n    # Number of locations must be even\n    if num_loc % 2 != 0:\n        log.warn(\n            \"Number of locations must be even. Adding 1 to the number of locations.\"\n        )\n        self.num_loc += 1\n\n    # Location distribution\n    if kwargs.get(\"loc_sampler\", None) is not None:\n        self.loc_sampler = kwargs[\"loc_sampler\"]\n    else:\n        self.loc_sampler = get_sampler(\n            \"loc\", loc_distribution, min_loc, max_loc, **kwargs\n        )\n\n    # Depot distribution\n    if kwargs.get(\"depot_sampler\", None) is not None:\n        self.depot_sampler = kwargs[\"depot_sampler\"]\n    else:\n        self.depot_sampler = get_sampler(\n            \"depot\", depot_distribution, min_loc, max_loc, **kwargs\n        ) if depot_distribution is not None else None\n
"},{"location":"docs/content/api/envs/routing/#prize-collecting-traveling-salesman-problem-pctsp","title":"Prize Collecting Traveling Salesman Problem (PCTSP)","text":""},{"location":"docs/content/api/envs/routing/#envs.routing.pctsp.env.PCTSPEnv","title":"PCTSPEnv","text":"
PCTSPEnv(\n    generator: PCTSPGenerator = None,\n    generator_params: dict = {},\n    **kwargs\n)\n

Bases: RL4COEnvBase

Prize-collecting TSP (PCTSP) environment. The goal is to collect as much prize as possible while minimizing the total travel cost. The environment is stochastic, the prize is only revealed when the node is visited.

Observations
  • locations of the nodes
  • prize and penalty of each node
  • current location of the vehicle
  • current total prize
  • current total penalty
  • visited nodes
  • prize required to visit a node
  • the current step
Constraints
  • the tour starts and ends at the depot
  • the vehicle cannot visit nodes exceed the remaining prize
Finish Condition
  • the vehicle back to the depot
Reward
  • the sum of the saved penalties

Parameters:

  • generator (PCTSPGenerator, default: None ) \u2013

    OPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Methods:

  • get_action_mask \u2013

    Cannot visit depot if not yet collected 1 total prize and there are unvisited nodes

  • check_solution_validity \u2013

    Check that the solution is valid, i.e. contains all nodes once at most, and either prize constraint is met or all nodes are visited

Source code in rl4co/envs/routing/pctsp/env.py
def __init__(\n    self,\n    generator: PCTSPGenerator = None,\n    generator_params: dict = {},\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = PCTSPGenerator(**generator_params)\n    self.generator = generator\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.pctsp.env.PCTSPEnv.get_action_mask","title":"get_action_mask staticmethod","text":"
get_action_mask(td: TensorDict) -> Tensor\n

Cannot visit depot if not yet collected 1 total prize and there are unvisited nodes

Source code in rl4co/envs/routing/pctsp/env.py
@staticmethod\ndef get_action_mask(td: TensorDict) -> torch.Tensor:\n    \"\"\"Cannot visit depot if not yet collected 1 total prize and there are unvisited nodes\"\"\"\n    mask = td[\"visited\"] | td[\"visited\"][..., 0:1]\n    mask[..., 0] = (td[\"cur_total_prize\"] < 1.0) & (\n        td[\"visited\"][..., 1:].int().sum(-1) < td[\"visited\"][..., 1:].size(-1)\n    )\n    return ~(mask > 0)  # Invert mask, since 1 means feasible action\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.pctsp.env.PCTSPEnv.check_solution_validity","title":"check_solution_validity staticmethod","text":"
check_solution_validity(\n    td: TensorDict, actions: Tensor\n) -> None\n

Check that the solution is valid, i.e. contains all nodes once at most, and either prize constraint is met or all nodes are visited

Source code in rl4co/envs/routing/pctsp/env.py
@staticmethod\ndef check_solution_validity(td: TensorDict, actions: torch.Tensor) -> None:\n    \"\"\"Check that the solution is valid, i.e. contains all nodes once at most, and either prize constraint is met or all nodes are visited\"\"\"\n\n    # Check that tours are valid, i.e. contain 0 to n -1\n    sorted_actions = actions.data.sort(1)[0]\n\n    # Make sure each node visited once at most (except for depot)\n    assert (\n        (sorted_actions[..., 1:] == 0)\n        | (sorted_actions[..., 1:] > sorted_actions[..., :-1])\n    ).all(), \"Duplicates\"\n\n    prize = td[\"real_prize\"][..., 1:]  # Remove depot\n    prize_with_depot = torch.cat((torch.zeros_like(prize[:, :1]), prize), 1)\n    p = prize_with_depot.gather(1, actions)\n\n    # Either prize constraint should be satisfied or all prizes should be visited\n    assert (\n        (p.sum(-1) >= 1 - 1e-5)\n        | (\n            sorted_actions.size(-1) - (sorted_actions == 0).int().sum(-1)\n            == (td[\"locs\"].size(-2) - 1)\n        )  # no depot\n    ).all(), \"Total prize does not satisfy min total prize\"\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.pctsp.generator.PCTSPGenerator","title":"PCTSPGenerator","text":"
PCTSPGenerator(\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    depot_distribution: Union[\n        int, float, str, type, Callable\n    ] = None,\n    penalty_factor: float = 3.0,\n    prize_required: float = 1.0,\n    **kwargs\n)\n

Bases: Generator

Data generator for the Prize-collecting Traveling Salesman Problem (PCTSP).

Parameters:

  • num_loc (int, default: 20 ) \u2013

    number of locations (customers) in the VRP, without the depot. (e.g. 10 means 10 locs + 1 depot)

  • min_loc (float, default: 0.0 ) \u2013

    minimum value for the location coordinates

  • max_loc (float, default: 1.0 ) \u2013

    maximum value for the location coordinates

  • loc_distribution (Union[int, float, str, type, Callable], default: Uniform ) \u2013

    distribution for the location coordinates

  • depot_distribution (Union[int, float, str, type, Callable], default: None ) \u2013

    distribution for the depot location. If None, sample the depot from the locations

  • min_demand \u2013

    minimum value for the demand of each customer

  • max_demand \u2013

    maximum value for the demand of each customer

  • demand_distribution \u2013

    distribution for the demand of each customer

  • capacity \u2013

    capacity of the vehicle

Returns:

  • \u2013

    A TensorDict with the following keys: locs [batch_size, num_loc, 2]: locations of each city depot [batch_size, 2]: location of the depot demand [batch_size, num_loc]: demand of each customer capacity [batch_size, 1]: capacity of the vehicle

Source code in rl4co/envs/routing/pctsp/generator.py
def __init__(\n    self,\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[int, float, str, type, Callable] = Uniform,\n    depot_distribution: Union[int, float, str, type, Callable] = None,\n    penalty_factor: float = 3.0,\n    prize_required: float = 1.0,\n    **kwargs,\n):\n    self.num_loc = num_loc\n    self.min_loc = min_loc\n    self.max_loc = max_loc\n    self.penalty_fctor = penalty_factor\n    self.prize_required = prize_required\n\n    # Location distribution\n    if kwargs.get(\"loc_sampler\", None) is not None:\n        self.loc_sampler = kwargs[\"loc_sampler\"]\n    else:\n        self.loc_sampler = get_sampler(\n            \"loc\", loc_distribution, min_loc, max_loc, **kwargs\n        )\n\n    # Depot distribution\n    if kwargs.get(\"depot_sampler\", None) is not None:\n        self.depot_sampler = kwargs[\"depot_sampler\"]\n    else:\n        self.depot_sampler = get_sampler(\n            \"depot\", depot_distribution, min_loc, max_loc, **kwargs\n        ) if depot_distribution is not None else None\n\n    # Prize distribution\n    self.deterministic_prize_sampler = get_sampler(\n        \"deterministric_prize\", \"uniform\", 0.0, 4.0 / self.num_loc, **kwargs\n    )\n    self.stochastic_prize_sampler = get_sampler(\n        \"stochastic_prize\", \"uniform\", 0.0, 2.0, **kwargs\n    )\n\n    # For the penalty to make sense it should be not too large (in which case all nodes will be visited) nor too small\n    # so we want the objective term to be approximately equal to the length of the tour, which we estimate with half\n    # of the nodes by half of the tour length (which is very rough but similar to op)\n    # This means that the sum of penalties for all nodes will be approximately equal to the tour length (on average)\n    # The expected total (uniform) penalty of half of the nodes (since approx half will be visited by the constraint)\n    # is (n / 2) / 2 = n / 4 so divide by this means multiply by 4 / n,\n    # However instead of 4 we use penalty_factor (3 works well) so we can make them larger or smaller        \n    self.max_penalty = kwargs.get(\"max_penalty\", None)\n    if self.max_penalty is None:  # If not provided, use the default max penalty\n        self.max_penalty = MAX_LENGTHS.get(num_loc, None)\n    if (\n        self.max_penalty is None\n    ):  # If not in the table keys, find the closest number of nodes as the key\n        closest_num_loc = min(MAX_LENGTHS.keys(), key=lambda x: abs(x - num_loc))\n        self.max_penalty = MAX_LENGTHS[closest_num_loc]\n        log.warning(\n            f\"The max penalty for {num_loc} locations is not defined. Using the closest max penalty: {self.max_penalty}\\\n                with {closest_num_loc} locations.\"\n        )\n\n    # Adjust as in Kool et al. (2019)\n    self.max_penalty *= penalty_factor / self.num_loc\n    self.penalty_sampler = get_sampler(\n        \"penalty\", \"uniform\", 0.0, self.max_penalty, **kwargs\n    )\n
"},{"location":"docs/content/api/envs/routing/#split-delivery-vehicle-routing-problem-sdvrp","title":"Split Delivery Vehicle Routing Problem (SDVRP)","text":""},{"location":"docs/content/api/envs/routing/#envs.routing.sdvrp.env.SDVRPEnv","title":"SDVRPEnv","text":"
SDVRPEnv(\n    generator: CVRPGenerator = None,\n    generator_params: dict = {},\n    **kwargs\n)\n

Bases: CVRPEnv

Split Delivery Vehicle Routing Problem (SDVRP) environment. SDVRP is a generalization of CVRP, where nodes can be visited multiple times and a fraction of the demand can be met. At each step, the agent chooses a customer to visit depending on the current location and the remaining capacity. When the agent visits a customer, the remaining capacity is updated. If the remaining capacity is not enough to visit any customer, the agent must go back to the depot. The reward is the -infinite unless the agent visits all the customers. In that case, the reward is (-)length of the path: maximizing the reward is equivalent to minimizing the path length.

Observations
  • location of the depot.
  • locations and demand/remaining demand of each customer
  • current location of the vehicle.
  • the remaining capacity of the vehicle.
Constraints
  • the tour starts and ends at the depot.
  • each customer can be visited multiple times.
  • the vehicle cannot visit customers exceed the remaining capacity.
  • the vehicle can return to the depot to refill the capacity.
Finish Condition
  • the vehicle has finished all customers demand and returned to the depot.
Reward
  • (minus) the negative length of the path.

Parameters:

  • generator (CVRPGenerator, default: None ) \u2013

    CVRPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Methods:

  • check_solution_validity \u2013

    Check that the solution is valid (all demand is satisfied)

Source code in rl4co/envs/routing/sdvrp/env.py
def __init__(\n    self,\n    generator: CVRPGenerator = None,\n    generator_params: dict = {},\n    **kwargs,\n):\n    super().__init__(generator, generator_params, **kwargs)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.sdvrp.env.SDVRPEnv.check_solution_validity","title":"check_solution_validity staticmethod","text":"
check_solution_validity(\n    td: TensorDict, actions: Tensor\n) -> None\n

Check that the solution is valid (all demand is satisfied)

Source code in rl4co/envs/routing/sdvrp/env.py
@staticmethod\ndef check_solution_validity(td: TensorDict, actions: torch.Tensor) -> None:\n    \"\"\"Check that the solution is valid (all demand is satisfied)\"\"\"\n\n    batch_size, graph_size = td[\"demand\"].size()\n\n    # Each node can be visited multiple times, but we always deliver as much demand as possible\n    # We check that at the end all demand has been satisfied\n    demands = torch.cat((-td[\"vehicle_capacity\"], td[\"demand\"]), 1)\n\n    rng = torch.arange(batch_size, out=demands.data.new().long())\n    used_cap = torch.zeros_like(td[\"demand\"][..., 0])\n    a_prev = None\n    for a in actions.transpose(0, 1):\n        assert (\n            a_prev is None or (demands[((a_prev == 0) & (a == 0)), :] == 0).all()\n        ), \"Cannot visit depot twice if any nonzero demand\"\n        d = torch.min(demands[rng, a], td[\"vehicle_capacity\"].squeeze(-1) - used_cap)\n        demands[rng, a] -= d\n        used_cap += d\n        used_cap[a == 0] = 0\n        a_prev = a\n    assert (demands == 0).all(), \"All demand must be satisfied\"\n
"},{"location":"docs/content/api/envs/routing/#stochastic-prize-collecting-traveling-salesman-problem-spctsp","title":"Stochastic Prize Collecting Traveling Salesman Problem (SPCTSP)","text":""},{"location":"docs/content/api/envs/routing/#envs.routing.spctsp.env.SPCTSPEnv","title":"SPCTSPEnv","text":"
SPCTSPEnv(**kwargs)\n

Bases: PCTSPEnv

Stochastic Prize Collecting Traveling Salesman Problem (SPCTSP) environment.

Note

The only difference with deterministic PCTSP is that the prizes are stochastic (i.e. the expected prize is not the same as the real prize).

Source code in rl4co/envs/routing/spctsp/env.py
def __init__(self, **kwargs):\n    super().__init__(**kwargs)\n
"},{"location":"docs/content/api/envs/routing/#traveling-salesman-problem-tsp","title":"Traveling Salesman Problem (TSP)","text":""},{"location":"docs/content/api/envs/routing/#envs.routing.tsp.env.TSPEnv","title":"TSPEnv","text":"
TSPEnv(\n    generator: TSPGenerator = None,\n    generator_params: dict = {},\n    **kwargs\n)\n

Bases: RL4COEnvBase

Traveling Salesman Problem (TSP) environment At each step, the agent chooses a city to visit. The reward is 0 unless the agent visits all the cities. In that case, the reward is (-)length of the path: maximizing the reward is equivalent to minimizing the path length.

Observations
  • locations of each customer.
  • the current location of the vehicle.
Constraints
  • the tour must return to the starting customer.
  • each customer must be visited exactly once.
Finish condition
  • the agent has visited all customers and returned to the starting customer.
Reward
  • (minus) the negative length of the path.

Parameters:

  • generator (TSPGenerator, default: None ) \u2013

    TSPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Methods:

  • check_solution_validity \u2013

    Check that solution is valid: nodes are visited exactly once

  • replace_selected_actions \u2013

    Replace selected current actions with updated actions based on selection_mask.

Source code in rl4co/envs/routing/tsp/env.py
def __init__(\n    self,\n    generator: TSPGenerator = None,\n    generator_params: dict = {},\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = TSPGenerator(**generator_params)\n    self.generator = generator\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.tsp.env.TSPEnv.check_solution_validity","title":"check_solution_validity staticmethod","text":"
check_solution_validity(\n    td: TensorDict, actions: Tensor\n) -> None\n

Check that solution is valid: nodes are visited exactly once

Source code in rl4co/envs/routing/tsp/env.py
@staticmethod\ndef check_solution_validity(td: TensorDict, actions: torch.Tensor) -> None:\n    \"\"\"Check that solution is valid: nodes are visited exactly once\"\"\"\n    assert (\n        torch.arange(actions.size(1), out=actions.data.new())\n        .view(1, -1)\n        .expand_as(actions)\n        == actions.data.sort(1)[0]\n    ).all(), \"Invalid tour\"\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.tsp.env.TSPEnv.replace_selected_actions","title":"replace_selected_actions","text":"
replace_selected_actions(\n    cur_actions: Tensor,\n    new_actions: Tensor,\n    selection_mask: Tensor,\n) -> Tensor\n

Replace selected current actions with updated actions based on selection_mask.

Source code in rl4co/envs/routing/tsp/env.py
def replace_selected_actions(\n    self,\n    cur_actions: torch.Tensor,\n    new_actions: torch.Tensor,\n    selection_mask: torch.Tensor,\n) -> torch.Tensor:\n    \"\"\"\n    Replace selected current actions with updated actions based on `selection_mask`.\n\n    Args:\n        cur_actions [batch_size, num_loc]\n        new_actions [batch_size, num_loc]\n        selection_mask [batch_size,]\n    \"\"\"\n    cur_actions[selection_mask] = new_actions[selection_mask]\n    return cur_actions\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.tsp.generator.TSPGenerator","title":"TSPGenerator","text":"
TSPGenerator(\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    init_sol_type: str = \"random\",\n    loc_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    **kwargs\n)\n

Bases: Generator

Data generator for the Travelling Salesman Problem (TSP).

Parameters:

  • num_loc (int, default: 20 ) \u2013

    number of locations (customers) in the TSP

  • min_loc (float, default: 0.0 ) \u2013

    minimum value for the location coordinates

  • max_loc (float, default: 1.0 ) \u2013

    maximum value for the location coordinates

  • init_sol_type (str, default: 'random' ) \u2013

    the method type used for generating initial solutions (random or greedy)

  • loc_distribution (Union[int, float, str, type, Callable], default: Uniform ) \u2013

    distribution for the location coordinates

Returns:

  • \u2013

    A TensorDict with the following keys: locs [batch_size, num_loc, 2]: locations of each customer

Source code in rl4co/envs/routing/tsp/generator.py
def __init__(\n    self,\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    init_sol_type: str = \"random\",\n    loc_distribution: Union[int, float, str, type, Callable] = Uniform,\n    **kwargs,\n):\n    self.num_loc = num_loc\n    self.min_loc = min_loc\n    self.max_loc = max_loc\n    self.init_sol_type = init_sol_type\n\n    # Location distribution\n    if kwargs.get(\"loc_sampler\", None) is not None:\n        self.loc_sampler = kwargs[\"loc_sampler\"]\n    else:\n        self.loc_sampler = get_sampler(\n            \"loc\", loc_distribution, min_loc, max_loc, **kwargs\n        )\n
"},{"location":"docs/content/api/envs/routing/#multi-task-vehicle-routing-problem-mtvrp","title":"Multi-Task Vehicle Routing Problem (MTVRP)","text":""},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.env.MTVRPEnv","title":"MTVRPEnv","text":"
MTVRPEnv(\n    generator: MTVRPGenerator = None,\n    generator_params: dict = {},\n    check_solution: bool = False,\n    **kwargs\n)\n

Bases: RL4COEnvBase

MTVRPEnv is a Multi-Task VRP environment which can take any combination of the following constraints:

Features:

  • Capacity (C) - Each vehicle has a maximum capacity \\(Q\\), restricting the total load that can be in the vehicle at any point of the route. - The route must be planned such that the sum of demands and pickups for all customers visited does not exceed this capacity.
  • Time Windows (TW) - Every node \\(i\\) has an associated time window \\([e_i, l_i]\\) during which service must commence. - Additionally, each node has a service time \\(s_i\\). Vehicles must reach node \\(i\\) within its time window; early arrivals must wait at the node location until time \\(e_i\\).
  • Open Routes (O) - Vehicles are not required to return to the depot after serving all customers. - Note that this does not need to be counted as a constraint since it can be modelled by setting zero costs on arcs returning to the depot \\(c_{i0} = 0\\) from any customer \\(i \\in C\\), and not counting the return arc as part of the route.
  • Backhauls (B) - Backhauls generalize demand to also account for return shipments. Customers are either linehaul or backhaul customers. - Linehaul customers require delivery of a demand \\(q_i > 0\\) that needs to be transported from the depot to the customer, whereas backhaul customers need a pickup of an amount \\(p_i > 0\\) that is transported from the client back to the depot. - It is possible for vehicles to serve a combination of linehaul and backhaul customers in a single route, but then any linehaul customers must precede the backhaul customers in the route.
  • Duration Limits (L) - Imposes a limit on the total travel duration (or length) of each route, ensuring a balanced workload across vehicles.

The environment covers the following 16 variants depending on the data generation:

VRP Variant Capacity (C) Open Route (O) Backhaul (B) Duration Limit (L) Time Window (TW) CVRP \u2714 OVRP \u2714 \u2714 VRPB \u2714 \u2714 VRPL \u2714 \u2714 VRPTW \u2714 \u2714 OVRPTW \u2714 \u2714 \u2714 OVRPB \u2714 \u2714 \u2714 OVRPL \u2714 \u2714 \u2714 VRPBL \u2714 \u2714 \u2714 VRPBTW \u2714 \u2714 \u2714 VRPLTW \u2714 \u2714 \u2714 OVRPBL \u2714 \u2714 \u2714 \u2714 OVRPBTW \u2714 \u2714 \u2714 \u2714 OVRPLTW \u2714 \u2714 \u2714 \u2714 VRPBLTW \u2714 \u2714 \u2714 \u2714 OVRPBLTW \u2714 \u2714 \u2714 \u2714 \u2714

You may also check out the following papers as reference:

  • \"Multi-Task Learning for Routing Problem with Cross-Problem Zero-Shot Generalization\" (Liu et al, 2024)
  • \"MVMoE: Multi-Task Vehicle Routing Solver with Mixture-of-Experts\" (Zhou et al, 2024)
  • \"RouteFinder: Towards Foundation Models for Vehicle Routing Problems\" (Berto et al, 2024)
Tip

Have a look at https://pyvrp.org/ for more information about VRP and its variants and their solutions. Kudos to their help and great job!

Parameters:

  • generator (MTVRPGenerator, default: None ) \u2013

    Generator for the environment, see :class:MTVRPGenerator.

  • generator_params (dict, default: {} ) \u2013

    Parameters for the generator.

Methods:

  • load_data \u2013

    Dataset loading from file

  • render \u2013

    Simple wrapper for render function

  • select_start_nodes \u2013

    Select available start nodes for the environment (e.g. for POMO-based training)

  • solve \u2013

    Classical solver for the environment. This is a wrapper for the baselines solver.

  • check_variants \u2013

    Check if the problem has the variants

Source code in rl4co/envs/routing/mtvrp/env.py
def __init__(\n    self,\n    generator: MTVRPGenerator = None,\n    generator_params: dict = {},\n    check_solution: bool = False,\n    **kwargs,\n):\n    if check_solution:\n        log.warning(\n            \"Solution checking is enabled. This may slow down the environment.\"\n            \" We recommend disabling this for training by passing `check_solution=False`.\"\n        )\n\n    super().__init__(check_solution=check_solution, **kwargs)\n\n    if generator is None:\n        generator = MTVRPGenerator(**generator_params)\n    self.generator = generator\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.env.MTVRPEnv.load_data","title":"load_data","text":"
load_data(fpath, batch_size=[], scale=False)\n

Dataset loading from file Normalize demand by capacity to be in [0, 1]

Source code in rl4co/envs/routing/mtvrp/env.py
def load_data(self, fpath, batch_size=[], scale=False):\n    \"\"\"Dataset loading from file\n    Normalize demand by capacity to be in [0, 1]\n    \"\"\"\n    td_load = load_npz_to_tensordict(fpath)\n    if scale:\n        td_load.set(\n            \"demand_linehaul\",\n            td_load[\"demand_linehaul\"] / td_load[\"capacity_original\"],\n        )\n        td_load.set(\n            \"demand_backhaul\",\n            td_load[\"demand_backhaul\"] / td_load[\"capacity_original\"],\n        )\n    return td_load\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.env.MTVRPEnv.render","title":"render staticmethod","text":"
render(*args, **kwargs)\n

Simple wrapper for render function

Source code in rl4co/envs/routing/mtvrp/env.py
@staticmethod\ndef render(*args, **kwargs):\n    \"\"\"Simple wrapper for render function\"\"\"\n    from .render import render\n\n    return render(*args, **kwargs)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.env.MTVRPEnv.select_start_nodes","title":"select_start_nodes","text":"
select_start_nodes(td, num_starts)\n

Select available start nodes for the environment (e.g. for POMO-based training)

Source code in rl4co/envs/routing/mtvrp/env.py
def select_start_nodes(self, td, num_starts):\n    \"\"\"Select available start nodes for the environment (e.g. for POMO-based training)\"\"\"\n    num_loc = td[\"locs\"].shape[-2] - 1\n    selected = (\n        torch.arange(num_starts, device=td.device).repeat_interleave(td.shape[0])\n        % num_loc\n        + 1\n    )\n    return selected\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.env.MTVRPEnv.solve","title":"solve staticmethod","text":"
solve(\n    instances: TensorDict,\n    max_runtime: float,\n    num_procs: int = 1,\n    solver: str = \"pyvrp\",\n    **kwargs\n) -> tuple[Tensor, Tensor]\n

Classical solver for the environment. This is a wrapper for the baselines solver. Available solvers are: pyvrp, ortools, lkh. Returns the actions and costs.

Source code in rl4co/envs/routing/mtvrp/env.py
@staticmethod\ndef solve(\n    instances: TensorDict,\n    max_runtime: float,\n    num_procs: int = 1,\n    solver: str = \"pyvrp\",\n    **kwargs,\n) -> tuple[torch.Tensor, torch.Tensor]:\n    \"\"\"Classical solver for the environment. This is a wrapper for the baselines solver.\n    Available solvers are: `pyvrp`, `ortools`, `lkh`. Returns the actions and costs.\n    \"\"\"\n    from .baselines.solve import solve\n\n    return solve(instances, max_runtime, num_procs, solver, **kwargs)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.env.MTVRPEnv.check_variants","title":"check_variants staticmethod","text":"
check_variants(td)\n

Check if the problem has the variants

Source code in rl4co/envs/routing/mtvrp/env.py
@staticmethod\ndef check_variants(td):\n    \"\"\"Check if the problem has the variants\"\"\"\n    has_open = td[\"open_route\"].squeeze(-1)\n    has_tw = (td[\"time_windows\"][:, :, 1] != float(\"inf\")).any(-1)\n    has_limit = (td[\"distance_limit\"] != float(\"inf\")).squeeze(-1)\n    has_backhaul = (td[\"demand_backhaul\"] != 0).any(-1)\n    return has_open, has_tw, has_limit, has_backhaul\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.generator.MTVRPGenerator","title":"MTVRPGenerator","text":"
MTVRPGenerator(\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[\n        int, float, str, type, Callable\n    ] = Uniform,\n    capacity: float = None,\n    min_demand: int = 1,\n    max_demand: int = 10,\n    min_backhaul: int = 1,\n    max_backhaul: int = 10,\n    scale_demand: bool = True,\n    max_time: float = 4.6,\n    backhaul_ratio: float = 0.2,\n    distance_limit: float = 3.0,\n    speed: float = 1.0,\n    prob_open: float = 0.5,\n    prob_time_window: float = 0.5,\n    prob_limit: float = 0.5,\n    prob_backhaul: float = 0.5,\n    variant_preset=None,\n    use_combinations=True,\n    subsample=True,\n    **kwargs\n)\n

Bases: Generator

MTVRP Generator. Class to generate instances of the MTVRP problem. If a variant is declared and Subsample is True, the generator will sample the problem based on the variant probabilities. By default, we use Mixed-Batch Training as in Berto et al. 2024 (RouteFinder), i.e. one batch can contain multiple variants.

Example presets:

  • \"all\": Sample uniformly from 16 variants
  • \"single_feat\": Sample uniformly between CVRP, OVRP, VRPB, VRPL, VRPTW (as done in Liu et al. 2024 (MTPOMO))
  • \"single_feat_otw\": Sample uniformly between CVRP, OVRP, VRPB, VRPL, VRPTW, OVRPTW (as done in Zhou et al. 2024 (MVMoE))
  • \"cvrp\": Only CVRP (similarly for other variants)

Parameters:

  • num_loc (int, default: 20 ) \u2013

    Number of locations to generate

  • min_loc (float, default: 0.0 ) \u2013

    Minimum location value

  • max_loc (float, default: 1.0 ) \u2013

    Maximum location value

  • loc_distribution (Union[int, float, str, type, Callable], default: Uniform ) \u2013

    Distribution to sample locations from

  • capacity (float, default: None ) \u2013

    Vehicle capacity. If None, get value based on get_vehicle_capacity

  • min_demand (int, default: 1 ) \u2013

    Minimum demand value

  • max_demand (int, default: 10 ) \u2013

    Maximum demand value

  • min_backhaul (int, default: 1 ) \u2013

    Minimum backhaul value

  • max_backhaul (int, default: 10 ) \u2013

    Maximum backhaul value

  • scale_demand (bool, default: True ) \u2013

    Scale demand values (by default, generate between 1 and 10)

  • max_time (float, default: 4.6 ) \u2013

    Maximum time window value (at depot)

  • backhaul_ratio (float, default: 0.2 ) \u2013

    Fraction of backhauls (e.g. 0.2 means 20% of nodes are backhaul)

  • distance_limit (float, default: 3.0 ) \u2013

    Distance limit

  • speed (float, default: 1.0 ) \u2013

    Speed of vehicle. Defaults to 1

  • subsample \u2013

    If False, we always sample all attributes (i.e., OVRPBLTW) If true, we use the

  • **kwargs \u2013

    Additional keyword arguments

Methods:

  • subsample_problems \u2013

    Create subproblems starting from seed probabilities depending on their variant.

  • generate_locations \u2013

    Generate seed locations.

  • generate_demands \u2013

    Classical lineahul demand / delivery from depot (C) and backhaul demand / pickup to depot (B) generation.

  • generate_time_windows \u2013

    Generate time windows (TW) and service times for each location including depot.

  • generate_distance_limit \u2013

    Generates distance limits (L) and checks their feasibilities.

  • generate_open_route \u2013

    Generate open route flags (O). Here we could have a sampler but we simply return True here so all

  • generate_speed \u2013

    We simply generate the speed as constant here

Source code in rl4co/envs/routing/mtvrp/generator.py
def __init__(\n    self,\n    num_loc: int = 20,\n    min_loc: float = 0.0,\n    max_loc: float = 1.0,\n    loc_distribution: Union[int, float, str, type, Callable] = Uniform,\n    capacity: float = None,\n    min_demand: int = 1,\n    max_demand: int = 10,\n    min_backhaul: int = 1,\n    max_backhaul: int = 10,\n    scale_demand: bool = True,\n    max_time: float = 4.6,\n    backhaul_ratio: float = 0.2,\n    distance_limit: float = 3.0,\n    speed: float = 1.0,\n    prob_open: float = 0.5,\n    prob_time_window: float = 0.5,\n    prob_limit: float = 0.5,\n    prob_backhaul: float = 0.5,\n    variant_preset=None,\n    use_combinations=True,\n    subsample=True,\n    **kwargs,\n) -> None:\n    # Location distribution\n    self.num_loc = num_loc\n    self.min_loc = min_loc\n    self.max_loc = max_loc\n    if kwargs.get(\"loc_sampler\", None) is not None:\n        self.loc_sampler = kwargs[\"loc_sampler\"]\n    else:\n        self.loc_sampler = get_sampler(\n            \"loc\", loc_distribution, min_loc, max_loc, **kwargs\n        )\n\n    if capacity is None:\n        capacity = get_vehicle_capacity(num_loc)\n    self.capacity = capacity\n    self.min_demand = min_demand\n    self.max_demand = max_demand\n    self.min_backhaul = min_backhaul\n    self.max_backhaul = max_backhaul\n    self.scale_demand = scale_demand\n    self.backhaul_ratio = backhaul_ratio\n\n    self.max_time = max_time\n    self.distance_limit = distance_limit\n    self.speed = speed\n\n    assert not (subsample and (variant_preset is None)), (\n        \"Cannot use subsample if variant_preset is not specified. \"\n    )\n    if variant_preset is not None:\n        log.info(f\"Using variant generation preset {variant_preset}\")\n        variant_probs = VARIANT_GENERATION_PRESETS.get(variant_preset)\n        assert (\n            variant_probs is not None\n        ), f\"Variant generation preset {variant_preset} not found. \\\n            Available presets are {VARIANT_GENERATION_PRESETS.keys()} with probabilities {VARIANT_GENERATION_PRESETS.values()}\"\n    else:\n        variant_probs = {\n            \"O\": prob_open,\n            \"TW\": prob_time_window,\n            \"L\": prob_limit,\n            \"B\": prob_backhaul,\n        }\n    # check probabilities\n    for key, prob in variant_probs.items():\n        assert 0 <= prob <= 1, f\"Probability {key} must be between 0 and 1\"\n    self.variant_probs = variant_probs\n    self.variant_preset = variant_preset\n    if isinstance(variant_preset, str) and variant_preset != \"all\":\n        log.warning(f\"{variant_preset} selected. Will not use feature combination!\")\n        use_combinations = False\n    self.use_combinations = use_combinations\n    self.subsample = subsample\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.generator.MTVRPGenerator.subsample_problems","title":"subsample_problems","text":"
subsample_problems(td)\n

Create subproblems starting from seed probabilities depending on their variant. If random seed sampled in [0, 1] in batch is greater than prob, remove the constraint thus, if prob high, it is less likely to remove the constraint (i.e. prob=0.9, 90% chance to keep constraint)

Source code in rl4co/envs/routing/mtvrp/generator.py
def subsample_problems(self, td):\n    \"\"\"Create subproblems starting from seed probabilities depending on their variant.\n    If random seed sampled in [0, 1] in batch is greater than prob, remove the constraint\n    thus, if prob high, it is less likely to remove the constraint (i.e. prob=0.9, 90% chance to keep constraint)\n    \"\"\"\n    batch_size = td.batch_size[0]\n\n    variant_probs = torch.tensor(list(self.variant_probs.values()))\n\n    if self.use_combinations:\n        # in a batch, multiple variants combinations can be picked\n        keep_mask = torch.rand(batch_size, 4) >= variant_probs  # O, TW, L, B\n    else:\n        # in a batch, only a variant can be picked.\n        # we assign a 0.5 prob to the last variant (which is normal cvrp)\n        if self.variant_preset in list(\n            VARIANT_GENERATION_PRESETS.keys()\n        ) and self.variant_preset not in (\n            \"all\",\n            \"cvrp\",\n            \"single_feat\",\n            \"single_feat_otw\",\n        ):\n            cvrp_prob = 0\n        else:\n            cvrp_prob = 0.5\n        if self.variant_preset in (\"all\", \"cvrp\", \"single_feat\", \"single_feat_otw\"):\n            indices = torch.distributions.Categorical(\n                torch.Tensor(list(self.variant_probs.values()) + [cvrp_prob])[\n                    None\n                ].repeat(batch_size, 1)\n            ).sample()\n            if self.variant_preset == \"single_feat_otw\":\n                keep_mask = torch.zeros((batch_size, 6), dtype=torch.bool)\n                keep_mask[torch.arange(batch_size), indices] = True\n\n                # If keep_mask[:, 4] is True, make both keep_mask[:, 0] and keep_mask[:, 1] True\n                keep_mask[:, :2] |= keep_mask[:, 4:5]\n            else:\n                keep_mask = torch.zeros((batch_size, 5), dtype=torch.bool)\n                keep_mask[torch.arange(batch_size), indices] = True\n        else:\n            # if the variant is specified, we keep the attributes with probability > 0\n            keep_mask = torch.zeros((batch_size, 4), dtype=torch.bool)\n            indices = torch.nonzero(variant_probs).squeeze()\n            keep_mask[:, indices] = True\n\n    td = self._default_open(td, ~keep_mask[:, 0])\n    td = self._default_time_window(td, ~keep_mask[:, 1])\n    td = self._default_distance_limit(td, ~keep_mask[:, 2])\n    td = self._default_backhaul(td, ~keep_mask[:, 3])\n\n    return td\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.generator.MTVRPGenerator.generate_locations","title":"generate_locations","text":"
generate_locations(batch_size, num_loc) -> Tensor\n

Generate seed locations.

Returns:

  • locs ( Tensor ) \u2013

    [B, N+1, 2] where the first location is the depot.

Source code in rl4co/envs/routing/mtvrp/generator.py
def generate_locations(self, batch_size, num_loc) -> torch.Tensor:\n    \"\"\"Generate seed locations.\n\n    Returns:\n        locs: [B, N+1, 2] where the first location is the depot.\n    \"\"\"\n    locs = torch.FloatTensor(*batch_size, num_loc + 1, 2).uniform_(\n        self.min_loc, self.max_loc\n    )\n    return locs\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.generator.MTVRPGenerator.generate_demands","title":"generate_demands","text":"
generate_demands(batch_size: int, num_loc: int) -> Tensor\n

Classical lineahul demand / delivery from depot (C) and backhaul demand / pickup to depot (B) generation. Initialize the demand for nodes except the depot, which are added during reset. Demand sampling Following Kool et al. (2019), demands as integers between 1 and 10. Generates a slightly different distribution than using torch.randint.

Returns:

  • linehaul_demand ( Tensor ) \u2013

    [B, N]

  • backhaul_demand ( Tensor ) \u2013

    [B, N]

Source code in rl4co/envs/routing/mtvrp/generator.py
def generate_demands(self, batch_size: int, num_loc: int) -> torch.Tensor:\n    \"\"\"Classical lineahul demand / delivery from depot (C) and backhaul demand / pickup to depot (B) generation.\n    Initialize the demand for nodes except the depot, which are added during reset.\n    Demand sampling Following Kool et al. (2019), demands as integers between 1 and 10.\n    Generates a slightly different distribution than using torch.randint.\n\n    Returns:\n        linehaul_demand: [B, N]\n        backhaul_demand: [B, N]\n    \"\"\"\n    linehaul_demand = (\n        torch.FloatTensor(*batch_size, num_loc)\n        .uniform_(self.min_demand - 1, self.max_demand - 1)\n        .int()\n        + 1\n    ).float()\n    # Backhaul demand sampling\n    backhaul_demand = (\n        torch.FloatTensor(*batch_size, num_loc)\n        .uniform_(self.min_backhaul - 1, self.max_backhaul - 1)\n        .int()\n        + 1\n    ).float()\n    is_linehaul = torch.rand(*batch_size, num_loc) > self.backhaul_ratio\n    backhaul_demand = (\n        backhaul_demand * ~is_linehaul\n    )  # keep only values where they are not linehauls\n    linehaul_demand = (\n        linehaul_demand * is_linehaul\n    )\n    return linehaul_demand, backhaul_demand\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.generator.MTVRPGenerator.generate_time_windows","title":"generate_time_windows","text":"
generate_time_windows(\n    locs: Tensor, speed: Tensor\n) -> Tensor\n

Generate time windows (TW) and service times for each location including depot. We refer to the generation process in \"Multi-Task Learning for Routing Problem with Cross-Problem Zero-Shot Generalization\" (Liu et al., 2024). Note that another way to generate is from \"Learning to Delegate for Large-scale Vehicle Routing\" (Li et al, 2021) which is used in \"MVMoE: Multi-Task Vehicle Routing Solver with Mixture-of-Experts\" (Zhou et al, 2024). Note that however, in that case the distance limit would have no influence when time windows are present, since the tw for depot is the same as distance with speed=1. This function can be overridden for that implementation. See also https://github.com/RoyalSkye/Routing-MVMoE

Parameters:

  • locs (Tensor) \u2013

    [B, N+1, 2] (depot, locs)

  • speed (Tensor) \u2013

    [B]

Returns:

  • time_windows ( Tensor ) \u2013

    [B, N+1, 2]

  • service_time ( Tensor ) \u2013

    [B, N+1]

Source code in rl4co/envs/routing/mtvrp/generator.py
def generate_time_windows(\n    self,\n    locs: torch.Tensor,\n    speed: torch.Tensor,\n) -> torch.Tensor:\n    \"\"\"Generate time windows (TW) and service times for each location including depot.\n    We refer to the generation process in \"Multi-Task Learning for Routing Problem with Cross-Problem Zero-Shot Generalization\"\n    (Liu et al., 2024). Note that another way to generate is from \"Learning to Delegate for Large-scale Vehicle Routing\" (Li et al, 2021) which\n    is used in \"MVMoE: Multi-Task Vehicle Routing Solver with Mixture-of-Experts\" (Zhou et al, 2024). Note that however, in that case\n    the distance limit would have no influence when time windows are present, since the tw for depot is the same as distance with speed=1.\n    This function can be overridden for that implementation.\n    See also https://github.com/RoyalSkye/Routing-MVMoE\n\n    Args:\n        locs: [B, N+1, 2] (depot, locs)\n        speed: [B]\n\n    Returns:\n        time_windows: [B, N+1, 2]\n        service_time: [B, N+1]\n    \"\"\"\n\n    batch_size, n_loc = locs.shape[0], locs.shape[1] - 1  # no depot\n\n    a, b, c = 0.15, 0.18, 0.2\n    service_time = a + (b - a) * torch.rand(batch_size, n_loc)\n    tw_length = b + (c - b) * torch.rand(batch_size, n_loc)\n    d_0i = get_distance(locs[:, 0:1], locs[:, 1:])\n    h_max = (self.max_time - service_time - tw_length) / d_0i * speed - 1\n    tw_start = (1 + (h_max - 1) * torch.rand(batch_size, n_loc)) * d_0i / speed\n    tw_end = tw_start + tw_length\n\n    # Depot tw is 0, max_time\n    time_windows = torch.stack(\n        (\n            torch.cat((torch.zeros(batch_size, 1), tw_start), -1),  # start\n            torch.cat((torch.full((batch_size, 1), self.max_time), tw_end), -1),\n        ),  # en\n        dim=-1,\n    )\n    # depot service time is 0\n    service_time = torch.cat((torch.zeros(batch_size, 1), service_time), dim=-1)\n    return time_windows, service_time  # [B, N+1, 2], [B, N+1]\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.generator.MTVRPGenerator.generate_distance_limit","title":"generate_distance_limit","text":"
generate_distance_limit(\n    shape: Tuple[int, int], locs: Tensor\n) -> Tensor\n

Generates distance limits (L) and checks their feasibilities.

Returns:

  • distance_limit ( Tensor ) \u2013

    [B, 1]

Source code in rl4co/envs/routing/mtvrp/generator.py
def generate_distance_limit(\n    self, shape: Tuple[int, int], locs: torch.Tensor\n) -> torch.Tensor:\n    \"\"\"Generates distance limits (L) and checks their feasibilities.\n\n    Returns:\n        distance_limit: [B, 1]\n    \"\"\"\n    # calculate distance of all locations to depot\n    dist_to_depot = torch.cdist(locs, locs[:, 0:1, :], p=2)\n    assert (\n        dist_to_depot * 2 < self.distance_limit  # go back and forth\n    ).all(), \"Distance limit too low, not all nodes can be reached from the depot.\"\n    return torch.full(shape, self.distance_limit, dtype=torch.float32)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.generator.MTVRPGenerator.generate_open_route","title":"generate_open_route","text":"
generate_open_route(shape: Tuple[int, int])\n

Generate open route flags (O). Here we could have a sampler but we simply return True here so all routes are open. Afterwards, we subsample the problems.

Source code in rl4co/envs/routing/mtvrp/generator.py
def generate_open_route(self, shape: Tuple[int, int]):\n    \"\"\"Generate open route flags (O). Here we could have a sampler but we simply return True here so all\n    routes are open. Afterwards, we subsample the problems.\n    \"\"\"\n    return torch.ones(shape, dtype=torch.bool)\n
"},{"location":"docs/content/api/envs/routing/#envs.routing.mtvrp.generator.MTVRPGenerator.generate_speed","title":"generate_speed","text":"
generate_speed(shape: Tuple[int, int])\n

We simply generate the speed as constant here

Source code in rl4co/envs/routing/mtvrp/generator.py
def generate_speed(self, shape: Tuple[int, int]):\n    \"\"\"We simply generate the speed as constant here\"\"\"\n    # in this version, the speed is constant but this class may be overridden\n    return torch.full(shape, self.speed, dtype=torch.float32)\n
"},{"location":"docs/content/api/envs/scheduling/","title":"Scheduling Problems","text":""},{"location":"docs/content/api/envs/scheduling/#flexible-flow-shop-problem-ffsp","title":"Flexible Flow Shop Problem (FFSP)","text":""},{"location":"docs/content/api/envs/scheduling/#envs.scheduling.ffsp.env.FFSPEnv","title":"FFSPEnv","text":"
FFSPEnv(\n    generator: FFSPGenerator = None,\n    generator_params: dict = {},\n    **kwargs\n)\n

Bases: RL4COEnvBase

Flexible Flow Shop Problem (FFSP) environment. The goal is to schedule a set of jobs on a set of machines such that the makespan is minimized.

Observations
  • time index
  • sub time index
  • batch index
  • machine index
  • schedule
  • machine wait step
  • job location
  • job wait step
  • job duration
Constraints
  • each job has to be processed on each machine in a specific order
  • the machine has to be available to process the job
  • the job has to be available to be processed
Finish Condition
  • all jobs are scheduled
Reward
  • (minus) the makespan of the schedule

Parameters:

  • generator (FFSPGenerator, default: None ) \u2013

    FFSPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Source code in rl4co/envs/scheduling/ffsp/env.py
def __init__(\n    self,\n    generator: FFSPGenerator = None,\n    generator_params: dict = {},\n    **kwargs,\n):\n    super().__init__(check_solution=False, dataset_cls=FastTdDataset, **kwargs)\n    if generator is None:\n        generator = FFSPGenerator(**generator_params)\n    self.generator = generator\n\n    self.num_stage = generator.num_stage\n    self.num_machine = generator.num_machine\n    self.num_job = generator.num_job\n    self.num_machine_total = generator.num_machine_total\n    self.tables = None\n    self.step_cnt = None\n    self.flatten_stages = generator.flatten_stages\n\n    self._make_spec(generator)\n
"},{"location":"docs/content/api/envs/scheduling/#envs.scheduling.ffsp.generator.FFSPGenerator","title":"FFSPGenerator","text":"
FFSPGenerator(\n    num_stage: int = 2,\n    num_machine: int = 3,\n    num_job: int = 4,\n    min_time: int = 2,\n    max_time: int = 10,\n    flatten_stages: bool = True,\n    **unused_kwargs\n)\n

Bases: Generator

Data generator for the Flow Shop Scheduling Problem (FFSP).

Parameters:

  • num_stage (int, default: 2 ) \u2013

    number of stages

  • num_machine (int, default: 3 ) \u2013

    number of machines

  • num_job (int, default: 4 ) \u2013

    number of jobs

  • min_time (int, default: 2 ) \u2013

    minimum running time of each job on each machine

  • max_time (int, default: 10 ) \u2013

    maximum running time of each job on each machine

  • flatten_stages (bool, default: True ) \u2013

    whether to flatten the stages

Returns:

  • \u2013

    A TensorDict with the following key: run_time [batch_size, num_job, num_machine, num_stage]: running time of each job on each machine

Note
  • [IMPORTANT] This version of ffsp requires the number of machines in each stage to be the same
Source code in rl4co/envs/scheduling/ffsp/generator.py
def __init__(\n    self,\n    num_stage: int = 2,\n    num_machine: int = 3,\n    num_job: int = 4,\n    min_time: int = 2,\n    max_time: int = 10,\n    flatten_stages: bool = True,\n    **unused_kwargs,\n):\n    self.num_stage = num_stage\n    self.num_machine = num_machine\n    self.num_machine_total = num_machine * num_stage\n    self.num_job = num_job\n    self.min_time = min_time\n    self.max_time = max_time\n    self.flatten_stages = flatten_stages\n\n    # FFSP environment doen't have any other kwargs\n    if len(unused_kwargs) > 0:\n        log.error(f\"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}\")\n
"},{"location":"docs/content/api/envs/scheduling/#flexible-job-shop-problem-fjsp","title":"Flexible Job Shop Problem (FJSP)","text":""},{"location":"docs/content/api/envs/scheduling/#envs.scheduling.fjsp.env.FJSPEnv","title":"FJSPEnv","text":"
FJSPEnv(\n    generator: FJSPGenerator = None,\n    generator_params: dict = {},\n    mask_no_ops: bool = True,\n    check_mask: bool = False,\n    stepwise_reward: bool = False,\n    **kwargs\n)\n

Bases: RL4COEnvBase

Flexible Job-Shop Scheduling Problem (FJSP) environment At each step, the agent chooses a job-machine combination. The operation to be processed next for the selected job is then executed on the selected machine. The reward is 0 unless the agent scheduled all operations of all jobs. In that case, the reward is (-)makespan of the schedule: maximizing the reward is equivalent to minimizing the makespan.

Observations
  • time: current time
  • next_op: next operation per job
  • proc_times: processing time of operation-machine pairs
  • pad_mask: specifies padded operations
  • start_op_per_job: id of first operation per job
  • end_op_per_job: id of last operation per job
  • start_times: start time of operation (defaults to 0 if not scheduled)
  • finish_times: finish time of operation (defaults to INIT_FINISH if not scheduled)
  • job_ops_adj: adjacency matrix specifying job-operation affiliation
  • ops_job_map: same as above but using ids of jobs to indicate affiliation
  • ops_sequence_order: specifies the order in which operations have to be processed
  • ma_assignment: specifies which operation has been scheduled on which machine
  • busy_until: specifies until when the machine will be busy
  • num_eligible: number of machines that can process an operation
  • job_in_process: whether job is currently being processed
  • job_done: whether the job is done
Constrains

the agent may not select:

  • machines that are currently busy
  • jobs that are done already
  • jobs that are currently processed
  • job-machine combinations, where the machine cannot process the next operation of the job
Finish condition
  • the agent has scheduled all operations of all jobs
Reward
  • the negative makespan of the final schedule

Parameters:

  • generator (FJSPGenerator, default: None ) \u2013

    FJSPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

  • mask_no_ops (bool, default: True ) \u2013

    if True, agent may not select waiting operation (unless instance is done)

Source code in rl4co/envs/scheduling/fjsp/env.py
def __init__(\n    self,\n    generator: FJSPGenerator = None,\n    generator_params: dict = {},\n    mask_no_ops: bool = True,\n    check_mask: bool = False,\n    stepwise_reward: bool = False,\n    **kwargs,\n):\n    super().__init__(check_solution=False, **kwargs)\n    if generator is None:\n        if generator_params.get(\"file_path\", None) is not None:\n            generator = FJSPFileGenerator(**generator_params)\n        else:\n            generator = FJSPGenerator(**generator_params)\n    self.generator = generator\n    self._num_mas = generator.num_mas\n    self._num_jobs = generator.num_jobs\n    self._n_ops_max = generator.max_ops_per_job * self.num_jobs\n\n    self.mask_no_ops = mask_no_ops\n    self.check_mask = check_mask\n    self.stepwise_reward = stepwise_reward\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/scheduling/#envs.scheduling.fjsp.generator.FJSPGenerator","title":"FJSPGenerator","text":"
FJSPGenerator(\n    num_jobs: int = 10,\n    num_machines: int = 5,\n    min_ops_per_job: int = 4,\n    max_ops_per_job: int = 6,\n    min_processing_time: int = 1,\n    max_processing_time: int = 20,\n    min_eligible_ma_per_op: int = 1,\n    max_eligible_ma_per_op: int = None,\n    same_mean_per_op: bool = True,\n    **unused_kwargs\n)\n

Bases: Generator

Data generator for the Flexible Job-Shop Scheduling Problem (FJSP).

Parameters:

  • num_stage \u2013

    number of stages

  • num_machine \u2013

    number of machines

  • num_job \u2013

    number of jobs

  • min_time \u2013

    minimum running time of each job on each machine

  • max_time \u2013

    maximum running time of each job on each machine

  • flatten_stages \u2013

    whether to flatten the stages

Returns:

  • \u2013

    A TensorDict with the following key: start_op_per_job [batch_size, num_jobs]: first operation of each job end_op_per_job [batch_size, num_jobs]: last operation of each job proc_times [batch_size, num_machines, total_n_ops]: processing time of ops on machines pad_mask [batch_size, total_n_ops]: not all instances have the same number of ops, so padding is used

Source code in rl4co/envs/scheduling/fjsp/generator.py
def __init__(\n    self,\n    num_jobs: int = 10,\n    num_machines: int = 5,\n    min_ops_per_job: int = 4,\n    max_ops_per_job: int = 6,\n    min_processing_time: int = 1,\n    max_processing_time: int = 20,\n    min_eligible_ma_per_op: int = 1,\n    max_eligible_ma_per_op: int = None,\n    same_mean_per_op: bool = True,\n    **unused_kwargs,\n):\n    self.num_jobs = num_jobs\n    self.num_mas = num_machines\n    self.min_ops_per_job = min_ops_per_job\n    self.max_ops_per_job = max_ops_per_job\n    self.min_processing_time = min_processing_time\n    self.max_processing_time = max_processing_time\n    self.min_eligible_ma_per_op = min_eligible_ma_per_op\n    self.max_eligible_ma_per_op = max_eligible_ma_per_op or num_machines\n    # determines whether to use a fixed number of total operations or let it vary between instances\n    # NOTE: due to the way rl4co builds datasets, we need a fixed size here\n    self.n_ops_max = max_ops_per_job * num_jobs\n    self.same_mean_per_op = same_mean_per_op\n    # FFSP environment doen't have any other kwargs\n    if len(unused_kwargs) > 0:\n        log.error(f\"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}\")\n
"},{"location":"docs/content/api/envs/scheduling/#job-shop-scheduling-problem-jssp","title":"Job Shop Scheduling Problem (JSSP)","text":""},{"location":"docs/content/api/envs/scheduling/#envs.scheduling.jssp.env.JSSPEnv","title":"JSSPEnv","text":"
JSSPEnv(\n    generator: JSSPGenerator = None,\n    generator_params: dict = {},\n    mask_no_ops: bool = True,\n    **kwargs\n)\n

Bases: FJSPEnv

Job-Shop Scheduling Problem (JSSP) environment At each step, the agent chooses a job. The operation to be processed next for the selected job is then executed on the associated machine. The reward is 0 unless the agent scheduled all operations of all jobs. In that case, the reward is (-)makespan of the schedule: maximizing the reward is equivalent to minimizing the makespan. NOTE: The JSSP is a special case of the FJSP, when the number of eligible machines per operation is equal to one for all operations. Therefore, this environment is a subclass of the FJSP environment. Observations:

- time: current time\n- next_op: next operation per job\n- proc_times: processing time of operation-machine pairs\n- pad_mask: specifies padded operations\n- start_op_per_job: id of first operation per job\n- end_op_per_job: id of last operation per job\n- start_times: start time of operation (defaults to 0 if not scheduled)\n- finish_times: finish time of operation (defaults to INIT_FINISH if not scheduled)\n- job_ops_adj: adjacency matrix specifying job-operation affiliation\n- ops_job_map: same as above but using ids of jobs to indicate affiliation\n- ops_sequence_order: specifies the order in which operations have to be processed\n- ma_assignment: specifies which operation has been scheduled on which machine\n- busy_until: specifies until when the machine will be busy\n- num_eligible: number of machines that can process an operation\n- job_in_process: whether job is currently being processed\n- job_done: whether the job is done\n
Constrains

the agent may not select:

  • jobs that are done already
  • jobs that are currently processed
Finish condition
  • the agent has scheduled all operations of all jobs
Reward
  • the negative makespan of the final schedule

Parameters:

  • generator (JSSPGenerator, default: None ) \u2013

    JSSPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

  • mask_no_ops (bool, default: True ) \u2013

    if True, agent may not select waiting operation (unless instance is done)

Source code in rl4co/envs/scheduling/jssp/env.py
def __init__(\n    self,\n    generator: JSSPGenerator = None,\n    generator_params: dict = {},\n    mask_no_ops: bool = True,\n    **kwargs,\n):\n    if generator is None:\n        if generator_params.get(\"file_path\", None) is not None:\n            generator = JSSPFileGenerator(**generator_params)\n        else:\n            generator = JSSPGenerator(**generator_params)\n\n    super().__init__(generator, generator_params, mask_no_ops, **kwargs)\n
"},{"location":"docs/content/api/envs/scheduling/#envs.scheduling.jssp.generator.JSSPGenerator","title":"JSSPGenerator","text":"
JSSPGenerator(\n    num_jobs: int = 6,\n    num_machines: int = 6,\n    min_ops_per_job: int = None,\n    max_ops_per_job: int = None,\n    min_processing_time: int = 1,\n    max_processing_time: int = 99,\n    one2one_ma_map: bool = True,\n    **unused_kwargs\n)\n

Bases: Generator

Data generator for the Job-Shop Scheduling Problem (JSSP)

Parameters:

  • num_stage \u2013

    number of stages

  • num_machine \u2013

    number of machines

  • num_job \u2013

    number of jobs

  • min_time \u2013

    minimum running time of each job on each machine

  • max_time \u2013

    maximum running time of each job on each machine

  • flatten_stages \u2013

    whether to flatten the stages

  • one2one_ma_map (bool, default: True ) \u2013

    whether each machine should have exactly one operation per job (common in jssp benchmark instances)

Returns:

  • \u2013

    A TensorDict with the following key: start_op_per_job [batch_size, num_jobs]: first operation of each job end_op_per_job [batch_size, num_jobs]: last operation of each job proc_times [batch_size, num_machines, total_n_ops]: processing time of ops on machines pad_mask [batch_size, total_n_ops]: not all instances have the same number of ops, so padding is used

Source code in rl4co/envs/scheduling/jssp/generator.py
def __init__(\n    self,\n    num_jobs: int = 6,\n    num_machines: int = 6,\n    min_ops_per_job: int = None,\n    max_ops_per_job: int = None,\n    min_processing_time: int = 1,\n    max_processing_time: int = 99,\n    one2one_ma_map: bool = True,\n    **unused_kwargs,\n):\n    self.num_jobs = num_jobs\n    self.num_mas = num_machines\n    # quite common in jssp to have as many ops per job as there are machines\n    self.min_ops_per_job = min_ops_per_job or self.num_mas\n    self.max_ops_per_job = max_ops_per_job or self.num_mas\n    self.min_processing_time = min_processing_time\n    self.max_processing_time = max_processing_time\n    self.one2one_ma_map = one2one_ma_map\n    if self.one2one_ma_map:\n        assert self.min_ops_per_job == self.max_ops_per_job == self.num_mas\n\n    # determines whether to use a fixed number of total operations or let it vary between instances\n    # NOTE: due to the way rl4co builds datasets, we need a fixed size here\n    self.n_ops_max = self.max_ops_per_job * self.num_jobs\n\n    # FFSP environment doen't have any other kwargs\n    if len(unused_kwargs) > 0:\n        log.error(f\"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}\")\n
"},{"location":"docs/content/api/envs/scheduling/#single-machine-total-weighted-tardiness-problem-smtwtp","title":"Single Machine Total Weighted Tardiness Problem (SMTWTP)","text":""},{"location":"docs/content/api/envs/scheduling/#envs.scheduling.smtwtp.env.SMTWTPEnv","title":"SMTWTPEnv","text":"
SMTWTPEnv(\n    generator: SMTWTPGenerator = None,\n    generator_params: dict = {},\n    **kwargs\n)\n

Bases: RL4COEnvBase

Single Machine Total Weighted Tardiness Problem environment as described in DeepACO (https://arxiv.org/pdf/2309.14032.pdf) SMTWTP is a scheduling problem in which a set of jobs must be processed on a single machine. Each job i has a processing time, a weight, and a due date. The objective is to minimize the sum of the weighted tardiness of all jobs, where the weighted tardiness of a job is defined as the product of its weight and the duration by which its completion time exceeds its due date. At each step, the agent chooses a job to process. The reward is 0 unless the agent processes all the jobs. In that case, the reward is (-)objective value of the processing order: maximizing the reward is equivalent to minimizing the objective.

Observation
  • job_due_time: the due time of each job
  • job_weight: the weight of each job
  • job_process_time: the process time of each job
  • current_node: the current node
  • action_mask: a mask of available actions
  • current_time: the current time
Constants
  • num_job: number of jobs
  • min_time_span: lower bound of jobs' due time. By default, jobs' due time is uniformly sampled from (min_time_span, max_time_span)
  • max_time_span: upper bound of jobs' due time. By default, it will be set to num_job / 2
  • min_job_weight: lower bound of jobs' weights. By default, jobs' weights are uniformly sampled from (min_job_weight, max_job_weight)
  • max_job_weight: upper bound of jobs' weights
  • min_process_time: lower bound of jobs' process time. By default, jobs' process time is uniformly sampled from (min_process_time, max_process_time)
  • max_process_time: upper bound of jobs' process time
Finishing condition
  • All jobs are processed
Reward
  • The reward is 0 unless the agent processes all the jobs.
  • In that case, the reward is (-)objective value of the processing order: maximizing the reward is equivalent to minimizing the objective.

Parameters:

  • generator (SMTWTPGenerator, default: None ) \u2013

    FFSPGenerator instance as the data generator

  • generator_params (dict, default: {} ) \u2013

    parameters for the generator

Source code in rl4co/envs/scheduling/smtwtp/env.py
def __init__(\n    self,\n    generator: SMTWTPGenerator = None,\n    generator_params: dict = {},\n    **kwargs,\n):\n    super().__init__(**kwargs)\n    if generator is None:\n        generator = SMTWTPGenerator(**generator_params)\n    self.generator = generator\n    self._make_spec(self.generator)\n
"},{"location":"docs/content/api/envs/scheduling/#envs.scheduling.smtwtp.generator.SMTWTPGenerator","title":"SMTWTPGenerator","text":"
SMTWTPGenerator(\n    num_job: int = 10,\n    min_time_span: float = 0,\n    max_time_span: float = None,\n    min_job_weight: float = 0,\n    max_job_weight: float = 1,\n    min_process_time: float = 0,\n    max_process_time: float = 1,\n    **unused_kwargs\n)\n

Bases: Generator

Data generator for the Single Machine Total Weighted Tardiness Problem (SMTWTP) environment

Parameters:

  • num_job (int, default: 10 ) \u2013

    number of jobs

  • min_time_span (float, default: 0 ) \u2013

    lower bound of jobs' due time. By default, jobs' due time is uniformly sampled from (min_time_span, max_time_span)

  • max_time_span (float, default: None ) \u2013

    upper bound of jobs' due time. By default, it will be set to num_job / 2

  • min_job_weight (float, default: 0 ) \u2013

    lower bound of jobs' weights. By default, jobs' weights are uniformly sampled from (min_job_weight, max_job_weight)

  • max_job_weight (float, default: 1 ) \u2013

    upper bound of jobs' weights

  • min_process_time (float, default: 0 ) \u2013

    lower bound of jobs' process time. By default, jobs' process time is uniformly sampled from (min_process_time, max_process_time)

  • max_process_time (float, default: 1 ) \u2013

    upper bound of jobs' process time

Returns:

  • \u2013

    A TensorDict with the following key: job_due_time [batch_size, num_job + 1]: the due time of each job job_weight [batch_size, num_job + 1]: the weight of each job job_process_time [batch_size, num_job + 1]: the process time of each job

Source code in rl4co/envs/scheduling/smtwtp/generator.py
def __init__(\n    self,\n    num_job: int = 10,\n    min_time_span: float = 0,\n    max_time_span: float = None, # will be set to num_job / 2 by default. In DeepACO, it is set to num_job, which would be too simple\n    min_job_weight: float = 0,\n    max_job_weight: float = 1,\n    min_process_time: float = 0,\n    max_process_time: float = 1,\n    **unused_kwargs\n):\n    self.num_job = num_job\n    self.min_time_span = min_time_span\n    self.max_time_span = num_job / 2 if max_time_span is None else max_time_span\n    self.min_job_weight = min_job_weight\n    self.max_job_weight = max_job_weight\n    self.min_process_time = min_process_time\n    self.max_process_time = max_process_time\n\n    # SMTWTP environment doen't have any other kwargs\n    if len(unused_kwargs) > 0:\n        log.error(f\"Found {len(unused_kwargs)} unused kwargs: {unused_kwargs}\")\n
"},{"location":"docs/content/api/networks/base_policies/","title":"Constructive Policies Base Classes","text":"

Classes:

  • ConstructiveEncoder \u2013

    Base class for the encoder of constructive models

  • ConstructiveDecoder \u2013

    Base decoder model for constructive models. The decoder is responsible for generating the logits for the action

  • NoEncoder \u2013

    Default encoder decoder-only models, i.e. autoregressive models that re-encode all the state at each decoding step.

  • ConstructivePolicy \u2013

    Base class for constructive policies. Constructive policies take as input and instance and output a solution (sequence of actions).

"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.base.ConstructiveEncoder","title":"ConstructiveEncoder","text":"

Bases: Module

Base class for the encoder of constructive models

Methods:

  • forward \u2013

    Forward pass for the encoder

"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.base.ConstructiveEncoder.forward","title":"forward abstractmethod","text":"
forward(td: TensorDict) -> Tuple[Any, Tensor]\n

Forward pass for the encoder

Parameters:

  • td (TensorDict) \u2013

    TensorDict containing the input data

Returns:

  • Tuple[Any, Tensor] \u2013

    Tuple containing:

    • latent representation (any type)
    • initial embeddings (from feature space to embedding space)
Source code in rl4co/models/common/constructive/base.py
@abc.abstractmethod\ndef forward(self, td: TensorDict) -> Tuple[Any, Tensor]:\n    \"\"\"Forward pass for the encoder\n\n    Args:\n        td: TensorDict containing the input data\n\n    Returns:\n        Tuple containing:\n          - latent representation (any type)\n          - initial embeddings (from feature space to embedding space)\n    \"\"\"\n    raise NotImplementedError(\"Implement me in subclass!\")\n
"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.base.ConstructiveDecoder","title":"ConstructiveDecoder","text":"

Bases: Module

Base decoder model for constructive models. The decoder is responsible for generating the logits for the action

Methods:

  • forward \u2013

    Obtain logits for current action to the next ones

  • pre_decoder_hook \u2013

    By default, we don't need to do anything here.

"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.base.ConstructiveDecoder.forward","title":"forward abstractmethod","text":"
forward(\n    td: TensorDict, hidden: Any = None, num_starts: int = 0\n) -> Tuple[Tensor, Tensor]\n

Obtain logits for current action to the next ones

Parameters:

  • td (TensorDict) \u2013

    TensorDict containing the input data

  • hidden (Any, default: None ) \u2013

    Hidden state from the encoder. Can be any type

  • num_starts (int, default: 0 ) \u2013

    Number of starts for multistart decoding

Returns:

  • Tuple[Tensor, Tensor] \u2013

    Tuple containing the logits and the action mask

Source code in rl4co/models/common/constructive/base.py
@abc.abstractmethod\ndef forward(\n    self, td: TensorDict, hidden: Any = None, num_starts: int = 0\n) -> Tuple[Tensor, Tensor]:\n    \"\"\"Obtain logits for current action to the next ones\n\n    Args:\n        td: TensorDict containing the input data\n        hidden: Hidden state from the encoder. Can be any type\n        num_starts: Number of starts for multistart decoding\n\n    Returns:\n        Tuple containing the logits and the action mask\n    \"\"\"\n    raise NotImplementedError(\"Implement me in subclass!\")\n
"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.base.ConstructiveDecoder.pre_decoder_hook","title":"pre_decoder_hook","text":"
pre_decoder_hook(\n    td: TensorDict,\n    env: RL4COEnvBase,\n    hidden: Any = None,\n    num_starts: int = 0,\n) -> Tuple[TensorDict, Any, RL4COEnvBase]\n

By default, we don't need to do anything here.

Parameters:

  • td (TensorDict) \u2013

    TensorDict containing the input data

  • hidden (Any, default: None ) \u2013

    Hidden state from the encoder

  • env (RL4COEnvBase) \u2013

    Environment for decoding

  • num_starts (int, default: 0 ) \u2013

    Number of starts for multistart decoding

Returns:

  • Tuple[TensorDict, Any, RL4COEnvBase] \u2013

    Tuple containing the updated hidden state, TensorDict, and environment

Source code in rl4co/models/common/constructive/base.py
def pre_decoder_hook(\n    self, td: TensorDict, env: RL4COEnvBase, hidden: Any = None, num_starts: int = 0\n) -> Tuple[TensorDict, Any, RL4COEnvBase]:\n    \"\"\"By default, we don't need to do anything here.\n\n    Args:\n        td: TensorDict containing the input data\n        hidden: Hidden state from the encoder\n        env: Environment for decoding\n        num_starts: Number of starts for multistart decoding\n\n    Returns:\n        Tuple containing the updated hidden state, TensorDict, and environment\n    \"\"\"\n    return td, env, hidden\n
"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.base.NoEncoder","title":"NoEncoder","text":"

Bases: ConstructiveEncoder

Default encoder decoder-only models, i.e. autoregressive models that re-encode all the state at each decoding step.

Methods:

  • forward \u2013

    Return Nones for the hidden state and initial embeddings

"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.base.NoEncoder.forward","title":"forward","text":"
forward(td: TensorDict) -> Tuple[Tensor, Tensor]\n

Return Nones for the hidden state and initial embeddings

Source code in rl4co/models/common/constructive/base.py
def forward(self, td: TensorDict) -> Tuple[Tensor, Tensor]:\n    \"\"\"Return Nones for the hidden state and initial embeddings\"\"\"\n    return None, None\n
"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.base.ConstructivePolicy","title":"ConstructivePolicy","text":"
ConstructivePolicy(\n    encoder: Union[ConstructiveEncoder, Callable],\n    decoder: Union[ConstructiveDecoder, Callable],\n    env_name: str = \"tsp\",\n    temperature: float = 1.0,\n    tanh_clipping: float = 0,\n    mask_logits: bool = True,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"greedy\",\n    test_decode_type: str = \"greedy\",\n    **unused_kw\n)\n

Bases: Module

Base class for constructive policies. Constructive policies take as input and instance and output a solution (sequence of actions). \"Constructive\" means that a solution is created from scratch by the model.

The structure follows roughly the following steps
  1. Create a hidden state from the encoder
  2. Initialize decoding strategy (such as greedy, sampling, etc.)
  3. Decode the action given the hidden state and the environment state at the current step
  4. Update the environment state with the action. Repeat 3-4 until all sequences are done
  5. Obtain log likelihood, rewards etc.

Note that an encoder is not strictly needed (see :class:NoEncoder).). A decoder however is always needed either in the form of a network or a function.

Note

There are major differences between this decoding and most RL problems. The most important one is that reward may not defined for partial solutions, hence we have to wait for the environment to reach a terminal state before we can compute the reward with env.get_reward().

Warning

We suppose environments in the done state are still available for sampling. This is because in NCO we need to wait for all the environments to reach a terminal state before we can stop the decoding process. This is in contrast with the TorchRL framework (at the moment) where the env.rollout function automatically resets. You may follow tighter integration with TorchRL here: https://github.com/ai4co/rl4co/issues/72.

Parameters:

  • encoder (Union[ConstructiveEncoder, Callable]) \u2013

    Encoder to use

  • decoder (Union[ConstructiveDecoder, Callable]) \u2013

    Decoder to use

  • env_name (str, default: 'tsp' ) \u2013

    Environment name to solve (used for automatically instantiating networks)

  • temperature (float, default: 1.0 ) \u2013

    Temperature for the softmax during decoding

  • tanh_clipping (float, default: 0 ) \u2013

    Clipping value for the tanh activation (see Bello et al. 2016) during decoding

  • mask_logits (bool, default: True ) \u2013

    Whether to mask the logits or not during decoding

  • train_decode_type (str, default: 'sampling' ) \u2013

    Decoding strategy for training

  • val_decode_type (str, default: 'greedy' ) \u2013

    Decoding strategy for validation

  • test_decode_type (str, default: 'greedy' ) \u2013

    Decoding strategy for testing

Methods:

  • forward \u2013

    Forward pass of the policy.

Source code in rl4co/models/common/constructive/base.py
def __init__(\n    self,\n    encoder: Union[ConstructiveEncoder, Callable],\n    decoder: Union[ConstructiveDecoder, Callable],\n    env_name: str = \"tsp\",\n    temperature: float = 1.0,\n    tanh_clipping: float = 0,\n    mask_logits: bool = True,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"greedy\",\n    test_decode_type: str = \"greedy\",\n    **unused_kw,\n):\n    super(ConstructivePolicy, self).__init__()\n\n    if len(unused_kw) > 0:\n        log.error(f\"Found {len(unused_kw)} unused kwargs: {unused_kw}\")\n\n    self.env_name = env_name\n\n    # Encoder and decoder\n    if encoder is None:\n        log.warning(\"`None` was provided as encoder. Using `NoEncoder`.\")\n        encoder = NoEncoder()\n    self.encoder = encoder\n    self.decoder = decoder\n\n    # Decoding strategies\n    self.temperature = temperature\n    self.tanh_clipping = tanh_clipping\n    self.mask_logits = mask_logits\n    self.train_decode_type = train_decode_type\n    self.val_decode_type = val_decode_type\n    self.test_decode_type = test_decode_type\n
"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.base.ConstructivePolicy.forward","title":"forward","text":"
forward(\n    td: TensorDict,\n    env: Optional[Union[str, RL4COEnvBase]] = None,\n    phase: str = \"train\",\n    calc_reward: bool = True,\n    return_actions: bool = True,\n    return_entropy: bool = False,\n    return_hidden: bool = False,\n    return_init_embeds: bool = False,\n    return_sum_log_likelihood: bool = True,\n    actions=None,\n    max_steps=1000000,\n    **decoding_kwargs\n) -> dict\n

Forward pass of the policy.

Parameters:

  • td (TensorDict) \u2013

    TensorDict containing the environment state

  • env (Optional[Union[str, RL4COEnvBase]], default: None ) \u2013

    Environment to use for decoding. If None, the environment is instantiated from env_name. Note that it is more efficient to pass an already instantiated environment each time for fine-grained control

  • phase (str, default: 'train' ) \u2013

    Phase of the algorithm (train, val, test)

  • calc_reward (bool, default: True ) \u2013

    Whether to calculate the reward

  • return_actions (bool, default: True ) \u2013

    Whether to return the actions

  • return_entropy (bool, default: False ) \u2013

    Whether to return the entropy

  • return_hidden (bool, default: False ) \u2013

    Whether to return the hidden state

  • return_init_embeds (bool, default: False ) \u2013

    Whether to return the initial embeddings

  • return_sum_log_likelihood (bool, default: True ) \u2013

    Whether to return the sum of the log likelihood

  • actions \u2013

    Actions to use for evaluating the policy. If passed, use these actions instead of sampling from the policy to calculate log likelihood

  • max_steps \u2013

    Maximum number of decoding steps for sanity check to avoid infinite loops if envs are buggy (i.e. do not reach done)

  • decoding_kwargs \u2013

    Keyword arguments for the decoding strategy. See :class:rl4co.utils.decoding.DecodingStrategy for more information.

Returns:

  • out ( dict ) \u2013

    Dictionary containing the reward, log likelihood, and optionally the actions and entropy

Source code in rl4co/models/common/constructive/base.py
def forward(\n    self,\n    td: TensorDict,\n    env: Optional[Union[str, RL4COEnvBase]] = None,\n    phase: str = \"train\",\n    calc_reward: bool = True,\n    return_actions: bool = True,\n    return_entropy: bool = False,\n    return_hidden: bool = False,\n    return_init_embeds: bool = False,\n    return_sum_log_likelihood: bool = True,\n    actions=None,\n    max_steps=1_000_000,\n    **decoding_kwargs,\n) -> dict:\n    \"\"\"Forward pass of the policy.\n\n    Args:\n        td: TensorDict containing the environment state\n        env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that\n            it is more efficient to pass an already instantiated environment each time for fine-grained control\n        phase: Phase of the algorithm (train, val, test)\n        calc_reward: Whether to calculate the reward\n        return_actions: Whether to return the actions\n        return_entropy: Whether to return the entropy\n        return_hidden: Whether to return the hidden state\n        return_init_embeds: Whether to return the initial embeddings\n        return_sum_log_likelihood: Whether to return the sum of the log likelihood\n        actions: Actions to use for evaluating the policy.\n            If passed, use these actions instead of sampling from the policy to calculate log likelihood\n        max_steps: Maximum number of decoding steps for sanity check to avoid infinite loops if envs are buggy (i.e. do not reach `done`)\n        decoding_kwargs: Keyword arguments for the decoding strategy. See :class:`rl4co.utils.decoding.DecodingStrategy` for more information.\n\n    Returns:\n        out: Dictionary containing the reward, log likelihood, and optionally the actions and entropy\n    \"\"\"\n\n    # Encoder: get encoder output and initial embeddings from initial state\n    hidden, init_embeds = self.encoder(td)\n\n    # Instantiate environment if needed\n    if isinstance(env, str) or env is None:\n        env_name = self.env_name if env is None else env\n        log.info(f\"Instantiated environment not provided; instantiating {env_name}\")\n        env = get_env(env_name)\n\n    # Get decode type depending on phase and whether actions are passed for evaluation\n    decode_type = decoding_kwargs.pop(\"decode_type\", None)\n    if actions is not None:\n        decode_type = \"evaluate\"\n    elif decode_type is None:\n        decode_type = getattr(self, f\"{phase}_decode_type\")\n\n    # Setup decoding strategy\n    # we pop arguments that are not part of the decoding strategy\n    decode_strategy: DecodingStrategy = get_decoding_strategy(\n        decode_type,\n        temperature=decoding_kwargs.pop(\"temperature\", self.temperature),\n        tanh_clipping=decoding_kwargs.pop(\"tanh_clipping\", self.tanh_clipping),\n        mask_logits=decoding_kwargs.pop(\"mask_logits\", self.mask_logits),\n        store_all_logp=decoding_kwargs.pop(\"store_all_logp\", return_entropy),\n        **decoding_kwargs,\n    )\n\n    # Pre-decoding hook: used for the initial step(s) of the decoding strategy\n    td, env, num_starts = decode_strategy.pre_decoder_hook(td, env)\n\n    # Additionally call a decoder hook if needed before main decoding\n    td, env, hidden = self.decoder.pre_decoder_hook(td, env, hidden, num_starts)\n\n    # Main decoding: loop until all sequences are done\n    step = 0\n    while not td[\"done\"].all():\n        logits, mask = self.decoder(td, hidden, num_starts)\n        td = decode_strategy.step(\n            logits,\n            mask,\n            td,\n            action=actions[..., step] if actions is not None else None,\n        )\n        td = env.step(td)[\"next\"]\n        step += 1\n        if step > max_steps:\n            log.error(\n                f\"Exceeded maximum number of steps ({max_steps}) duing decoding\"\n            )\n            break\n\n    # Post-decoding hook: used for the final step(s) of the decoding strategy\n    logprobs, actions, td, env = decode_strategy.post_decoder_hook(td, env)\n\n    # Output dictionary construction\n    if calc_reward:\n        td.set(\"reward\", env.get_reward(td, actions))\n\n    outdict = {\n        \"reward\": td[\"reward\"],\n        \"log_likelihood\": get_log_likelihood(\n            logprobs, actions, td.get(\"mask\", None), return_sum_log_likelihood\n        ),\n    }\n\n    if return_actions:\n        outdict[\"actions\"] = actions\n    if return_entropy:\n        outdict[\"entropy\"] = calculate_entropy(logprobs)\n    if return_hidden:\n        outdict[\"hidden\"] = hidden\n    if return_init_embeds:\n        outdict[\"init_embeds\"] = init_embeds\n\n    return outdict\n
"},{"location":"docs/content/api/networks/base_policies/#autoregressive-policies","title":"Autoregressive Policies","text":"

Classes:

  • AutoregressiveEncoder \u2013

    Template class for an autoregressive encoder, simple wrapper around

Classes:

  • AutoregressiveDecoder \u2013

    Template class for an autoregressive decoder, simple wrapper around

Classes:

  • AutoregressivePolicy \u2013

    Template class for an autoregressive policy, simple wrapper around

"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.autoregressive.encoder.AutoregressiveEncoder","title":"AutoregressiveEncoder","text":"

Bases: ConstructiveEncoder

Template class for an autoregressive encoder, simple wrapper around :class:rl4co.models.common.constructive.base.ConstructiveEncoder.

Tip

This class will not work as it is and is just a template. An example for autoregressive encoder can be found as :class:rl4co.models.zoo.am.encoder.AttentionModelEncoder.

"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.autoregressive.decoder.AutoregressiveDecoder","title":"AutoregressiveDecoder","text":"

Bases: ConstructiveDecoder

Template class for an autoregressive decoder, simple wrapper around :class:rl4co.models.common.constructive.base.ConstructiveDecoder

Tip

This class will not work as it is and is just a template. An example for autoregressive encoder can be found as :class:rl4co.models.zoo.am.decoder.AttentionModelDecoder.

"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.autoregressive.policy.AutoregressivePolicy","title":"AutoregressivePolicy","text":"
AutoregressivePolicy(\n    encoder: AutoregressiveEncoder,\n    decoder: AutoregressiveDecoder,\n    env_name: str = \"tsp\",\n    temperature: float = 1.0,\n    tanh_clipping: float = 0,\n    mask_logits: bool = True,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"greedy\",\n    test_decode_type: str = \"greedy\",\n    **unused_kw\n)\n

Bases: ConstructivePolicy

Template class for an autoregressive policy, simple wrapper around :class:rl4co.models.common.constructive.base.ConstructivePolicy.

Note

While a decoder is required, an encoder is optional and will be initialized to :class:rl4co.models.common.constructive.autoregressive.encoder.NoEncoder. This can be used in decoder-only models in which at each step actions do not depend on previously encoded states.

Source code in rl4co/models/common/constructive/autoregressive/policy.py
def __init__(\n    self,\n    encoder: AutoregressiveEncoder,\n    decoder: AutoregressiveDecoder,\n    env_name: str = \"tsp\",\n    temperature: float = 1.0,\n    tanh_clipping: float = 0,\n    mask_logits: bool = True,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"greedy\",\n    test_decode_type: str = \"greedy\",\n    **unused_kw,\n):\n    # We raise an error for the user if no decoder was provided\n    if decoder is None:\n        raise ValueError(\"AutoregressivePolicy requires a decoder to be provided.\")\n\n    super(AutoregressivePolicy, self).__init__(\n        encoder=encoder,\n        decoder=decoder,\n        env_name=env_name,\n        temperature=temperature,\n        tanh_clipping=tanh_clipping,\n        mask_logits=mask_logits,\n        train_decode_type=train_decode_type,\n        val_decode_type=val_decode_type,\n        test_decode_type=test_decode_type,\n        **unused_kw,\n    )\n
"},{"location":"docs/content/api/networks/base_policies/#nonautoregressive-policies","title":"Nonautoregressive Policies","text":"

Classes:

  • NonAutoregressiveEncoder \u2013

    Template class for an autoregressive encoder, simple wrapper around

Classes:

  • NonAutoregressiveDecoder \u2013

    The nonautoregressive decoder is a simple callable class that

Classes:

  • NonAutoregressivePolicy \u2013

    Template class for an nonautoregressive policy, simple wrapper around

"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.nonautoregressive.encoder.NonAutoregressiveEncoder","title":"NonAutoregressiveEncoder","text":"

Bases: ConstructiveEncoder

Template class for an autoregressive encoder, simple wrapper around :class:rl4co.models.common.constructive.base.ConstructiveEncoder.

Tip

This class will not work as it is and is just a template. An example for autoregressive encoder can be found as :class:rl4co.models.zoo.am.encoder.AttentionModelEncoder.

"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.nonautoregressive.decoder.NonAutoregressiveDecoder","title":"NonAutoregressiveDecoder","text":"

Bases: ConstructiveDecoder

The nonautoregressive decoder is a simple callable class that takes the tensor dictionary and the heatmaps logits and returns the logits for the current action logits and the action mask.

Methods:

  • heatmap_to_logits \u2013

    Obtain heatmap logits for current action to the next ones

"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.nonautoregressive.decoder.NonAutoregressiveDecoder.heatmap_to_logits","title":"heatmap_to_logits staticmethod","text":"
heatmap_to_logits(\n    td: TensorDict, heatmaps_logits: Tensor, num_starts: int\n)\n

Obtain heatmap logits for current action to the next ones

Source code in rl4co/models/common/constructive/nonautoregressive/decoder.py
@staticmethod\ndef heatmap_to_logits(td: TensorDict, heatmaps_logits: torch.Tensor, num_starts: int):\n    \"\"\"Obtain heatmap logits for current action to the next ones\"\"\"\n    current_action = td.get(\"action\", None)\n    if current_action is None:\n        logits = heatmaps_logits.mean(-1)\n    else:\n        batch_size = heatmaps_logits.shape[0]\n        _indexer = _multistart_batched_index(batch_size, num_starts)\n        logits = heatmaps_logits[_indexer, current_action, :]\n    return logits, td[\"action_mask\"]\n
"},{"location":"docs/content/api/networks/base_policies/#models.common.constructive.nonautoregressive.policy.NonAutoregressivePolicy","title":"NonAutoregressivePolicy","text":"
NonAutoregressivePolicy(\n    encoder: NonAutoregressiveEncoder,\n    decoder: NonAutoregressiveDecoder = None,\n    env_name: str = \"tsp\",\n    temperature: float = 1.0,\n    tanh_clipping: float = 0,\n    mask_logits: bool = True,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"greedy\",\n    test_decode_type: str = \"greedy\",\n    **unused_kw\n)\n

Bases: ConstructivePolicy

Template class for an nonautoregressive policy, simple wrapper around :class:rl4co.models.common.constructive.base.ConstructivePolicy.

Source code in rl4co/models/common/constructive/nonautoregressive/policy.py
def __init__(\n    self,\n    encoder: NonAutoregressiveEncoder,\n    decoder: NonAutoregressiveDecoder = None,\n    env_name: str = \"tsp\",\n    temperature: float = 1.0,\n    tanh_clipping: float = 0,\n    mask_logits: bool = True,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"greedy\",\n    test_decode_type: str = \"greedy\",\n    **unused_kw,\n):\n    # If decoder is not passed, we default to the non-autoregressive decoder that decodes the heatmap\n    if decoder is None:\n        decoder = NonAutoregressiveDecoder()\n\n    super(NonAutoregressivePolicy, self).__init__(\n        encoder=encoder,\n        decoder=decoder,\n        env_name=env_name,\n        temperature=temperature,\n        tanh_clipping=tanh_clipping,\n        mask_logits=mask_logits,\n        train_decode_type=train_decode_type,\n        val_decode_type=val_decode_type,\n        test_decode_type=test_decode_type,\n        **unused_kw,\n    )\n
"},{"location":"docs/content/api/networks/base_policies/#improvement-policies-base-classes","title":"Improvement Policies (Base Classes)","text":"

Classes:

  • ImprovementEncoder \u2013

    Base class for the encoder of improvement models

  • ImprovementDecoder \u2013

    Base decoder model for improvement models. The decoder is responsible for generating the logits of the action

  • ImprovementPolicy \u2013

    Base class for improvement policies. Improvement policies take an instance + a solution as input and output a specific operator that changes the current solution to a new one.

"},{"location":"docs/content/api/networks/base_policies/#models.common.improvement.base.ImprovementEncoder","title":"ImprovementEncoder","text":"
ImprovementEncoder(\n    embed_dim: int = 128,\n    init_embedding: Module = None,\n    pos_embedding: Module = None,\n    env_name: str = \"pdp_ruin_repair\",\n    pos_type: str = \"CPE\",\n    num_heads: int = 4,\n    num_layers: int = 3,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 128,\n    linear_bias: bool = False,\n)\n

Bases: Module

Base class for the encoder of improvement models

Methods:

  • forward \u2013

    Forward pass of the encoder.

Source code in rl4co/models/common/improvement/base.py
def __init__(\n    self,\n    embed_dim: int = 128,\n    init_embedding: nn.Module = None,\n    pos_embedding: nn.Module = None,\n    env_name: str = \"pdp_ruin_repair\",\n    pos_type: str = \"CPE\",\n    num_heads: int = 4,\n    num_layers: int = 3,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 128,\n    linear_bias: bool = False,\n):\n    super(ImprovementEncoder, self).__init__()\n\n    if isinstance(env_name, RL4COEnvBase):\n        env_name = env_name.name\n    self.env_name = env_name\n    self.init_embedding = (\n        env_init_embedding(\n            self.env_name, {\"embed_dim\": embed_dim, \"linear_bias\": linear_bias}\n        )\n        if init_embedding is None\n        else init_embedding\n    )\n\n    self.pos_type = pos_type\n    self.pos_embedding = (\n        pos_init_embedding(self.pos_type, {\"embed_dim\": embed_dim})\n        if pos_embedding is None\n        else pos_embedding\n    )\n
"},{"location":"docs/content/api/networks/base_policies/#models.common.improvement.base.ImprovementEncoder.forward","title":"forward","text":"
forward(td: TensorDict) -> Tuple[Tensor, Tensor]\n

Forward pass of the encoder. Transform the input TensorDict into a latent representation.

Parameters:

  • td (TensorDict) \u2013

    Input TensorDict containing the environment state

Returns:

  • h ( Tensor ) \u2013

    Latent representation of the input

  • init_h ( Tensor ) \u2013

    Initial embedding of the input

Source code in rl4co/models/common/improvement/base.py
def forward(self, td: TensorDict) -> Tuple[Tensor, Tensor]:\n    \"\"\"Forward pass of the encoder.\n    Transform the input TensorDict into a latent representation.\n\n    Args:\n        td: Input TensorDict containing the environment state\n\n    Returns:\n        h: Latent representation of the input\n        init_h: Initial embedding of the input\n    \"\"\"\n    # Transfer to embedding space (node)\n    init_h = self.init_embedding(td)\n\n    # Transfer to embedding space (solution)\n    init_p = self.pos_embedding(td)\n\n    # Process embedding\n    final_h, final_p = self._encoder_forward(init_h, init_p)\n\n    # Return latent representation and initial embedding\n    return final_h, final_p\n
"},{"location":"docs/content/api/networks/base_policies/#models.common.improvement.base.ImprovementDecoder","title":"ImprovementDecoder","text":"

Bases: Module

Base decoder model for improvement models. The decoder is responsible for generating the logits of the action

Methods:

  • forward \u2013

    Obtain logits to perform operators that improve the current solution to the next ones

"},{"location":"docs/content/api/networks/base_policies/#models.common.improvement.base.ImprovementDecoder.forward","title":"forward abstractmethod","text":"
forward(\n    td: TensorDict, final_h: Tensor, final_p: Tensor\n) -> Tensor\n

Obtain logits to perform operators that improve the current solution to the next ones

Parameters:

  • td (TensorDict) \u2013

    TensorDict with the current environment state

  • final_h (Tensor) \u2013

    final node embeddings

  • final_p (Tensor) \u2013

    final positional embeddings

Returns:

  • Tensor \u2013

    Tuple containing the logits

Source code in rl4co/models/common/improvement/base.py
@abc.abstractmethod\ndef forward(self, td: TensorDict, final_h: Tensor, final_p: Tensor) -> Tensor:\n    \"\"\"Obtain logits to perform operators that improve the current solution to the next ones\n\n    Args:\n        td: TensorDict with the current environment state\n        final_h: final node embeddings\n        final_p: final positional embeddings\n\n    Returns:\n        Tuple containing the logits\n    \"\"\"\n    raise NotImplementedError(\"Implement me in subclass!\")\n
"},{"location":"docs/content/api/networks/base_policies/#models.common.improvement.base.ImprovementPolicy","title":"ImprovementPolicy","text":"

Bases: Module

Base class for improvement policies. Improvement policies take an instance + a solution as input and output a specific operator that changes the current solution to a new one.

\"Improvement\" means that a solution is (potentially) improved to a new one by the model.

Methods:

  • forward \u2013

    Forward pass of the policy.

"},{"location":"docs/content/api/networks/base_policies/#models.common.improvement.base.ImprovementPolicy.forward","title":"forward abstractmethod","text":"
forward(\n    td: TensorDict,\n    env: Union[str, RL4COEnvBase] = None,\n    phase: str = \"train\",\n    return_actions: bool = True,\n    return_entropy: bool = False,\n    return_init_embeds: bool = False,\n    actions=None,\n    **decoding_kwargs\n) -> dict\n

Forward pass of the policy.

Parameters:

  • td (TensorDict) \u2013

    TensorDict containing the environment state

  • env (Union[str, RL4COEnvBase], default: None ) \u2013

    Environment to use for decoding. If None, the environment is instantiated from env_name. Note that it is more efficient to pass an already instantiated environment each time for fine-grained control

  • phase (str, default: 'train' ) \u2013

    Phase of the algorithm (train, val, test)

  • return_actions (bool, default: True ) \u2013

    Whether to return the actions

  • return_entropy (bool, default: False ) \u2013

    Whether to return the entropy

  • return_init_embeds (bool, default: False ) \u2013

    Whether to return the initial embeddings

  • actions \u2013

    Actions to use for evaluating the policy. If passed, use these actions instead of sampling from the policy to calculate log likelihood

  • decoding_kwargs \u2013

    Keyword arguments for the decoding strategy. See :class:rl4co.utils.decoding.DecodingStrategy for more information.

Returns:

  • out ( dict ) \u2013

    Dictionary containing the reward, log likelihood, and optionally the actions and entropy

Source code in rl4co/models/common/improvement/base.py
@abc.abstractmethod\ndef forward(\n    self,\n    td: TensorDict,\n    env: Union[str, RL4COEnvBase] = None,\n    phase: str = \"train\",\n    return_actions: bool = True,\n    return_entropy: bool = False,\n    return_init_embeds: bool = False,\n    actions=None,\n    **decoding_kwargs,\n) -> dict:\n    \"\"\"Forward pass of the policy.\n\n    Args:\n        td: TensorDict containing the environment state\n        env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that\n            it is more efficient to pass an already instantiated environment each time for fine-grained control\n        phase: Phase of the algorithm (train, val, test)\n        return_actions: Whether to return the actions\n        return_entropy: Whether to return the entropy\n        return_init_embeds: Whether to return the initial embeddings\n        actions: Actions to use for evaluating the policy.\n            If passed, use these actions instead of sampling from the policy to calculate log likelihood\n        decoding_kwargs: Keyword arguments for the decoding strategy. See :class:`rl4co.utils.decoding.DecodingStrategy` for more information.\n\n    Returns:\n        out: Dictionary containing the reward, log likelihood, and optionally the actions and entropy\n    \"\"\"\n    raise NotImplementedError(\"Implement me in subclass!\")\n
"},{"location":"docs/content/api/networks/env_embeddings/","title":"Environment Embeddings","text":"

In autoregressive policies, environment embeddings transfer data from feature space to hidden space:

  • Initial Embeddings: encode global problem features
  • Context Embeddings: modify current node embedding during decoding
  • Dynamic Embeddings: modify all nodes embeddings during decoding

"},{"location":"docs/content/api/networks/env_embeddings/#context-embeddings","title":"Context Embeddings","text":"

The context embedding is used to modify the query embedding of the problem node of the current partial solution. Usually consists of a projection of gathered node embeddings and features to the embedding space.

Classes:

  • EnvContext \u2013

    Base class for environment context embeddings. The context embedding is used to modify the

  • FFSPContext \u2013
  • TSPContext \u2013

    Context embedding for the Traveling Salesman Problem (TSP).

  • VRPContext \u2013

    Context embedding for the Capacitated Vehicle Routing Problem (CVRP).

  • VRPTWContext \u2013

    Context embedding for the Capacitated Vehicle Routing Problem (CVRP).

  • SVRPContext \u2013

    Context embedding for the Skill Vehicle Routing Problem (SVRP).

  • PCTSPContext \u2013

    Context embedding for the Prize Collecting TSP (PCTSP).

  • OPContext \u2013

    Context embedding for the Orienteering Problem (OP).

  • DPPContext \u2013

    Context embedding for the Decap Placement Problem (DPP), EDA (electronic design automation).

  • PDPContext \u2013

    Context embedding for the Pickup and Delivery Problem (PDP).

  • MTSPContext \u2013

    Context embedding for the Multiple Traveling Salesman Problem (mTSP).

  • SMTWTPContext \u2013

    Context embedding for the Single Machine Total Weighted Tardiness Problem (SMTWTP).

  • MDCPDPContext \u2013

    Context embedding for the MDCPDP.

  • MTVRPContext \u2013

    Context embedding for Multi-Task VRPEnv.

Functions:

  • env_context_embedding \u2013

    Get environment context embedding. The context embedding is used to modify the

"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.EnvContext","title":"EnvContext","text":"
EnvContext(\n    embed_dim, step_context_dim=None, linear_bias=False\n)\n

Bases: Module

Base class for environment context embeddings. The context embedding is used to modify the query embedding of the problem node of the current partial solution. Consists of a linear layer that projects the node features to the embedding space.

Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim, step_context_dim=None, linear_bias=False):\n    super(EnvContext, self).__init__()\n    self.embed_dim = embed_dim\n    step_context_dim = step_context_dim if step_context_dim is not None else embed_dim\n    self.project_context = nn.Linear(step_context_dim, embed_dim, bias=linear_bias)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.FFSPContext","title":"FFSPContext","text":"
FFSPContext(embed_dim, stage_cnt=None)\n

Bases: EnvContext

Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim, stage_cnt=None):\n    self.has_stage_emb = stage_cnt is not None\n    step_context_dim = (1 + int(self.has_stage_emb)) * embed_dim\n    super().__init__(embed_dim=embed_dim, step_context_dim=step_context_dim)\n    if self.has_stage_emb:\n        self.stage_emb = nn.Parameter(torch.rand(stage_cnt, embed_dim))\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.TSPContext","title":"TSPContext","text":"
TSPContext(embed_dim)\n

Bases: EnvContext

Context embedding for the Traveling Salesman Problem (TSP). Project the following to the embedding space:

- first node embedding\n- current node embedding\n
Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim):\n    super(TSPContext, self).__init__(embed_dim, 2 * embed_dim)\n    self.W_placeholder = nn.Parameter(\n        torch.Tensor(2 * self.embed_dim).uniform_(-1, 1)\n    )\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.VRPContext","title":"VRPContext","text":"
VRPContext(embed_dim)\n

Bases: EnvContext

Context embedding for the Capacitated Vehicle Routing Problem (CVRP). Project the following to the embedding space:

- current node embedding\n- remaining capacity (vehicle_capacity - used_capacity)\n
Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim):\n    super(VRPContext, self).__init__(\n        embed_dim=embed_dim, step_context_dim=embed_dim + 1\n    )\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.VRPTWContext","title":"VRPTWContext","text":"
VRPTWContext(embed_dim)\n

Bases: VRPContext

Context embedding for the Capacitated Vehicle Routing Problem (CVRP). Project the following to the embedding space:

- current node embedding\n- remaining capacity (vehicle_capacity - used_capacity)\n- current time\n
Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim):\n    super(VRPContext, self).__init__(\n        embed_dim=embed_dim, step_context_dim=embed_dim + 2\n    )\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.SVRPContext","title":"SVRPContext","text":"
SVRPContext(embed_dim)\n

Bases: EnvContext

Context embedding for the Skill Vehicle Routing Problem (SVRP). Project the following to the embedding space:

- current node embedding\n- current technician\n
Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim):\n    super(SVRPContext, self).__init__(embed_dim=embed_dim, step_context_dim=embed_dim)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.PCTSPContext","title":"PCTSPContext","text":"
PCTSPContext(embed_dim)\n

Bases: EnvContext

Context embedding for the Prize Collecting TSP (PCTSP). Project the following to the embedding space:

- current node embedding\n- remaining prize (prize_required - cur_total_prize)\n
Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim):\n    super(PCTSPContext, self).__init__(embed_dim, embed_dim + 1)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.OPContext","title":"OPContext","text":"
OPContext(embed_dim)\n

Bases: EnvContext

Context embedding for the Orienteering Problem (OP). Project the following to the embedding space:

- current node embedding\n- remaining distance (max_length - tour_length)\n
Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim):\n    super(OPContext, self).__init__(embed_dim, embed_dim + 1)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.DPPContext","title":"DPPContext","text":"
DPPContext(embed_dim)\n

Bases: EnvContext

Context embedding for the Decap Placement Problem (DPP), EDA (electronic design automation). Project the following to the embedding space:

- current cell embedding\n

Methods:

  • forward \u2013

    Context cannot be defined by a single node embedding for DPP, hence 0.

Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim):\n    super(DPPContext, self).__init__(embed_dim)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.DPPContext.forward","title":"forward","text":"
forward(embeddings, td)\n

Context cannot be defined by a single node embedding for DPP, hence 0. We modify the dynamic embedding instead to capture placed items

Source code in rl4co/models/nn/env_embeddings/context.py
def forward(self, embeddings, td):\n    \"\"\"Context cannot be defined by a single node embedding for DPP, hence 0.\n    We modify the dynamic embedding instead to capture placed items\n    \"\"\"\n    return embeddings.new_zeros(embeddings.size(0), self.embed_dim)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.PDPContext","title":"PDPContext","text":"
PDPContext(embed_dim)\n

Bases: EnvContext

Context embedding for the Pickup and Delivery Problem (PDP). Project the following to the embedding space:

- current node embedding\n
Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim):\n    super(PDPContext, self).__init__(embed_dim, embed_dim)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.MTSPContext","title":"MTSPContext","text":"
MTSPContext(embed_dim, linear_bias=False)\n

Bases: EnvContext

Context embedding for the Multiple Traveling Salesman Problem (mTSP). Project the following to the embedding space:

- current node embedding\n- remaining_agents\n- current_length\n- max_subtour_length\n- distance_from_depot\n
Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim, linear_bias=False):\n    super(MTSPContext, self).__init__(embed_dim, 2 * embed_dim)\n    proj_in_dim = (\n        4  # remaining_agents, current_length, max_subtour_length, distance_from_depot\n    )\n    self.proj_dynamic_feats = nn.Linear(proj_in_dim, embed_dim, bias=linear_bias)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.SMTWTPContext","title":"SMTWTPContext","text":"
SMTWTPContext(embed_dim)\n

Bases: EnvContext

Context embedding for the Single Machine Total Weighted Tardiness Problem (SMTWTP). Project the following to the embedding space:

- current node embedding\n- current time\n
Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim):\n    super(SMTWTPContext, self).__init__(embed_dim, embed_dim + 1)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.MDCPDPContext","title":"MDCPDPContext","text":"
MDCPDPContext(embed_dim)\n

Bases: EnvContext

Context embedding for the MDCPDP. Project the following to the embedding space:

- current node embedding\n
Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim):\n    super(MDCPDPContext, self).__init__(embed_dim, embed_dim)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.MTVRPContext","title":"MTVRPContext","text":"
MTVRPContext(embed_dim)\n

Bases: VRPContext

Context embedding for Multi-Task VRPEnv. Project the following to the embedding space:

- current node embedding\n- remaining_linehaul_capacity (vehicle_capacity - used_capacity_linehaul)\n- remaining_backhaul_capacity (vehicle_capacity - used_capacity_backhaul)\n- current time\n- current_route_length\n- open route indicator\n
Source code in rl4co/models/nn/env_embeddings/context.py
def __init__(self, embed_dim):\n    super(VRPContext, self).__init__(\n        embed_dim=embed_dim, step_context_dim=embed_dim + 5\n    )\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.context.env_context_embedding","title":"env_context_embedding","text":"
env_context_embedding(\n    env_name: str, config: dict\n) -> Module\n

Get environment context embedding. The context embedding is used to modify the query embedding of the problem node of the current partial solution. Usually consists of a projection of gathered node embeddings and features to the embedding space.

Parameters:

  • env \u2013

    Environment or its name.

  • config (dict) \u2013

    A dictionary of configuration options for the environment.

Source code in rl4co/models/nn/env_embeddings/context.py
def env_context_embedding(env_name: str, config: dict) -> nn.Module:\n    \"\"\"Get environment context embedding. The context embedding is used to modify the\n    query embedding of the problem node of the current partial solution.\n    Usually consists of a projection of gathered node embeddings and features to the embedding space.\n\n    Args:\n        env: Environment or its name.\n        config: A dictionary of configuration options for the environment.\n    \"\"\"\n    embedding_registry = {\n        \"tsp\": TSPContext,\n        \"atsp\": TSPContext,\n        \"cvrp\": VRPContext,\n        \"cvrptw\": VRPTWContext,\n        \"ffsp\": FFSPContext,\n        \"svrp\": SVRPContext,\n        \"sdvrp\": VRPContext,\n        \"pctsp\": PCTSPContext,\n        \"spctsp\": PCTSPContext,\n        \"op\": OPContext,\n        \"dpp\": DPPContext,\n        \"mdpp\": DPPContext,\n        \"pdp\": PDPContext,\n        \"mtsp\": MTSPContext,\n        \"smtwtp\": SMTWTPContext,\n        \"mdcpdp\": MDCPDPContext,\n        \"mtvrp\": MTVRPContext,\n    }\n\n    if env_name not in embedding_registry:\n        raise ValueError(\n            f\"Unknown environment name '{env_name}'. Available context embeddings: {embedding_registry.keys()}\"\n        )\n\n    return embedding_registry[env_name](**config)\n
"},{"location":"docs/content/api/networks/env_embeddings/#dynamic-embeddings","title":"Dynamic Embeddings","text":"

The dynamic embedding is used to modify query, key and value vectors of the attention mechanism based on the current state of the environment (which is changing during the rollout). Generally consists of a linear layer that projects the node features to the embedding space.

Classes:

  • StaticEmbedding \u2013

    Static embedding for general problems.

  • SDVRPDynamicEmbedding \u2013

    Dynamic embedding for the Split Delivery Vehicle Routing Problem (SDVRP).

Functions:

  • env_dynamic_embedding \u2013

    Get environment dynamic embedding. The dynamic embedding is used to modify query, key and value vectors of the attention mechanism

"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.dynamic.StaticEmbedding","title":"StaticEmbedding","text":"
StaticEmbedding(*args, **kwargs)\n

Bases: Module

Static embedding for general problems. This is used for problems that do not have any dynamic information, except for the information regarding the current action (e.g. the current node in TSP). See context embedding for more details.

Source code in rl4co/models/nn/env_embeddings/dynamic.py
def __init__(self, *args, **kwargs):\n    super(StaticEmbedding, self).__init__()\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.dynamic.SDVRPDynamicEmbedding","title":"SDVRPDynamicEmbedding","text":"
SDVRPDynamicEmbedding(embed_dim, linear_bias=False)\n

Bases: Module

Dynamic embedding for the Split Delivery Vehicle Routing Problem (SDVRP). Embed the following node features to the embedding space:

- demand_with_depot: demand of the customers and the depot\n

The demand with depot is used to modify the query, key and value vectors of the attention mechanism based on the current state of the environment (which is changing during the rollout).

Source code in rl4co/models/nn/env_embeddings/dynamic.py
def __init__(self, embed_dim, linear_bias=False):\n    super(SDVRPDynamicEmbedding, self).__init__()\n    self.projection = nn.Linear(1, 3 * embed_dim, bias=linear_bias)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.dynamic.env_dynamic_embedding","title":"env_dynamic_embedding","text":"
env_dynamic_embedding(\n    env_name: str, config: dict\n) -> Module\n

Get environment dynamic embedding. The dynamic embedding is used to modify query, key and value vectors of the attention mechanism based on the current state of the environment (which is changing during the rollout). Consists of a linear layer that projects the node features to the embedding space.

Parameters:

  • env \u2013

    Environment or its name.

  • config (dict) \u2013

    A dictionary of configuration options for the environment.

Source code in rl4co/models/nn/env_embeddings/dynamic.py
def env_dynamic_embedding(env_name: str, config: dict) -> nn.Module:\n    \"\"\"Get environment dynamic embedding. The dynamic embedding is used to modify query, key and value vectors of the attention mechanism\n    based on the current state of the environment (which is changing during the rollout).\n    Consists of a linear layer that projects the node features to the embedding space.\n\n    Args:\n        env: Environment or its name.\n        config: A dictionary of configuration options for the environment.\n    \"\"\"\n    embedding_registry = {\n        \"tsp\": StaticEmbedding,\n        \"atsp\": StaticEmbedding,\n        \"cvrp\": StaticEmbedding,\n        \"cvrptw\": StaticEmbedding,\n        \"ffsp\": StaticEmbedding,\n        \"svrp\": StaticEmbedding,\n        \"sdvrp\": SDVRPDynamicEmbedding,\n        \"pctsp\": StaticEmbedding,\n        \"spctsp\": StaticEmbedding,\n        \"op\": StaticEmbedding,\n        \"dpp\": StaticEmbedding,\n        \"mdpp\": StaticEmbedding,\n        \"pdp\": StaticEmbedding,\n        \"mtsp\": StaticEmbedding,\n        \"smtwtp\": StaticEmbedding,\n        \"jssp\": JSSPDynamicEmbedding,\n        \"fjsp\": JSSPDynamicEmbedding,\n        \"mtvrp\": StaticEmbedding,\n    }\n\n    if env_name not in embedding_registry:\n        log.warning(\n            f\"Unknown environment name '{env_name}'. Available dynamic embeddings: {embedding_registry.keys()}. Defaulting to StaticEmbedding.\"\n        )\n    return embedding_registry.get(env_name, StaticEmbedding)(**config)\n
"},{"location":"docs/content/api/networks/env_embeddings/#init-embeddings","title":"Init Embeddings","text":"

The init embedding is used to initialize the general embedding of the problem nodes without any solution information. Generally consists of a linear layer that projects the node features to the embedding space.

Classes:

  • TSPInitEmbedding \u2013

    Initial embedding for the Traveling Salesman Problems (TSP).

  • MatNetInitEmbedding \u2013

    Preparing the initial row and column embeddings for MatNet.

  • VRPInitEmbedding \u2013

    Initial embedding for the Vehicle Routing Problems (VRP).

  • PCTSPInitEmbedding \u2013

    Initial embedding for the Prize Collecting Traveling Salesman Problems (PCTSP).

  • OPInitEmbedding \u2013

    Initial embedding for the Orienteering Problems (OP).

  • DPPInitEmbedding \u2013

    Initial embedding for the Decap Placement Problem (DPP), EDA (electronic design automation).

  • MDPPInitEmbedding \u2013

    Initial embedding for the Multi-port Placement Problem (MDPP), EDA (electronic design automation).

  • PDPInitEmbedding \u2013

    Initial embedding for the Pickup and Delivery Problem (PDP).

  • MTSPInitEmbedding \u2013

    Initial embedding for the Multiple Traveling Salesman Problem (mTSP).

  • SMTWTPInitEmbedding \u2013

    Initial embedding for the Single Machine Total Weighted Tardiness Problem (SMTWTP).

  • MDCPDPInitEmbedding \u2013

    Initial embedding for the MDCPDP environment

Functions:

  • env_init_embedding \u2013

    Get environment initial embedding. The init embedding is used to initialize the

"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.TSPInitEmbedding","title":"TSPInitEmbedding","text":"
TSPInitEmbedding(embed_dim, linear_bias=True)\n

Bases: Module

Initial embedding for the Traveling Salesman Problems (TSP). Embed the following node features to the embedding space:

- locs: x, y coordinates of the cities\n
Source code in rl4co/models/nn/env_embeddings/init.py
def __init__(self, embed_dim, linear_bias=True):\n    super(TSPInitEmbedding, self).__init__()\n    node_dim = 2  # x, y\n    self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.MatNetInitEmbedding","title":"MatNetInitEmbedding","text":"
MatNetInitEmbedding(\n    embed_dim: int, mode: str = \"RandomOneHot\"\n)\n

Bases: Module

Preparing the initial row and column embeddings for MatNet.

Reference: https://github.com/yd-kwon/MatNet/blob/782698b60979effe2e7b61283cca155b7cdb727f/ATSP/ATSP_MatNet/ATSPModel.py#L51

Source code in rl4co/models/nn/env_embeddings/init.py
def __init__(self, embed_dim: int, mode: str = \"RandomOneHot\") -> None:\n    super().__init__()\n\n    self.embed_dim = embed_dim\n    assert mode in {\n        \"RandomOneHot\",\n        \"Random\",\n    }, \"mode must be one of ['RandomOneHot', 'Random']\"\n    self.mode = mode\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.VRPInitEmbedding","title":"VRPInitEmbedding","text":"
VRPInitEmbedding(\n    embed_dim, linear_bias=True, node_dim: int = 3\n)\n

Bases: Module

Initial embedding for the Vehicle Routing Problems (VRP). Embed the following node features to the embedding space:

- locs: x, y coordinates of the nodes (depot and customers separately)\n- demand: demand of the customers\n
Source code in rl4co/models/nn/env_embeddings/init.py
def __init__(self, embed_dim, linear_bias=True, node_dim: int = 3):\n    super(VRPInitEmbedding, self).__init__()\n    node_dim = node_dim  # 3: x, y, demand\n    self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias)\n    self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias)  # depot embedding\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.PCTSPInitEmbedding","title":"PCTSPInitEmbedding","text":"
PCTSPInitEmbedding(embed_dim, linear_bias=True)\n

Bases: Module

Initial embedding for the Prize Collecting Traveling Salesman Problems (PCTSP). Embed the following node features to the embedding space:

- locs: x, y coordinates of the nodes (depot and customers separately)\n- expected_prize: expected prize for visiting the customers.\n    In PCTSP, this is the actual prize. In SPCTSP, this is the expected prize.\n- penalty: penalty for not visiting the customers\n
Source code in rl4co/models/nn/env_embeddings/init.py
def __init__(self, embed_dim, linear_bias=True):\n    super(PCTSPInitEmbedding, self).__init__()\n    node_dim = 4  # x, y, prize, penalty\n    self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias)\n    self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.OPInitEmbedding","title":"OPInitEmbedding","text":"
OPInitEmbedding(embed_dim, linear_bias=True)\n

Bases: Module

Initial embedding for the Orienteering Problems (OP). Embed the following node features to the embedding space:

- locs: x, y coordinates of the nodes (depot and customers separately)\n- prize: prize for visiting the customers\n
Source code in rl4co/models/nn/env_embeddings/init.py
def __init__(self, embed_dim, linear_bias=True):\n    super(OPInitEmbedding, self).__init__()\n    node_dim = 3  # x, y, prize\n    self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias)\n    self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias)  # depot embedding\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.DPPInitEmbedding","title":"DPPInitEmbedding","text":"
DPPInitEmbedding(embed_dim, linear_bias=True)\n

Bases: Module

Initial embedding for the Decap Placement Problem (DPP), EDA (electronic design automation). Embed the following node features to the embedding space:

- locs: x, y coordinates of the nodes (cells)\n- probe: index of the (single) probe cell. We embed the euclidean distance from the probe to all cells.\n
Source code in rl4co/models/nn/env_embeddings/init.py
def __init__(self, embed_dim, linear_bias=True):\n    super(DPPInitEmbedding, self).__init__()\n    node_dim = 2  # x, y\n    self.init_embed = nn.Linear(node_dim, embed_dim // 2, linear_bias)  # locs\n    self.init_embed_probe = nn.Linear(1, embed_dim // 2, linear_bias)  # probe\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.MDPPInitEmbedding","title":"MDPPInitEmbedding","text":"
MDPPInitEmbedding(embed_dim, linear_bias=True)\n

Bases: Module

Initial embedding for the Multi-port Placement Problem (MDPP), EDA (electronic design automation). Embed the following node features to the embedding space:

- locs: x, y coordinates of the nodes (cells)\n- probe: indexes of the probe cells (multiple). We embed the euclidean distance of each cell to the closest probe.\n
Source code in rl4co/models/nn/env_embeddings/init.py
def __init__(self, embed_dim, linear_bias=True):\n    super(MDPPInitEmbedding, self).__init__()\n    node_dim = 2  # x, y\n    self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias)  # locs\n    self.init_embed_probe_distance = nn.Linear(\n        1, embed_dim, linear_bias\n    )  # probe_distance\n    self.project_out = nn.Linear(embed_dim * 2, embed_dim, linear_bias)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.PDPInitEmbedding","title":"PDPInitEmbedding","text":"
PDPInitEmbedding(embed_dim, linear_bias=True)\n

Bases: Module

Initial embedding for the Pickup and Delivery Problem (PDP). Embed the following node features to the embedding space:

- locs: x, y coordinates of the nodes (depot, pickups and deliveries separately)\n   Note that pickups and deliveries are interleaved in the input.\n
Source code in rl4co/models/nn/env_embeddings/init.py
def __init__(self, embed_dim, linear_bias=True):\n    super(PDPInitEmbedding, self).__init__()\n    node_dim = 2  # x, y\n    self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias)\n    self.init_embed_pick = nn.Linear(node_dim * 2, embed_dim, linear_bias)\n    self.init_embed_delivery = nn.Linear(node_dim, embed_dim, linear_bias)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.MTSPInitEmbedding","title":"MTSPInitEmbedding","text":"
MTSPInitEmbedding(embed_dim, linear_bias=True)\n

Bases: Module

Initial embedding for the Multiple Traveling Salesman Problem (mTSP). Embed the following node features to the embedding space:

- locs: x, y coordinates of the nodes (depot, cities)\n
Source code in rl4co/models/nn/env_embeddings/init.py
def __init__(self, embed_dim, linear_bias=True):\n    \"\"\"NOTE: new made by Fede. May need to be checked\"\"\"\n    super(MTSPInitEmbedding, self).__init__()\n    node_dim = 2  # x, y\n    self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias)\n    self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias)  # depot embedding\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.SMTWTPInitEmbedding","title":"SMTWTPInitEmbedding","text":"
SMTWTPInitEmbedding(embed_dim, linear_bias=True)\n

Bases: Module

Initial embedding for the Single Machine Total Weighted Tardiness Problem (SMTWTP). Embed the following node features to the embedding space:

- job_due_time: due time of the jobs\n- job_weight: weights of the jobs\n- job_process_time: the processing time of jobs\n
Source code in rl4co/models/nn/env_embeddings/init.py
def __init__(self, embed_dim, linear_bias=True):\n    super(SMTWTPInitEmbedding, self).__init__()\n    node_dim = 3  # job_due_time, job_weight, job_process_time\n    self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.MDCPDPInitEmbedding","title":"MDCPDPInitEmbedding","text":"
MDCPDPInitEmbedding(embed_dim, linear_bias=True)\n

Bases: Module

Initial embedding for the MDCPDP environment Embed the following node features to the embedding space:

- locs: x, y coordinates of the nodes (depot, pickups and deliveries separately)\n   Note that pickups and deliveries are interleaved in the input.\n
Source code in rl4co/models/nn/env_embeddings/init.py
def __init__(self, embed_dim, linear_bias=True):\n    super(MDCPDPInitEmbedding, self).__init__()\n    node_dim = 2  # x, y\n    self.init_embed_depot = nn.Linear(2, embed_dim, linear_bias)\n    self.init_embed_pick = nn.Linear(node_dim * 2, embed_dim, linear_bias)\n    self.init_embed_delivery = nn.Linear(node_dim, embed_dim, linear_bias)\n
"},{"location":"docs/content/api/networks/env_embeddings/#models.nn.env_embeddings.init.env_init_embedding","title":"env_init_embedding","text":"
env_init_embedding(env_name: str, config: dict) -> Module\n

Get environment initial embedding. The init embedding is used to initialize the general embedding of the problem nodes without any solution information. Consists of a linear layer that projects the node features to the embedding space.

Parameters:

  • env \u2013

    Environment or its name.

  • config (dict) \u2013

    A dictionary of configuration options for the environment.

Source code in rl4co/models/nn/env_embeddings/init.py
def env_init_embedding(env_name: str, config: dict) -> nn.Module:\n    \"\"\"Get environment initial embedding. The init embedding is used to initialize the\n    general embedding of the problem nodes without any solution information.\n    Consists of a linear layer that projects the node features to the embedding space.\n\n    Args:\n        env: Environment or its name.\n        config: A dictionary of configuration options for the environment.\n    \"\"\"\n    embedding_registry = {\n        \"tsp\": TSPInitEmbedding,\n        \"atsp\": TSPInitEmbedding,\n        \"matnet\": MatNetInitEmbedding,\n        \"cvrp\": VRPInitEmbedding,\n        \"cvrptw\": VRPTWInitEmbedding,\n        \"svrp\": SVRPInitEmbedding,\n        \"sdvrp\": VRPInitEmbedding,\n        \"pctsp\": PCTSPInitEmbedding,\n        \"spctsp\": PCTSPInitEmbedding,\n        \"op\": OPInitEmbedding,\n        \"dpp\": DPPInitEmbedding,\n        \"mdpp\": MDPPInitEmbedding,\n        \"pdp\": PDPInitEmbedding,\n        \"pdp_ruin_repair\": TSPInitEmbedding,\n        \"tsp_kopt\": TSPInitEmbedding,\n        \"mtsp\": MTSPInitEmbedding,\n        \"smtwtp\": SMTWTPInitEmbedding,\n        \"mdcpdp\": MDCPDPInitEmbedding,\n        \"fjsp\": FJSPInitEmbedding,\n        \"jssp\": FJSPInitEmbedding,\n        \"mtvrp\": MTVRPInitEmbedding,\n    }\n\n    if env_name not in embedding_registry:\n        raise ValueError(\n            f\"Unknown environment name '{env_name}'. Available init embeddings: {embedding_registry.keys()}\"\n        )\n\n    return embedding_registry[env_name](**config)\n
"},{"location":"docs/content/api/networks/improvement_policies/","title":"Improvement policies","text":""},{"location":"docs/content/api/networks/improvement_policies/#improvement-policies-base-classes","title":"Improvement Policies (Base Classes)","text":"

Classes:

  • ImprovementEncoder \u2013

    Base class for the encoder of improvement models

  • ImprovementDecoder \u2013

    Base decoder model for improvement models. The decoder is responsible for generating the logits of the action

  • ImprovementPolicy \u2013

    Base class for improvement policies. Improvement policies take an instance + a solution as input and output a specific operator that changes the current solution to a new one.

"},{"location":"docs/content/api/networks/improvement_policies/#models.common.improvement.base.ImprovementEncoder","title":"ImprovementEncoder","text":"
ImprovementEncoder(\n    embed_dim: int = 128,\n    init_embedding: Module = None,\n    pos_embedding: Module = None,\n    env_name: str = \"pdp_ruin_repair\",\n    pos_type: str = \"CPE\",\n    num_heads: int = 4,\n    num_layers: int = 3,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 128,\n    linear_bias: bool = False,\n)\n

Bases: Module

Base class for the encoder of improvement models

Methods:

  • forward \u2013

    Forward pass of the encoder.

Source code in rl4co/models/common/improvement/base.py
def __init__(\n    self,\n    embed_dim: int = 128,\n    init_embedding: nn.Module = None,\n    pos_embedding: nn.Module = None,\n    env_name: str = \"pdp_ruin_repair\",\n    pos_type: str = \"CPE\",\n    num_heads: int = 4,\n    num_layers: int = 3,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 128,\n    linear_bias: bool = False,\n):\n    super(ImprovementEncoder, self).__init__()\n\n    if isinstance(env_name, RL4COEnvBase):\n        env_name = env_name.name\n    self.env_name = env_name\n    self.init_embedding = (\n        env_init_embedding(\n            self.env_name, {\"embed_dim\": embed_dim, \"linear_bias\": linear_bias}\n        )\n        if init_embedding is None\n        else init_embedding\n    )\n\n    self.pos_type = pos_type\n    self.pos_embedding = (\n        pos_init_embedding(self.pos_type, {\"embed_dim\": embed_dim})\n        if pos_embedding is None\n        else pos_embedding\n    )\n
"},{"location":"docs/content/api/networks/improvement_policies/#models.common.improvement.base.ImprovementEncoder.forward","title":"forward","text":"
forward(td: TensorDict) -> Tuple[Tensor, Tensor]\n

Forward pass of the encoder. Transform the input TensorDict into a latent representation.

Parameters:

  • td (TensorDict) \u2013

    Input TensorDict containing the environment state

Returns:

  • h ( Tensor ) \u2013

    Latent representation of the input

  • init_h ( Tensor ) \u2013

    Initial embedding of the input

Source code in rl4co/models/common/improvement/base.py
def forward(self, td: TensorDict) -> Tuple[Tensor, Tensor]:\n    \"\"\"Forward pass of the encoder.\n    Transform the input TensorDict into a latent representation.\n\n    Args:\n        td: Input TensorDict containing the environment state\n\n    Returns:\n        h: Latent representation of the input\n        init_h: Initial embedding of the input\n    \"\"\"\n    # Transfer to embedding space (node)\n    init_h = self.init_embedding(td)\n\n    # Transfer to embedding space (solution)\n    init_p = self.pos_embedding(td)\n\n    # Process embedding\n    final_h, final_p = self._encoder_forward(init_h, init_p)\n\n    # Return latent representation and initial embedding\n    return final_h, final_p\n
"},{"location":"docs/content/api/networks/improvement_policies/#models.common.improvement.base.ImprovementDecoder","title":"ImprovementDecoder","text":"

Bases: Module

Base decoder model for improvement models. The decoder is responsible for generating the logits of the action

Methods:

  • forward \u2013

    Obtain logits to perform operators that improve the current solution to the next ones

"},{"location":"docs/content/api/networks/improvement_policies/#models.common.improvement.base.ImprovementDecoder.forward","title":"forward abstractmethod","text":"
forward(\n    td: TensorDict, final_h: Tensor, final_p: Tensor\n) -> Tensor\n

Obtain logits to perform operators that improve the current solution to the next ones

Parameters:

  • td (TensorDict) \u2013

    TensorDict with the current environment state

  • final_h (Tensor) \u2013

    final node embeddings

  • final_p (Tensor) \u2013

    final positional embeddings

Returns:

  • Tensor \u2013

    Tuple containing the logits

Source code in rl4co/models/common/improvement/base.py
@abc.abstractmethod\ndef forward(self, td: TensorDict, final_h: Tensor, final_p: Tensor) -> Tensor:\n    \"\"\"Obtain logits to perform operators that improve the current solution to the next ones\n\n    Args:\n        td: TensorDict with the current environment state\n        final_h: final node embeddings\n        final_p: final positional embeddings\n\n    Returns:\n        Tuple containing the logits\n    \"\"\"\n    raise NotImplementedError(\"Implement me in subclass!\")\n
"},{"location":"docs/content/api/networks/improvement_policies/#models.common.improvement.base.ImprovementPolicy","title":"ImprovementPolicy","text":"

Bases: Module

Base class for improvement policies. Improvement policies take an instance + a solution as input and output a specific operator that changes the current solution to a new one.

\"Improvement\" means that a solution is (potentially) improved to a new one by the model.

Methods:

  • forward \u2013

    Forward pass of the policy.

"},{"location":"docs/content/api/networks/improvement_policies/#models.common.improvement.base.ImprovementPolicy.forward","title":"forward abstractmethod","text":"
forward(\n    td: TensorDict,\n    env: Union[str, RL4COEnvBase] = None,\n    phase: str = \"train\",\n    return_actions: bool = True,\n    return_entropy: bool = False,\n    return_init_embeds: bool = False,\n    actions=None,\n    **decoding_kwargs\n) -> dict\n

Forward pass of the policy.

Parameters:

  • td (TensorDict) \u2013

    TensorDict containing the environment state

  • env (Union[str, RL4COEnvBase], default: None ) \u2013

    Environment to use for decoding. If None, the environment is instantiated from env_name. Note that it is more efficient to pass an already instantiated environment each time for fine-grained control

  • phase (str, default: 'train' ) \u2013

    Phase of the algorithm (train, val, test)

  • return_actions (bool, default: True ) \u2013

    Whether to return the actions

  • return_entropy (bool, default: False ) \u2013

    Whether to return the entropy

  • return_init_embeds (bool, default: False ) \u2013

    Whether to return the initial embeddings

  • actions \u2013

    Actions to use for evaluating the policy. If passed, use these actions instead of sampling from the policy to calculate log likelihood

  • decoding_kwargs \u2013

    Keyword arguments for the decoding strategy. See :class:rl4co.utils.decoding.DecodingStrategy for more information.

Returns:

  • out ( dict ) \u2013

    Dictionary containing the reward, log likelihood, and optionally the actions and entropy

Source code in rl4co/models/common/improvement/base.py
@abc.abstractmethod\ndef forward(\n    self,\n    td: TensorDict,\n    env: Union[str, RL4COEnvBase] = None,\n    phase: str = \"train\",\n    return_actions: bool = True,\n    return_entropy: bool = False,\n    return_init_embeds: bool = False,\n    actions=None,\n    **decoding_kwargs,\n) -> dict:\n    \"\"\"Forward pass of the policy.\n\n    Args:\n        td: TensorDict containing the environment state\n        env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that\n            it is more efficient to pass an already instantiated environment each time for fine-grained control\n        phase: Phase of the algorithm (train, val, test)\n        return_actions: Whether to return the actions\n        return_entropy: Whether to return the entropy\n        return_init_embeds: Whether to return the initial embeddings\n        actions: Actions to use for evaluating the policy.\n            If passed, use these actions instead of sampling from the policy to calculate log likelihood\n        decoding_kwargs: Keyword arguments for the decoding strategy. See :class:`rl4co.utils.decoding.DecodingStrategy` for more information.\n\n    Returns:\n        out: Dictionary containing the reward, log likelihood, and optionally the actions and entropy\n    \"\"\"\n    raise NotImplementedError(\"Implement me in subclass!\")\n
"},{"location":"docs/content/api/networks/nn/","title":"Neural Network Modules","text":""},{"location":"docs/content/api/networks/nn/#critic-network","title":"Critic Network","text":""},{"location":"docs/content/api/networks/nn/#models.rl.common.critic.CriticNetwork","title":"CriticNetwork","text":"
CriticNetwork(\n    encoder: Module,\n    value_head: Optional[Module] = None,\n    embed_dim: int = 128,\n    hidden_dim: int = 512,\n    customized: bool = False,\n)\n

Bases: Module

Create a critic network given an encoder (e.g. as the one in the policy network) with a value head to transform the embeddings to a scalar value.

Parameters:

  • encoder (Module) \u2013

    Encoder module to encode the input

  • value_head (Optional[Module], default: None ) \u2013

    Value head to transform the embeddings to a scalar value

  • embed_dim (int, default: 128 ) \u2013

    Dimension of the embeddings of the value head

  • hidden_dim (int, default: 512 ) \u2013

    Dimension of the hidden layer of the value head

Methods:

  • forward \u2013

    Forward pass of the critic network: encode the imput in embedding space and return the value

Source code in rl4co/models/rl/common/critic.py
def __init__(\n    self,\n    encoder: nn.Module,\n    value_head: Optional[nn.Module] = None,\n    embed_dim: int = 128,\n    hidden_dim: int = 512,\n    customized: bool = False,\n):\n    super(CriticNetwork, self).__init__()\n\n    self.encoder = encoder\n    if value_head is None:\n        # check if embed dim of encoder is different, if so, use it\n        if getattr(encoder, \"embed_dim\", embed_dim) != embed_dim:\n            log.warning(\n                f\"Found encoder with different embed_dim {encoder.embed_dim} than the value head {embed_dim}. Using encoder embed_dim for value head.\"\n            )\n            embed_dim = getattr(encoder, \"embed_dim\", embed_dim)\n        value_head = nn.Sequential(\n            nn.Linear(embed_dim, hidden_dim), nn.ReLU(), nn.Linear(hidden_dim, 1)\n        )\n    self.value_head = value_head\n    self.customized = customized\n
"},{"location":"docs/content/api/networks/nn/#models.rl.common.critic.CriticNetwork.forward","title":"forward","text":"
forward(\n    x: Union[Tensor, TensorDict], hidden=None\n) -> Tensor\n

Forward pass of the critic network: encode the imput in embedding space and return the value

Parameters:

  • x (Union[Tensor, TensorDict]) \u2013

    Input containing the environment state. Can be a Tensor or a TensorDict

Returns:

  • Tensor \u2013

    Value of the input state

Source code in rl4co/models/rl/common/critic.py
def forward(self, x: Union[Tensor, TensorDict], hidden=None) -> Tensor:\n    \"\"\"Forward pass of the critic network: encode the imput in embedding space and return the value\n\n    Args:\n        x: Input containing the environment state. Can be a Tensor or a TensorDict\n\n    Returns:\n        Value of the input state\n    \"\"\"\n    if not self.customized:  # fir for most of costructive tasks\n        h, _ = self.encoder(x)  # [batch_size, N, embed_dim] -> [batch_size, N]\n        return self.value_head(h).mean(1)  # [batch_size, N] -> [batch_size]\n    else:  # custimized encoder and value head with hidden input\n        h = self.encoder(x)  # [batch_size, N, embed_dim] -> [batch_size, N]\n        return self.value_head(h, hidden)\n
"},{"location":"docs/content/api/networks/nn/#graph-neural-networks","title":"Graph Neural Networks","text":""},{"location":"docs/content/api/networks/nn/#models.nn.graph.attnnet.MultiHeadAttentionLayer","title":"MultiHeadAttentionLayer","text":"
MultiHeadAttentionLayer(\n    embed_dim: int,\n    num_heads: int = 8,\n    feedforward_hidden: int = 512,\n    normalization: Optional[str] = \"batch\",\n    bias: bool = True,\n    sdpa_fn: Optional[Callable] = None,\n    moe_kwargs: Optional[dict] = None,\n)\n

Bases: Sequential

Multi-Head Attention Layer with normalization and feed-forward layer

Parameters:

  • embed_dim (int) \u2013

    dimension of the embeddings

  • num_heads (int, default: 8 ) \u2013

    number of heads in the MHA

  • feedforward_hidden (int, default: 512 ) \u2013

    dimension of the hidden layer in the feed-forward layer

  • normalization (Optional[str], default: 'batch' ) \u2013

    type of normalization to use (batch, layer, none)

  • sdpa_fn (Optional[Callable], default: None ) \u2013

    scaled dot product attention function (SDPA)

  • moe_kwargs (Optional[dict], default: None ) \u2013

    Keyword arguments for MoE

Source code in rl4co/models/nn/graph/attnnet.py
def __init__(\n    self,\n    embed_dim: int,\n    num_heads: int = 8,\n    feedforward_hidden: int = 512,\n    normalization: Optional[str] = \"batch\",\n    bias: bool = True,\n    sdpa_fn: Optional[Callable] = None,\n    moe_kwargs: Optional[dict] = None,\n):\n    num_neurons = [feedforward_hidden] if feedforward_hidden > 0 else []\n    if moe_kwargs is not None:\n        ffn = MoE(embed_dim, embed_dim, num_neurons=num_neurons, **moe_kwargs)\n    else:\n        ffn = MLP(input_dim=embed_dim, output_dim=embed_dim, num_neurons=num_neurons, hidden_act=\"ReLU\")\n\n    super(MultiHeadAttentionLayer, self).__init__(\n        SkipConnection(\n            MultiHeadAttention(embed_dim, num_heads, bias=bias, sdpa_fn=sdpa_fn)\n        ),\n        Normalization(embed_dim, normalization),\n        SkipConnection(ffn),\n        Normalization(embed_dim, normalization),\n    )\n
"},{"location":"docs/content/api/networks/nn/#models.nn.graph.attnnet.GraphAttentionNetwork","title":"GraphAttentionNetwork","text":"
GraphAttentionNetwork(\n    num_heads: int,\n    embed_dim: int,\n    num_layers: int,\n    normalization: str = \"batch\",\n    feedforward_hidden: int = 512,\n    sdpa_fn: Optional[Callable] = None,\n    moe_kwargs: Optional[dict] = None,\n)\n

Bases: Module

Graph Attention Network to encode embeddings with a series of MHA layers consisting of a MHA layer, normalization, feed-forward layer, and normalization. Similar to Transformer encoder, as used in Kool et al. (2019).

Parameters:

  • num_heads (int) \u2013

    number of heads in the MHA

  • embed_dim (int) \u2013

    dimension of the embeddings

  • num_layers (int) \u2013

    number of MHA layers

  • normalization (str, default: 'batch' ) \u2013

    type of normalization to use (batch, layer, none)

  • feedforward_hidden (int, default: 512 ) \u2013

    dimension of the hidden layer in the feed-forward layer

  • sdpa_fn (Optional[Callable], default: None ) \u2013

    scaled dot product attention function (SDPA)

  • moe_kwargs (Optional[dict], default: None ) \u2013

    Keyword arguments for MoE

Methods:

  • forward \u2013

    Forward pass of the encoder

Source code in rl4co/models/nn/graph/attnnet.py
def __init__(\n    self,\n    num_heads: int,\n    embed_dim: int,\n    num_layers: int,\n    normalization: str = \"batch\",\n    feedforward_hidden: int = 512,\n    sdpa_fn: Optional[Callable] = None,\n    moe_kwargs: Optional[dict] = None,\n):\n    super(GraphAttentionNetwork, self).__init__()\n\n    self.layers = nn.Sequential(\n        *(\n            MultiHeadAttentionLayer(\n                embed_dim,\n                num_heads,\n                feedforward_hidden=feedforward_hidden,\n                normalization=normalization,\n                sdpa_fn=sdpa_fn,\n                moe_kwargs=moe_kwargs,\n            )\n            for _ in range(num_layers)\n        )\n    )\n
"},{"location":"docs/content/api/networks/nn/#models.nn.graph.attnnet.GraphAttentionNetwork.forward","title":"forward","text":"
forward(x: Tensor, mask: Optional[Tensor] = None) -> Tensor\n

Forward pass of the encoder

Parameters:

  • x (Tensor) \u2013

    [batch_size, graph_size, embed_dim] initial embeddings to process

  • mask (Optional[Tensor], default: None ) \u2013

    [batch_size, graph_size, graph_size] mask for the input embeddings. Unused for now.

Source code in rl4co/models/nn/graph/attnnet.py
def forward(self, x: Tensor, mask: Optional[Tensor] = None) -> Tensor:\n    \"\"\"Forward pass of the encoder\n\n    Args:\n        x: [batch_size, graph_size, embed_dim] initial embeddings to process\n        mask: [batch_size, graph_size, graph_size] mask for the input embeddings. Unused for now.\n    \"\"\"\n    assert mask is None, \"Mask not yet supported!\"\n    h = self.layers(x)\n    return h\n
"},{"location":"docs/content/api/networks/nn/#models.nn.graph.gcn.GCNEncoder","title":"GCNEncoder","text":"
GCNEncoder(\n    env_name: str,\n    embed_dim: int,\n    num_layers: int,\n    init_embedding: Module = None,\n    residual: bool = True,\n    edge_idx_fn: EdgeIndexFnSignature = None,\n    dropout: float = 0.5,\n    bias: bool = True,\n)\n

Bases: Module

Graph Convolutional Network to encode embeddings with a series of GCN layers from the pytorch geometric package

Parameters:

  • embed_dim (int) \u2013

    dimension of the embeddings

  • num_nodes \u2013

    number of nodes in the graph

  • num_gcn_layer \u2013

    number of GCN layers

  • self_loop \u2013

    whether to add self loop in the graph

  • residual (bool, default: True ) \u2013

    whether to use residual connection

Methods:

  • forward \u2013

    Forward pass of the encoder.

Source code in rl4co/models/nn/graph/gcn.py
def __init__(\n    self,\n    env_name: str,\n    embed_dim: int,\n    num_layers: int,\n    init_embedding: nn.Module = None,\n    residual: bool = True,\n    edge_idx_fn: EdgeIndexFnSignature = None,\n    dropout: float = 0.5,\n    bias: bool = True,\n):\n    super().__init__()\n\n    self.env_name = env_name\n    self.embed_dim = embed_dim\n    self.residual = residual\n    self.dropout = dropout\n\n    self.init_embedding = (\n        env_init_embedding(self.env_name, {\"embed_dim\": embed_dim})\n        if init_embedding is None\n        else init_embedding\n    )\n\n    if edge_idx_fn is None:\n        log.warning(\"No edge indices passed. Assume a fully connected graph\")\n        edge_idx_fn = edge_idx_fn_wrapper\n\n    self.edge_idx_fn = edge_idx_fn\n\n    # Define the GCN layers\n    self.gcn_layers = nn.ModuleList(\n        [GCNConv(embed_dim, embed_dim, bias=bias) for _ in range(num_layers)]\n    )\n
"},{"location":"docs/content/api/networks/nn/#models.nn.graph.gcn.GCNEncoder.forward","title":"forward","text":"
forward(\n    td: TensorDict, mask: Union[Tensor, None] = None\n) -> Tuple[Tensor, Tensor]\n

Forward pass of the encoder. Transform the input TensorDict into a latent representation.

Parameters:

  • td (TensorDict) \u2013

    Input TensorDict containing the environment state

  • mask (Union[Tensor, None], default: None ) \u2013

    Mask to apply to the attention

Returns:

  • h ( Tensor ) \u2013

    Latent representation of the input

  • init_h ( Tensor ) \u2013

    Initial embedding of the input

Source code in rl4co/models/nn/graph/gcn.py
def forward(\n    self, td: TensorDict, mask: Union[Tensor, None] = None\n) -> Tuple[Tensor, Tensor]:\n    \"\"\"Forward pass of the encoder.\n    Transform the input TensorDict into a latent representation.\n\n    Args:\n        td: Input TensorDict containing the environment state\n        mask: Mask to apply to the attention\n\n    Returns:\n        h: Latent representation of the input\n        init_h: Initial embedding of the input\n    \"\"\"\n    # Transfer to embedding space\n    init_h = self.init_embedding(td)\n    bs, num_nodes, emb_dim = init_h.shape\n    # (bs*num_nodes, emb_dim)\n    update_node_feature = init_h.reshape(-1, emb_dim)\n    # shape=(2, num_edges)\n    edge_index = self.edge_idx_fn(td, num_nodes)\n\n    for layer in self.gcn_layers[:-1]:\n        update_node_feature = layer(update_node_feature, edge_index)\n        update_node_feature = F.relu(update_node_feature)\n        update_node_feature = F.dropout(\n            update_node_feature, training=self.training, p=self.dropout\n        )\n\n    # last layer without relu activation and dropout\n    update_node_feature = self.gcn_layers[-1](update_node_feature, edge_index)\n\n    # De-batch the graph\n    update_node_feature = update_node_feature.view(bs, num_nodes, emb_dim)\n\n    # Residual\n    if self.residual:\n        update_node_feature = update_node_feature + init_h\n\n    return update_node_feature, init_h\n
"},{"location":"docs/content/api/networks/nn/#models.nn.graph.mpnn.MessagePassingEncoder","title":"MessagePassingEncoder","text":"
MessagePassingEncoder(\n    env_name: str,\n    embed_dim: int,\n    num_nodes: int,\n    num_layers: int,\n    init_embedding: Module = None,\n    aggregation: str = \"add\",\n    self_loop: bool = False,\n    residual: bool = True,\n)\n

Bases: Module

Source code in rl4co/models/nn/graph/mpnn.py
def __init__(\n    self,\n    env_name: str,\n    embed_dim: int,\n    num_nodes: int,\n    num_layers: int,\n    init_embedding: nn.Module = None,\n    aggregation: str = \"add\",\n    self_loop: bool = False,\n    residual: bool = True,\n):\n    \"\"\"\n    Note:\n        - Support fully connected graph for now.\n    \"\"\"\n    super(MessagePassingEncoder, self).__init__()\n\n    self.env_name = env_name\n\n    self.init_embedding = (\n        env_init_embedding(self.env_name, {\"embed_dim\": embed_dim})\n        if init_embedding is None\n        else init_embedding\n    )\n\n    # Generate edge index for a fully connected graph\n    adj_matrix = torch.ones(num_nodes, num_nodes)\n    if self_loop:\n        adj_matrix.fill_diagonal_(0)  # No self-loops\n    self.edge_index = torch.permute(torch.nonzero(adj_matrix), (1, 0))\n\n    # Init message passing models\n    self.mpnn_layers = nn.ModuleList(\n        [\n            MessagePassingLayer(\n                node_indim=embed_dim,\n                node_outdim=embed_dim,\n                edge_indim=1,\n                edge_outdim=1,\n                aggregation=aggregation,\n                residual=residual,\n            )\n            for _ in range(num_layers)\n        ]\n    )\n\n    # Record parameters\n    self.self_loop = self_loop\n
"},{"location":"docs/content/api/networks/nn/#attention-mechanisms","title":"Attention Mechanisms","text":"

Classes:

  • MultiHeadAttention \u2013

    PyTorch native implementation of Flash Multi-Head Attention with automatic mixed precision support.

  • MultiHeadCrossAttention \u2013

    PyTorch native implementation of Flash Multi-Head Cross Attention with automatic mixed precision support.

  • PointerAttention \u2013

    Calculate logits given query, key and value and logit key.

  • PointerAttnMoE \u2013

    Calculate logits given query, key and value and logit key.

  • MultiHeadCompat \u2013
  • PolyNetAttention \u2013

    Calculate logits given query, key and value and logit key.

Functions:

  • scaled_dot_product_attention_simple \u2013

    Simple (exact) Scaled Dot-Product Attention in RL4CO without customized kernels (i.e. no Flash Attention).

"},{"location":"docs/content/api/networks/nn/#models.nn.attention.MultiHeadAttention","title":"MultiHeadAttention","text":"
MultiHeadAttention(\n    embed_dim: int,\n    num_heads: int,\n    bias: bool = True,\n    attention_dropout: float = 0.0,\n    causal: bool = False,\n    device: str = None,\n    dtype: dtype = None,\n    sdpa_fn: Optional[Callable] = None,\n)\n

Bases: Module

PyTorch native implementation of Flash Multi-Head Attention with automatic mixed precision support. Uses PyTorch's native scaled_dot_product_attention implementation, available from 2.0

Note

If scaled_dot_product_attention is not available, use custom implementation of scaled_dot_product_attention without Flash Attention.

Parameters:

  • embed_dim (int) \u2013

    total dimension of the model

  • num_heads (int) \u2013

    number of heads

  • bias (bool, default: True ) \u2013

    whether to use bias

  • attention_dropout (float, default: 0.0 ) \u2013

    dropout rate for attention weights

  • causal (bool, default: False ) \u2013

    whether to apply causal mask to attention scores

  • device (str, default: None ) \u2013

    torch device

  • dtype (dtype, default: None ) \u2013

    torch dtype

  • sdpa_fn (Optional[Callable], default: None ) \u2013

    scaled dot product attention function (SDPA) implementation

Methods:

  • forward \u2013

    x: (batch, seqlen, hidden_dim) (where hidden_dim = num heads * head dim)

Source code in rl4co/models/nn/attention.py
def __init__(\n    self,\n    embed_dim: int,\n    num_heads: int,\n    bias: bool = True,\n    attention_dropout: float = 0.0,\n    causal: bool = False,\n    device: str = None,\n    dtype: torch.dtype = None,\n    sdpa_fn: Optional[Callable] = None,\n) -> None:\n    factory_kwargs = {\"device\": device, \"dtype\": dtype}\n    super().__init__()\n    self.embed_dim = embed_dim\n    self.causal = causal\n    self.attention_dropout = attention_dropout\n    self.sdpa_fn = sdpa_fn if sdpa_fn is not None else scaled_dot_product_attention\n\n    self.num_heads = num_heads\n    assert self.embed_dim % num_heads == 0, \"self.kdim must be divisible by num_heads\"\n    self.head_dim = self.embed_dim // num_heads\n    assert (\n        self.head_dim % 8 == 0 and self.head_dim <= 128\n    ), \"Only support head_dim <= 128 and divisible by 8\"\n\n    self.Wqkv = nn.Linear(embed_dim, 3 * embed_dim, bias=bias, **factory_kwargs)\n    self.out_proj = nn.Linear(embed_dim, embed_dim, bias=bias, **factory_kwargs)\n
"},{"location":"docs/content/api/networks/nn/#models.nn.attention.MultiHeadAttention.forward","title":"forward","text":"
forward(x, attn_mask=None)\n

x: (batch, seqlen, hidden_dim) (where hidden_dim = num heads * head dim) attn_mask: bool tensor of shape (batch, seqlen)

Source code in rl4co/models/nn/attention.py
def forward(self, x, attn_mask=None):\n    \"\"\"x: (batch, seqlen, hidden_dim) (where hidden_dim = num heads * head dim)\n    attn_mask: bool tensor of shape (batch, seqlen)\n    \"\"\"\n    # Project query, key, value\n    q, k, v = rearrange(\n        self.Wqkv(x), \"b s (three h d) -> three b h s d\", three=3, h=self.num_heads\n    ).unbind(dim=0)\n\n    if attn_mask is not None:\n        attn_mask = (\n            attn_mask.unsqueeze(1)\n            if attn_mask.ndim == 3\n            else attn_mask.unsqueeze(1).unsqueeze(2)\n        )\n\n    # Scaled dot product attention\n    out = self.sdpa_fn(\n        q,\n        k,\n        v,\n        attn_mask=attn_mask,\n        dropout_p=self.attention_dropout,\n    )\n    return self.out_proj(rearrange(out, \"b h s d -> b s (h d)\"))\n
"},{"location":"docs/content/api/networks/nn/#models.nn.attention.MultiHeadCrossAttention","title":"MultiHeadCrossAttention","text":"
MultiHeadCrossAttention(\n    embed_dim: int,\n    num_heads: int,\n    bias: bool = False,\n    attention_dropout: float = 0.0,\n    device: str = None,\n    dtype: dtype = None,\n    sdpa_fn: Optional[Union[Callable, Module]] = None,\n)\n

Bases: Module

PyTorch native implementation of Flash Multi-Head Cross Attention with automatic mixed precision support. Uses PyTorch's native scaled_dot_product_attention implementation, available from 2.0

Note

If scaled_dot_product_attention is not available, use custom implementation of scaled_dot_product_attention without Flash Attention.

Parameters:

  • embed_dim (int) \u2013

    total dimension of the model

  • num_heads (int) \u2013

    number of heads

  • bias (bool, default: False ) \u2013

    whether to use bias

  • attention_dropout (float, default: 0.0 ) \u2013

    dropout rate for attention weights

  • device (str, default: None ) \u2013

    torch device

  • dtype (dtype, default: None ) \u2013

    torch dtype

  • sdpa_fn (Optional[Union[Callable, Module]], default: None ) \u2013

    scaled dot product attention function (SDPA)

Source code in rl4co/models/nn/attention.py
def __init__(\n    self,\n    embed_dim: int,\n    num_heads: int,\n    bias: bool = False,\n    attention_dropout: float = 0.0,\n    device: str = None,\n    dtype: torch.dtype = None,\n    sdpa_fn: Optional[Union[Callable, nn.Module]] = None,\n) -> None:\n    factory_kwargs = {\"device\": device, \"dtype\": dtype}\n    super().__init__()\n    self.embed_dim = embed_dim\n    self.attention_dropout = attention_dropout\n\n    # Default to `scaled_dot_product_attention` if `sdpa_fn` is not provided\n    if sdpa_fn is None:\n        sdpa_fn = sdpa_fn_wrapper\n    self.sdpa_fn = sdpa_fn\n\n    self.num_heads = num_heads\n    assert self.embed_dim % num_heads == 0, \"self.kdim must be divisible by num_heads\"\n    self.head_dim = self.embed_dim // num_heads\n    assert (\n        self.head_dim % 8 == 0 and self.head_dim <= 128\n    ), \"Only support head_dim <= 128 and divisible by 8\"\n\n    self.Wq = nn.Linear(embed_dim, embed_dim, bias=bias, **factory_kwargs)\n    self.Wkv = nn.Linear(embed_dim, 2 * embed_dim, bias=bias, **factory_kwargs)\n    self.out_proj = nn.Linear(embed_dim, embed_dim, bias=bias, **factory_kwargs)\n
"},{"location":"docs/content/api/networks/nn/#models.nn.attention.PointerAttention","title":"PointerAttention","text":"
PointerAttention(\n    embed_dim: int,\n    num_heads: int,\n    mask_inner: bool = True,\n    out_bias: bool = False,\n    check_nan: bool = True,\n    sdpa_fn: Optional[Callable] = None,\n    **kwargs\n)\n

Bases: Module

Calculate logits given query, key and value and logit key. This follows the pointer mechanism of Vinyals et al. (2015) (https://arxiv.org/abs/1506.03134).

Note

With Flash Attention, masking is not supported

Performs the following
  1. Apply cross attention to get the heads
  2. Project heads to get glimpse
  3. Compute attention score between glimpse and logit key

Parameters:

  • embed_dim (int) \u2013

    total dimension of the model

  • num_heads (int) \u2013

    number of heads

  • mask_inner (bool, default: True ) \u2013

    whether to mask inner attention

  • linear_bias \u2013

    whether to use bias in linear projection

  • check_nan (bool, default: True ) \u2013

    whether to check for NaNs in logits

  • sdpa_fn (Optional[Callable], default: None ) \u2013

    scaled dot product attention function (SDPA) implementation

Methods:

  • forward \u2013

    Compute attention logits given query, key, value, logit key and attention mask.

Source code in rl4co/models/nn/attention.py
def __init__(\n    self,\n    embed_dim: int,\n    num_heads: int,\n    mask_inner: bool = True,\n    out_bias: bool = False,\n    check_nan: bool = True,\n    sdpa_fn: Optional[Callable] = None,\n    **kwargs,\n):\n    super(PointerAttention, self).__init__()\n    self.num_heads = num_heads\n    self.mask_inner = mask_inner\n\n    # Projection - query, key, value already include projections\n    self.project_out = nn.Linear(embed_dim, embed_dim, bias=out_bias)\n    self.sdpa_fn = sdpa_fn if sdpa_fn is not None else scaled_dot_product_attention\n    self.check_nan = check_nan\n
"},{"location":"docs/content/api/networks/nn/#models.nn.attention.PointerAttention.forward","title":"forward","text":"
forward(query, key, value, logit_key, attn_mask=None)\n

Compute attention logits given query, key, value, logit key and attention mask.

Parameters:

  • query \u2013

    query tensor of shape [B, ..., L, E]

  • key \u2013

    key tensor of shape [B, ..., S, E]

  • value \u2013

    value tensor of shape [B, ..., S, E]

  • logit_key \u2013

    logit key tensor of shape [B, ..., S, E]

  • attn_mask \u2013

    attention mask tensor of shape [B, ..., S]. Note that True means that the value should take part in attention as described in the PyTorch Documentation

Source code in rl4co/models/nn/attention.py
def forward(self, query, key, value, logit_key, attn_mask=None):\n    \"\"\"Compute attention logits given query, key, value, logit key and attention mask.\n\n    Args:\n        query: query tensor of shape [B, ..., L, E]\n        key: key tensor of shape [B, ..., S, E]\n        value: value tensor of shape [B, ..., S, E]\n        logit_key: logit key tensor of shape [B, ..., S, E]\n        attn_mask: attention mask tensor of shape [B, ..., S]. Note that `True` means that the value _should_ take part in attention\n            as described in the [PyTorch Documentation](https://pytorch.org/docs/stable/generated/torch.nn.functional.scaled_dot_product_attention.html)\n    \"\"\"\n    # Compute inner multi-head attention with no projections.\n    heads = self._inner_mha(query, key, value, attn_mask)\n    glimpse = self._project_out(heads, attn_mask)\n\n    # Batch matrix multiplication to compute logits (batch_size, num_steps, graph_size)\n    # bmm is slightly faster than einsum and matmul\n    logits = (torch.bmm(glimpse, logit_key.squeeze(-2).transpose(-2, -1))).squeeze(\n        -2\n    ) / math.sqrt(glimpse.size(-1))\n\n    if self.check_nan:\n        assert not torch.isnan(logits).any(), \"Logits contain NaNs\"\n\n    return logits\n
"},{"location":"docs/content/api/networks/nn/#models.nn.attention.PointerAttnMoE","title":"PointerAttnMoE","text":"
PointerAttnMoE(\n    embed_dim: int,\n    num_heads: int,\n    mask_inner: bool = True,\n    out_bias: bool = False,\n    check_nan: bool = True,\n    sdpa_fn: Optional[Callable] = None,\n    moe_kwargs: Optional[dict] = None,\n)\n

Bases: PointerAttention

Calculate logits given query, key and value and logit key. This follows the pointer mechanism of Vinyals et al. (2015) https://arxiv.org/abs/1506.03134, and the MoE gating mechanism of Zhou et al. (2024) https://arxiv.org/abs/2405.01029.

Note

With Flash Attention, masking is not supported

Performs the following
  1. Apply cross attention to get the heads
  2. Project heads to get glimpse
  3. Compute attention score between glimpse and logit key

Parameters:

  • embed_dim (int) \u2013

    total dimension of the model

  • num_heads (int) \u2013

    number of heads

  • mask_inner (bool, default: True ) \u2013

    whether to mask inner attention

  • linear_bias \u2013

    whether to use bias in linear projection

  • check_nan (bool, default: True ) \u2013

    whether to check for NaNs in logits

  • sdpa_fn (Optional[Callable], default: None ) \u2013

    scaled dot product attention function (SDPA) implementation

  • moe_kwargs (Optional[dict], default: None ) \u2013

    Keyword arguments for MoE

Source code in rl4co/models/nn/attention.py
def __init__(\n    self,\n    embed_dim: int,\n    num_heads: int,\n    mask_inner: bool = True,\n    out_bias: bool = False,\n    check_nan: bool = True,\n    sdpa_fn: Optional[Callable] = None,\n    moe_kwargs: Optional[dict] = None,\n):\n    super(PointerAttnMoE, self).__init__(\n        embed_dim, num_heads, mask_inner, out_bias, check_nan, sdpa_fn\n    )\n    self.moe_kwargs = moe_kwargs\n\n    self.project_out = None\n    self.project_out_moe = MoE(\n        embed_dim, embed_dim, num_neurons=[], out_bias=out_bias, **moe_kwargs\n    )\n    if self.moe_kwargs[\"light_version\"]:\n        self.dense_or_moe = nn.Linear(embed_dim, 2, bias=False)\n        self.project_out = nn.Linear(embed_dim, embed_dim, bias=out_bias)\n
"},{"location":"docs/content/api/networks/nn/#models.nn.attention.MultiHeadCompat","title":"MultiHeadCompat","text":"
MultiHeadCompat(\n    n_heads,\n    input_dim,\n    embed_dim=None,\n    val_dim=None,\n    key_dim=None,\n)\n

Bases: Module

Methods:

  • forward \u2013

    :param q: queries (batch_size, n_query, input_dim)

Source code in rl4co/models/nn/attention.py
def __init__(self, n_heads, input_dim, embed_dim=None, val_dim=None, key_dim=None):\n    super(MultiHeadCompat, self).__init__()\n\n    if val_dim is None:\n        # assert embed_dim is not None, \"Provide either embed_dim or val_dim\"\n        val_dim = embed_dim // n_heads\n    if key_dim is None:\n        key_dim = val_dim\n\n    self.n_heads = n_heads\n    self.input_dim = input_dim\n    self.embed_dim = embed_dim\n    self.val_dim = val_dim\n    self.key_dim = key_dim\n\n    self.W_query = nn.Parameter(torch.Tensor(n_heads, input_dim, key_dim))\n    self.W_key = nn.Parameter(torch.Tensor(n_heads, input_dim, key_dim))\n\n    self.init_parameters()\n
"},{"location":"docs/content/api/networks/nn/#models.nn.attention.MultiHeadCompat.forward","title":"forward","text":"
forward(q, h=None, mask=None)\n

:param q: queries (batch_size, n_query, input_dim) :param h: data (batch_size, graph_size, input_dim) :param mask: mask (batch_size, n_query, graph_size) or viewable as that (i.e. can be 2 dim if n_query == 1) Mask should contain 1 if attention is not possible (i.e. mask is negative adjacency) :return:

Source code in rl4co/models/nn/attention.py
def forward(self, q, h=None, mask=None):\n    \"\"\"\n\n    :param q: queries (batch_size, n_query, input_dim)\n    :param h: data (batch_size, graph_size, input_dim)\n    :param mask: mask (batch_size, n_query, graph_size) or viewable as that (i.e. can be 2 dim if n_query == 1)\n    Mask should contain 1 if attention is not possible (i.e. mask is negative adjacency)\n    :return:\n    \"\"\"\n\n    if h is None:\n        h = q  # compute self-attention\n\n    # h should be (batch_size, graph_size, input_dim)\n    batch_size, graph_size, input_dim = h.size()\n    n_query = q.size(1)\n\n    hflat = h.contiguous().view(-1, input_dim)  #################   reshape\n    qflat = q.contiguous().view(-1, input_dim)\n\n    # last dimension can be different for keys and values\n    shp = (self.n_heads, batch_size, graph_size, -1)\n    shp_q = (self.n_heads, batch_size, n_query, -1)\n\n    # Calculate queries, (n_heads, n_query, graph_size, key/val_size)\n    Q = torch.matmul(qflat, self.W_query).view(shp_q)\n    K = torch.matmul(hflat, self.W_key).view(shp)\n\n    # Calculate compatibility (n_heads, batch_size, n_query, graph_size)\n    compatibility_s2n = torch.matmul(Q, K.transpose(2, 3))\n\n    return compatibility_s2n\n
"},{"location":"docs/content/api/networks/nn/#models.nn.attention.PolyNetAttention","title":"PolyNetAttention","text":"
PolyNetAttention(\n    k: int,\n    embed_dim: int,\n    poly_layer_dim: int,\n    num_heads: int,\n    **kwargs\n)\n

Bases: PointerAttention

Calculate logits given query, key and value and logit key. This implements a modified version the pointer mechanism of Vinyals et al. (2015) (https://arxiv.org/abs/1506.03134) as described in Hottung et al. (2024) (https://arxiv.org/abs/2402.14048) PolyNetAttention conditions the attention logits on a set of k different binary vectors allowing to learn k different solution strategies.

Note

With Flash Attention, masking is not supported

Performs the following
  1. Apply cross attention to get the heads
  2. Project heads to get glimpse
  3. Apply PolyNet layers
  4. Compute attention score between glimpse and logit key

Parameters:

  • k (int) \u2013

    Number unique bit vectors used to compute attention score

  • embed_dim (int) \u2013

    total dimension of the model

  • poly_layer_dim (int) \u2013

    Dimension of the PolyNet layers

  • num_heads (int) \u2013

    number of heads

  • mask_inner \u2013

    whether to mask inner attention

  • linear_bias \u2013

    whether to use bias in linear projection

  • check_nan \u2013

    whether to check for NaNs in logits

  • sdpa_fn \u2013

    scaled dot product attention function (SDPA) implementation

Methods:

  • forward \u2013

    Compute attention logits given query, key, value, logit key and attention mask.

Source code in rl4co/models/nn/attention.py
def __init__(\n    self, k: int, embed_dim: int, poly_layer_dim: int, num_heads: int, **kwargs\n):\n    super(PolyNetAttention, self).__init__(embed_dim, num_heads, **kwargs)\n\n    self.k = k\n    self.binary_vector_dim = math.ceil(math.log2(k))\n    self.binary_vectors = torch.nn.Parameter(\n        torch.Tensor(\n            list(itertools.product([0, 1], repeat=self.binary_vector_dim))[:k]\n        ),\n        requires_grad=False,\n    )\n\n    self.poly_layer_1 = nn.Linear(embed_dim + self.binary_vector_dim, poly_layer_dim)\n    self.poly_layer_2 = nn.Linear(poly_layer_dim, embed_dim)\n
"},{"location":"docs/content/api/networks/nn/#models.nn.attention.PolyNetAttention.forward","title":"forward","text":"
forward(query, key, value, logit_key, attn_mask=None)\n

Compute attention logits given query, key, value, logit key and attention mask.

Parameters:

  • query \u2013

    query tensor of shape [B, ..., L, E]

  • key \u2013

    key tensor of shape [B, ..., S, E]

  • value \u2013

    value tensor of shape [B, ..., S, E]

  • logit_key \u2013

    logit key tensor of shape [B, ..., S, E]

  • attn_mask \u2013

    attention mask tensor of shape [B, ..., S]. Note that True means that the value should take part in attention as described in the PyTorch Documentation

Source code in rl4co/models/nn/attention.py
def forward(self, query, key, value, logit_key, attn_mask=None):\n    \"\"\"Compute attention logits given query, key, value, logit key and attention mask.\n\n    Args:\n        query: query tensor of shape [B, ..., L, E]\n        key: key tensor of shape [B, ..., S, E]\n        value: value tensor of shape [B, ..., S, E]\n        logit_key: logit key tensor of shape [B, ..., S, E]\n        attn_mask: attention mask tensor of shape [B, ..., S]. Note that `True` means that the value _should_ take part in attention\n            as described in the [PyTorch Documentation](https://pytorch.org/docs/stable/generated/torch.nn.functional.scaled_dot_product_attention.html)\n    \"\"\"\n    # Compute inner multi-head attention with no projections.\n    heads = self._inner_mha(query, key, value, attn_mask)\n    glimpse = self.project_out(heads)\n\n    num_solutions = glimpse.shape[1]\n    z = self.binary_vectors.repeat(math.ceil(num_solutions / self.k), 1)[\n        :num_solutions\n    ]\n    z = z[None].expand(glimpse.shape[0], num_solutions, self.binary_vector_dim)\n\n    # PolyNet layers\n    poly_out = self.poly_layer_1(torch.cat((glimpse, z), dim=2))\n    poly_out = F.relu(poly_out)\n    poly_out = self.poly_layer_2(poly_out)\n\n    glimpse += poly_out\n\n    # Batch matrix multiplication to compute logits (batch_size, num_steps, graph_size)\n    # bmm is slightly faster than einsum and matmul\n    logits = (torch.bmm(glimpse, logit_key.squeeze(-2).transpose(-2, -1))).squeeze(\n        -2\n    ) / math.sqrt(glimpse.size(-1))\n\n    if self.check_nan:\n        assert not torch.isnan(logits).any(), \"Logits contain NaNs\"\n\n    return logits\n
"},{"location":"docs/content/api/networks/nn/#models.nn.attention.scaled_dot_product_attention_simple","title":"scaled_dot_product_attention_simple","text":"
scaled_dot_product_attention_simple(\n    q, k, v, attn_mask=None, dropout_p=0.0, is_causal=False\n)\n

Simple (exact) Scaled Dot-Product Attention in RL4CO without customized kernels (i.e. no Flash Attention).

Source code in rl4co/models/nn/attention.py
def scaled_dot_product_attention_simple(\n    q, k, v, attn_mask=None, dropout_p=0.0, is_causal=False\n):\n    \"\"\"Simple (exact) Scaled Dot-Product Attention in RL4CO without customized kernels (i.e. no Flash Attention).\"\"\"\n\n    # Check for causal and attn_mask conflict\n    if is_causal and attn_mask is not None:\n        raise ValueError(\"Cannot set both is_causal and attn_mask\")\n\n    # Calculate scaled dot product\n    scores = torch.matmul(q, k.transpose(-2, -1)) / (k.size(-1) ** 0.5)\n\n    # Apply the provided attention mask\n    if attn_mask is not None:\n        if attn_mask.dtype == torch.bool:\n            scores.masked_fill_(~attn_mask, float(\"-inf\"))\n        else:\n            scores += attn_mask\n\n    # Apply causal mask\n    if is_causal:\n        s, l_ = scores.size(-2), scores.size(-1)\n        mask = torch.triu(torch.ones((s, l_), device=scores.device), diagonal=1)\n        scores.masked_fill_(mask.bool(), float(\"-inf\"))\n\n    # Softmax to get attention weights\n    attn_weights = F.softmax(scores, dim=-1)\n\n    # Apply dropout\n    if dropout_p > 0.0:\n        attn_weights = F.dropout(attn_weights, p=dropout_p)\n\n    # Compute the weighted sum of values\n    return torch.matmul(attn_weights, v)\n
"},{"location":"docs/content/api/networks/nn/#multi-layer-perceptron","title":"Multi-Layer Perceptron","text":""},{"location":"docs/content/api/networks/nn/#models.nn.mlp.MLP","title":"MLP","text":"
MLP(\n    input_dim: int,\n    output_dim: int,\n    num_neurons: List[int] = [64, 32],\n    dropout_probs: Union[None, List[float]] = None,\n    hidden_act: str = \"ReLU\",\n    out_act: str = \"Identity\",\n    input_norm: str = \"None\",\n    output_norm: str = \"None\",\n)\n

Bases: Module

Source code in rl4co/models/nn/mlp.py
def __init__(\n    self,\n    input_dim: int,\n    output_dim: int,\n    num_neurons: List[int] = [64, 32],\n    dropout_probs: Union[None, List[float]] = None,\n    hidden_act: str = \"ReLU\",\n    out_act: str = \"Identity\",\n    input_norm: str = \"None\",\n    output_norm: str = \"None\",\n):\n    super(MLP, self).__init__()\n\n    assert input_norm in [\"Batch\", \"Layer\", \"None\"]\n    assert output_norm in [\"Batch\", \"Layer\", \"None\"]\n\n    if dropout_probs is None:\n        dropout_probs = [0.0] * len(num_neurons)\n    elif len(dropout_probs) != len(num_neurons):\n        log.info(\n            \"dropout_probs List length should match the num_neurons List length for MLP, dropouts set to False instead\"\n        )\n        dropout_probs = [0.0] * len(num_neurons)\n\n    self.input_dim = input_dim\n    self.output_dim = output_dim\n    self.num_neurons = num_neurons\n    self.hidden_act = getattr(nn, hidden_act)()\n    self.out_act = getattr(nn, out_act)()\n    self.dropouts = []\n    for i in range(len(dropout_probs)):\n        self.dropouts.append(nn.Dropout(p=dropout_probs[i]))\n\n    input_dims = [input_dim] + num_neurons\n    output_dims = num_neurons + [output_dim]\n\n    self.lins = nn.ModuleList()\n    for i, (in_dim, out_dim) in enumerate(zip(input_dims, output_dims)):\n        self.lins.append(nn.Linear(in_dim, out_dim))\n\n    self.input_norm = self._get_norm_layer(input_norm, input_dim)\n    self.output_norm = self._get_norm_layer(output_norm, output_dim)\n
"},{"location":"docs/content/api/networks/nn/#operations","title":"Operations","text":""},{"location":"docs/content/api/networks/nn/#models.nn.ops.PositionalEncoding","title":"PositionalEncoding","text":"
PositionalEncoding(\n    embed_dim: int,\n    dropout: float = 0.1,\n    max_len: int = 1000,\n)\n

Bases: Module

Methods:

  • forward \u2013

    Arguments:

Source code in rl4co/models/nn/ops.py
def __init__(self, embed_dim: int, dropout: float = 0.1, max_len: int = 1000):\n    super().__init__()\n    self.dropout = nn.Dropout(p=dropout)\n    self.d_model = embed_dim\n    max_len = max_len\n    position = torch.arange(max_len).unsqueeze(1)\n    div_term = torch.exp(\n        torch.arange(0, self.d_model, 2) * (-math.log(10000.0) / self.d_model)\n    )\n    pe = torch.zeros(max_len, 1, self.d_model)\n    pe[:, 0, 0::2] = torch.sin(position * div_term)\n    pe[:, 0, 1::2] = torch.cos(position * div_term)\n    pe = pe.transpose(0, 1)  # [1, max_len, d_model]\n    self.register_buffer(\"pe\", pe)\n
"},{"location":"docs/content/api/networks/nn/#models.nn.ops.PositionalEncoding.forward","title":"forward","text":"
forward(hidden: Tensor, seq_pos) -> Tensor\n

Parameters:

  • x \u2013

    Tensor, shape [batch_size, seq_len, embedding_dim]

  • seq_pos \u2013

    Tensor, shape [batch_size, seq_len]

Source code in rl4co/models/nn/ops.py
def forward(self, hidden: torch.Tensor, seq_pos) -> torch.Tensor:\n    \"\"\"\n    Arguments:\n        x: Tensor, shape ``[batch_size, seq_len, embedding_dim]``\n        seq_pos: Tensor, shape ``[batch_size, seq_len]``\n    \"\"\"\n    pes = self.pe.expand(hidden.size(0), -1, -1).gather(\n        1, seq_pos.unsqueeze(-1).expand(-1, -1, self.d_model)\n    )\n    hidden = hidden + pes\n    return self.dropout(hidden)\n
"},{"location":"docs/content/api/networks/nn/#models.nn.ops.RandomEncoding","title":"RandomEncoding","text":"
RandomEncoding(embed_dim: int, max_classes: int = 100)\n

Bases: Module

This is like torch.nn.Embedding but with rows of embeddings are randomly permuted in each forward pass before lookup operation. This might be useful in cases where classes have no fixed meaning but rather indicate a connection between different elements in a sequence. Reference is the MatNet model.

Source code in rl4co/models/nn/ops.py
def __init__(self, embed_dim: int, max_classes: int = 100):\n    super().__init__()\n    self.embed_dim = embed_dim\n    self.max_classes = max_classes\n    rand_emb = torch.rand(max_classes, self.embed_dim)\n    self.register_buffer(\"emb\", rand_emb)\n
"},{"location":"docs/content/api/rl/a2c/","title":"A2C","text":""},{"location":"docs/content/api/rl/a2c/#models.rl.a2c.a2c.A2C","title":"A2C","text":"
A2C(\n    env: RL4COEnvBase,\n    policy: Module,\n    critic: CriticNetwork = None,\n    critic_kwargs: dict = {},\n    actor_optimizer_kwargs: dict = {\"lr\": 0.0001},\n    critic_optimizer_kwargs: dict = None,\n    **kwargs\n)\n

Bases: REINFORCE

Advantage Actor Critic (A2C) algorithm. A2C is a variant of REINFORCE where a baseline is provided by a critic network. Here we additionally support different optimizers for the actor and the critic.

Parameters:

  • env (RL4COEnvBase) \u2013

    Environment to use for the algorithm

  • policy (Module) \u2013

    Policy to use for the algorithm

  • critic (CriticNetwork, default: None ) \u2013

    Critic network to use for the algorithm

  • critic_kwargs (dict, default: {} ) \u2013

    Keyword arguments to pass to the critic network

  • actor_optimizer_kwargs (dict, default: {'lr': 0.0001} ) \u2013

    Keyword arguments for the policy (=actor) optimizer

  • critic_optimizer_kwargs (dict, default: None ) \u2013

    Keyword arguments for the critic optimizer. If None, use the same as actor_optimizer_kwargs

  • **kwargs \u2013

    Keyword arguments passed to the superclass

Methods:

  • configure_optimizers \u2013

    Configure the optimizers for the policy and the critic network (=baseline)

Source code in rl4co/models/rl/a2c/a2c.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: nn.Module,\n    critic: CriticNetwork = None,\n    critic_kwargs: dict = {},\n    actor_optimizer_kwargs: dict = {\"lr\": 1e-4},\n    critic_optimizer_kwargs: dict = None,\n    **kwargs,\n):\n    if critic is None:\n        log.info(\"Creating critic network for {}\".format(env.name))\n        critic = create_critic_from_actor(policy, **critic_kwargs)\n\n    # The baseline is directly created here, so we eliminate the baseline argument\n    kwargs.pop(\"baseline\", None)\n\n    super().__init__(env, policy, baseline=CriticBaseline(critic), **kwargs)\n    self.actor_optimizer_kwargs = actor_optimizer_kwargs\n    self.critic_optimizer_kwargs = (\n        critic_optimizer_kwargs\n        if critic_optimizer_kwargs is not None\n        else actor_optimizer_kwargs\n    )\n
"},{"location":"docs/content/api/rl/a2c/#models.rl.a2c.a2c.A2C.configure_optimizers","title":"configure_optimizers","text":"
configure_optimizers()\n

Configure the optimizers for the policy and the critic network (=baseline)

Source code in rl4co/models/rl/a2c/a2c.py
def configure_optimizers(self):\n    \"\"\"Configure the optimizers for the policy and the critic network (=baseline)\"\"\"\n    parameters = [\n        {\"params\": self.policy.parameters(), **self.actor_optimizer_kwargs},\n    ] + [{\"params\": self.baseline.parameters(), **self.critic_optimizer_kwargs}]\n\n    return super().configure_optimizers(parameters)\n
"},{"location":"docs/content/api/rl/base/","title":"RL4COLitModule","text":"

The RL4COLitModule is a wrapper around PyTorch Lightning's LightningModule that provides additional functionality for RL algorithms. It is the parent class for all RL algorithms in the library.

"},{"location":"docs/content/api/rl/base/#models.rl.common.base.RL4COLitModule","title":"RL4COLitModule","text":"
RL4COLitModule(\n    env: RL4COEnvBase,\n    policy: Module,\n    batch_size: int = 512,\n    val_batch_size: Union[List[int], int] = None,\n    test_batch_size: Union[List[int], int] = None,\n    train_data_size: int = 100000,\n    val_data_size: int = 10000,\n    test_data_size: int = 10000,\n    optimizer: Union[str, Optimizer, partial] = \"Adam\",\n    optimizer_kwargs: dict = {\"lr\": 0.0001},\n    lr_scheduler: Union[str, LRScheduler, partial] = None,\n    lr_scheduler_kwargs: dict = {\n        \"milestones\": [80, 95],\n        \"gamma\": 0.1,\n    },\n    lr_scheduler_interval: str = \"epoch\",\n    lr_scheduler_monitor: str = \"val/reward\",\n    generate_default_data: bool = False,\n    shuffle_train_dataloader: bool = False,\n    dataloader_num_workers: int = 0,\n    data_dir: str = \"data/\",\n    log_on_step: bool = True,\n    metrics: dict = {},\n    **litmodule_kwargs\n)\n

Bases: LightningModule

Base class for Lightning modules for RL4CO. This defines the general training loop in terms of RL algorithms. Subclasses should implement mainly the shared_step to define the specific loss functions and optimization routines.

Parameters:

  • env (RL4COEnvBase) \u2013

    RL4CO environment

  • policy (Module) \u2013

    policy network (actor)

  • batch_size (int, default: 512 ) \u2013

    batch size (general one, default used for training)

  • val_batch_size (Union[List[int], int], default: None ) \u2013

    specific batch size for validation. If None, will use batch_size. If list, will use one for each dataset

  • test_batch_size (Union[List[int], int], default: None ) \u2013

    specific batch size for testing. If None, will use val_batch_size. If list, will use one for each dataset

  • train_data_size (int, default: 100000 ) \u2013

    size of training dataset for one epoch

  • val_data_size (int, default: 10000 ) \u2013

    size of validation dataset for one epoch

  • test_data_size (int, default: 10000 ) \u2013

    size of testing dataset for one epoch

  • optimizer (Union[str, Optimizer, partial], default: 'Adam' ) \u2013

    optimizer or optimizer name

  • optimizer_kwargs (dict, default: {'lr': 0.0001} ) \u2013

    optimizer kwargs

  • lr_scheduler (Union[str, LRScheduler, partial], default: None ) \u2013

    learning rate scheduler or learning rate scheduler name

  • lr_scheduler_kwargs (dict, default: {'milestones': [80, 95], 'gamma': 0.1} ) \u2013

    learning rate scheduler kwargs

  • lr_scheduler_interval (str, default: 'epoch' ) \u2013

    learning rate scheduler interval

  • lr_scheduler_monitor (str, default: 'val/reward' ) \u2013

    learning rate scheduler monitor

  • generate_default_data (bool, default: False ) \u2013

    whether to generate default datasets, filling up the data directory

  • shuffle_train_dataloader (bool, default: False ) \u2013

    whether to shuffle training dataloader. Default is False since we recreate dataset every epoch

  • dataloader_num_workers (int, default: 0 ) \u2013

    number of workers for dataloader

  • data_dir (str, default: 'data/' ) \u2013

    data directory

  • metrics (dict, default: {} ) \u2013

    metrics

  • litmodule_kwargs \u2013

    kwargs for LightningModule

Methods:

  • instantiate_metrics \u2013

    Dictionary of metrics to be logged at each phase

  • setup \u2013

    Base LightningModule setup method. This will setup the datasets and dataloaders

  • setup_loggers \u2013

    Log all hyperparameters except those in nn.Module

  • post_setup_hook \u2013

    Hook to be called after setup. Can be used to set up subclasses without overriding setup

  • configure_optimizers \u2013

    Args:

  • log_metrics \u2013

    Log metrics to logger and progress bar

  • forward \u2013

    Forward pass for the model. Simple wrapper around policy. Uses env from the module if not provided.

  • shared_step \u2013

    Shared step between train/val/test. To be implemented in subclass

  • on_train_epoch_end \u2013

    Called at the end of the training epoch. This can be used for instance to update the train dataset

  • wrap_dataset \u2013

    Wrap dataset with policy-specific wrapper. This is useful i.e. in REINFORCE where we need to

Source code in rl4co/models/rl/common/base.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: nn.Module,\n    batch_size: int = 512,\n    val_batch_size: Union[List[int], int] = None,\n    test_batch_size: Union[List[int], int] = None,\n    train_data_size: int = 100_000,\n    val_data_size: int = 10_000,\n    test_data_size: int = 10_000,\n    optimizer: Union[str, torch.optim.Optimizer, partial] = \"Adam\",\n    optimizer_kwargs: dict = {\"lr\": 1e-4},\n    lr_scheduler: Union[str, torch.optim.lr_scheduler.LRScheduler, partial] = None,\n    lr_scheduler_kwargs: dict = {\n        \"milestones\": [80, 95],\n        \"gamma\": 0.1,\n    },\n    lr_scheduler_interval: str = \"epoch\",\n    lr_scheduler_monitor: str = \"val/reward\",\n    generate_default_data: bool = False,\n    shuffle_train_dataloader: bool = False,\n    dataloader_num_workers: int = 0,\n    data_dir: str = \"data/\",\n    log_on_step: bool = True,\n    metrics: dict = {},\n    **litmodule_kwargs,\n):\n    super().__init__(**litmodule_kwargs)\n\n    # This line ensures params passed to LightningModule will be saved to ckpt\n    # it also allows to access params with 'self.hparams' attribute\n    # Note: we will send to logger with `self.logger.save_hyperparams` in `setup`\n    self.save_hyperparameters(logger=False)\n\n    self.env = env\n    self.policy = policy\n\n    self.instantiate_metrics(metrics)\n    self.log_on_step = log_on_step\n\n    self.data_cfg = {\n        \"batch_size\": batch_size,\n        \"val_batch_size\": val_batch_size,\n        \"test_batch_size\": test_batch_size,\n        \"generate_default_data\": generate_default_data,\n        \"data_dir\": data_dir,\n        \"train_data_size\": train_data_size,\n        \"val_data_size\": val_data_size,\n        \"test_data_size\": test_data_size,\n    }\n\n    self._optimizer_name_or_cls: Union[str, torch.optim.Optimizer] = optimizer\n    self.optimizer_kwargs: dict = optimizer_kwargs\n    self._lr_scheduler_name_or_cls: Union[\n        str, torch.optim.lr_scheduler.LRScheduler\n    ] = lr_scheduler\n    self.lr_scheduler_kwargs: dict = lr_scheduler_kwargs\n    self.lr_scheduler_interval: str = lr_scheduler_interval\n    self.lr_scheduler_monitor: str = lr_scheduler_monitor\n\n    self.shuffle_train_dataloader = shuffle_train_dataloader\n    self.dataloader_num_workers = dataloader_num_workers\n
"},{"location":"docs/content/api/rl/base/#models.rl.common.base.RL4COLitModule.instantiate_metrics","title":"instantiate_metrics","text":"
instantiate_metrics(metrics: dict)\n

Dictionary of metrics to be logged at each phase

Source code in rl4co/models/rl/common/base.py
def instantiate_metrics(self, metrics: dict):\n    \"\"\"Dictionary of metrics to be logged at each phase\"\"\"\n\n    if not metrics:\n        log.info(\"No metrics specified, using default\")\n    self.train_metrics = metrics.get(\"train\", [\"loss\", \"reward\"])\n    self.val_metrics = metrics.get(\"val\", [\"reward\"])\n    self.test_metrics = metrics.get(\"test\", [\"reward\"])\n    self.log_on_step = metrics.get(\"log_on_step\", True)\n
"},{"location":"docs/content/api/rl/base/#models.rl.common.base.RL4COLitModule.setup","title":"setup","text":"
setup(stage='fit')\n

Base LightningModule setup method. This will setup the datasets and dataloaders

Note

We also send to the loggers all hyperparams that are not nn.Module (i.e. the policy). Apparently PyTorch Lightning does not do this by default.

Source code in rl4co/models/rl/common/base.py
def setup(self, stage=\"fit\"):\n    \"\"\"Base LightningModule setup method. This will setup the datasets and dataloaders\n\n    Note:\n        We also send to the loggers all hyperparams that are not `nn.Module` (i.e. the policy).\n        Apparently PyTorch Lightning does not do this by default.\n    \"\"\"\n\n    log.info(\"Setting up batch sizes for train/val/test\")\n    train_bs, val_bs, test_bs = (\n        self.data_cfg[\"batch_size\"],\n        self.data_cfg[\"val_batch_size\"],\n        self.data_cfg[\"test_batch_size\"],\n    )\n    self.train_batch_size = train_bs\n    self.val_batch_size = train_bs if val_bs is None else val_bs\n    self.test_batch_size = self.val_batch_size if test_bs is None else test_bs\n\n    if self.data_cfg[\"generate_default_data\"]:\n        log.info(\n            \"Generating default datasets. If found, they will not be overwritten\"\n        )\n        generate_default_datasets(data_dir=self.data_cfg[\"data_dir\"])\n\n    log.info(\"Setting up datasets\")\n    self.train_dataset = self.wrap_dataset(\n        self.env.dataset(self.data_cfg[\"train_data_size\"], phase=\"train\")\n    )\n    self.val_dataset = self.env.dataset(self.data_cfg[\"val_data_size\"], phase=\"val\")\n    self.test_dataset = self.env.dataset(\n        self.data_cfg[\"test_data_size\"], phase=\"test\"\n    )\n    self.dataloader_names = None\n    self.setup_loggers()\n    self.post_setup_hook()\n
"},{"location":"docs/content/api/rl/base/#models.rl.common.base.RL4COLitModule.setup_loggers","title":"setup_loggers","text":"
setup_loggers()\n

Log all hyperparameters except those in nn.Module

Source code in rl4co/models/rl/common/base.py
def setup_loggers(self):\n    \"\"\"Log all hyperparameters except those in `nn.Module`\"\"\"\n    if self.loggers is not None:\n        hparams_save = {\n            k: v for k, v in self.hparams.items() if not isinstance(v, nn.Module)\n        }\n        for logger in self.loggers:\n            logger.log_hyperparams(hparams_save)\n            logger.log_graph(self)\n            logger.save()\n
"},{"location":"docs/content/api/rl/base/#models.rl.common.base.RL4COLitModule.post_setup_hook","title":"post_setup_hook","text":"
post_setup_hook()\n

Hook to be called after setup. Can be used to set up subclasses without overriding setup

Source code in rl4co/models/rl/common/base.py
def post_setup_hook(self):\n    \"\"\"Hook to be called after setup. Can be used to set up subclasses without overriding `setup`\"\"\"\n    pass\n
"},{"location":"docs/content/api/rl/base/#models.rl.common.base.RL4COLitModule.configure_optimizers","title":"configure_optimizers","text":"
configure_optimizers(parameters=None)\n

Parameters:

  • parameters \u2013

    parameters to be optimized. If None, will use self.parameters(), i.e. all parameters

Source code in rl4co/models/rl/common/base.py
def configure_optimizers(self, parameters=None):\n    \"\"\"\n    Args:\n        parameters: parameters to be optimized. If None, will use `self.parameters()`, i.e. all parameters\n    \"\"\"\n\n    if parameters is None:\n        parameters = self.parameters()\n\n    log.info(f\"Instantiating optimizer <{self._optimizer_name_or_cls}>\")\n    if isinstance(self._optimizer_name_or_cls, str):\n        optimizer = create_optimizer(\n            parameters, self._optimizer_name_or_cls, **self.optimizer_kwargs\n        )\n    elif isinstance(self._optimizer_name_or_cls, partial):\n        optimizer = self._optimizer_name_or_cls(parameters, **self.optimizer_kwargs)\n    else:  # User-defined optimizer\n        opt_cls = self._optimizer_name_or_cls\n        optimizer = opt_cls(parameters, **self.optimizer_kwargs)\n        assert isinstance(optimizer, torch.optim.Optimizer)\n\n    # instantiate lr scheduler\n    if self._lr_scheduler_name_or_cls is None:\n        return optimizer\n    else:\n        log.info(f\"Instantiating LR scheduler <{self._lr_scheduler_name_or_cls}>\")\n        if isinstance(self._lr_scheduler_name_or_cls, str):\n            scheduler = create_scheduler(\n                optimizer, self._lr_scheduler_name_or_cls, **self.lr_scheduler_kwargs\n            )\n        elif isinstance(self._lr_scheduler_name_or_cls, partial):\n            scheduler = self._lr_scheduler_name_or_cls(\n                optimizer, **self.lr_scheduler_kwargs\n            )\n        else:  # User-defined scheduler\n            scheduler_cls = self._lr_scheduler_name_or_cls\n            scheduler = scheduler_cls(optimizer, **self.lr_scheduler_kwargs)\n            assert isinstance(scheduler, torch.optim.lr_scheduler.LRScheduler)\n        return [optimizer], {\n            \"scheduler\": scheduler,\n            \"interval\": self.lr_scheduler_interval,\n            \"monitor\": self.lr_scheduler_monitor,\n        }\n
"},{"location":"docs/content/api/rl/base/#models.rl.common.base.RL4COLitModule.log_metrics","title":"log_metrics","text":"
log_metrics(\n    metric_dict: dict,\n    phase: str,\n    dataloader_idx: Union[int, None] = None,\n)\n

Log metrics to logger and progress bar

Source code in rl4co/models/rl/common/base.py
def log_metrics(\n    self, metric_dict: dict, phase: str, dataloader_idx: Union[int, None] = None\n):\n    \"\"\"Log metrics to logger and progress bar\"\"\"\n    metrics = getattr(self, f\"{phase}_metrics\")\n    dataloader_name = \"\"\n    if dataloader_idx is not None and self.dataloader_names is not None:\n        dataloader_name = \"/\" + self.dataloader_names[dataloader_idx]\n    metrics = {\n        f\"{phase}/{k}{dataloader_name}\": v.mean()\n        if isinstance(v, torch.Tensor)\n        else v\n        for k, v in metric_dict.items()\n        if k in metrics\n    }\n    log_on_step = self.log_on_step if phase == \"train\" else False\n    on_epoch = False if phase == \"train\" else True\n    self.log_dict(\n        metrics,\n        on_step=log_on_step,\n        on_epoch=on_epoch,\n        prog_bar=True,\n        sync_dist=True,\n        add_dataloader_idx=False,  # we add manually above\n    )\n    return metrics\n
"},{"location":"docs/content/api/rl/base/#models.rl.common.base.RL4COLitModule.forward","title":"forward","text":"
forward(td, **kwargs)\n

Forward pass for the model. Simple wrapper around policy. Uses env from the module if not provided.

Source code in rl4co/models/rl/common/base.py
def forward(self, td, **kwargs):\n    \"\"\"Forward pass for the model. Simple wrapper around `policy`. Uses `env` from the module if not provided.\"\"\"\n    if kwargs.get(\"env\", None) is None:\n        env = self.env\n    else:\n        log.info(\"Using env from kwargs\")\n        env = kwargs.pop(\"env\")\n    return self.policy(td, env, **kwargs)\n
"},{"location":"docs/content/api/rl/base/#models.rl.common.base.RL4COLitModule.shared_step","title":"shared_step","text":"
shared_step(\n    batch: Any, batch_idx: int, phase: str, **kwargs\n)\n

Shared step between train/val/test. To be implemented in subclass

Source code in rl4co/models/rl/common/base.py
def shared_step(self, batch: Any, batch_idx: int, phase: str, **kwargs):\n    \"\"\"Shared step between train/val/test. To be implemented in subclass\"\"\"\n    raise NotImplementedError(\"Shared step is required to implemented in subclass\")\n
"},{"location":"docs/content/api/rl/base/#models.rl.common.base.RL4COLitModule.on_train_epoch_end","title":"on_train_epoch_end","text":"
on_train_epoch_end()\n

Called at the end of the training epoch. This can be used for instance to update the train dataset with new data (which is the case in RL).

Source code in rl4co/models/rl/common/base.py
def on_train_epoch_end(self):\n    \"\"\"Called at the end of the training epoch. This can be used for instance to update the train dataset\n    with new data (which is the case in RL).\n    \"\"\"\n    # Only update if not in the first epoch\n    # If last epoch, we don't need to update since we will not use the dataset anymore\n    if self.current_epoch < self.trainer.max_epochs - 1:\n        log.info(\"Generating training dataset for next epoch...\")\n        train_dataset = self.env.dataset(self.data_cfg[\"train_data_size\"], \"train\")\n        self.train_dataset = self.wrap_dataset(train_dataset)\n
"},{"location":"docs/content/api/rl/base/#models.rl.common.base.RL4COLitModule.wrap_dataset","title":"wrap_dataset","text":"
wrap_dataset(dataset)\n

Wrap dataset with policy-specific wrapper. This is useful i.e. in REINFORCE where we need to collect the greedy rollout baseline outputs.

Source code in rl4co/models/rl/common/base.py
def wrap_dataset(self, dataset):\n    \"\"\"Wrap dataset with policy-specific wrapper. This is useful i.e. in REINFORCE where we need to\n    collect the greedy rollout baseline outputs.\n    \"\"\"\n    return dataset\n
"},{"location":"docs/content/api/rl/base/#transductive-learning","title":"Transductive Learning","text":"

Transductive models are learning algorithms that optimize on a specific instance. They improve solutions by updating policy parameters \\(\\theta\\), which means that we are running optimization (backprop) at test time. Transductive learning can be performed with different policies: for example EAS updates (a part of) AR policies parameters to obtain better solutions, but I guess there are ways (or papers out there I don't know of) that optimize at test time.

Tip

You may refer to the definition of inductive vs transductive RL . In inductive RL, we train to generalize to new instances. In transductive RL we train (or finetune) to solve only specific ones.

Classes:

  • TransductiveModel \u2013

    Base class for transductive algorithms (i.e. that optimize policy parameters for

"},{"location":"docs/content/api/rl/base/#models.common.transductive.base.TransductiveModel","title":"TransductiveModel","text":"
TransductiveModel(\n    env,\n    policy,\n    dataset: Union[Dataset, str],\n    batch_size: int = 1,\n    max_iters: int = 100,\n    max_runtime: Optional[int] = 86400,\n    save_path: Optional[str] = None,\n    **kwargs\n)\n

Bases: RL4COLitModule

Base class for transductive algorithms (i.e. that optimize policy parameters for specific instances, see https://en.wikipedia.org/wiki/Transduction_(machine_learning)). Transductive algorithms are used online to find better solutions for a given dataset, i.e. given a policy, improve (a part of) its parameters such that the policy performs better on the given dataset.

Note

By default, we use manual optimization to handle the search.

Parameters:

  • env \u2013

    RL4CO environment

  • policy \u2013

    policy network

  • dataset (Union[Dataset, str]) \u2013

    dataset to use for training

  • batch_size (int, default: 1 ) \u2013

    batch size

  • max_iters (int, default: 100 ) \u2013

    maximum number of iterations

  • max_runtime (Optional[int], default: 86400 ) \u2013

    maximum runtime in seconds

  • save_path (Optional[str], default: None ) \u2013

    path to save the model

  • **kwargs \u2013

    additional arguments

Methods:

  • setup \u2013

    Setup the dataset and attributes.

  • on_train_batch_start \u2013

    Called before training (i.e. search) for a new batch begins.

  • training_step \u2013

    Main search loop. We use the training step to effectively adapt to a batch of instances.

  • on_train_batch_end \u2013

    Called when the train batch ends. This can be used for

  • on_train_epoch_end \u2013

    Called when the train ends.

  • validation_step \u2013

    Not used during search

  • test_step \u2013

    Not used during search

Source code in rl4co/models/common/transductive/base.py
def __init__(\n    self,\n    env,\n    policy,\n    dataset: Union[Dataset, str],\n    batch_size: int = 1,\n    max_iters: int = 100,\n    max_runtime: Optional[int] = 86_400,\n    save_path: Optional[str] = None,\n    **kwargs,\n):\n    self.save_hyperparameters(logger=False)\n    super().__init__(env, policy, **kwargs)\n    self.dataset = dataset\n    self.automatic_optimization = False  # we optimize manually\n
"},{"location":"docs/content/api/rl/base/#models.common.transductive.base.TransductiveModel.setup","title":"setup","text":"
setup(stage='fit')\n

Setup the dataset and attributes. The RL4COLitModulebase class automatically loads the data.

Source code in rl4co/models/common/transductive/base.py
def setup(self, stage=\"fit\"):\n    \"\"\"Setup the dataset and attributes.\n    The RL4COLitModulebase class automatically loads the data.\n    \"\"\"\n    if isinstance(self.dataset, str):\n        # load from file\n        self.dataset = self.env.dataset(filename=self.dataset)\n\n    # Set all datasets and batch size as the same\n    for split in [\"train\", \"val\", \"test\"]:\n        setattr(self, f\"{split}_dataset\", self.dataset)\n        setattr(self, f\"{split}_batch_size\", self.hparams.batch_size)\n\n    # Setup loggers\n    self.setup_loggers()\n
"},{"location":"docs/content/api/rl/base/#models.common.transductive.base.TransductiveModel.on_train_batch_start","title":"on_train_batch_start","text":"
on_train_batch_start(batch: Any, batch_idx: int)\n

Called before training (i.e. search) for a new batch begins. This can be used to perform changes to the model or optimizer at the start of each batch.

Source code in rl4co/models/common/transductive/base.py
def on_train_batch_start(self, batch: Any, batch_idx: int):\n    \"\"\"Called before training (i.e. search) for a new batch begins.\n    This can be used to perform changes to the model or optimizer at the start of each batch.\n    \"\"\"\n    pass  # Implement in subclass\n
"},{"location":"docs/content/api/rl/base/#models.common.transductive.base.TransductiveModel.training_step","title":"training_step abstractmethod","text":"
training_step(batch, batch_idx)\n

Main search loop. We use the training step to effectively adapt to a batch of instances.

Source code in rl4co/models/common/transductive/base.py
@abc.abstractmethod\ndef training_step(self, batch, batch_idx):\n    \"\"\"Main search loop. We use the training step to effectively adapt to a `batch` of instances.\"\"\"\n    raise NotImplementedError(\"Implement in subclass\")\n
"},{"location":"docs/content/api/rl/base/#models.common.transductive.base.TransductiveModel.on_train_batch_end","title":"on_train_batch_end","text":"
on_train_batch_end(\n    outputs: STEP_OUTPUT, batch: Any, batch_idx: int\n) -> None\n

Called when the train batch ends. This can be used for instance for logging or clearing cache.

Source code in rl4co/models/common/transductive/base.py
def on_train_batch_end(\n    self, outputs: STEP_OUTPUT, batch: Any, batch_idx: int\n) -> None:\n    \"\"\"Called when the train batch ends. This can be used for\n    instance for logging or clearing cache.\n    \"\"\"\n    pass  # Implement in subclass\n
"},{"location":"docs/content/api/rl/base/#models.common.transductive.base.TransductiveModel.on_train_epoch_end","title":"on_train_epoch_end","text":"
on_train_epoch_end() -> None\n

Called when the train ends.

Source code in rl4co/models/common/transductive/base.py
def on_train_epoch_end(self) -> None:\n    \"\"\"Called when the train ends.\"\"\"\n    pass  # Implement in subclass\n
"},{"location":"docs/content/api/rl/base/#models.common.transductive.base.TransductiveModel.validation_step","title":"validation_step","text":"
validation_step(batch: Any, batch_idx: int)\n

Not used during search

Source code in rl4co/models/common/transductive/base.py
def validation_step(self, batch: Any, batch_idx: int):\n    \"\"\"Not used during search\"\"\"\n    pass\n
"},{"location":"docs/content/api/rl/base/#models.common.transductive.base.TransductiveModel.test_step","title":"test_step","text":"
test_step(batch: Any, batch_idx: int)\n

Not used during search

Source code in rl4co/models/common/transductive/base.py
def test_step(self, batch: Any, batch_idx: int):\n    \"\"\"Not used during search\"\"\"\n    pass\n
"},{"location":"docs/content/api/rl/ppo/","title":"PPO","text":""},{"location":"docs/content/api/rl/ppo/#models.rl.ppo.ppo.PPO","title":"PPO","text":"
PPO(\n    env: RL4COEnvBase,\n    policy: Module,\n    critic: CriticNetwork = None,\n    critic_kwargs: dict = {},\n    clip_range: float = 0.2,\n    ppo_epochs: int = 2,\n    mini_batch_size: Union[int, float] = 0.25,\n    vf_lambda: float = 0.5,\n    entropy_lambda: float = 0.0,\n    normalize_adv: bool = False,\n    max_grad_norm: float = 0.5,\n    metrics: dict = {\n        \"train\": [\n            \"reward\",\n            \"loss\",\n            \"surrogate_loss\",\n            \"value_loss\",\n            \"entropy\",\n        ]\n    },\n    **kwargs\n)\n

Bases: RL4COLitModule

An implementation of the Proximal Policy Optimization (PPO) algorithm (https://arxiv.org/abs/1707.06347) is presented with modifications for autoregressive decoding schemes.

In contrast to the original PPO algorithm, this implementation does not consider autoregressive decoding steps as part of the MDP transition. While many Neural Combinatorial Optimization (NCO) studies model decoding steps as transitions in a solution-construction MDP, we treat autoregressive solution construction as an algorithmic choice for tractable CO solution generation. This choice aligns with the Attention Model (AM) (https://openreview.net/forum?id=ByxBFsRqYm), which treats decoding steps as a single-step MDP in Equation 9.

Modeling autoregressive decoding steps as a single-step MDP introduces significant changes to the PPO implementation, including:

  • Generalized Advantage Estimation (GAE) (https://arxiv.org/abs/1506.02438) is not applicable since we are dealing with a single-step MDP.
  • The definition of policy entropy can differ from the commonly implemented manner.

The commonly implemented definition of policy entropy is the entropy of the policy distribution, given by:

\\[H(\\pi(x_t)) = - \\sum_{a_t \\in A_t} \\pi(a_t|x_t) \\log \\pi(a_t|x_t)\\]

where \\(x_t\\) represents the given state at step \\(t\\), \\(A_t\\) is the set of all (admisible) actions at step \\(t\\), and \\(a_t\\) is the action taken at step \\(t\\).

If we interpret autoregressive decoding steps as transition steps of an MDP, the entropy for the entire decoding process can be defined as the sum of entropies for each decoding step:

\\[H(\\pi) = \\sum_t H(\\pi(x_t))\\]

However, if we consider autoregressive decoding steps as an algorithmic choice, the entropy for the entire decoding process is defined as:

\\[H(\\pi) = - \\sum_{a \\in A} \\pi(a|x) \\log \\pi(a|x)\\]

where \\(x\\) represents the given CO problem instance, and \\(A\\) is the set of all feasible solutions.

Due to the intractability of computing the entropy of the policy distribution over all feasible solutions, we approximate it by computing the entropy over solutions generated by the policy itself. This approximation serves as a proxy for the second definition of entropy, utilizing Monte Carlo sampling.

It is worth noting that our modeling of decoding steps and the implementation of the PPO algorithm align with recent work in the Natural Language Processing (NLP) community, specifically RL with Human Feedback (RLHF) (e.g., https://github.com/lucidrains/PaLM-rlhf-pytorch).

Methods:

  • on_train_epoch_end \u2013

    ToDo: Add support for other schedulers.

Source code in rl4co/models/rl/ppo/ppo.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: nn.Module,\n    critic: CriticNetwork = None,\n    critic_kwargs: dict = {},\n    clip_range: float = 0.2,  # epsilon of PPO\n    ppo_epochs: int = 2,  # inner epoch, K\n    mini_batch_size: Union[int, float] = 0.25,  # 0.25,\n    vf_lambda: float = 0.5,  # lambda of Value function fitting\n    entropy_lambda: float = 0.0,  # lambda of entropy bonus\n    normalize_adv: bool = False,  # whether to normalize advantage\n    max_grad_norm: float = 0.5,  # max gradient norm\n    metrics: dict = {\n        \"train\": [\"reward\", \"loss\", \"surrogate_loss\", \"value_loss\", \"entropy\"],\n    },\n    **kwargs,\n):\n    super().__init__(env, policy, metrics=metrics, **kwargs)\n    self.automatic_optimization = False  # PPO uses custom optimization routine\n\n    if critic is None:\n        log.info(\"Creating critic network for {}\".format(env.name))\n        critic = create_critic_from_actor(policy, **critic_kwargs)\n    self.critic = critic\n\n    if isinstance(mini_batch_size, float) and (\n        mini_batch_size <= 0 or mini_batch_size > 1\n    ):\n        default_mini_batch_fraction = 0.25\n        log.warning(\n            f\"mini_batch_size must be an integer or a float in the range (0, 1], got {mini_batch_size}. Setting mini_batch_size to {default_mini_batch_fraction}.\"\n        )\n        mini_batch_size = default_mini_batch_fraction\n\n    if isinstance(mini_batch_size, int) and (mini_batch_size <= 0):\n        default_mini_batch_size = 128\n        log.warning(\n            f\"mini_batch_size must be an integer or a float in the range (0, 1], got {mini_batch_size}. Setting mini_batch_size to {default_mini_batch_size}.\"\n        )\n        mini_batch_size = default_mini_batch_size\n\n    self.ppo_cfg = {\n        \"clip_range\": clip_range,\n        \"ppo_epochs\": ppo_epochs,\n        \"mini_batch_size\": mini_batch_size,\n        \"vf_lambda\": vf_lambda,\n        \"entropy_lambda\": entropy_lambda,\n        \"normalize_adv\": normalize_adv,\n        \"max_grad_norm\": max_grad_norm,\n    }\n
"},{"location":"docs/content/api/rl/ppo/#models.rl.ppo.ppo.PPO.on_train_epoch_end","title":"on_train_epoch_end","text":"
on_train_epoch_end()\n

ToDo: Add support for other schedulers.

Source code in rl4co/models/rl/ppo/ppo.py
def on_train_epoch_end(self):\n    \"\"\"\n    ToDo: Add support for other schedulers.\n    \"\"\"\n\n    sch = self.lr_schedulers()\n\n    # If the selected scheduler is a MultiStepLR scheduler.\n    if isinstance(sch, torch.optim.lr_scheduler.MultiStepLR):\n        sch.step()\n
"},{"location":"docs/content/api/rl/reinforce/","title":"REINFORCE","text":""},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.reinforce.REINFORCE","title":"REINFORCE","text":"
REINFORCE(\n    env: RL4COEnvBase,\n    policy: Module,\n    baseline: Union[REINFORCEBaseline, str] = \"rollout\",\n    baseline_kwargs: dict = {},\n    reward_scale: str = None,\n    **kwargs\n)\n

Bases: RL4COLitModule

REINFORCE algorithm, also known as policy gradients. See superclass RL4COLitModule for more details.

Parameters:

  • env (RL4COEnvBase) \u2013

    Environment to use for the algorithm

  • policy (Module) \u2013

    Policy to use for the algorithm

  • baseline (Union[REINFORCEBaseline, str], default: 'rollout' ) \u2013

    REINFORCE baseline

  • baseline_kwargs (dict, default: {} ) \u2013

    Keyword arguments for baseline. Ignored if baseline is not a string

  • **kwargs \u2013

    Keyword arguments passed to the superclass

Methods:

  • calculate_loss \u2013

    Calculate loss for REINFORCE algorithm.

  • on_train_epoch_end \u2013

    Callback for end of training epoch: we evaluate the baseline

  • wrap_dataset \u2013

    Wrap dataset from baseline evaluation. Used in greedy rollout baseline

  • set_decode_type_multistart \u2013

    Set decode type to multistart for train, val and test in policy.

  • load_from_checkpoint \u2013

    Load model from checkpoint/

Source code in rl4co/models/rl/reinforce/reinforce.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: nn.Module,\n    baseline: Union[REINFORCEBaseline, str] = \"rollout\",\n    baseline_kwargs: dict = {},\n    reward_scale: str = None,\n    **kwargs,\n):\n    super().__init__(env, policy, **kwargs)\n\n    self.save_hyperparameters(logger=False)\n\n    if baseline == \"critic\":\n        log.warning(\n            \"Using critic as baseline. If you want more granular support, use the A2C module instead.\"\n        )\n\n    if isinstance(baseline, str):\n        baseline = get_reinforce_baseline(baseline, **baseline_kwargs)\n    else:\n        if baseline_kwargs != {}:\n            log.warning(\"baseline_kwargs is ignored when baseline is not a string\")\n    self.baseline = baseline\n    self.advantage_scaler = RewardScaler(reward_scale)\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.reinforce.REINFORCE.calculate_loss","title":"calculate_loss","text":"
calculate_loss(\n    td: TensorDict,\n    batch: TensorDict,\n    policy_out: dict,\n    reward: Optional[Tensor] = None,\n    log_likelihood: Optional[Tensor] = None,\n)\n

Calculate loss for REINFORCE algorithm.

Parameters:

  • td (TensorDict) \u2013

    TensorDict containing the current state of the environment

  • batch (TensorDict) \u2013

    Batch of data. This is used to get the extra loss terms, e.g., REINFORCE baseline

  • policy_out (dict) \u2013

    Output of the policy network

  • reward (Optional[Tensor], default: None ) \u2013

    Reward tensor. If None, it is taken from policy_out

  • log_likelihood (Optional[Tensor], default: None ) \u2013

    Log-likelihood tensor. If None, it is taken from policy_out

Source code in rl4co/models/rl/reinforce/reinforce.py
def calculate_loss(\n    self,\n    td: TensorDict,\n    batch: TensorDict,\n    policy_out: dict,\n    reward: Optional[torch.Tensor] = None,\n    log_likelihood: Optional[torch.Tensor] = None,\n):\n    \"\"\"Calculate loss for REINFORCE algorithm.\n\n    Args:\n        td: TensorDict containing the current state of the environment\n        batch: Batch of data. This is used to get the extra loss terms, e.g., REINFORCE baseline\n        policy_out: Output of the policy network\n        reward: Reward tensor. If None, it is taken from `policy_out`\n        log_likelihood: Log-likelihood tensor. If None, it is taken from `policy_out`\n    \"\"\"\n    # Extra: this is used for additional loss terms, e.g., REINFORCE baseline\n    extra = batch.get(\"extra\", None)\n    reward = reward if reward is not None else policy_out[\"reward\"]\n    log_likelihood = (\n        log_likelihood if log_likelihood is not None else policy_out[\"log_likelihood\"]\n    )\n\n    # REINFORCE baseline\n    bl_val, bl_loss = (\n        self.baseline.eval(td, reward, self.env) if extra is None else (extra, 0)\n    )\n\n    # Main loss function\n    advantage = reward - bl_val  # advantage = reward - baseline\n    advantage = self.advantage_scaler(advantage)\n    reinforce_loss = -(advantage * log_likelihood).mean()\n    loss = reinforce_loss + bl_loss\n    policy_out.update(\n        {\n            \"loss\": loss,\n            \"reinforce_loss\": reinforce_loss,\n            \"bl_loss\": bl_loss,\n            \"bl_val\": bl_val,\n        }\n    )\n    return policy_out\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.reinforce.REINFORCE.on_train_epoch_end","title":"on_train_epoch_end","text":"
on_train_epoch_end()\n

Callback for end of training epoch: we evaluate the baseline

Source code in rl4co/models/rl/reinforce/reinforce.py
def on_train_epoch_end(self):\n    \"\"\"Callback for end of training epoch: we evaluate the baseline\"\"\"\n    self.baseline.epoch_callback(\n        self.policy,\n        env=self.env,\n        batch_size=self.val_batch_size,\n        device=get_lightning_device(self),\n        epoch=self.current_epoch,\n        dataset_size=self.data_cfg[\"val_data_size\"],\n    )\n    # Need to call super() for the dataset to be reset\n    super().on_train_epoch_end()\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.reinforce.REINFORCE.wrap_dataset","title":"wrap_dataset","text":"
wrap_dataset(dataset)\n

Wrap dataset from baseline evaluation. Used in greedy rollout baseline

Source code in rl4co/models/rl/reinforce/reinforce.py
def wrap_dataset(self, dataset):\n    \"\"\"Wrap dataset from baseline evaluation. Used in greedy rollout baseline\"\"\"\n    return self.baseline.wrap_dataset(\n        dataset,\n        self.env,\n        batch_size=self.val_batch_size,\n        device=get_lightning_device(self),\n    )\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.reinforce.REINFORCE.set_decode_type_multistart","title":"set_decode_type_multistart","text":"
set_decode_type_multistart(phase: str)\n

Set decode type to multistart for train, val and test in policy. For example, if the decode type is greedy, it will be set to multistart_greedy.

Parameters:

  • phase (str) \u2013

    Phase to set decode type for. Must be one of train, val or test.

Source code in rl4co/models/rl/reinforce/reinforce.py
def set_decode_type_multistart(self, phase: str):\n    \"\"\"Set decode type to `multistart` for train, val and test in policy.\n    For example, if the decode type is `greedy`, it will be set to `multistart_greedy`.\n\n    Args:\n        phase: Phase to set decode type for. Must be one of `train`, `val` or `test`.\n    \"\"\"\n    attribute = f\"{phase}_decode_type\"\n    attr_get = getattr(self.policy, attribute)\n    # If does not exist, log error\n    if attr_get is None:\n        log.error(f\"Decode type for {phase} is None. Cannot prepend `multistart_`.\")\n        return\n    elif \"multistart\" in attr_get:\n        return\n    else:\n        setattr(self.policy, attribute, f\"multistart_{attr_get}\")\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.reinforce.REINFORCE.load_from_checkpoint","title":"load_from_checkpoint classmethod","text":"
load_from_checkpoint(\n    checkpoint_path: Union[_PATH, IO],\n    map_location: _MAP_LOCATION_TYPE = None,\n    hparams_file: Optional[_PATH] = None,\n    strict: bool = False,\n    load_baseline: bool = True,\n    **kwargs: Any\n) -> Self\n

Load model from checkpoint/

Note

This is a modified version of load_from_checkpoint from pytorch_lightning.core.saving. It deals with matching keys for the baseline by first running setup

Source code in rl4co/models/rl/reinforce/reinforce.py
@classmethod\ndef load_from_checkpoint(\n    cls,\n    checkpoint_path: Union[_PATH, IO],\n    map_location: _MAP_LOCATION_TYPE = None,\n    hparams_file: Optional[_PATH] = None,\n    strict: bool = False,\n    load_baseline: bool = True,\n    **kwargs: Any,\n) -> Self:\n    \"\"\"Load model from checkpoint/\n\n    Note:\n        This is a modified version of `load_from_checkpoint` from `pytorch_lightning.core.saving`.\n        It deals with matching keys for the baseline by first running setup\n    \"\"\"\n\n    if strict:\n        log.warning(\"Setting strict=False for loading model from checkpoint.\")\n        strict = False\n\n    # Do not use strict\n    loaded = _load_from_checkpoint(\n        cls,\n        checkpoint_path,\n        map_location,\n        hparams_file,\n        strict,\n        **kwargs,\n    )\n\n    # Load baseline state dict\n    if load_baseline:\n        # setup baseline first\n        loaded.setup()\n        loaded.post_setup_hook()\n        # load baseline state dict\n        state_dict = torch.load(checkpoint_path, map_location=map_location)[\"state_dict\"]\n        # get only baseline parameters\n        state_dict = {k: v for k, v in state_dict.items() if \"baseline\" in k}\n        state_dict = {k.replace(\"baseline.\", \"\", 1): v for k, v in state_dict.items()}\n        loaded.baseline.load_state_dict(state_dict)\n\n    return cast(Self, loaded)\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.REINFORCEBaseline","title":"REINFORCEBaseline","text":"
REINFORCEBaseline(*args, **kw)\n

Bases: Module

Base class for REINFORCE baselines

Methods:

  • wrap_dataset \u2013

    Wrap dataset with baseline-specific functionality

  • eval \u2013

    Evaluate baseline

  • epoch_callback \u2013

    Callback at the end of each epoch

  • setup \u2013

    To be called before training during setup phase

Source code in rl4co/models/rl/reinforce/baselines.py
def __init__(self, *args, **kw):\n    super().__init__()\n    pass\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.REINFORCEBaseline.wrap_dataset","title":"wrap_dataset","text":"
wrap_dataset(dataset: Dataset, *args, **kw)\n

Wrap dataset with baseline-specific functionality

Source code in rl4co/models/rl/reinforce/baselines.py
def wrap_dataset(self, dataset: Dataset, *args, **kw):\n    \"\"\"Wrap dataset with baseline-specific functionality\"\"\"\n    return dataset\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.REINFORCEBaseline.eval","title":"eval abstractmethod","text":"
eval(\n    td: TensorDict,\n    reward: Tensor,\n    env: RL4COEnvBase = None,\n    **kwargs\n)\n

Evaluate baseline

Source code in rl4co/models/rl/reinforce/baselines.py
@abc.abstractmethod\ndef eval(\n    self, td: TensorDict, reward: torch.Tensor, env: RL4COEnvBase = None, **kwargs\n):\n    \"\"\"Evaluate baseline\"\"\"\n    raise NotImplementedError\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.REINFORCEBaseline.epoch_callback","title":"epoch_callback","text":"
epoch_callback(*args, **kw)\n

Callback at the end of each epoch For example, update baseline parameters and obtain baseline values

Source code in rl4co/models/rl/reinforce/baselines.py
def epoch_callback(self, *args, **kw):\n    \"\"\"Callback at the end of each epoch\n    For example, update baseline parameters and obtain baseline values\n    \"\"\"\n    pass\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.REINFORCEBaseline.setup","title":"setup","text":"
setup(*args, **kw)\n

To be called before training during setup phase This follow PyTorch Lightning's setup() convention

Source code in rl4co/models/rl/reinforce/baselines.py
def setup(self, *args, **kw):\n    \"\"\"To be called before training during setup phase\n    This follow PyTorch Lightning's setup() convention\n    \"\"\"\n    pass\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.NoBaseline","title":"NoBaseline","text":"
NoBaseline(*args, **kw)\n

Bases: REINFORCEBaseline

No baseline: return 0 for baseline and neg_los

Methods:

  • eval \u2013

    Evaluate baseline

Source code in rl4co/models/rl/reinforce/baselines.py
def __init__(self, *args, **kw):\n    super().__init__()\n    pass\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.NoBaseline.eval","title":"eval","text":"
eval(td, reward, env=None)\n

Evaluate baseline

Source code in rl4co/models/rl/reinforce/baselines.py
def eval(self, td, reward, env=None):\n    return 0, 0  # No baseline, no neg_los\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.SharedBaseline","title":"SharedBaseline","text":"
SharedBaseline(*args, **kw)\n

Bases: REINFORCEBaseline

Shared baseline: return mean of reward as baseline

Methods:

  • eval \u2013

    Evaluate baseline

Source code in rl4co/models/rl/reinforce/baselines.py
def __init__(self, *args, **kw):\n    super().__init__()\n    pass\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.SharedBaseline.eval","title":"eval","text":"
eval(td, reward, env=None, on_dim=1)\n

Evaluate baseline

Source code in rl4co/models/rl/reinforce/baselines.py
def eval(self, td, reward, env=None, on_dim=1):  # e.g. [batch, pomo, ...]\n    return reward.mean(dim=on_dim, keepdims=True), 0\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.ExponentialBaseline","title":"ExponentialBaseline","text":"
ExponentialBaseline(beta=0.8, **kw)\n

Bases: REINFORCEBaseline

Exponential baseline: return exponential moving average of reward as baseline

Parameters:

  • beta \u2013

    Beta value for the exponential moving average

Methods:

  • eval \u2013

    Evaluate baseline

Source code in rl4co/models/rl/reinforce/baselines.py
def __init__(self, beta=0.8, **kw):\n    super(REINFORCEBaseline, self).__init__()\n\n    self.beta = beta\n    self.v = None\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.ExponentialBaseline.eval","title":"eval","text":"
eval(td, reward, env=None)\n

Evaluate baseline

Source code in rl4co/models/rl/reinforce/baselines.py
def eval(self, td, reward, env=None):\n    if self.v is None:\n        v = reward.mean()\n    else:\n        v = self.beta * self.v + (1.0 - self.beta) * reward.mean()\n    self.v = v.detach()  # Detach since we never want to backprop\n    return self.v, 0  # No loss\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.MeanBaseline","title":"MeanBaseline","text":"
MeanBaseline(*args, **kw)\n

Bases: REINFORCEBaseline

Mean baseline: return mean of reward as baseline

Source code in rl4co/models/rl/reinforce/baselines.py
def __init__(self, *args, **kw):\n    super().__init__()\n    pass\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.WarmupBaseline","title":"WarmupBaseline","text":"
WarmupBaseline(\n    baseline, n_epochs=1, warmup_exp_beta=0.8, **kw\n)\n

Bases: REINFORCEBaseline

Warmup baseline: return convex combination of baseline and exponential baseline

Parameters:

  • baseline \u2013

    Baseline to use after warmup

  • n_epochs \u2013

    Number of epochs to warmup

  • warmup_exp_beta \u2013

    Beta value for the exponential baseline during warmup

Methods:

  • wrap_dataset \u2013

    Wrap dataset with baseline-specific functionality

  • setup \u2013

    To be called before training during setup phase

  • eval \u2013

    Evaluate baseline

  • epoch_callback \u2013

    Callback at the end of each epoch

Source code in rl4co/models/rl/reinforce/baselines.py
def __init__(self, baseline, n_epochs=1, warmup_exp_beta=0.8, **kw):\n    super(REINFORCEBaseline, self).__init__()\n\n    self.baseline = baseline\n    assert n_epochs > 0, \"n_epochs to warmup must be positive\"\n    self.warmup_baseline = ExponentialBaseline(warmup_exp_beta)\n    self.alpha = 0\n    self.n_epochs = n_epochs\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.WarmupBaseline.wrap_dataset","title":"wrap_dataset","text":"
wrap_dataset(dataset, *args, **kw)\n

Wrap dataset with baseline-specific functionality

Source code in rl4co/models/rl/reinforce/baselines.py
def wrap_dataset(self, dataset, *args, **kw):\n    if self.alpha > 0:\n        return self.baseline.wrap_dataset(dataset, *args, **kw)\n    return self.warmup_baseline.wrap_dataset(dataset, *args, **kw)\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.WarmupBaseline.setup","title":"setup","text":"
setup(*args, **kw)\n

To be called before training during setup phase This follow PyTorch Lightning's setup() convention

Source code in rl4co/models/rl/reinforce/baselines.py
def setup(self, *args, **kw):\n    self.baseline.setup(*args, **kw)\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.WarmupBaseline.eval","title":"eval","text":"
eval(td, reward, env=None)\n

Evaluate baseline

Source code in rl4co/models/rl/reinforce/baselines.py
def eval(self, td, reward, env=None):\n    if self.alpha == 1:\n        return self.baseline.eval(td, reward, env)\n    if self.alpha == 0:\n        return self.warmup_baseline.eval(td, reward, env)\n    v_b, l_b = self.baseline.eval(td, reward, env)\n    v_wb, l_wb = self.warmup_baseline.eval(td, reward, env)\n    # Return convex combination of baseline and of loss\n    return (\n        self.alpha * v_b + (1 - self.alpha) * v_wb,\n        self.alpha * l_b + (1 - self.alpha) * l_wb,\n    )\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.WarmupBaseline.epoch_callback","title":"epoch_callback","text":"
epoch_callback(*args, **kw)\n

Callback at the end of each epoch For example, update baseline parameters and obtain baseline values

Source code in rl4co/models/rl/reinforce/baselines.py
def epoch_callback(self, *args, **kw):\n    # Need to call epoch callback of inner policy (also after first epoch if we have not used it)\n    self.baseline.epoch_callback(*args, **kw)\n    if kw[\"epoch\"] < self.n_epochs:\n        self.alpha = (kw[\"epoch\"] + 1) / float(self.n_epochs)\n        log.info(\"Set warmup alpha = {}\".format(self.alpha))\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.CriticBaseline","title":"CriticBaseline","text":"
CriticBaseline(critic: CriticNetwork = None, **unused_kw)\n

Bases: REINFORCEBaseline

Critic baseline: use critic network as baseline

Parameters:

  • critic (CriticNetwork, default: None ) \u2013

    Critic network to use as baseline. If None, create a new critic network based on the environment

Methods:

  • setup \u2013

    To be called before training during setup phase

  • eval \u2013

    Evaluate baseline

Source code in rl4co/models/rl/reinforce/baselines.py
def __init__(self, critic: CriticNetwork = None, **unused_kw):\n    super(CriticBaseline, self).__init__()\n    self.critic = critic\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.CriticBaseline.setup","title":"setup","text":"
setup(policy, env, **kwargs)\n

To be called before training during setup phase This follow PyTorch Lightning's setup() convention

Source code in rl4co/models/rl/reinforce/baselines.py
def setup(self, policy, env, **kwargs):\n    if self.critic is None:\n        log.info(\"Critic not found. Creating critic network for {}\".format(env.name))\n        self.critic = create_critic_from_actor(policy)\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.CriticBaseline.eval","title":"eval","text":"
eval(x, c, env=None)\n

Evaluate baseline

Source code in rl4co/models/rl/reinforce/baselines.py
def eval(self, x, c, env=None):\n    v = self.critic(x).squeeze(-1)\n    # detach v since actor should not backprop through baseline, only for loss\n    return v.detach(), F.mse_loss(v, c.detach())\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.RolloutBaseline","title":"RolloutBaseline","text":"
RolloutBaseline(bl_alpha=0.05, **kw)\n

Bases: REINFORCEBaseline

Rollout baseline: use greedy rollout as baseline

Parameters:

  • bl_alpha \u2013

    Alpha value for the baseline T-test

Methods:

  • setup \u2013

    To be called before training during setup phase

  • eval \u2013

    Evaluate rollout baseline

  • epoch_callback \u2013

    Challenges the current baseline with the policy and replaces the baseline policy if it is improved

  • rollout \u2013

    Rollout the policy on the given dataset

  • wrap_dataset \u2013

    Wrap the dataset in a baseline dataset

Source code in rl4co/models/rl/reinforce/baselines.py
def __init__(self, bl_alpha=0.05, **kw):\n    super(RolloutBaseline, self).__init__()\n    self.bl_alpha = bl_alpha\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.RolloutBaseline.setup","title":"setup","text":"
setup(*args, **kw)\n

To be called before training during setup phase This follow PyTorch Lightning's setup() convention

Source code in rl4co/models/rl/reinforce/baselines.py
def setup(self, *args, **kw):\n    self._update_policy(*args, **kw)\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.RolloutBaseline.eval","title":"eval","text":"
eval(td, reward, env)\n

Evaluate rollout baseline

Warning

This is not differentiable and should only be used for evaluation. Also, it is recommended to use the rollout method directly instead of this method.

Source code in rl4co/models/rl/reinforce/baselines.py
def eval(self, td, reward, env):\n    \"\"\"Evaluate rollout baseline\n\n    Warning:\n        This is not differentiable and should only be used for evaluation.\n        Also, it is recommended to use the `rollout` method directly instead of this method.\n    \"\"\"\n    with torch.inference_mode():\n        reward = self.policy(td, env)[\"reward\"]\n    return reward, 0\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.RolloutBaseline.epoch_callback","title":"epoch_callback","text":"
epoch_callback(\n    policy,\n    env,\n    batch_size=64,\n    device=\"cpu\",\n    epoch=None,\n    dataset_size=None,\n)\n

Challenges the current baseline with the policy and replaces the baseline policy if it is improved

Source code in rl4co/models/rl/reinforce/baselines.py
def epoch_callback(\n    self, policy, env, batch_size=64, device=\"cpu\", epoch=None, dataset_size=None\n):\n    \"\"\"Challenges the current baseline with the policy and replaces the baseline policy if it is improved\"\"\"\n    log.info(\"Evaluating candidate policy on evaluation dataset\")\n    candidate_vals = self.rollout(policy, env, batch_size, device).cpu().numpy()\n    candidate_mean = candidate_vals.mean()\n\n    log.info(\n        \"Candidate mean: {:.3f}, Baseline mean: {:.3f}\".format(\n            candidate_mean, self.mean\n        )\n    )\n    if candidate_mean - self.mean > 0:\n        # Calc p value with inverse logic (costs)\n        t, p = ttest_rel(-candidate_vals, -self.bl_vals)\n\n        p_val = p / 2  # one-sided\n        assert t < 0, \"T-statistic should be negative\"\n        log.info(\"p-value: {:.3f}\".format(p_val))\n        if p_val < self.bl_alpha:\n            log.info(\"Updating baseline\")\n            self._update_policy(policy, env, batch_size, device, dataset_size)\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.RolloutBaseline.rollout","title":"rollout","text":"
rollout(\n    policy, env, batch_size=64, device=\"cpu\", dataset=None\n)\n

Rollout the policy on the given dataset

Source code in rl4co/models/rl/reinforce/baselines.py
def rollout(self, policy, env, batch_size=64, device=\"cpu\", dataset=None):\n    \"\"\"Rollout the policy on the given dataset\"\"\"\n\n    # if dataset is None, use the dataset of the baseline\n    dataset = self.dataset if dataset is None else dataset\n\n    policy.eval()\n    policy = policy.to(device)\n\n    def eval_policy(batch):\n        with torch.inference_mode():\n            batch = env.reset(batch.to(device))\n            return policy(batch, env, decode_type=\"greedy\")[\"reward\"]\n\n    dl = DataLoader(dataset, batch_size=batch_size, collate_fn=dataset.collate_fn)\n\n    rewards = torch.cat([eval_policy(batch) for batch in dl], 0)\n    return rewards\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.RolloutBaseline.wrap_dataset","title":"wrap_dataset","text":"
wrap_dataset(\n    dataset, env, batch_size=64, device=\"cpu\", **kw\n)\n

Wrap the dataset in a baseline dataset

Note

This is an alternative to eval that does not require the policy to be passed at every call but just once. Values are added to the dataset. This also allows for larger batch sizes since we evauate the policy without gradients.

Source code in rl4co/models/rl/reinforce/baselines.py
def wrap_dataset(self, dataset, env, batch_size=64, device=\"cpu\", **kw):\n    \"\"\"Wrap the dataset in a baseline dataset\n\n    Note:\n        This is an alternative to `eval` that does not require the policy to be passed\n        at every call but just once. Values are added to the dataset. This also allows for\n        larger batch sizes since we evauate the policy without gradients.\n    \"\"\"\n    rewards = (\n        self.rollout(self.policy, env, batch_size, device, dataset=dataset)\n        .detach()\n        .cpu()\n    )\n    return dataset.add_key(\"extra\", rewards)\n
"},{"location":"docs/content/api/rl/reinforce/#models.rl.reinforce.baselines.get_reinforce_baseline","title":"get_reinforce_baseline","text":"
get_reinforce_baseline(name, **kw)\n

Get a REINFORCE baseline by name The rollout baseline default to warmup baseline with one epoch of exponential baseline and the greedy rollout

Source code in rl4co/models/rl/reinforce/baselines.py
def get_reinforce_baseline(name, **kw):\n    \"\"\"Get a REINFORCE baseline by name\n    The rollout baseline default to warmup baseline with one epoch of\n    exponential baseline and the greedy rollout\n    \"\"\"\n    if name == \"warmup\":\n        inner_baseline = kw.get(\"baseline\", \"rollout\")\n        if not isinstance(inner_baseline, REINFORCEBaseline):\n            inner_baseline = get_reinforce_baseline(inner_baseline, **kw)\n        return WarmupBaseline(inner_baseline, **kw)\n    elif name == \"rollout\":\n        warmup_epochs = kw.get(\"n_epochs\", 1)\n        warmup_exp_beta = kw.get(\"exp_beta\", 0.8)\n        bl_alpha = kw.get(\"bl_alpha\", 0.05)\n        return WarmupBaseline(\n            RolloutBaseline(bl_alpha=bl_alpha), warmup_epochs, warmup_exp_beta\n        )\n\n    if name is None:\n        name = \"no\"  # default to no baseline\n    baseline_cls = REINFORCE_BASELINES_REGISTRY.get(name, None)\n    if baseline_cls is None:\n        raise ValueError(\n            f\"Unknown baseline {baseline_cls}. Available baselines: {REINFORCE_BASELINES_REGISTRY.keys()}\"\n        )\n    return baseline_cls(**kw)\n
"},{"location":"docs/content/api/zoo/constructive_ar/","title":"Constructive Autoregressive Methods","text":""},{"location":"docs/content/api/zoo/constructive_ar/#attention-model-am","title":"Attention Model (AM)","text":"

Classes:

  • AttentionModel \u2013

    Attention Model based on REINFORCE: https://arxiv.org/abs/1803.08475.

Classes:

  • AttentionModelPolicy \u2013

    Attention Model Policy based on Kool et al. (2019): https://arxiv.org/abs/1803.08475.

"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.am.model.AttentionModel","title":"AttentionModel","text":"
AttentionModel(\n    env: RL4COEnvBase,\n    policy: AttentionModelPolicy = None,\n    baseline: Union[REINFORCEBaseline, str] = \"rollout\",\n    policy_kwargs={},\n    baseline_kwargs={},\n    **kwargs\n)\n

Bases: REINFORCE

Attention Model based on REINFORCE: https://arxiv.org/abs/1803.08475. Check :class:REINFORCE and :class:rl4co.models.RL4COLitModule for more details such as additional parameters including batch size.

Parameters:

  • env (RL4COEnvBase) \u2013

    Environment to use for the algorithm

  • policy (AttentionModelPolicy, default: None ) \u2013

    Policy to use for the algorithm

  • baseline (Union[REINFORCEBaseline, str], default: 'rollout' ) \u2013

    REINFORCE baseline. Defaults to rollout (1 epoch of exponential, then greedy rollout baseline)

  • policy_kwargs \u2013

    Keyword arguments for policy

  • baseline_kwargs \u2013

    Keyword arguments for baseline

  • **kwargs \u2013

    Keyword arguments passed to the superclass

Source code in rl4co/models/zoo/am/model.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: AttentionModelPolicy = None,\n    baseline: Union[REINFORCEBaseline, str] = \"rollout\",\n    policy_kwargs={},\n    baseline_kwargs={},\n    **kwargs,\n):\n    if policy is None:\n        policy = AttentionModelPolicy(env_name=env.name, **policy_kwargs)\n\n    super().__init__(env, policy, baseline, baseline_kwargs, **kwargs)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.am.policy.AttentionModelPolicy","title":"AttentionModelPolicy","text":"
AttentionModelPolicy(\n    encoder: Module = None,\n    decoder: Module = None,\n    embed_dim: int = 128,\n    num_encoder_layers: int = 3,\n    num_heads: int = 8,\n    normalization: str = \"batch\",\n    feedforward_hidden: int = 512,\n    env_name: str = \"tsp\",\n    encoder_network: Module = None,\n    init_embedding: Module = None,\n    context_embedding: Module = None,\n    dynamic_embedding: Module = None,\n    use_graph_context: bool = True,\n    linear_bias_decoder: bool = False,\n    sdpa_fn: Callable = None,\n    sdpa_fn_encoder: Callable = None,\n    sdpa_fn_decoder: Callable = None,\n    mask_inner: bool = True,\n    out_bias_pointer_attn: bool = False,\n    check_nan: bool = True,\n    temperature: float = 1.0,\n    tanh_clipping: float = 10.0,\n    mask_logits: bool = True,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"greedy\",\n    test_decode_type: str = \"greedy\",\n    moe_kwargs: dict = {\"encoder\": None, \"decoder\": None},\n    **unused_kwargs\n)\n

Bases: AutoregressivePolicy

Attention Model Policy based on Kool et al. (2019): https://arxiv.org/abs/1803.08475. This model first encodes the input graph using a Graph Attention Network (GAT) (:class:AttentionModelEncoder) and then decodes the solution using a pointer network (:class:AttentionModelDecoder). Cache is used to store the embeddings of the nodes to be used by the decoder to save computation. See :class:rl4co.models.common.constructive.autoregressive.policy.AutoregressivePolicy for more details on the inference process.

Parameters:

  • encoder (Module, default: None ) \u2013

    Encoder module, defaults to :class:AttentionModelEncoder

  • decoder (Module, default: None ) \u2013

    Decoder module, defaults to :class:AttentionModelDecoder

  • embed_dim (int, default: 128 ) \u2013

    Dimension of the node embeddings

  • num_encoder_layers (int, default: 3 ) \u2013

    Number of layers in the encoder

  • num_heads (int, default: 8 ) \u2013

    Number of heads in the attention layers

  • normalization (str, default: 'batch' ) \u2013

    Normalization type in the attention layers

  • feedforward_hidden (int, default: 512 ) \u2013

    Dimension of the hidden layer in the feedforward network

  • env_name (str, default: 'tsp' ) \u2013

    Name of the environment used to initialize embeddings

  • encoder_network (Module, default: None ) \u2013

    Network to use for the encoder

  • init_embedding (Module, default: None ) \u2013

    Module to use for the initialization of the embeddings

  • context_embedding (Module, default: None ) \u2013

    Module to use for the context embedding

  • dynamic_embedding (Module, default: None ) \u2013

    Module to use for the dynamic embedding

  • use_graph_context (bool, default: True ) \u2013

    Whether to use the graph context

  • linear_bias_decoder (bool, default: False ) \u2013

    Whether to use a bias in the linear layer of the decoder

  • sdpa_fn_encoder (Callable, default: None ) \u2013

    Function to use for the scaled dot product attention in the encoder

  • sdpa_fn_decoder (Callable, default: None ) \u2013

    Function to use for the scaled dot product attention in the decoder

  • sdpa_fn (Callable, default: None ) \u2013

    (deprecated) Function to use for the scaled dot product attention

  • mask_inner (bool, default: True ) \u2013

    Whether to mask the inner product

  • out_bias_pointer_attn (bool, default: False ) \u2013

    Whether to use a bias in the pointer attention

  • check_nan (bool, default: True ) \u2013

    Whether to check for nan values during decoding

  • temperature (float, default: 1.0 ) \u2013

    Temperature for the softmax

  • tanh_clipping (float, default: 10.0 ) \u2013

    Tanh clipping value (see Bello et al., 2016)

  • mask_logits (bool, default: True ) \u2013

    Whether to mask the logits during decoding

  • train_decode_type (str, default: 'sampling' ) \u2013

    Type of decoding to use during training

  • val_decode_type (str, default: 'greedy' ) \u2013

    Type of decoding to use during validation

  • test_decode_type (str, default: 'greedy' ) \u2013

    Type of decoding to use during testing

  • moe_kwargs (dict, default: {'encoder': None, 'decoder': None} ) \u2013

    Keyword arguments for MoE, e.g., {\"encoder\": {\"hidden_act\": \"ReLU\", \"num_experts\": 4, \"k\": 2, \"noisy_gating\": True}, \"decoder\": {\"light_version\": True, ...}}

Source code in rl4co/models/zoo/am/policy.py
def __init__(\n    self,\n    encoder: nn.Module = None,\n    decoder: nn.Module = None,\n    embed_dim: int = 128,\n    num_encoder_layers: int = 3,\n    num_heads: int = 8,\n    normalization: str = \"batch\",\n    feedforward_hidden: int = 512,\n    env_name: str = \"tsp\",\n    encoder_network: nn.Module = None,\n    init_embedding: nn.Module = None,\n    context_embedding: nn.Module = None,\n    dynamic_embedding: nn.Module = None,\n    use_graph_context: bool = True,\n    linear_bias_decoder: bool = False,\n    sdpa_fn: Callable = None,\n    sdpa_fn_encoder: Callable = None,\n    sdpa_fn_decoder: Callable = None,\n    mask_inner: bool = True,\n    out_bias_pointer_attn: bool = False,\n    check_nan: bool = True,\n    temperature: float = 1.0,\n    tanh_clipping: float = 10.0,\n    mask_logits: bool = True,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"greedy\",\n    test_decode_type: str = \"greedy\",\n    moe_kwargs: dict = {\"encoder\": None, \"decoder\": None},\n    **unused_kwargs,\n):\n    if encoder is None:\n        encoder = AttentionModelEncoder(\n            embed_dim=embed_dim,\n            num_heads=num_heads,\n            num_layers=num_encoder_layers,\n            env_name=env_name,\n            normalization=normalization,\n            feedforward_hidden=feedforward_hidden,\n            net=encoder_network,\n            init_embedding=init_embedding,\n            sdpa_fn=sdpa_fn if sdpa_fn_encoder is None else sdpa_fn_encoder,\n            moe_kwargs=moe_kwargs[\"encoder\"],\n        )\n\n    if decoder is None:\n        decoder = AttentionModelDecoder(\n            embed_dim=embed_dim,\n            num_heads=num_heads,\n            env_name=env_name,\n            context_embedding=context_embedding,\n            dynamic_embedding=dynamic_embedding,\n            sdpa_fn=sdpa_fn if sdpa_fn_decoder is None else sdpa_fn_decoder,\n            mask_inner=mask_inner,\n            out_bias_pointer_attn=out_bias_pointer_attn,\n            linear_bias=linear_bias_decoder,\n            use_graph_context=use_graph_context,\n            check_nan=check_nan,\n            moe_kwargs=moe_kwargs[\"decoder\"],\n        )\n\n    super(AttentionModelPolicy, self).__init__(\n        encoder=encoder,\n        decoder=decoder,\n        env_name=env_name,\n        temperature=temperature,\n        tanh_clipping=tanh_clipping,\n        mask_logits=mask_logits,\n        train_decode_type=train_decode_type,\n        val_decode_type=val_decode_type,\n        test_decode_type=test_decode_type,\n        **unused_kwargs,\n    )\n
"},{"location":"docs/content/api/zoo/constructive_ar/#attention-model-ppo-am-ppo","title":"Attention Model - PPO (AM-PPO)","text":"

Classes:

  • AMPPO \u2013

    PPO Model based on Proximal Policy Optimization (PPO) with an attention model policy.

"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.amppo.model.AMPPO","title":"AMPPO","text":"
AMPPO(\n    env: RL4COEnvBase,\n    policy: Module = None,\n    critic: CriticNetwork = None,\n    policy_kwargs: dict = {},\n    critic_kwargs: dict = {},\n    **kwargs\n)\n

Bases: PPO

PPO Model based on Proximal Policy Optimization (PPO) with an attention model policy. We default to the attention model policy and the Attention Critic Network.

Parameters:

  • env (RL4COEnvBase) \u2013

    Environment to use for the algorithm

  • policy (Module, default: None ) \u2013

    Policy to use for the algorithm

  • critic (CriticNetwork, default: None ) \u2013

    Critic to use for the algorithm

  • policy_kwargs (dict, default: {} ) \u2013

    Keyword arguments for policy

  • critic_kwargs (dict, default: {} ) \u2013

    Keyword arguments for critic

Source code in rl4co/models/zoo/amppo/model.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: nn.Module = None,\n    critic: CriticNetwork = None,\n    policy_kwargs: dict = {},\n    critic_kwargs: dict = {},\n    **kwargs,\n):\n    if policy is None:\n        policy = AttentionModelPolicy(env_name=env.name, **policy_kwargs)\n\n    if critic is None:\n        log.info(\"Creating critic network for {}\".format(env.name))\n        # we reuse the parameters of the model\n        encoder = getattr(policy, \"encoder\", None)\n        if encoder is None:\n            raise ValueError(\"Critic network requires an encoder\")\n        critic = CriticNetwork(\n            copy.deepcopy(encoder).to(next(encoder.parameters()).device),\n            **critic_kwargs,\n        )\n\n    super().__init__(env, policy, critic, **kwargs)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#heterogeneous-attention-model-ham","title":"Heterogeneous Attention Model (HAM)","text":"

Classes:

  • HeterogeneousAttentionModel \u2013

    Heterogenous Attention Model for solving the Pickup and Delivery Problem based on

Classes:

  • HeterogeneousAttentionModelPolicy \u2013

    Heterogeneous Attention Model Policy based on https://ieeexplore.ieee.org/document/9352489.

Classes:

  • HeterogenousMHA \u2013
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ham.model.HeterogeneousAttentionModel","title":"HeterogeneousAttentionModel","text":"
HeterogeneousAttentionModel(\n    env: RL4COEnvBase,\n    policy: HeterogeneousAttentionModelPolicy = None,\n    baseline: Union[REINFORCEBaseline, str] = \"rollout\",\n    policy_kwargs={},\n    baseline_kwargs={},\n    **kwargs\n)\n

Bases: REINFORCE

Heterogenous Attention Model for solving the Pickup and Delivery Problem based on REINFORCE: https://arxiv.org/abs/2110.02634.

Parameters:

  • env (RL4COEnvBase) \u2013

    Environment to use for the algorithm

  • policy (HeterogeneousAttentionModelPolicy, default: None ) \u2013

    Policy to use for the algorithm

  • baseline (Union[REINFORCEBaseline, str], default: 'rollout' ) \u2013

    REINFORCE baseline. Defaults to rollout (1 epoch of exponential, then greedy rollout baseline)

  • policy_kwargs \u2013

    Keyword arguments for policy

  • baseline_kwargs \u2013

    Keyword arguments for baseline

  • **kwargs \u2013

    Keyword arguments passed to the superclass

Source code in rl4co/models/zoo/ham/model.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: HeterogeneousAttentionModelPolicy = None,\n    baseline: Union[REINFORCEBaseline, str] = \"rollout\",\n    policy_kwargs={},\n    baseline_kwargs={},\n    **kwargs,\n):\n    assert (\n        env.name == \"pdp\"\n    ), \"HeterogeneousAttentionModel only works for PDP (Pickup and Delivery Problem)\"\n    if policy is None:\n        policy = HeterogeneousAttentionModelPolicy(env_name=env.name, **policy_kwargs)\n\n    super().__init__(env, policy, baseline, baseline_kwargs, **kwargs)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ham.policy.HeterogeneousAttentionModelPolicy","title":"HeterogeneousAttentionModelPolicy","text":"
HeterogeneousAttentionModelPolicy(\n    encoder: Module = None,\n    env_name: str = \"pdp\",\n    init_embedding: Module = None,\n    embed_dim: int = 128,\n    num_encoder_layers: int = 3,\n    num_heads: int = 8,\n    normalization: str = \"batch\",\n    feedforward_hidden: int = 512,\n    sdpa_fn: Optional[Callable] = None,\n    **kwargs\n)\n

Bases: AttentionModelPolicy

Heterogeneous Attention Model Policy based on https://ieeexplore.ieee.org/document/9352489. We re-declare the most important arguments here for convenience as in the paper. See :class:rl4co.models.zoo.am.AttentionModelPolicy for more details.

Parameters:

  • encoder (Module, default: None ) \u2013

    Encoder module. Can be passed by sub-classes

  • env_name (str, default: 'pdp' ) \u2013

    Name of the environment used to initialize embeddings

  • init_embedding (Module, default: None ) \u2013

    Model to use for the initial embedding. If None, use the default embedding for the environment

  • embed_dim (int, default: 128 ) \u2013

    Dimension of the embeddings

  • num_encoder_layers (int, default: 3 ) \u2013

    Number of layers in the encoder

  • num_heads (int, default: 8 ) \u2013

    Number of heads for the attention in encoder

  • normalization (str, default: 'batch' ) \u2013

    Normalization to use for the attention layers

  • feedforward_hidden (int, default: 512 ) \u2013

    Dimension of the hidden layer in the feedforward network

  • sdpa_fn (Optional[Callable], default: None ) \u2013

    Function to use for the scaled dot product attention

  • **kwargs \u2013

    keyword arguments passed to the :class:rl4co.models.zoo.am.AttentionModelPolicy

Source code in rl4co/models/zoo/ham/policy.py
def __init__(\n    self,\n    encoder: nn.Module = None,\n    env_name: str = \"pdp\",\n    init_embedding: nn.Module = None,\n    embed_dim: int = 128,\n    num_encoder_layers: int = 3,\n    num_heads: int = 8,\n    normalization: str = \"batch\",\n    feedforward_hidden: int = 512,\n    sdpa_fn: Optional[Callable] = None,\n    **kwargs,\n):\n    if encoder is None:\n        encoder = GraphHeterogeneousAttentionEncoder(\n            init_embedding=init_embedding,\n            num_heads=num_heads,\n            embed_dim=embed_dim,\n            num_encoder_layers=num_encoder_layers,\n            env_name=env_name,\n            normalization=normalization,\n            feedforward_hidden=feedforward_hidden,\n            sdpa_fn=sdpa_fn,\n        )\n    else:\n        encoder = encoder\n\n    super(HeterogeneousAttentionModelPolicy, self).__init__(\n        env_name=env_name,\n        encoder=encoder,\n        embed_dim=embed_dim,\n        num_encoder_layers=num_encoder_layers,\n        num_heads=num_heads,\n        normalization=normalization,\n        **kwargs,\n    )\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ham.attention.HeterogenousMHA","title":"HeterogenousMHA","text":"
HeterogenousMHA(\n    num_heads,\n    input_dim,\n    embed_dim=None,\n    val_dim=None,\n    key_dim=None,\n)\n

Bases: Module

Methods:

  • forward \u2013

    Args:

Source code in rl4co/models/zoo/ham/attention.py
def __init__(self, num_heads, input_dim, embed_dim=None, val_dim=None, key_dim=None):\n    \"\"\"\n    Heterogenous Multi-Head Attention for Pickup and Delivery problems\n    https://arxiv.org/abs/2110.02634\n    \"\"\"\n    super(HeterogenousMHA, self).__init__()\n\n    if val_dim is None:\n        assert embed_dim is not None, \"Provide either embed_dim or val_dim\"\n        val_dim = embed_dim // num_heads\n    if key_dim is None:\n        key_dim = val_dim\n\n    self.num_heads = num_heads\n    self.input_dim = input_dim\n    self.embed_dim = embed_dim\n    self.val_dim = val_dim\n    self.key_dim = key_dim\n\n    self.norm_factor = 1 / math.sqrt(key_dim)  # See Attention is all you need\n\n    self.W_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim))\n    self.W_key = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim))\n    self.W_val = nn.Parameter(torch.Tensor(num_heads, input_dim, val_dim))\n\n    # Pickup weights\n    self.W1_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim))\n    self.W2_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim))\n    self.W3_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim))\n\n    # Delivery weights\n    self.W4_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim))\n    self.W5_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim))\n    self.W6_query = nn.Parameter(torch.Tensor(num_heads, input_dim, key_dim))\n\n    if embed_dim is not None:\n        self.W_out = nn.Parameter(torch.Tensor(num_heads, key_dim, embed_dim))\n\n    self.init_parameters()\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ham.attention.HeterogenousMHA.forward","title":"forward","text":"
forward(q, h=None, mask=None)\n

Parameters:

  • q \u2013

    queries (batch_size, n_query, input_dim)

  • h \u2013

    data (batch_size, graph_size, input_dim)

  • mask \u2013

    mask (batch_size, n_query, graph_size) or viewable as that (i.e. can be 2 dim if n_query == 1)

Mask should contain 1 if attention is not possible (i.e. mask is negative adjacency)

Source code in rl4co/models/zoo/ham/attention.py
def forward(self, q, h=None, mask=None):\n    \"\"\"\n    Args:\n        q: queries (batch_size, n_query, input_dim)\n        h: data (batch_size, graph_size, input_dim)\n        mask: mask (batch_size, n_query, graph_size) or viewable as that (i.e. can be 2 dim if n_query == 1)\n\n    Mask should contain 1 if attention is not possible (i.e. mask is negative adjacency)\n    \"\"\"\n    if h is None:\n        h = q  # compute self-attention\n\n    # h should be (batch_size, graph_size, input_dim)\n    batch_size, graph_size, input_dim = h.size()\n\n    # Check if graph size is odd number\n    assert (\n        graph_size % 2 == 1\n    ), \"Graph size should have odd number of nodes due to pickup-delivery problem  \\\n                                 (n/2 pickup, n/2 delivery, 1 depot)\"\n\n    n_query = q.size(1)\n    assert q.size(0) == batch_size\n    assert q.size(2) == input_dim\n    assert input_dim == self.input_dim, \"Wrong embedding dimension of input\"\n\n    hflat = h.contiguous().view(-1, input_dim)  # [batch_size * graph_size, embed_dim]\n    qflat = q.contiguous().view(-1, input_dim)  # [batch_size * n_query, embed_dim]\n\n    # last dimension can be different for keys and values\n    shp = (self.num_heads, batch_size, graph_size, -1)\n    shp_q = (self.num_heads, batch_size, n_query, -1)\n\n    # pickup -> its delivery attention\n    n_pick = (graph_size - 1) // 2\n    shp_delivery = (self.num_heads, batch_size, n_pick, -1)\n    shp_q_pick = (self.num_heads, batch_size, n_pick, -1)\n\n    # pickup -> all pickups attention\n    shp_allpick = (self.num_heads, batch_size, n_pick, -1)\n    shp_q_allpick = (self.num_heads, batch_size, n_pick, -1)\n\n    # pickup -> all pickups attention\n    shp_alldelivery = (self.num_heads, batch_size, n_pick, -1)\n    shp_q_alldelivery = (self.num_heads, batch_size, n_pick, -1)\n\n    # Calculate queries, (num_heads, n_query, graph_size, key/val_size)\n    Q = torch.matmul(qflat, self.W_query).view(shp_q)\n    # Calculate keys and values (num_heads, batch_size, graph_size, key/val_size)\n    K = torch.matmul(hflat, self.W_key).view(shp)\n    V = torch.matmul(hflat, self.W_val).view(shp)\n\n    # pickup -> its delivery\n    pick_flat = (\n        h[:, 1 : n_pick + 1, :].contiguous().view(-1, input_dim)\n    )  # [batch_size * n_pick, embed_dim]\n    delivery_flat = (\n        h[:, n_pick + 1 :, :].contiguous().view(-1, input_dim)\n    )  # [batch_size * n_pick, embed_dim]\n\n    # pickup -> its delivery attention\n    Q_pick = torch.matmul(pick_flat, self.W1_query).view(\n        shp_q_pick\n    )  # (self.num_heads, batch_size, n_pick, key_size)\n    K_delivery = torch.matmul(delivery_flat, self.W_key).view(\n        shp_delivery\n    )  # (self.num_heads, batch_size, n_pick, -1)\n    V_delivery = torch.matmul(delivery_flat, self.W_val).view(\n        shp_delivery\n    )  # (num_heads, batch_size, n_pick, key/val_size)\n\n    # pickup -> all pickups attention\n    Q_pick_allpick = torch.matmul(pick_flat, self.W2_query).view(\n        shp_q_allpick\n    )  # (self.num_heads, batch_size, n_pick, -1)\n    K_allpick = torch.matmul(pick_flat, self.W_key).view(\n        shp_allpick\n    )  # [self.num_heads, batch_size, n_pick, key_size]\n    V_allpick = torch.matmul(pick_flat, self.W_val).view(\n        shp_allpick\n    )  # [self.num_heads, batch_size, n_pick, key_size]\n\n    # pickup -> all delivery\n    Q_pick_alldelivery = torch.matmul(pick_flat, self.W3_query).view(\n        shp_q_alldelivery\n    )  # (self.num_heads, batch_size, n_pick, key_size)\n    K_alldelivery = torch.matmul(delivery_flat, self.W_key).view(\n        shp_alldelivery\n    )  # (self.num_heads, batch_size, n_pick, -1)\n    V_alldelivery = torch.matmul(delivery_flat, self.W_val).view(\n        shp_alldelivery\n    )  # (num_heads, batch_size, n_pick, key/val_size)\n\n    # pickup -> its delivery\n    V_additional_delivery = torch.cat(\n        [  # [num_heads, batch_size, graph_size, key_size]\n            torch.zeros(\n                self.num_heads,\n                batch_size,\n                1,\n                self.input_dim // self.num_heads,\n                dtype=V.dtype,\n                device=V.device,\n            ),\n            V_delivery,  # [num_heads, batch_size, n_pick, key/val_size]\n            torch.zeros(\n                self.num_heads,\n                batch_size,\n                n_pick,\n                self.input_dim // self.num_heads,\n                dtype=V.dtype,\n                device=V.device,\n            ),\n        ],\n        2,\n    )\n\n    # delivery -> its pickup attention\n    Q_delivery = torch.matmul(delivery_flat, self.W4_query).view(\n        shp_delivery\n    )  # (self.num_heads, batch_size, n_pick, key_size)\n    K_pick = torch.matmul(pick_flat, self.W_key).view(\n        shp_q_pick\n    )  # (self.num_heads, batch_size, n_pick, -1)\n    V_pick = torch.matmul(pick_flat, self.W_val).view(\n        shp_q_pick\n    )  # (num_heads, batch_size, n_pick, key/val_size)\n\n    # delivery -> all delivery attention\n    Q_delivery_alldelivery = torch.matmul(delivery_flat, self.W5_query).view(\n        shp_alldelivery\n    )  # (self.num_heads, batch_size, n_pick, -1)\n    K_alldelivery2 = torch.matmul(delivery_flat, self.W_key).view(\n        shp_alldelivery\n    )  # [self.num_heads, batch_size, n_pick, key_size]\n    V_alldelivery2 = torch.matmul(delivery_flat, self.W_val).view(\n        shp_alldelivery\n    )  # [self.num_heads, batch_size, n_pick, key_size]\n\n    # delivery -> all pickup\n    Q_delivery_allpickup = torch.matmul(delivery_flat, self.W6_query).view(\n        shp_alldelivery\n    )  # (self.num_heads, batch_size, n_pick, key_size)\n    K_allpickup2 = torch.matmul(pick_flat, self.W_key).view(\n        shp_q_alldelivery\n    )  # (self.num_heads, batch_size, n_pick, -1)\n    V_allpickup2 = torch.matmul(pick_flat, self.W_val).view(\n        shp_q_alldelivery\n    )  # (num_heads, batch_size, n_pick, key/val_size)\n\n    # delivery -> its pick up\n    V_additional_pick = torch.cat(\n        [  # [num_heads, batch_size, graph_size, key_size]\n            torch.zeros(\n                self.num_heads,\n                batch_size,\n                1,\n                self.input_dim // self.num_heads,\n                dtype=V.dtype,\n                device=V.device,\n            ),\n            torch.zeros(\n                self.num_heads,\n                batch_size,\n                n_pick,\n                self.input_dim // self.num_heads,\n                dtype=V.dtype,\n                device=V.device,\n            ),\n            V_pick,  # [num_heads, batch_size, n_pick, key/val_size]\n        ],\n        2,\n    )\n\n    # Calculate compatibility (num_heads, batch_size, n_query, graph_size)\n    compatibility = self.norm_factor * torch.matmul(Q, K.transpose(2, 3))\n\n    ##Pick up pair attention\n    compatibility_pick_delivery = self.norm_factor * torch.sum(\n        Q_pick * K_delivery, -1\n    )  # element_wise, [num_heads, batch_size, n_pick]\n    # [num_heads, batch_size, n_pick, n_pick]\n    compatibility_pick_allpick = self.norm_factor * torch.matmul(\n        Q_pick_allpick, K_allpick.transpose(2, 3)\n    )  # [num_heads, batch_size, n_pick, n_pick]\n    compatibility_pick_alldelivery = self.norm_factor * torch.matmul(\n        Q_pick_alldelivery, K_alldelivery.transpose(2, 3)\n    )  # [num_heads, batch_size, n_pick, n_pick]\n\n    ##Delivery\n    compatibility_delivery_pick = self.norm_factor * torch.sum(\n        Q_delivery * K_pick, -1\n    )  # element_wise, [num_heads, batch_size, n_pick]\n    compatibility_delivery_alldelivery = self.norm_factor * torch.matmul(\n        Q_delivery_alldelivery, K_alldelivery2.transpose(2, 3)\n    )  # [num_heads, batch_size, n_pick, n_pick]\n    compatibility_delivery_allpick = self.norm_factor * torch.matmul(\n        Q_delivery_allpickup, K_allpickup2.transpose(2, 3)\n    )  # [num_heads, batch_size, n_pick, n_pick]\n\n    ##Pick up->\n    # compatibility_additional?pickup????delivery????attention(size 1),1:n_pick+1??attention,depot?delivery??\n    compatibility_additional_delivery = torch.cat(\n        [  # [num_heads, batch_size, graph_size, 1]\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                1,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n            compatibility_pick_delivery,  # [num_heads, batch_size, n_pick]\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                n_pick,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n        ],\n        -1,\n    ).view(self.num_heads, batch_size, graph_size, 1)\n\n    compatibility_additional_allpick = torch.cat(\n        [  # [num_heads, batch_size, graph_size, n_pick]\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                1,\n                n_pick,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n            compatibility_pick_allpick,  # [num_heads, batch_size, n_pick, n_pick]\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                n_pick,\n                n_pick,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n        ],\n        2,\n    ).view(self.num_heads, batch_size, graph_size, n_pick)\n\n    compatibility_additional_alldelivery = torch.cat(\n        [  # [num_heads, batch_size, graph_size, n_pick]\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                1,\n                n_pick,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n            compatibility_pick_alldelivery,  # [num_heads, batch_size, n_pick, n_pick]\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                n_pick,\n                n_pick,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n        ],\n        2,\n    ).view(self.num_heads, batch_size, graph_size, n_pick)\n    # [num_heads, batch_size, n_query, graph_size+1+n_pick+n_pick]\n\n    # Delivery\n    compatibility_additional_pick = torch.cat(\n        [  # [num_heads, batch_size, graph_size, 1]\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                1,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                n_pick,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n            compatibility_delivery_pick,  # [num_heads, batch_size, n_pick]\n        ],\n        -1,\n    ).view(self.num_heads, batch_size, graph_size, 1)\n\n    compatibility_additional_alldelivery2 = torch.cat(\n        [  # [num_heads, batch_size, graph_size, n_pick]\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                1,\n                n_pick,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                n_pick,\n                n_pick,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n            compatibility_delivery_alldelivery,  # [num_heads, batch_size, n_pick, n_pick]\n        ],\n        2,\n    ).view(self.num_heads, batch_size, graph_size, n_pick)\n\n    compatibility_additional_allpick2 = torch.cat(\n        [  # [num_heads, batch_size, graph_size, n_pick]\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                1,\n                n_pick,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n            float(\"-inf\")\n            * torch.ones(\n                self.num_heads,\n                batch_size,\n                n_pick,\n                n_pick,\n                dtype=compatibility.dtype,\n                device=compatibility.device,\n            ),\n            compatibility_delivery_allpick,  # [num_heads, batch_size, n_pick, n_pick]\n        ],\n        2,\n    ).view(self.num_heads, batch_size, graph_size, n_pick)\n\n    compatibility = torch.cat(\n        [\n            compatibility,\n            compatibility_additional_delivery,\n            compatibility_additional_allpick,\n            compatibility_additional_alldelivery,\n            compatibility_additional_pick,\n            compatibility_additional_alldelivery2,\n            compatibility_additional_allpick2,\n        ],\n        dim=-1,\n    )\n\n    # Optionally apply mask to prevent attention\n    if mask is not None:\n        mask = mask.view(1, batch_size, n_query, graph_size).expand_as(compatibility)\n        compatibility[mask] = float(\"-inf\")\n\n    attn = torch.softmax(\n        compatibility, dim=-1\n    )  # [num_heads, batch_size, n_query, graph_size+1+n_pick*2] (graph_size include depot)\n\n    # If there are nodes with no neighbours then softmax returns nan so we fix them to 0\n    if mask is not None:\n        attnc = attn.clone()\n        attnc[mask] = 0\n        attn = attnc\n\n    # heads: [num_heads, batrch_size, n_query, val_size] pick -> its delivery\n    heads = torch.matmul(\n        attn[:, :, :, :graph_size], V\n    )  # V: (self.num_heads, batch_size, graph_size, val_size)\n    heads = (\n        heads\n        + attn[:, :, :, graph_size].view(self.num_heads, batch_size, graph_size, 1)\n        * V_additional_delivery\n    )  # V_addi:[num_heads, batch_size, graph_size, key_size]\n\n    # Heads pick -> otherpick, V_allpick: # [num_heads, batch_size, n_pick, key_size]\n    heads = heads + torch.matmul(\n        attn[:, :, :, graph_size + 1 : graph_size + 1 + n_pick].view(\n            self.num_heads, batch_size, graph_size, n_pick\n        ),\n        V_allpick,\n    )\n\n    # V_alldelivery: # (num_heads, batch_size, n_pick, key/val_size)\n    heads = heads + torch.matmul(\n        attn[:, :, :, graph_size + 1 + n_pick : graph_size + 1 + 2 * n_pick].view(\n            self.num_heads, batch_size, graph_size, n_pick\n        ),\n        V_alldelivery,\n    )\n\n    # Delivery\n    heads = (\n        heads\n        + attn[:, :, :, graph_size + 1 + 2 * n_pick].view(\n            self.num_heads, batch_size, graph_size, 1\n        )\n        * V_additional_pick\n    )\n    heads = heads + torch.matmul(\n        attn[\n            :,\n            :,\n            :,\n            graph_size + 1 + 2 * n_pick + 1 : graph_size + 1 + 3 * n_pick + 1,\n        ].view(self.num_heads, batch_size, graph_size, n_pick),\n        V_alldelivery2,\n    )\n    heads = heads + torch.matmul(\n        attn[:, :, :, graph_size + 1 + 3 * n_pick + 1 :].view(\n            self.num_heads, batch_size, graph_size, n_pick\n        ),\n        V_allpickup2,\n    )\n\n    out = torch.mm(\n        heads.permute(1, 2, 0, 3)\n        .contiguous()\n        .view(-1, self.num_heads * self.val_dim),\n        self.W_out.view(-1, self.embed_dim),\n    ).view(batch_size, n_query, self.embed_dim)\n\n    return out\n
"},{"location":"docs/content/api/zoo/constructive_ar/#matrix-encoding-network-matnet","title":"Matrix Encoding Network (MatNet)","text":"

Classes:

  • MatNetPolicy \u2013

    MatNet Policy from Kwon et al., 2021.

  • MultiStageFFSPPolicy \u2013

    Policy for solving the FFSP using a seperate encoder and decoder for each

Classes:

  • MixedScoresSDPA \u2013
  • MatNetMHA \u2013
  • MatNetLayer \u2013

Classes:

  • MultiStageFFSPDecoder \u2013

    Decoder class for the solving the FFSP using a seperate MatNet decoder for each stage

"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.matnet.policy.MatNetPolicy","title":"MatNetPolicy","text":"
MatNetPolicy(\n    env_name: str = \"atsp\",\n    embed_dim: int = 256,\n    num_encoder_layers: int = 5,\n    num_heads: int = 16,\n    normalization: str = \"instance\",\n    init_embedding_kwargs: dict = {\"mode\": \"RandomOneHot\"},\n    use_graph_context: bool = False,\n    bias: bool = False,\n    **kwargs\n)\n

Bases: AutoregressivePolicy

MatNet Policy from Kwon et al., 2021. Reference: https://arxiv.org/abs/2106.11113

Warning

This implementation is under development and subject to change.

Parameters:

  • env_name (str, default: 'atsp' ) \u2013

    Name of the environment used to initialize embeddings

  • embed_dim (int, default: 256 ) \u2013

    Dimension of the node embeddings

  • num_encoder_layers (int, default: 5 ) \u2013

    Number of layers in the encoder

  • num_heads (int, default: 16 ) \u2013

    Number of heads in the attention layers

  • normalization (str, default: 'instance' ) \u2013

    Normalization type in the attention layers

  • **kwargs \u2013

    keyword arguments passed to the AutoregressivePolicy

Default paarameters are adopted from the original implementation.

Source code in rl4co/models/zoo/matnet/policy.py
def __init__(\n    self,\n    env_name: str = \"atsp\",\n    embed_dim: int = 256,\n    num_encoder_layers: int = 5,\n    num_heads: int = 16,\n    normalization: str = \"instance\",\n    init_embedding_kwargs: dict = {\"mode\": \"RandomOneHot\"},\n    use_graph_context: bool = False,\n    bias: bool = False,\n    **kwargs,\n):\n    if env_name not in [\"atsp\", \"ffsp\"]:\n        log.error(f\"env_name {env_name} is not originally implemented in MatNet\")\n\n    if env_name == \"ffsp\":\n        decoder = MatNetFFSPDecoder(\n            embed_dim=embed_dim,\n            num_heads=num_heads,\n            use_graph_context=use_graph_context,\n            out_bias=True,\n        )\n\n    else:\n        decoder = MatNetDecoder(\n            env_name=env_name,\n            embed_dim=embed_dim,\n            num_heads=num_heads,\n            use_graph_context=use_graph_context,\n        )\n\n    super(MatNetPolicy, self).__init__(\n        env_name=env_name,\n        encoder=MatNetEncoder(\n            embed_dim=embed_dim,\n            num_heads=num_heads,\n            num_layers=num_encoder_layers,\n            normalization=normalization,\n            init_embedding_kwargs=init_embedding_kwargs,\n            bias=bias,\n        ),\n        decoder=decoder,\n        embed_dim=embed_dim,\n        num_encoder_layers=num_encoder_layers,\n        num_heads=num_heads,\n        normalization=normalization,\n        **kwargs,\n    )\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.matnet.policy.MultiStageFFSPPolicy","title":"MultiStageFFSPPolicy","text":"
MultiStageFFSPPolicy(\n    stage_cnt: int,\n    embed_dim: int = 512,\n    num_heads: int = 16,\n    num_encoder_layers: int = 5,\n    use_graph_context: bool = False,\n    normalization: str = \"instance\",\n    feedforward_hidden: int = 512,\n    bias: bool = False,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"sampling\",\n    test_decode_type: str = \"sampling\",\n)\n

Bases: Module

Policy for solving the FFSP using a seperate encoder and decoder for each stage. This requires the 'while not td[\"done\"].all()'-loop to be on policy level (instead of decoder level).

Source code in rl4co/models/zoo/matnet/policy.py
def __init__(\n    self,\n    stage_cnt: int,\n    embed_dim: int = 512,\n    num_heads: int = 16,\n    num_encoder_layers: int = 5,\n    use_graph_context: bool = False,\n    normalization: str = \"instance\",\n    feedforward_hidden: int = 512,\n    bias: bool = False,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"sampling\",\n    test_decode_type: str = \"sampling\",\n):\n    super().__init__()\n    self.stage_cnt = stage_cnt\n\n    self.encoders: List[MatNetEncoder] = nn.ModuleList(\n        [\n            MatNetEncoder(\n                embed_dim=embed_dim,\n                num_heads=num_heads,\n                num_layers=num_encoder_layers,\n                normalization=normalization,\n                feedforward_hidden=feedforward_hidden,\n                bias=bias,\n                init_embedding_kwargs={\"mode\": \"RandomOneHot\"},\n            )\n            for _ in range(self.stage_cnt)\n        ]\n    )\n    self.decoders: List[MultiStageFFSPDecoder] = nn.ModuleList(\n        [\n            MultiStageFFSPDecoder(embed_dim, num_heads, use_graph_context)\n            for _ in range(self.stage_cnt)\n        ]\n    )\n\n    self.train_decode_type = train_decode_type\n    self.val_decode_type = val_decode_type\n    self.test_decode_type = test_decode_type\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.matnet.encoder.MixedScoresSDPA","title":"MixedScoresSDPA","text":"
MixedScoresSDPA(\n    num_heads: int,\n    num_scores: int = 1,\n    mixer_hidden_dim: int = 16,\n    mix1_init: float = 1 / 2**1 / 2,\n    mix2_init: float = 1 / 16**1 / 2,\n)\n

Bases: Module

Methods:

  • forward \u2013

    Scaled Dot-Product Attention with MatNet Scores Mixer

Source code in rl4co/models/zoo/matnet/encoder.py
def __init__(\n    self,\n    num_heads: int,\n    num_scores: int = 1,\n    mixer_hidden_dim: int = 16,\n    mix1_init: float = (1 / 2) ** (1 / 2),\n    mix2_init: float = (1 / 16) ** (1 / 2),\n):\n    super().__init__()\n    self.num_heads = num_heads\n    self.num_scores = num_scores\n    mix_W1 = torch.torch.distributions.Uniform(low=-mix1_init, high=mix1_init).sample(\n        (num_heads, self.num_scores + 1, mixer_hidden_dim)\n    )\n    mix_b1 = torch.torch.distributions.Uniform(low=-mix1_init, high=mix1_init).sample(\n        (num_heads, mixer_hidden_dim)\n    )\n    self.mix_W1 = nn.Parameter(mix_W1)\n    self.mix_b1 = nn.Parameter(mix_b1)\n\n    mix_W2 = torch.torch.distributions.Uniform(low=-mix2_init, high=mix2_init).sample(\n        (num_heads, mixer_hidden_dim, 1)\n    )\n    mix_b2 = torch.torch.distributions.Uniform(low=-mix2_init, high=mix2_init).sample(\n        (num_heads, 1)\n    )\n    self.mix_W2 = nn.Parameter(mix_W2)\n    self.mix_b2 = nn.Parameter(mix_b2)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.matnet.encoder.MixedScoresSDPA.forward","title":"forward","text":"
forward(q, k, v, attn_mask=None, dmat=None, dropout_p=0.0)\n

Scaled Dot-Product Attention with MatNet Scores Mixer

Source code in rl4co/models/zoo/matnet/encoder.py
def forward(self, q, k, v, attn_mask=None, dmat=None, dropout_p=0.0):\n    \"\"\"Scaled Dot-Product Attention with MatNet Scores Mixer\"\"\"\n    assert dmat is not None\n    b, m, n = dmat.shape[:3]\n    dmat = dmat.reshape(b, m, n, self.num_scores)\n\n    # Calculate scaled dot product\n    attn_scores = torch.matmul(q, k.transpose(-2, -1)) / (k.size(-1) ** 0.5)\n    # [b, h, m, n, num_scores+1]\n    mix_attn_scores = torch.cat(\n        [\n            attn_scores.unsqueeze(-1),\n            dmat[:, None, ...].expand(b, self.num_heads, m, n, self.num_scores),\n        ],\n        dim=-1,\n    )\n    # [b, h, m, n]\n    attn_scores = (\n        (\n            torch.matmul(\n                F.relu(\n                    torch.matmul(mix_attn_scores.transpose(1, 2), self.mix_W1)\n                    + self.mix_b1[None, None, :, None, :]\n                ),\n                self.mix_W2,\n            )\n            + self.mix_b2[None, None, :, None, :]\n        )\n        .transpose(1, 2)\n        .squeeze(-1)\n    )\n\n    # Apply the provided attention mask\n    if attn_mask is not None:\n        if attn_mask.dtype == torch.bool:\n            attn_mask[~attn_mask.any(-1)] = True\n            attn_scores.masked_fill_(~attn_mask, float(\"-inf\"))\n        else:\n            attn_scores += attn_mask\n\n    # Softmax to get attention weights\n    attn_weights = F.softmax(attn_scores, dim=-1)\n\n    # Apply dropout\n    if dropout_p > 0.0:\n        attn_weights = F.dropout(attn_weights, p=dropout_p)\n\n    # Compute the weighted sum of values\n    return torch.matmul(attn_weights, v)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.matnet.encoder.MatNetMHA","title":"MatNetMHA","text":"
MatNetMHA(\n    embed_dim: int, num_heads: int, bias: bool = False\n)\n

Bases: Module

Methods:

  • forward \u2013

    Args:

Source code in rl4co/models/zoo/matnet/encoder.py
def __init__(self, embed_dim: int, num_heads: int, bias: bool = False):\n    super().__init__()\n    self.row_encoding_block = MatNetCrossMHA(embed_dim, num_heads, bias)\n    self.col_encoding_block = MatNetCrossMHA(embed_dim, num_heads, bias)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.matnet.encoder.MatNetMHA.forward","title":"forward","text":"
forward(row_emb, col_emb, dmat, attn_mask=None)\n

Parameters:

  • row_emb (Tensor) \u2013

    [b, m, d]

  • col_emb (Tensor) \u2013

    [b, n, d]

  • dmat (Tensor) \u2013

    [b, m, n]

Returns:

  • \u2013

    Updated row_emb (Tensor): [b, m, d]

  • \u2013

    Updated col_emb (Tensor): [b, n, d]

Source code in rl4co/models/zoo/matnet/encoder.py
def forward(self, row_emb, col_emb, dmat, attn_mask=None):\n    \"\"\"\n    Args:\n        row_emb (Tensor): [b, m, d]\n        col_emb (Tensor): [b, n, d]\n        dmat (Tensor): [b, m, n]\n\n    Returns:\n        Updated row_emb (Tensor): [b, m, d]\n        Updated col_emb (Tensor): [b, n, d]\n    \"\"\"\n    updated_row_emb = self.row_encoding_block(\n        row_emb, col_emb, dmat=dmat, cross_attn_mask=attn_mask\n    )\n    attn_mask_t = attn_mask.transpose(-2, -1) if attn_mask is not None else None\n    updated_col_emb = self.col_encoding_block(\n        col_emb,\n        row_emb,\n        dmat=dmat.transpose(-2, -1),\n        cross_attn_mask=attn_mask_t,\n    )\n    return updated_row_emb, updated_col_emb\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.matnet.encoder.MatNetLayer","title":"MatNetLayer","text":"
MatNetLayer(\n    embed_dim: int,\n    num_heads: int,\n    bias: bool = False,\n    feedforward_hidden: int = 512,\n    normalization: Optional[str] = \"instance\",\n)\n

Bases: Module

Methods:

  • forward \u2013

    Args:

Source code in rl4co/models/zoo/matnet/encoder.py
def __init__(\n    self,\n    embed_dim: int,\n    num_heads: int,\n    bias: bool = False,\n    feedforward_hidden: int = 512,\n    normalization: Optional[str] = \"instance\",\n):\n    super().__init__()\n    self.MHA = MatNetMHA(embed_dim, num_heads, bias)\n    self.F_a = TransformerFFN(embed_dim, feedforward_hidden, normalization)\n    self.F_b = TransformerFFN(embed_dim, feedforward_hidden, normalization)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.matnet.encoder.MatNetLayer.forward","title":"forward","text":"
forward(row_emb, col_emb, dmat, attn_mask=None)\n

Parameters:

  • row_emb (Tensor) \u2013

    [b, m, d]

  • col_emb (Tensor) \u2013

    [b, n, d]

  • dmat (Tensor) \u2013

    [b, m, n]

Returns:

  • \u2013

    Updated row_emb (Tensor): [b, m, d]

  • \u2013

    Updated col_emb (Tensor): [b, n, d]

Source code in rl4co/models/zoo/matnet/encoder.py
def forward(self, row_emb, col_emb, dmat, attn_mask=None):\n    \"\"\"\n    Args:\n        row_emb (Tensor): [b, m, d]\n        col_emb (Tensor): [b, n, d]\n        dmat (Tensor): [b, m, n]\n\n    Returns:\n        Updated row_emb (Tensor): [b, m, d]\n        Updated col_emb (Tensor): [b, n, d]\n    \"\"\"\n\n    row_emb_out, col_emb_out = self.MHA(row_emb, col_emb, dmat, attn_mask)\n    row_emb_out = self.F_a(row_emb_out, row_emb)\n    col_emb_out = self.F_b(col_emb_out, col_emb)\n    return row_emb_out, col_emb_out\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.matnet.decoder.MultiStageFFSPDecoder","title":"MultiStageFFSPDecoder","text":"
MultiStageFFSPDecoder(\n    embed_dim: int,\n    num_heads: int,\n    use_graph_context: bool = True,\n    tanh_clipping: float = 10,\n    **kwargs\n)\n

Bases: MatNetFFSPDecoder

Decoder class for the solving the FFSP using a seperate MatNet decoder for each stage as originally implemented by Kwon et al. (2021)

Source code in rl4co/models/zoo/matnet/decoder.py
def __init__(\n    self,\n    embed_dim: int,\n    num_heads: int,\n    use_graph_context: bool = True,\n    tanh_clipping: float = 10,\n    **kwargs,\n):\n    super().__init__(\n        embed_dim=embed_dim,\n        num_heads=num_heads,\n        use_graph_context=use_graph_context,\n        **kwargs,\n    )\n    self.cached_embs: PrecomputedCache = None\n    self.tanh_clipping = tanh_clipping\n
"},{"location":"docs/content/api/zoo/constructive_ar/#multi-decoder-attention-model-mdam","title":"Multi-Decoder Attention Model (MDAM)","text":"

Classes:

  • MDAM \u2013

    Multi-Decoder Attention Model (MDAM) is a model

Functions:

  • rollout \u2013

    In this case the reward from the model is [batch, num_paths]

Classes:

  • MDAMPolicy \u2013

    Multi-Decoder Attention Model (MDAM) policy.

Classes:

  • MDAMGraphAttentionEncoder \u2013
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.mdam.model.MDAM","title":"MDAM","text":"
MDAM(\n    env: RL4COEnvBase,\n    policy: MDAMPolicy = None,\n    baseline: Union[REINFORCEBaseline, str] = \"rollout\",\n    policy_kwargs={},\n    baseline_kwargs={},\n    **kwargs\n)\n

Bases: REINFORCE

Multi-Decoder Attention Model (MDAM) is a model to train multiple diverse policies, which effectively increases the chance of finding good solutions compared with existing methods that train only one policy. Reference link: https://arxiv.org/abs/2012.10638; Implementation reference: https://github.com/liangxinedu/MDAM.

Parameters:

  • env (RL4COEnvBase) \u2013

    Environment to use for the algorithm

  • policy (MDAMPolicy, default: None ) \u2013

    Policy to use for the algorithm

  • baseline (Union[REINFORCEBaseline, str], default: 'rollout' ) \u2013

    REINFORCE baseline. Defaults to rollout (1 epoch of exponential, then greedy rollout baseline)

  • policy_kwargs \u2013

    Keyword arguments for policy

  • baseline_kwargs \u2013

    Keyword arguments for baseline

  • **kwargs \u2013

    Keyword arguments passed to the superclass

Methods:

  • calculate_loss \u2013

    Calculate loss for REINFORCE algorithm.

Source code in rl4co/models/zoo/mdam/model.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: MDAMPolicy = None,\n    baseline: Union[REINFORCEBaseline, str] = \"rollout\",\n    policy_kwargs={},\n    baseline_kwargs={},\n    **kwargs,\n):\n    if policy is None:\n        policy = MDAMPolicy(env_name=env.name, **policy_kwargs)\n\n    super().__init__(env, policy, baseline, baseline_kwargs, **kwargs)\n\n    # Change rollout of baseline to the rollout function\n    if isinstance(self.baseline, WarmupBaseline):\n        if isinstance(self.baseline.baseline, RolloutBaseline):\n            self.baseline.baseline.rollout = partial(rollout, self.baseline.baseline)\n    elif isinstance(self.baseline, RolloutBaseline):\n        self.baseline.rollout = partial(rollout, self.baseline)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.mdam.model.MDAM.calculate_loss","title":"calculate_loss","text":"
calculate_loss(\n    td, batch, policy_out, reward=None, log_likelihood=None\n)\n

Calculate loss for REINFORCE algorithm. Same as in :class:REINFORCE, but the bl_val is calculated is simply unsqueezed to match the reward shape (i.e., [batch, num_paths])

Parameters:

  • td \u2013

    TensorDict containing the current state of the environment

  • batch \u2013

    Batch of data. This is used to get the extra loss terms, e.g., REINFORCE baseline

  • policy_out \u2013

    Output of the policy network

  • reward \u2013

    Reward tensor. If None, it is taken from policy_out

  • log_likelihood \u2013

    Log-likelihood tensor. If None, it is taken from policy_out

Source code in rl4co/models/zoo/mdam/model.py
def calculate_loss(\n    self,\n    td,\n    batch,\n    policy_out,\n    reward=None,\n    log_likelihood=None,\n):\n    \"\"\"Calculate loss for REINFORCE algorithm.\n    Same as in :class:`REINFORCE`, but the bl_val is calculated is simply unsqueezed to match\n    the reward shape (i.e., [batch, num_paths])\n\n    Args:\n        td: TensorDict containing the current state of the environment\n        batch: Batch of data. This is used to get the extra loss terms, e.g., REINFORCE baseline\n        policy_out: Output of the policy network\n        reward: Reward tensor. If None, it is taken from `policy_out`\n        log_likelihood: Log-likelihood tensor. If None, it is taken from `policy_out`\n    \"\"\"\n    # Extra: this is used for additional loss terms, e.g., REINFORCE baseline\n    extra = batch.get(\"extra\", None)\n    reward = reward if reward is not None else policy_out[\"reward\"]\n    log_likelihood = (\n        log_likelihood if log_likelihood is not None else policy_out[\"log_likelihood\"]\n    )\n\n    # REINFORCE baseline\n    bl_val, bl_loss = (\n        self.baseline.eval(td, reward, self.env) if extra is None else (extra, 0)\n    )\n\n    # Main loss function\n    # reward: [batch, num_paths]. Note that the baseline value is the max reward\n    # if bl_val is a tensor, unsqueeze it to match the reward shape\n    if isinstance(bl_val, torch.Tensor):\n        if len(bl_val.shape) > 0:\n            bl_val = bl_val.unsqueeze(1)\n    advantage = reward - bl_val  # advantage = reward - baseline\n    reinforce_loss = -(advantage * log_likelihood).mean()\n    loss = reinforce_loss + bl_loss\n    policy_out.update(\n        {\n            \"loss\": loss,\n            \"reinforce_loss\": reinforce_loss,\n            \"bl_loss\": bl_loss,\n            \"bl_val\": bl_val,\n        }\n    )\n    return policy_out\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.mdam.model.rollout","title":"rollout","text":"
rollout(\n    self,\n    model,\n    env,\n    batch_size=64,\n    device=\"cpu\",\n    dataset=None,\n)\n

In this case the reward from the model is [batch, num_paths] and the baseline takes the maximum reward from the model as the baseline. https://github.com/liangxinedu/MDAM/blob/19b0bf813fb2dbec2fcde9e22eb50e04675400cd/train.py#L38C29-L38C33

Source code in rl4co/models/zoo/mdam/model.py
def rollout(self, model, env, batch_size=64, device=\"cpu\", dataset=None):\n    \"\"\"In this case the reward from the model is [batch, num_paths]\n    and the baseline takes the maximum reward from the model as the baseline.\n    https://github.com/liangxinedu/MDAM/blob/19b0bf813fb2dbec2fcde9e22eb50e04675400cd/train.py#L38C29-L38C33\n    \"\"\"\n    # if dataset is None, use the dataset of the baseline\n    dataset = self.dataset if dataset is None else dataset\n\n    model.eval()\n    model = model.to(device)\n\n    def eval_model(batch):\n        with torch.inference_mode():\n            batch = env.reset(batch.to(device))\n            return model(batch, env, decode_type=\"greedy\")[\"reward\"].max(1).values\n\n    dl = DataLoader(dataset, batch_size=batch_size, collate_fn=dataset.collate_fn)\n\n    rewards = torch.cat([eval_model(batch) for batch in dl], 0)\n    return rewards\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.mdam.policy.MDAMPolicy","title":"MDAMPolicy","text":"
MDAMPolicy(\n    encoder: MDAMGraphAttentionEncoder = None,\n    decoder: MDAMDecoder = None,\n    embed_dim: int = 128,\n    env_name: str = \"tsp\",\n    num_encoder_layers: int = 3,\n    num_heads: int = 8,\n    normalization: str = \"batch\",\n    **decoder_kwargs\n)\n

Bases: AutoregressivePolicy

Multi-Decoder Attention Model (MDAM) policy. Args:

Source code in rl4co/models/zoo/mdam/policy.py
def __init__(\n    self,\n    encoder: MDAMGraphAttentionEncoder = None,\n    decoder: MDAMDecoder = None,\n    embed_dim: int = 128,\n    env_name: str = \"tsp\",\n    num_encoder_layers: int = 3,\n    num_heads: int = 8,\n    normalization: str = \"batch\",\n    **decoder_kwargs,\n):\n    encoder = (\n        MDAMGraphAttentionEncoder(\n            num_heads=num_heads,\n            embed_dim=embed_dim,\n            num_layers=num_encoder_layers,\n            normalization=normalization,\n        )\n        if encoder is None\n        else encoder\n    )\n\n    decoder = (\n        MDAMDecoder(\n            env_name=env_name,\n            embed_dim=embed_dim,\n            num_heads=num_heads,\n            **decoder_kwargs,\n        )\n        if decoder is None\n        else decoder\n    )\n\n    super(MDAMPolicy, self).__init__(\n        env_name=env_name, encoder=encoder, decoder=decoder\n    )\n\n    self.init_embedding = env_init_embedding(env_name, {\"embed_dim\": embed_dim})\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.mdam.encoder.MDAMGraphAttentionEncoder","title":"MDAMGraphAttentionEncoder","text":"
MDAMGraphAttentionEncoder(\n    num_heads,\n    embed_dim,\n    num_layers,\n    node_dim=None,\n    normalization=\"batch\",\n    feedforward_hidden=512,\n    sdpa_fn: Optional[Callable] = None,\n)\n

Bases: Module

Methods:

  • forward \u2013

    Returns:

Source code in rl4co/models/zoo/mdam/encoder.py
def __init__(\n    self,\n    num_heads,\n    embed_dim,\n    num_layers,\n    node_dim=None,\n    normalization=\"batch\",\n    feedforward_hidden=512,\n    sdpa_fn: Optional[Callable] = None,\n):\n    super(MDAMGraphAttentionEncoder, self).__init__()\n\n    # To map input to embedding space\n    self.init_embed = nn.Linear(node_dim, embed_dim) if node_dim is not None else None\n\n    self.layers = nn.Sequential(\n        *(\n            MultiHeadAttentionLayer(\n                embed_dim,\n                num_heads,\n                feedforward_hidden,\n                normalization,\n                sdpa_fn=sdpa_fn,\n            )\n            for _ in range(num_layers - 1)  # because last layer is different\n        )\n    )\n    self.attention_layer = MultiHeadAttentionMDAM(\n        embed_dim, num_heads, sdpa_fn=sdpa_fn, last_one=True\n    )\n    self.BN1 = Normalization(embed_dim, normalization)\n    self.projection = SkipConnection(\n        nn.Sequential(\n            nn.Linear(embed_dim, feedforward_hidden),\n            nn.ReLU(),\n            nn.Linear(feedforward_hidden, embed_dim),\n        )\n        if feedforward_hidden > 0\n        else nn.Linear(embed_dim, embed_dim)\n    )\n    self.BN2 = Normalization(embed_dim, normalization)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.mdam.encoder.MDAMGraphAttentionEncoder.forward","title":"forward","text":"
forward(x, mask=None, return_transform_loss=False)\n

Returns:

  • \u2013
    • h [batch_size, graph_size, embed_dim]
  • \u2013
    • attn [num_head, batch_size, graph_size, graph_size]
  • \u2013
    • V [num_head, batch_size, graph_size, key_dim]
  • \u2013
    • h_old [batch_size, graph_size, embed_dim]
Source code in rl4co/models/zoo/mdam/encoder.py
def forward(self, x, mask=None, return_transform_loss=False):\n    \"\"\"\n    Returns:\n        - h [batch_size, graph_size, embed_dim]\n        - attn [num_head, batch_size, graph_size, graph_size]\n        - V [num_head, batch_size, graph_size, key_dim]\n        - h_old [batch_size, graph_size, embed_dim]\n    \"\"\"\n    assert mask is None, \"TODO mask not yet supported!\"\n\n    h_embeded = x\n    h_old = self.layers(h_embeded)\n    h_new, attn, V = self.attention_layer(h_old)\n    h = h_new + h_old\n    h = self.BN1(h)\n    h = self.projection(h)\n    h = self.BN2(h)\n\n    return (h, h.mean(dim=1), attn, V, h_old)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#pomo","title":"POMO","text":"

Classes:

  • POMO \u2013

    POMO Model for neural combinatorial optimization based on REINFORCE

"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.pomo.model.POMO","title":"POMO","text":"
POMO(\n    env: RL4COEnvBase,\n    policy: Module = None,\n    policy_kwargs={},\n    baseline: str = \"shared\",\n    num_augment: int = 8,\n    augment_fn: Union[str, callable] = \"dihedral8\",\n    first_aug_identity: bool = True,\n    feats: list = None,\n    num_starts: int = None,\n    **kwargs\n)\n

Bases: REINFORCE

POMO Model for neural combinatorial optimization based on REINFORCE Based on Kwon et al. (2020) http://arxiv.org/abs/2010.16011.

Note

If no policy kwargs is passed, we use the Attention Model policy with the following arguments: Differently to the base class:

  • num_encoder_layers=6 (instead of 3)
  • normalization=\"instance\" (instead of \"batch\")
  • use_graph_context=False (instead of True) The latter is due to the fact that the paper does not use the graph context in the policy, which seems to be helpful in overfitting to the training graph size.

Parameters:

  • env (RL4COEnvBase) \u2013

    TorchRL Environment

  • policy (Module, default: None ) \u2013

    Policy to use for the algorithm

  • policy_kwargs \u2013

    Keyword arguments for policy

  • baseline (str, default: 'shared' ) \u2013

    Baseline to use for the algorithm. Note that POMO only supports shared baseline, so we will throw an error if anything else is passed.

  • num_augment (int, default: 8 ) \u2013

    Number of augmentations (used only for validation and test)

  • augment_fn (Union[str, callable], default: 'dihedral8' ) \u2013

    Function to use for augmentation, defaulting to dihedral8

  • first_aug_identity (bool, default: True ) \u2013

    Whether to include the identity augmentation in the first position

  • feats (list, default: None ) \u2013

    List of features to augment

  • num_starts (int, default: None ) \u2013

    Number of starts for multi-start. If None, use the number of available actions

  • **kwargs \u2013

    Keyword arguments passed to the superclass

Source code in rl4co/models/zoo/pomo/model.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: nn.Module = None,\n    policy_kwargs={},\n    baseline: str = \"shared\",\n    num_augment: int = 8,\n    augment_fn: Union[str, callable] = \"dihedral8\",\n    first_aug_identity: bool = True,\n    feats: list = None,\n    num_starts: int = None,\n    **kwargs,\n):\n    self.save_hyperparameters(logger=False)\n\n    if policy is None:\n        policy_kwargs_with_defaults = {\n            \"num_encoder_layers\": 6,\n            \"normalization\": \"instance\",\n            \"use_graph_context\": False,\n        }\n        policy_kwargs_with_defaults.update(policy_kwargs)\n        policy = AttentionModelPolicy(\n            env_name=env.name, **policy_kwargs_with_defaults\n        )\n\n    assert baseline == \"shared\", \"POMO only supports shared baseline\"\n\n    # Initialize with the shared baseline\n    super(POMO, self).__init__(env, policy, baseline, **kwargs)\n\n    self.num_starts = num_starts\n    self.num_augment = num_augment\n    if self.num_augment > 1:\n        self.augment = StateAugmentation(\n            num_augment=self.num_augment,\n            augment_fn=augment_fn,\n            first_aug_identity=first_aug_identity,\n            feats=feats,\n        )\n    else:\n        self.augment = None\n\n    # Add `_multistart` to decode type for train, val and test in policy\n    for phase in [\"train\", \"val\", \"test\"]:\n        self.set_decode_type_multistart(phase)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#pointer-network-ptrnet","title":"Pointer Network (PtrNet)","text":"

Classes:

  • PointerNetwork \u2013

    Pointer Network for neural combinatorial optimization based on REINFORCE

Classes:

  • Encoder \u2013

    Maps a graph represented as an input sequence

Classes:

  • SimpleAttention \u2013

    A generic attention module for a decoder in seq2seq

  • Decoder \u2013

Classes:

  • CriticNetworkLSTM \u2013

    Useful as a baseline in REINFORCE updates

"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ptrnet.model.PointerNetwork","title":"PointerNetwork","text":"
PointerNetwork(\n    env: RL4COEnvBase,\n    policy: PointerNetworkPolicy = None,\n    baseline: Union[REINFORCEBaseline, str] = \"rollout\",\n    policy_kwargs={},\n    baseline_kwargs={},\n    **kwargs\n)\n

Bases: REINFORCE

Pointer Network for neural combinatorial optimization based on REINFORCE Based on Vinyals et al. (2015) https://arxiv.org/abs/1506.03134 Refactored from reference implementation: https://github.com/wouterkool/attention-learn-to-route

Parameters:

  • env (RL4COEnvBase) \u2013

    Environment to use for the algorithm

  • policy (PointerNetworkPolicy, default: None ) \u2013

    Policy to use for the algorithm

  • baseline (Union[REINFORCEBaseline, str], default: 'rollout' ) \u2013

    REINFORCE baseline. Defaults to rollout (1 epoch of exponential, then greedy rollout baseline)

  • policy_kwargs \u2013

    Keyword arguments for policy

  • baseline_kwargs \u2013

    Keyword arguments for baseline

  • **kwargs \u2013

    Keyword arguments passed to the superclass

Source code in rl4co/models/zoo/ptrnet/model.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: PointerNetworkPolicy = None,\n    baseline: Union[REINFORCEBaseline, str] = \"rollout\",\n    policy_kwargs={},\n    baseline_kwargs={},\n    **kwargs,\n):\n    policy = (\n        PointerNetworkPolicy(env=env, **policy_kwargs) if policy is None else policy\n    )\n    super().__init__(env, policy, baseline, baseline_kwargs, **kwargs)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ptrnet.encoder.Encoder","title":"Encoder","text":"
Encoder(input_dim, hidden_dim)\n

Bases: Module

Maps a graph represented as an input sequence to a hidden vector

Methods:

  • init_hidden \u2013

    Trainable initial hidden state

Source code in rl4co/models/zoo/ptrnet/encoder.py
def __init__(self, input_dim, hidden_dim):\n    super(Encoder, self).__init__()\n    self.hidden_dim = hidden_dim\n    self.lstm = nn.LSTM(input_dim, hidden_dim)\n    self.init_hx, self.init_cx = self.init_hidden(hidden_dim)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ptrnet.encoder.Encoder.init_hidden","title":"init_hidden","text":"
init_hidden(hidden_dim)\n

Trainable initial hidden state

Source code in rl4co/models/zoo/ptrnet/encoder.py
def init_hidden(self, hidden_dim):\n    \"\"\"Trainable initial hidden state\"\"\"\n    std = 1.0 / math.sqrt(hidden_dim)\n    enc_init_hx = nn.Parameter(torch.FloatTensor(hidden_dim))\n    enc_init_hx.data.uniform_(-std, std)\n\n    enc_init_cx = nn.Parameter(torch.FloatTensor(hidden_dim))\n    enc_init_cx.data.uniform_(-std, std)\n    return enc_init_hx, enc_init_cx\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ptrnet.decoder.SimpleAttention","title":"SimpleAttention","text":"
SimpleAttention(dim, use_tanh=False, C=10)\n

Bases: Module

A generic attention module for a decoder in seq2seq

Methods:

  • forward \u2013

    Args:

Source code in rl4co/models/zoo/ptrnet/decoder.py
def __init__(self, dim, use_tanh=False, C=10):\n    super(SimpleAttention, self).__init__()\n    self.use_tanh = use_tanh\n    self.project_query = nn.Linear(dim, dim)\n    self.project_ref = nn.Conv1d(dim, dim, 1, 1)\n    self.C = C  # tanh exploration\n\n    self.v = nn.Parameter(torch.FloatTensor(dim))\n    self.v.data.uniform_(-(1.0 / math.sqrt(dim)), 1.0 / math.sqrt(dim))\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ptrnet.decoder.SimpleAttention.forward","title":"forward","text":"
forward(query, ref)\n

Parameters:

  • query \u2013

    is the hidden state of the decoder at the current time step. batch x dim

  • ref \u2013

    the set of hidden states from the encoder. sourceL x batch x hidden_dim

Source code in rl4co/models/zoo/ptrnet/decoder.py
def forward(self, query, ref):\n    \"\"\"\n    Args:\n        query: is the hidden state of the decoder at the current\n            time step. batch x dim\n        ref: the set of hidden states from the encoder.\n            sourceL x batch x hidden_dim\n    \"\"\"\n    # ref is now [batch_size x hidden_dim x sourceL]\n    ref = ref.permute(1, 2, 0)\n    q = self.project_query(query).unsqueeze(2)  # batch x dim x 1\n    e = self.project_ref(ref)  # batch_size x hidden_dim x sourceL\n    # expand the query by sourceL\n    # batch x dim x sourceL\n    expanded_q = q.repeat(1, 1, e.size(2))\n    # batch x 1 x hidden_dim\n    v_view = self.v.unsqueeze(0).expand(expanded_q.size(0), len(self.v)).unsqueeze(1)\n    # [batch_size x 1 x hidden_dim] * [batch_size x hidden_dim x sourceL]\n    u = torch.bmm(v_view, F.tanh(expanded_q + e)).squeeze(1)\n    if self.use_tanh:\n        logits = self.C * F.tanh(u)\n    else:\n        logits = u\n    return e, logits\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ptrnet.decoder.Decoder","title":"Decoder","text":"
Decoder(\n    embed_dim: int = 128,\n    hidden_dim: int = 128,\n    tanh_exploration: float = 10.0,\n    use_tanh: bool = True,\n    num_glimpses=1,\n    mask_glimpses=True,\n    mask_logits=True,\n)\n

Bases: Module

Methods:

  • forward \u2013

    Args:

Source code in rl4co/models/zoo/ptrnet/decoder.py
def __init__(\n    self,\n    embed_dim: int = 128,\n    hidden_dim: int = 128,\n    tanh_exploration: float = 10.0,\n    use_tanh: bool = True,\n    num_glimpses=1,\n    mask_glimpses=True,\n    mask_logits=True,\n):\n    super(Decoder, self).__init__()\n\n    self.embed_dim = embed_dim\n    self.hidden_dim = hidden_dim\n    self.num_glimpses = num_glimpses\n    self.mask_glimpses = mask_glimpses\n    self.mask_logits = mask_logits\n    self.use_tanh = use_tanh\n    self.tanh_exploration = tanh_exploration\n\n    self.lstm = nn.LSTMCell(embed_dim, hidden_dim)\n    self.pointer = SimpleAttention(hidden_dim, use_tanh=use_tanh, C=tanh_exploration)\n    self.glimpse = SimpleAttention(hidden_dim, use_tanh=False)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ptrnet.decoder.Decoder.forward","title":"forward","text":"
forward(\n    decoder_input,\n    embedded_inputs,\n    hidden,\n    context,\n    decode_type=\"sampling\",\n    eval_tours=None,\n)\n

Parameters:

  • decoder_input \u2013

    The initial input to the decoder size is [batch_size x embed_dim]. Trainable parameter.

  • embedded_inputs \u2013

    [sourceL x batch_size x embed_dim]

  • hidden \u2013

    the prev hidden state, size is [batch_size x hidden_dim]. Initially this is set to (enc_h[-1], enc_c[-1])

  • context \u2013

    encoder outputs, [sourceL x batch_size x hidden_dim]

Source code in rl4co/models/zoo/ptrnet/decoder.py
def forward(\n    self,\n    decoder_input,\n    embedded_inputs,\n    hidden,\n    context,\n    decode_type=\"sampling\",\n    eval_tours=None,\n):\n    \"\"\"\n    Args:\n        decoder_input: The initial input to the decoder\n            size is [batch_size x embed_dim]. Trainable parameter.\n        embedded_inputs: [sourceL x batch_size x embed_dim]\n        hidden: the prev hidden state, size is [batch_size x hidden_dim].\n            Initially this is set to (enc_h[-1], enc_c[-1])\n        context: encoder outputs, [sourceL x batch_size x hidden_dim]\n    \"\"\"\n\n    batch_size = context.size(1)\n    outputs = []\n    selections = []\n    steps = range(embedded_inputs.size(0))\n    idxs = None\n    mask = torch.ones(\n        embedded_inputs.size(1),\n        embedded_inputs.size(0),\n        dtype=torch.bool,\n        device=embedded_inputs.device,\n    )\n\n    for i in steps:\n        hidden, log_p, mask = self.recurrence(\n            decoder_input, hidden, mask, idxs, i, context\n        )\n        # select the next inputs for the decoder [batch_size x hidden_dim]\n        idxs = (\n            decode_logprobs(log_p, mask, decode_type=decode_type)\n            if eval_tours is None\n            else eval_tours[:, i]\n        )\n        # select logp of chosen action\n        log_p = gather_by_index(log_p, idxs, dim=1)\n\n        idxs = (\n            idxs.detach()\n        )  # Otherwise pytorch complains it want's a reward, todo implement this more properly?\n        # Gather input embedding of selected\n        decoder_input = torch.gather(\n            embedded_inputs,\n            0,\n            idxs.contiguous()\n            .view(1, batch_size, 1)\n            .expand(1, batch_size, *embedded_inputs.size()[2:]),\n        ).squeeze(0)\n\n        # use outs to point to next object\n        outputs.append(log_p)\n        selections.append(idxs)\n    return (torch.stack(outputs, 1), torch.stack(selections, 1)), hidden\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ptrnet.critic.CriticNetworkLSTM","title":"CriticNetworkLSTM","text":"
CriticNetworkLSTM(\n    embed_dim,\n    hidden_dim,\n    n_process_block_iters,\n    tanh_exploration,\n    use_tanh,\n)\n

Bases: Module

Useful as a baseline in REINFORCE updates

Methods:

  • forward \u2013

    Args:

Source code in rl4co/models/zoo/ptrnet/critic.py
def __init__(\n    self,\n    embed_dim,\n    hidden_dim,\n    n_process_block_iters,\n    tanh_exploration,\n    use_tanh,\n):\n    super(CriticNetworkLSTM, self).__init__()\n\n    self.hidden_dim = hidden_dim\n    self.n_process_block_iters = n_process_block_iters\n\n    self.encoder = Encoder(embed_dim, hidden_dim)\n\n    self.process_block = SimpleAttention(\n        hidden_dim, use_tanh=use_tanh, C=tanh_exploration\n    )\n    self.sm = nn.Softmax(dim=1)\n    self.decoder = nn.Sequential(\n        nn.Linear(hidden_dim, hidden_dim), nn.ReLU(), nn.Linear(hidden_dim, 1)\n    )\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.ptrnet.critic.CriticNetworkLSTM.forward","title":"forward","text":"
forward(inputs)\n

Parameters:

  • inputs \u2013

    [embed_dim x batch_size x sourceL] of embedded inputs

Source code in rl4co/models/zoo/ptrnet/critic.py
def forward(self, inputs):\n    \"\"\"\n    Args:\n        inputs: [embed_dim x batch_size x sourceL] of embedded inputs\n    \"\"\"\n    inputs = inputs.transpose(0, 1).contiguous()\n\n    encoder_hx = (\n        self.encoder.init_hx.unsqueeze(0).repeat(inputs.size(1), 1).unsqueeze(0)\n    )\n    encoder_cx = (\n        self.encoder.init_cx.unsqueeze(0).repeat(inputs.size(1), 1).unsqueeze(0)\n    )\n\n    # encoder forward pass\n    enc_outputs, (enc_h_t, enc_c_t) = self.encoder(inputs, (encoder_hx, encoder_cx))\n\n    # grab the hidden state and process it via the process block\n    process_block_state = enc_h_t[-1]\n    for i in range(self.n_process_block_iters):\n        ref, logits = self.process_block(process_block_state, enc_outputs)\n        process_block_state = torch.bmm(ref, self.sm(logits).unsqueeze(2)).squeeze(2)\n    # produce the final scalar output\n    out = self.decoder(process_block_state)\n    return out\n
"},{"location":"docs/content/api/zoo/constructive_ar/#symnco","title":"SymNCO","text":"

Classes:

  • SymNCO \u2013

    SymNCO Model based on REINFORCE with shared baselines.

Classes:

  • SymNCOPolicy \u2013

    SymNCO Policy based on AutoregressivePolicy.

Functions:

  • problem_symmetricity_loss \u2013

    REINFORCE loss for problem symmetricity

  • solution_symmetricity_loss \u2013

    REINFORCE loss for solution symmetricity

  • invariance_loss \u2013

    Loss for invariant representation on projected nodes

"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.symnco.model.SymNCO","title":"SymNCO","text":"
SymNCO(\n    env: RL4COEnvBase,\n    policy: Union[Module, SymNCOPolicy] = None,\n    policy_kwargs: dict = {},\n    baseline: str = \"symnco\",\n    num_augment: int = 4,\n    augment_fn: Union[str, callable] = \"symmetric\",\n    feats: list = None,\n    alpha: float = 0.2,\n    beta: float = 1,\n    num_starts: int = 0,\n    **kwargs\n)\n

Bases: REINFORCE

SymNCO Model based on REINFORCE with shared baselines. Based on Kim et al. (2022) https://arxiv.org/abs/2205.13209.

Parameters:

  • env (RL4COEnvBase) \u2013

    TorchRL environment to use for the algorithm

  • policy (Union[Module, SymNCOPolicy], default: None ) \u2013

    Policy to use for the algorithm

  • policy_kwargs (dict, default: {} ) \u2013

    Keyword arguments for policy

  • num_augment (int, default: 4 ) \u2013

    Number of augmentations

  • augment_fn (Union[str, callable], default: 'symmetric' ) \u2013

    Function to use for augmentation, defaulting to dihedral_8_augmentation

  • feats (list, default: None ) \u2013

    List of features to augment

  • alpha (float, default: 0.2 ) \u2013

    weight for invariance loss

  • beta (float, default: 1 ) \u2013

    weight for solution symmetricity loss

  • num_starts (int, default: 0 ) \u2013

    Number of starts for multi-start. If None, use the number of available actions

  • **kwargs \u2013

    Keyword arguments passed to the superclass

Source code in rl4co/models/zoo/symnco/model.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: Union[nn.Module, SymNCOPolicy] = None,\n    policy_kwargs: dict = {},\n    baseline: str = \"symnco\",\n    num_augment: int = 4,\n    augment_fn: Union[str, callable] = \"symmetric\",\n    feats: list = None,\n    alpha: float = 0.2,\n    beta: float = 1,\n    num_starts: int = 0,\n    **kwargs,\n):\n    self.save_hyperparameters(logger=False)\n\n    if policy is None:\n        policy = SymNCOPolicy(env_name=env.name, **policy_kwargs)\n\n    assert baseline == \"symnco\", \"SymNCO only supports custom-symnco baseline\"\n    baseline = \"no\"  # Pass no baseline to superclass since there are multiple custom baselines\n\n    # Pass no baseline to superclass since there are multiple custom baselines\n    super().__init__(env, policy, baseline, **kwargs)\n\n    self.num_starts = num_starts\n    self.num_augment = num_augment\n    self.augment = StateAugmentation(\n        num_augment=self.num_augment, augment_fn=augment_fn, feats=feats\n    )\n    self.alpha = alpha  # weight for invariance loss\n    self.beta = beta  # weight for solution symmetricity loss\n\n    # Add `_multistart` to decode type for train, val and test in policy if num_starts > 1\n    if self.num_starts > 1:\n        for phase in [\"train\", \"val\", \"test\"]:\n            self.set_decode_type_multistart(phase)\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.symnco.policy.SymNCOPolicy","title":"SymNCOPolicy","text":"
SymNCOPolicy(\n    embed_dim: int = 128,\n    env_name: str = \"tsp\",\n    num_encoder_layers: int = 3,\n    num_heads: int = 8,\n    normalization: str = \"batch\",\n    projection_head: Module = None,\n    use_projection_head: bool = True,\n    **kwargs\n)\n

Bases: AttentionModelPolicy

SymNCO Policy based on AutoregressivePolicy. This differs from the default :class:AutoregressivePolicy in that it projects the initial embeddings to a lower dimension using a projection head and returns it. This is used in the SymNCO algorithm to compute the invariance loss. Based on Kim et al. (2022) https://arxiv.org/abs/2205.13209.

Parameters:

  • embed_dim (int, default: 128 ) \u2013

    Dimension of the embedding

  • env_name (str, default: 'tsp' ) \u2013

    Name of the environment

  • num_encoder_layers (int, default: 3 ) \u2013

    Number of layers in the encoder

  • num_heads (int, default: 8 ) \u2013

    Number of heads in the encoder

  • normalization (str, default: 'batch' ) \u2013

    Normalization to use in the encoder

  • projection_head (Module, default: None ) \u2013

    Projection head to use

  • use_projection_head (bool, default: True ) \u2013

    Whether to use projection head

  • **kwargs \u2013

    Keyword arguments passed to the superclass

Source code in rl4co/models/zoo/symnco/policy.py
def __init__(\n    self,\n    embed_dim: int = 128,\n    env_name: str = \"tsp\",\n    num_encoder_layers: int = 3,\n    num_heads: int = 8,\n    normalization: str = \"batch\",\n    projection_head: nn.Module = None,\n    use_projection_head: bool = True,\n    **kwargs,\n):\n    super(SymNCOPolicy, self).__init__(\n        env_name=env_name,\n        embed_dim=embed_dim,\n        num_encoder_layers=num_encoder_layers,\n        num_heads=num_heads,\n        normalization=normalization,\n        **kwargs,\n    )\n\n    self.use_projection_head = use_projection_head\n\n    if self.use_projection_head:\n        self.projection_head = (\n            MLP(embed_dim, embed_dim, 1, embed_dim, nn.ReLU)\n            if projection_head is None\n            else projection_head\n        )\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.symnco.losses.problem_symmetricity_loss","title":"problem_symmetricity_loss","text":"
problem_symmetricity_loss(reward, log_likelihood, dim=1)\n

REINFORCE loss for problem symmetricity Baseline is the average reward for all augmented problems Corresponds to L_ps in the SymNCO paper

Source code in rl4co/models/zoo/symnco/losses.py
def problem_symmetricity_loss(reward, log_likelihood, dim=1):\n    \"\"\"REINFORCE loss for problem symmetricity\n    Baseline is the average reward for all augmented problems\n    Corresponds to `L_ps` in the SymNCO paper\n    \"\"\"\n    num_augment = reward.shape[dim]\n    if num_augment < 2:\n        return 0\n    advantage = reward - reward.mean(dim=dim, keepdim=True)\n    loss = -advantage * log_likelihood\n    return loss.mean()\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.symnco.losses.solution_symmetricity_loss","title":"solution_symmetricity_loss","text":"
solution_symmetricity_loss(reward, log_likelihood, dim=-1)\n

REINFORCE loss for solution symmetricity Baseline is the average reward for all start nodes Corresponds to L_ss in the SymNCO paper

Source code in rl4co/models/zoo/symnco/losses.py
def solution_symmetricity_loss(reward, log_likelihood, dim=-1):\n    \"\"\"REINFORCE loss for solution symmetricity\n    Baseline is the average reward for all start nodes\n    Corresponds to `L_ss` in the SymNCO paper\n    \"\"\"\n    num_starts = reward.shape[dim]\n    if num_starts < 2:\n        return 0\n    advantage = reward - reward.mean(dim=dim, keepdim=True)\n    loss = -advantage * log_likelihood\n    return loss.mean()\n
"},{"location":"docs/content/api/zoo/constructive_ar/#models.zoo.symnco.losses.invariance_loss","title":"invariance_loss","text":"
invariance_loss(proj_embed, num_augment)\n

Loss for invariant representation on projected nodes Corresponds to L_inv in the SymNCO paper

Source code in rl4co/models/zoo/symnco/losses.py
def invariance_loss(proj_embed, num_augment):\n    \"\"\"Loss for invariant representation on projected nodes\n    Corresponds to `L_inv` in the SymNCO paper\n    \"\"\"\n    pe = rearrange(proj_embed, \"(b a) ... -> b a ...\", a=num_augment)\n    similarity = sum(\n        [cosine_similarity(pe[:, 0], pe[:, i], dim=-1) for i in range(1, num_augment)]\n    )\n    return similarity.mean()\n
"},{"location":"docs/content/api/zoo/constructive_nar/","title":"Constructive NonAutoregressive","text":""},{"location":"docs/content/api/zoo/constructive_nar/#deepaco","title":"DeepACO","text":"

Classes:

  • AntSystem \u2013

    Implements the Ant System algorithm: https://doi.org/10.1109/3477.484436.

Classes:

  • DeepACO \u2013

    Implements DeepACO: https://arxiv.org/abs/2309.14032.

Classes:

  • DeepACOPolicy \u2013

    Implememts DeepACO policy based on :class:NonAutoregressivePolicy. Introduced by Ye et al. (2023): https://arxiv.org/abs/2309.14032.

"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.deepaco.antsystem.AntSystem","title":"AntSystem","text":"
AntSystem(\n    log_heuristic: Tensor,\n    n_ants: int = 20,\n    alpha: float = 1.0,\n    beta: float = 1.0,\n    decay: float = 0.95,\n    Q: Optional[float] = None,\n    temperature: float = 0.1,\n    pheromone: Optional[Tensor] = None,\n    require_logprobs: bool = False,\n    use_local_search: bool = False,\n    use_nls: bool = False,\n    n_perturbations: int = 5,\n    local_search_params: dict = {},\n    perturbation_params: dict = {},\n    start_node: Optional[int] = None,\n)\n

Implements the Ant System algorithm: https://doi.org/10.1109/3477.484436.

Parameters:

  • log_heuristic (Tensor) \u2013

    Logarithm of the heuristic matrix.

  • n_ants (int, default: 20 ) \u2013

    Number of ants to be used in the algorithm. Defaults to 20.

  • alpha (float, default: 1.0 ) \u2013

    Importance of pheromone in the decision-making process. Defaults to 1.0.

  • beta (float, default: 1.0 ) \u2013

    Importance of heuristic information in the decision-making process. Defaults to 1.0.

  • decay (float, default: 0.95 ) \u2013

    Rate at which pheromone evaporates. Should be between 0 and 1. Defaults to 0.95.

  • Q (Optional[float], default: None ) \u2013

    Rate at which pheromone deposits. Defaults to 1 / n_ants.

  • temperature (float, default: 0.1 ) \u2013

    Temperature for the softmax during decoding. Defaults to 0.1.

  • pheromone (Optional[Tensor], default: None ) \u2013

    Initial pheromone matrix. Defaults to torch.ones_like(log_heuristic).

  • require_logprobs (bool, default: False ) \u2013

    Whether to require the log probability of actions. Defaults to False.

  • use_local_search (bool, default: False ) \u2013

    Whether to use local_search provided by the env. Default to False.

  • use_nls (bool, default: False ) \u2013

    Whether to use neural-guided local search provided by the env. Default to False.

  • n_perturbations (int, default: 5 ) \u2013

    Number of perturbations to be used for nls. Defaults to 5.

  • local_search_params (dict, default: {} ) \u2013

    Arguments to be passed to the local_search.

  • perturbation_params (dict, default: {} ) \u2013

    Arguments to be passed to the perturbation used for nls.

Methods:

  • run \u2013

    Run the Ant System algorithm for a specified number of iterations.

  • local_search \u2013

    Perform local search on the actions and reward obtained.

  • get_logp \u2013

    Get the log probability (logprobs) values recorded during the execution of the algorithm.

Source code in rl4co/models/zoo/deepaco/antsystem.py
def __init__(\n    self,\n    log_heuristic: Tensor,\n    n_ants: int = 20,\n    alpha: float = 1.0,\n    beta: float = 1.0,\n    decay: float = 0.95,\n    Q: Optional[float] = None,\n    temperature: float = 0.1,\n    pheromone: Optional[Tensor] = None,\n    require_logprobs: bool = False,\n    use_local_search: bool = False,\n    use_nls: bool = False,\n    n_perturbations: int = 5,\n    local_search_params: dict = {},\n    perturbation_params: dict = {},\n    start_node: Optional[int] = None,\n):\n    self.batch_size = log_heuristic.shape[0]\n    self.n_ants = n_ants\n    self.alpha = alpha\n    self.beta = beta\n    self.decay = decay\n    self.Q = 1 / self.n_ants if Q is None else Q\n    self.temperature = temperature\n\n    self.log_heuristic = log_heuristic / self.temperature\n\n    if pheromone is None:\n        self.pheromone = torch.ones_like(log_heuristic)\n        self.pheromone.fill_(0.0005)\n    else:\n        self.pheromone = pheromone\n\n    self.final_actions = self.final_reward = None\n    self.require_logprobs = require_logprobs\n    self.all_records = []\n\n    self.use_local_search = use_local_search\n    assert not (use_nls and not use_local_search), \"use_nls requires use_local_search\"\n    self.use_nls = use_nls\n    self.n_perturbations = n_perturbations\n    self.local_search_params = local_search_params\n    self.perturbation_params = perturbation_params\n    self.start_node = start_node\n\n    self._batchindex = torch.arange(self.batch_size, device=log_heuristic.device)\n
"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.deepaco.antsystem.AntSystem.run","title":"run","text":"
run(\n    td_initial: TensorDict,\n    env: RL4COEnvBase,\n    n_iterations: int,\n) -> Tuple[TensorDict, Tensor, Tensor]\n

Run the Ant System algorithm for a specified number of iterations.

Parameters:

  • td_initial (TensorDict) \u2013

    Initial state of the problem.

  • env (RL4COEnvBase) \u2013

    Environment representing the problem.

  • n_iterations (int) \u2013

    Number of iterations to run the algorithm.

Returns:

  • td ( TensorDict ) \u2013

    The final state of the problem.

  • actions ( Tensor ) \u2013

    The final actions chosen by the algorithm.

  • reward ( Tensor ) \u2013

    The final reward achieved by the algorithm.

Source code in rl4co/models/zoo/deepaco/antsystem.py
def run(\n    self,\n    td_initial: TensorDict,\n    env: RL4COEnvBase,\n    n_iterations: int,\n) -> Tuple[TensorDict, Tensor, Tensor]:\n    \"\"\"Run the Ant System algorithm for a specified number of iterations.\n\n    Args:\n        td_initial: Initial state of the problem.\n        env: Environment representing the problem.\n        n_iterations: Number of iterations to run the algorithm.\n\n    Returns:\n        td: The final state of the problem.\n        actions: The final actions chosen by the algorithm.\n        reward: The final reward achieved by the algorithm.\n    \"\"\"\n    for _ in range(n_iterations):\n        # reset environment\n        td = td_initial.clone()\n        self._one_step(td, env)\n\n    action_matrix = self._convert_final_action_to_matrix()\n    assert action_matrix is not None and self.final_reward is not None\n    td, env = self._recreate_final_routes(td_initial, env, action_matrix)\n\n    return td, action_matrix, self.final_reward\n
"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.deepaco.antsystem.AntSystem.local_search","title":"local_search","text":"
local_search(\n    td: TensorDict, env: RL4COEnvBase, actions: Tensor\n) -> Tuple[Tensor, Tensor]\n

Perform local search on the actions and reward obtained.

Parameters:

  • td (TensorDict) \u2013

    Current state of the problem.

  • env (RL4COEnvBase) \u2013

    Environment representing the problem.

  • actions (Tensor) \u2013

    Actions chosen by the algorithm.

Returns:

  • actions ( Tensor ) \u2013

    The modified actions

  • reward ( Tensor ) \u2013

    The modified reward

Source code in rl4co/models/zoo/deepaco/antsystem.py
def local_search(\n    self, td: TensorDict, env: RL4COEnvBase, actions: Tensor\n) -> Tuple[Tensor, Tensor]:\n    \"\"\"Perform local search on the actions and reward obtained.\n\n    Args:\n        td: Current state of the problem.\n        env: Environment representing the problem.\n        actions: Actions chosen by the algorithm.\n\n    Returns:\n        actions: The modified actions\n        reward: The modified reward\n    \"\"\"\n    td_cpu = td.detach().cpu()  # Convert to CPU in advance to minimize the overhead from device transfer\n    td_cpu[\"distances\"] = get_distance_matrix(td_cpu[\"locs\"])\n    # TODO: avoid or generalize this, e.g., pre-compute for local search in each env\n    actions = actions.detach().cpu()\n    best_actions = env.local_search(td=td_cpu, actions=actions, **self.local_search_params)\n    best_rewards = env.get_reward(td_cpu, best_actions)\n\n    if self.use_nls:\n        td_cpu_perturb = td_cpu.clone()\n        td_cpu_perturb[\"distances\"] = torch.tile(self.heuristic_dist, (self.n_ants, 1, 1))\n        new_actions = best_actions.clone()\n\n        for _ in range(self.n_perturbations):\n            perturbed_actions = env.local_search(\n                td=td_cpu_perturb, actions=new_actions, **self.perturbation_params\n            )\n            new_actions = env.local_search(td=td_cpu, actions=perturbed_actions, **self.local_search_params)\n            new_rewards = env.get_reward(td_cpu, new_actions)\n\n            improved_indices = new_rewards > best_rewards\n            best_actions = env.replace_selected_actions(best_actions, new_actions, improved_indices)\n            best_rewards[improved_indices] = new_rewards[improved_indices]\n\n    best_actions = best_actions.to(td.device)\n    best_rewards = best_rewards.to(td.device)\n\n    return best_actions, best_rewards\n
"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.deepaco.antsystem.AntSystem.get_logp","title":"get_logp","text":"
get_logp()\n

Get the log probability (logprobs) values recorded during the execution of the algorithm.

Returns:

  • results \u2013

    Tuple containing the log probability values, actions chosen, rewards obtained, and mask values (if available).

Raises:

  • AssertionError \u2013

    If require_logp is not enabled.

Source code in rl4co/models/zoo/deepaco/antsystem.py
def get_logp(self):\n    \"\"\"Get the log probability (logprobs) values recorded during the execution of the algorithm.\n\n    Returns:\n        results: Tuple containing the log probability values,\n            actions chosen, rewards obtained, and mask values (if available).\n\n    Raises:\n        AssertionError: If `require_logp` is not enabled.\n    \"\"\"\n\n    assert (\n        self.require_logprobs\n    ), \"Please enable `require_logp` to record logprobs values\"\n\n    logprobs_list, actions_list, reward_list, mask_list = [], [], [], []\n\n    for logprobs, actions, reward, mask in self.all_records:\n        logprobs_list.append(logprobs)\n        actions_list.append(actions)\n        reward_list.append(reward)\n        mask_list.append(mask)\n\n    if mask_list[0] is None:\n        mask_list = None\n    else:\n        mask_list = torch.stack(mask_list, 0)\n\n    # reset records\n    self.all_records = []\n\n    return (\n        torch.stack(logprobs_list, 0),\n        torch.stack(actions_list, 0),\n        torch.stack(reward_list, 0),\n        mask_list,\n    )\n
"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.deepaco.model.DeepACO","title":"DeepACO","text":"
DeepACO(\n    env: RL4COEnvBase,\n    policy: Optional[DeepACOPolicy] = None,\n    baseline: Union[REINFORCEBaseline, str] = \"no\",\n    policy_kwargs: dict = {},\n    baseline_kwargs: dict = {},\n    **kwargs\n)\n

Bases: REINFORCE

Implements DeepACO: https://arxiv.org/abs/2309.14032.

Parameters:

  • env (RL4COEnvBase) \u2013

    Environment to use for the algorithm

  • policy (Optional[DeepACOPolicy], default: None ) \u2013

    Policy to use for the algorithm

  • baseline (Union[REINFORCEBaseline, str], default: 'no' ) \u2013

    REINFORCE baseline. Defaults to exponential

  • policy_kwargs (dict, default: {} ) \u2013

    Keyword arguments for policy

  • baseline_kwargs (dict, default: {} ) \u2013

    Keyword arguments for baseline

  • **kwargs \u2013

    Keyword arguments passed to the superclass

Source code in rl4co/models/zoo/deepaco/model.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: Optional[DeepACOPolicy] = None,\n    baseline: Union[REINFORCEBaseline, str] = \"no\",\n    policy_kwargs: dict = {},\n    baseline_kwargs: dict = {},\n    **kwargs,\n):\n    if policy is None:\n        policy = DeepACOPolicy(env_name=env.name, **policy_kwargs)\n\n    super().__init__(env, policy, baseline, baseline_kwargs, **kwargs)\n
"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.deepaco.policy.DeepACOPolicy","title":"DeepACOPolicy","text":"
DeepACOPolicy(\n    encoder: Optional[NonAutoregressiveEncoder] = None,\n    env_name: str = \"tsp\",\n    temperature: float = 1.0,\n    aco_class: Optional[Type[AntSystem]] = None,\n    aco_kwargs: dict = {},\n    train_with_local_search: bool = True,\n    n_ants: Optional[Union[int, dict]] = None,\n    n_iterations: Optional[Union[int, dict]] = None,\n    ls_reward_aug_W: float = 0.95,\n    **encoder_kwargs\n)\n

Bases: NonAutoregressivePolicy

Implememts DeepACO policy based on :class:NonAutoregressivePolicy. Introduced by Ye et al. (2023): https://arxiv.org/abs/2309.14032. This policy uses a Non-Autoregressive Graph Neural Network to generate heatmaps, which are then used to run Ant Colony Optimization (ACO) to construct solutions.

Parameters:

  • encoder (Optional[NonAutoregressiveEncoder], default: None ) \u2013

    Encoder module. Can be passed by sub-classes

  • env_name (str, default: 'tsp' ) \u2013

    Name of the environment used to initialize embeddings

  • temperature (float, default: 1.0 ) \u2013

    Temperature for the softmax during decoding. Defaults to 0.1.

  • aco_class (Optional[Type[AntSystem]], default: None ) \u2013

    Class representing the ACO algorithm to be used. Defaults to :class:AntSystem.

  • aco_kwargs (dict, default: {} ) \u2013

    Additional arguments to be passed to the ACO algorithm.

  • n_ants (Optional[Union[int, dict]], default: None ) \u2013

    Number of ants to be used in the ACO algorithm. Can be an integer or dictionary. Defaults to 20.

  • n_iterations (Optional[Union[int, dict]], default: None ) \u2013

    Number of iterations to run the ACO algorithm. Can be an integer or dictionary. Defaults to dict(train=1, val=20, test=100).

  • ls_reward_aug_W (float, default: 0.95 ) \u2013

    Coefficient to be used for the reward augmentation with the local search. Defaults to 0.95.

  • encoder_kwargs \u2013

    Additional arguments to be passed to the encoder.

Methods:

  • forward \u2013

    Forward method. During validation and testing, the policy runs the ACO algorithm to construct solutions.

Source code in rl4co/models/zoo/deepaco/policy.py
def __init__(\n    self,\n    encoder: Optional[NonAutoregressiveEncoder] = None,\n    env_name: str = \"tsp\",\n    temperature: float = 1.0,\n    aco_class: Optional[Type[AntSystem]] = None,\n    aco_kwargs: dict = {},\n    train_with_local_search: bool = True,\n    n_ants: Optional[Union[int, dict]] = None,\n    n_iterations: Optional[Union[int, dict]] = None,\n    ls_reward_aug_W: float = 0.95,\n    **encoder_kwargs,\n):\n    if encoder is None:\n        encoder = NARGNNEncoder(**encoder_kwargs)\n\n    super(DeepACOPolicy, self).__init__(\n        encoder=encoder,\n        env_name=env_name,\n        temperature=temperature,\n        train_decode_type=\"multistart_sampling\",\n        val_decode_type=\"multistart_sampling\",\n        test_decode_type=\"multistart_sampling\",\n    )\n\n    self.aco_class = AntSystem if aco_class is None else aco_class\n    self.aco_kwargs = aco_kwargs\n    self.train_with_local_search = train_with_local_search\n    self.n_ants = merge_with_defaults(n_ants, train=30, val=48, test=48)\n    self.n_iterations = merge_with_defaults(n_iterations, train=1, val=5, test=10)\n    self.ls_reward_aug_W = ls_reward_aug_W\n
"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.deepaco.policy.DeepACOPolicy.forward","title":"forward","text":"
forward(\n    td_initial: TensorDict,\n    env: Optional[Union[str, RL4COEnvBase]] = None,\n    calc_reward: bool = True,\n    phase: str = \"train\",\n    actions=None,\n    return_actions: bool = True,\n    return_hidden: bool = True,\n    **kwargs\n)\n

Forward method. During validation and testing, the policy runs the ACO algorithm to construct solutions. See :class:NonAutoregressivePolicy for more details during the training phase.

Source code in rl4co/models/zoo/deepaco/policy.py
def forward(\n    self,\n    td_initial: TensorDict,\n    env: Optional[Union[str, RL4COEnvBase]] = None,\n    calc_reward: bool = True,\n    phase: str = \"train\",\n    actions=None,\n    return_actions: bool = True,\n    return_hidden: bool = True,\n    **kwargs,\n):\n    \"\"\"\n    Forward method. During validation and testing, the policy runs the ACO algorithm to construct solutions.\n    See :class:`NonAutoregressivePolicy` for more details during the training phase.\n    \"\"\"\n    n_ants = self.n_ants[phase]\n    # Instantiate environment if needed\n    if (phase != \"train\" or self.ls_reward_aug_W > 0) and (env is None or isinstance(env, str)):\n        env_name = self.env_name if env is None else env\n        env = get_env(env_name)\n\n    if phase == \"train\":\n        select_start_nodes_fn = partial(\n            self.aco_class.select_start_node_fn, start_node=self.aco_kwargs.get(\"start_node\", None)\n        )\n        kwargs.update({\"select_start_nodes_fn\": select_start_nodes_fn})\n        #  we just use the constructive policy\n        outdict = super().forward(\n            td_initial,\n            env,\n            phase=phase,\n            decode_type=\"multistart_sampling\",\n            calc_reward=calc_reward,\n            num_starts=n_ants,\n            actions=actions,\n            return_actions=return_actions,\n            return_hidden=return_hidden,\n            **kwargs,\n        )\n\n        # manually compute the advantage\n        reward = unbatchify(outdict[\"reward\"], n_ants)\n        advantage = reward - reward.mean(dim=1, keepdim=True)\n\n        if self.ls_reward_aug_W > 0 and self.train_with_local_search:\n            heatmap_logits = outdict[\"hidden\"]\n            aco = self.aco_class(\n                heatmap_logits,\n                n_ants=n_ants,\n                temperature=self.aco_kwargs.get(\"temperature\", self.temperature),\n                **self.aco_kwargs,\n            )\n\n            actions = outdict[\"actions\"]\n            _, ls_reward = aco.local_search(batchify(td_initial, n_ants), env, actions)\n\n            ls_reward = unbatchify(ls_reward, n_ants)\n            ls_advantage = ls_reward - ls_reward.mean(dim=1, keepdim=True)\n            advantage = advantage * (1 - self.ls_reward_aug_W) + ls_advantage * self.ls_reward_aug_W\n\n        outdict[\"advantage\"] = advantage\n        outdict[\"log_likelihood\"] = unbatchify(outdict[\"log_likelihood\"], n_ants)\n\n        return outdict\n\n    heatmap_logits, _ = self.encoder(td_initial)\n\n    aco = self.aco_class(\n        heatmap_logits,\n        n_ants=self.n_ants[phase],\n        temperature=self.aco_kwargs.get(\"temperature\", self.temperature),\n        **self.aco_kwargs,\n    )\n    td, actions, reward = aco.run(td_initial, env, self.n_iterations[phase])\n\n    out = {}\n    if calc_reward:\n        out[\"reward\"] = reward\n    if return_actions:\n        out[\"actions\"] = actions\n\n    return out\n
"},{"location":"docs/content/api/zoo/constructive_nar/#nar-gnn","title":"NAR-GNN","text":"

Classes:

  • NARGNNPolicy \u2013

    Base Non-autoregressive policy for NCO construction methods.

Classes:

  • EdgeHeatmapGenerator \u2013

    MLP for converting edge embeddings to heatmaps.

  • NARGNNEncoder \u2013

    Anisotropic Graph Neural Network encoder with edge-gating mechanism as in Joshi et al. (2022), and used in DeepACO (Ye et al., 2023).

  • NARGNNNodeEncoder \u2013

    In this case, we just use the node embeddings from the graph

"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.nargnn.policy.NARGNNPolicy","title":"NARGNNPolicy","text":"
NARGNNPolicy(\n    encoder: Optional[NonAutoregressiveEncoder] = None,\n    decoder: Optional[NonAutoregressiveDecoder] = None,\n    embed_dim: int = 64,\n    env_name: str = \"tsp\",\n    init_embedding: Optional[Module] = None,\n    edge_embedding: Optional[Module] = None,\n    graph_network: Optional[Module] = None,\n    heatmap_generator: Optional[Module] = None,\n    num_layers_heatmap_generator: int = 5,\n    num_layers_graph_encoder: int = 15,\n    act_fn=\"silu\",\n    agg_fn=\"mean\",\n    linear_bias: bool = True,\n    train_decode_type: str = \"multistart_sampling\",\n    val_decode_type: str = \"multistart_greedy\",\n    test_decode_type: str = \"multistart_greedy\",\n    **constructive_policy_kw\n)\n

Bases: NonAutoregressivePolicy

Base Non-autoregressive policy for NCO construction methods. This creates a heatmap of NxN for N nodes (i.e., heuristic) that models the probability to go from one node to another for all nodes.

The policy performs the following steps
  1. Encode the environment initial state into node embeddings
  2. Decode (non-autoregressively) to construct the solution to the NCO problem
Warning

The effectiveness of the non-autoregressive approach can vary significantly across different problem types and configurations. It may require careful tuning of the model architecture and decoding strategy to achieve competitive results.

Parameters:

  • encoder (Optional[NonAutoregressiveEncoder], default: None ) \u2013

    Encoder module. Can be passed by sub-classes

  • decoder (Optional[NonAutoregressiveDecoder], default: None ) \u2013

    Decoder module. Note that this moule defaults to the non-autoregressive decoder

  • embed_dim (int, default: 64 ) \u2013

    Dimension of the embeddings

  • env_name (str, default: 'tsp' ) \u2013

    Name of the environment used to initialize embeddings

  • init_embedding (Optional[Module], default: None ) \u2013

    Model to use for the initial embedding. If None, use the default embedding for the environment

  • edge_embedding (Optional[Module], default: None ) \u2013

    Model to use for the edge embedding. If None, use the default embedding for the environment

  • graph_network (Optional[Module], default: None ) \u2013

    Model to use for the graph network. If None, use the default embedding for the environment

  • heatmap_generator (Optional[Module], default: None ) \u2013

    Model to use for the heatmap generator. If None, use the default embedding for the environment

  • num_layers_heatmap_generator (int, default: 5 ) \u2013

    Number of layers in the heatmap generator

  • num_layers_graph_encoder (int, default: 15 ) \u2013

    Number of layers in the graph encoder

  • act_fn \u2013

    Activation function to use in the encoder

  • agg_fn \u2013

    Aggregation function to use in the encoder

  • linear_bias (bool, default: True ) \u2013

    Whether to use bias in the encoder

  • train_decode_type (str, default: 'multistart_sampling' ) \u2013

    Type of decoding during training

  • val_decode_type (str, default: 'multistart_greedy' ) \u2013

    Type of decoding during validation

  • test_decode_type (str, default: 'multistart_greedy' ) \u2013

    Type of decoding during testing

  • **constructive_policy_kw \u2013

    Unused keyword arguments

Source code in rl4co/models/zoo/nargnn/policy.py
def __init__(\n    self,\n    encoder: Optional[NonAutoregressiveEncoder] = None,\n    decoder: Optional[NonAutoregressiveDecoder] = None,\n    embed_dim: int = 64,\n    env_name: str = \"tsp\",\n    init_embedding: Optional[nn.Module] = None,\n    edge_embedding: Optional[nn.Module] = None,\n    graph_network: Optional[nn.Module] = None,\n    heatmap_generator: Optional[nn.Module] = None,\n    num_layers_heatmap_generator: int = 5,\n    num_layers_graph_encoder: int = 15,\n    act_fn=\"silu\",\n    agg_fn=\"mean\",\n    linear_bias: bool = True,\n    train_decode_type: str = \"multistart_sampling\",\n    val_decode_type: str = \"multistart_greedy\",\n    test_decode_type: str = \"multistart_greedy\",\n    **constructive_policy_kw,\n):\n    if len(constructive_policy_kw) > 0:\n        log.warn(f\"Unused kwargs: {constructive_policy_kw}\")\n\n    if encoder is None:\n        encoder = NARGNNEncoder(\n            embed_dim=embed_dim,\n            env_name=env_name,\n            init_embedding=init_embedding,\n            edge_embedding=edge_embedding,\n            graph_network=graph_network,\n            heatmap_generator=heatmap_generator,\n            num_layers_heatmap_generator=num_layers_heatmap_generator,\n            num_layers_graph_encoder=num_layers_graph_encoder,\n            act_fn=act_fn,\n            agg_fn=agg_fn,\n            linear_bias=linear_bias,\n        )\n\n    # The decoder generates logits given the current td and heatmap\n    if decoder is None:\n        decoder = NonAutoregressiveDecoder()\n    else:\n        # check if the decoder has trainable parameters\n        if any(p.requires_grad for p in decoder.parameters()):\n            log.error(\n                \"The decoder contains trainable parameters. This should not happen in a non-autoregressive policy.\"\n            )\n\n    # Pass to constructive policy\n    super(NARGNNPolicy, self).__init__(\n        encoder=encoder,\n        decoder=decoder,\n        env_name=env_name,\n        train_decode_type=train_decode_type,\n        val_decode_type=val_decode_type,\n        test_decode_type=test_decode_type,\n        **constructive_policy_kw,\n    )\n
"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.nargnn.encoder.EdgeHeatmapGenerator","title":"EdgeHeatmapGenerator","text":"
EdgeHeatmapGenerator(\n    embed_dim: int,\n    num_layers: int,\n    act_fn: Union[str, Callable] = \"silu\",\n    linear_bias: bool = True,\n    undirected_graph: bool = True,\n)\n

Bases: Module

MLP for converting edge embeddings to heatmaps.

Parameters:

  • embed_dim (int) \u2013

    Dimension of the embeddings

  • num_layers (int) \u2013

    The number of linear layers in the network.

  • act_fn (Union[str, Callable], default: 'silu' ) \u2013

    Activation function. Defaults to \"silu\".

  • linear_bias (bool, default: True ) \u2013

    Use bias in linear layers. Defaults to True.

  • undirected_graph (bool, default: True ) \u2013

    Whether the graph is undirected. Defaults to True.

Source code in rl4co/models/zoo/nargnn/encoder.py
def __init__(\n    self,\n    embed_dim: int,\n    num_layers: int,\n    act_fn: Union[str, Callable] = \"silu\",\n    linear_bias: bool = True,\n    undirected_graph: bool = True,\n) -> None:\n    super(EdgeHeatmapGenerator, self).__init__()\n\n    self.linears = nn.ModuleList(\n        [\n            nn.Linear(embed_dim, embed_dim, bias=linear_bias)\n            for _ in range(num_layers - 1)\n        ]\n    )\n    self.output = nn.Linear(embed_dim, 1, bias=linear_bias)\n\n    self.act = getattr(nn.functional, act_fn) if isinstance(act_fn, str) else act_fn\n\n    self.undirected_graph = undirected_graph\n
"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.nargnn.encoder.NARGNNEncoder","title":"NARGNNEncoder","text":"
NARGNNEncoder(\n    embed_dim: int = 64,\n    env_name: str = \"tsp\",\n    init_embedding: Optional[Module] = None,\n    edge_embedding: Optional[Module] = None,\n    graph_network: Optional[Module] = None,\n    heatmap_generator: Optional[Module] = None,\n    num_layers_heatmap_generator: int = 5,\n    num_layers_graph_encoder: int = 15,\n    act_fn=\"silu\",\n    agg_fn=\"mean\",\n    linear_bias: bool = True,\n    k_sparse: Optional[int] = None,\n)\n

Bases: NonAutoregressiveEncoder

Anisotropic Graph Neural Network encoder with edge-gating mechanism as in Joshi et al. (2022), and used in DeepACO (Ye et al., 2023). This creates a heatmap of NxN for N nodes (i.e., heuristic) that models the probability to go from one node to another for all nodes. This model utilizes a multi-layer perceptron (MLP) approach to predict edge attributes directly from the input graph features, which are then transformed into a heatmap representation to facilitate the decoding of the solution. The decoding process is managed by a specified strategy which could vary from simple greedy selection to more complex sampling methods.

Tip

This decoder's performance heavily relies on the ability of the MLP to capture the dependencies between different parts of the solution without the iterative refinement provided by autoregressive models. It is particularly useful in scenarios where the solution space can be effectively explored in a parallelized manner or when the solution components are largely independent.

Parameters:

  • embed_dim (int, default: 64 ) \u2013

    Dimension of the node embeddings

  • env_name (str, default: 'tsp' ) \u2013

    Name of the environment used to initialize embeddings

  • num_layers \u2013

    Number of layers in the encoder

  • init_embedding (Optional[Module], default: None ) \u2013

    Model to use for the initial embedding. If None, use the default embedding for the environment

  • edge_embedding (Optional[Module], default: None ) \u2013

    Model to use for the edge embedding. If None, use the default embedding for the environment

  • graph_network (Optional[Module], default: None ) \u2013

    Model to use for the graph network. If None, use the default network for the environment

  • heatmap_generator (Optional[Module], default: None ) \u2013

    Model to use for the heatmap generator. If None, use the default network for the environment

  • num_layers_heatmap_generator (int, default: 5 ) \u2013

    Number of layers in the heatmap generator

  • num_layers_graph_encoder (int, default: 15 ) \u2013

    Number of layers in the graph encoder

  • act_fn \u2013

    The activation function to use in each GNNLayer, see https://pytorch.org/docs/stable/nn.functional.html#non-linear-activation-functions for available options. Defaults to 'silu'.

  • agg_fn \u2013

    The aggregation function to use in each GNNLayer for pooling features. Options: 'add', 'mean', 'max'. Defaults to 'mean'.

  • linear_bias (bool, default: True ) \u2013

    Use bias in linear layers. Defaults to True.

  • k_sparse (Optional[int], default: None ) \u2013

    Number of edges to keep for each node. Defaults to None.

Methods:

  • forward \u2013

    Forward pass of the encoder.

Source code in rl4co/models/zoo/nargnn/encoder.py
def __init__(\n    self,\n    embed_dim: int = 64,\n    env_name: str = \"tsp\",\n    # TODO: pass network\n    init_embedding: Optional[nn.Module] = None,\n    edge_embedding: Optional[nn.Module] = None,\n    graph_network: Optional[nn.Module] = None,\n    heatmap_generator: Optional[nn.Module] = None,\n    num_layers_heatmap_generator: int = 5,\n    num_layers_graph_encoder: int = 15,\n    act_fn=\"silu\",\n    agg_fn=\"mean\",\n    linear_bias: bool = True,\n    k_sparse: Optional[int] = None,\n):\n    super(NonAutoregressiveEncoder, self).__init__()\n    self.env_name = env_name\n\n    self.init_embedding = (\n        env_init_embedding(self.env_name, {\"embed_dim\": embed_dim})\n        if init_embedding is None\n        else init_embedding\n    )\n\n    self.edge_embedding = (\n        env_edge_embedding(self.env_name, {\"embed_dim\": embed_dim, \"k_sparse\": k_sparse})\n        if edge_embedding is None\n        else edge_embedding\n    )\n\n    self.graph_network = (\n        GNNEncoder(\n            embed_dim=embed_dim,\n            num_layers=num_layers_graph_encoder,\n            act_fn=act_fn,\n            agg_fn=agg_fn,\n        )\n        if graph_network is None\n        else graph_network\n    )\n\n    self.heatmap_generator = (\n        EdgeHeatmapGenerator(\n            embed_dim=embed_dim,\n            num_layers=num_layers_heatmap_generator,\n            linear_bias=linear_bias,\n        )\n        if heatmap_generator is None\n        else heatmap_generator\n    )\n
"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.nargnn.encoder.NARGNNEncoder.forward","title":"forward","text":"
forward(td: TensorDict)\n

Forward pass of the encoder. Transform the input TensorDict into the latent representation.

Source code in rl4co/models/zoo/nargnn/encoder.py
def forward(self, td: TensorDict):\n    \"\"\"Forward pass of the encoder.\n    Transform the input TensorDict into the latent representation.\n    \"\"\"\n    # Transfer to embedding space\n    node_embed = self.init_embedding(td)\n    graph = self.edge_embedding(td, node_embed)\n\n    # Process embedding into graph\n    # TODO: standardize?\n    graph.x, graph.edge_attr = self.graph_network(\n        graph.x, graph.edge_index, graph.edge_attr\n    )\n\n    # Generate heatmap logits\n    heatmap_logits = self.heatmap_generator(graph)\n\n    # Return latent representation (i.e. heatmap logits) and initial embeddings\n    return heatmap_logits, node_embed\n
"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.nargnn.encoder.NARGNNNodeEncoder","title":"NARGNNNodeEncoder","text":"
NARGNNNodeEncoder(\n    embed_dim: int = 64,\n    env_name: str = \"tsp\",\n    init_embedding: Optional[Module] = None,\n    edge_embedding: Optional[Module] = None,\n    graph_network: Optional[Module] = None,\n    heatmap_generator: Optional[Module] = None,\n    num_layers_heatmap_generator: int = 5,\n    num_layers_graph_encoder: int = 15,\n    act_fn=\"silu\",\n    agg_fn=\"mean\",\n    linear_bias: bool = True,\n    k_sparse: Optional[int] = None,\n)\n

Bases: NARGNNEncoder

In this case, we just use the node embeddings from the graph without transforming them into a heatmap.

Methods:

  • forward \u2013

    Forward pass of the encoder.

Source code in rl4co/models/zoo/nargnn/encoder.py
def __init__(\n    self,\n    embed_dim: int = 64,\n    env_name: str = \"tsp\",\n    # TODO: pass network\n    init_embedding: Optional[nn.Module] = None,\n    edge_embedding: Optional[nn.Module] = None,\n    graph_network: Optional[nn.Module] = None,\n    heatmap_generator: Optional[nn.Module] = None,\n    num_layers_heatmap_generator: int = 5,\n    num_layers_graph_encoder: int = 15,\n    act_fn=\"silu\",\n    agg_fn=\"mean\",\n    linear_bias: bool = True,\n    k_sparse: Optional[int] = None,\n):\n    super(NonAutoregressiveEncoder, self).__init__()\n    self.env_name = env_name\n\n    self.init_embedding = (\n        env_init_embedding(self.env_name, {\"embed_dim\": embed_dim})\n        if init_embedding is None\n        else init_embedding\n    )\n\n    self.edge_embedding = (\n        env_edge_embedding(self.env_name, {\"embed_dim\": embed_dim, \"k_sparse\": k_sparse})\n        if edge_embedding is None\n        else edge_embedding\n    )\n\n    self.graph_network = (\n        GNNEncoder(\n            embed_dim=embed_dim,\n            num_layers=num_layers_graph_encoder,\n            act_fn=act_fn,\n            agg_fn=agg_fn,\n        )\n        if graph_network is None\n        else graph_network\n    )\n\n    self.heatmap_generator = (\n        EdgeHeatmapGenerator(\n            embed_dim=embed_dim,\n            num_layers=num_layers_heatmap_generator,\n            linear_bias=linear_bias,\n        )\n        if heatmap_generator is None\n        else heatmap_generator\n    )\n
"},{"location":"docs/content/api/zoo/constructive_nar/#models.zoo.nargnn.encoder.NARGNNNodeEncoder.forward","title":"forward","text":"
forward(td: TensorDict)\n

Forward pass of the encoder. Transform the input TensorDict into the latent representation.

Source code in rl4co/models/zoo/nargnn/encoder.py
def forward(self, td: TensorDict):\n    # Transfer to embedding space\n    node_embed = self.init_embedding(td)\n    graph = self.edge_embedding(td, node_embed)\n\n    # Process embedding into graph\n    # TODO: standardize?\n    graph.x, graph.edge_attr = self.graph_network(\n        graph.x, graph.edge_index, graph.edge_attr\n    )\n\n    proc_embeds = graph.x\n    batch_size = node_embed.shape[0]\n    # reshape proc_embeds from [bs*n, h] to [bs, n, h]\n    proc_embeds = proc_embeds.reshape(batch_size, -1, proc_embeds.shape[1])\n    return proc_embeds, node_embed\n
"},{"location":"docs/content/api/zoo/improvement/","title":"Improvement Methods","text":"

These methods are trained to improve existing solutions iteratively, akin to local search algorithms. They focus on refining existing solutions rather than generating them from scratch.

"},{"location":"docs/content/api/zoo/improvement/#dact","title":"DACT","text":"

Classes:

  • DACTEncoder \u2013

    Dual-Aspect Collaborative Transformer Encoder as in Ma et al. (2021)

Classes:

  • DACTDecoder \u2013

    DACT decoder based on Ma et al. (2021)

Classes:

  • DACTPolicy \u2013

    DACT Policy based on Ma et al. (2021)

Classes:

  • DACT \u2013

    DACT Model based on n_step Proximal Policy Optimization (PPO) with an DACT model policy.

"},{"location":"docs/content/api/zoo/improvement/#models.zoo.dact.encoder.DACTEncoder","title":"DACTEncoder","text":"
DACTEncoder(\n    embed_dim: int = 64,\n    init_embedding: Module = None,\n    pos_embedding: Module = None,\n    env_name: str = \"tsp_kopt\",\n    pos_type: str = \"CPE\",\n    num_heads: int = 4,\n    num_layers: int = 3,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 64,\n)\n

Bases: ImprovementEncoder

Dual-Aspect Collaborative Transformer Encoder as in Ma et al. (2021)

Parameters:

  • embed_dim (int, default: 64 ) \u2013

    Dimension of the embedding space

  • init_embedding (Module, default: None ) \u2013

    Module to use for the initialization of the node embeddings

  • pos_embedding (Module, default: None ) \u2013

    Module to use for the initialization of the positional embeddings

  • env_name (str, default: 'tsp_kopt' ) \u2013

    Name of the environment used to initialize embeddings

  • pos_type (str, default: 'CPE' ) \u2013

    Name of the used positional encoding method (CPE or APE)

  • num_heads (int, default: 4 ) \u2013

    Number of heads in the attention layers

  • num_layers (int, default: 3 ) \u2013

    Number of layers in the attention network

  • normalization (str, default: 'layer' ) \u2013

    Normalization type in the attention layers

  • feedforward_hidden (int, default: 64 ) \u2013

    Hidden dimension in the feedforward layers

Source code in rl4co/models/zoo/dact/encoder.py
def __init__(\n    self,\n    embed_dim: int = 64,\n    init_embedding: nn.Module = None,\n    pos_embedding: nn.Module = None,\n    env_name: str = \"tsp_kopt\",\n    pos_type: str = \"CPE\",\n    num_heads: int = 4,\n    num_layers: int = 3,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 64,\n):\n    super(DACTEncoder, self).__init__(\n        embed_dim=embed_dim,\n        env_name=env_name,\n        pos_type=pos_type,\n        num_heads=num_heads,\n        num_layers=num_layers,\n        normalization=normalization,\n        feedforward_hidden=feedforward_hidden,\n    )\n\n    assert self.env_name in [\"tsp_kopt\"], NotImplementedError()\n\n    self.net = AdaptiveSequential(\n        *(\n            DACTEncoderLayer(\n                num_heads,\n                embed_dim,\n                feedforward_hidden,\n                normalization,\n            )\n            for _ in range(num_layers)\n        )\n    )\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.dact.decoder.DACTDecoder","title":"DACTDecoder","text":"
DACTDecoder(embed_dim: int = 64, num_heads: int = 4)\n

Bases: ImprovementDecoder

DACT decoder based on Ma et al. (2021) Given the environment state and the dual sets of embeddings (PFE, NFE embeddings), compute the logits for selecting two nodes for the 2-opt local search from the current solution

Parameters:

  • embed_dim (int, default: 64 ) \u2013

    Embedding dimension

  • num_heads (int, default: 4 ) \u2013

    Number of attention heads

Methods:

  • forward \u2013

    Compute the logits of the removing a node pair from the current solution

Source code in rl4co/models/zoo/dact/decoder.py
def __init__(\n    self,\n    embed_dim: int = 64,\n    num_heads: int = 4,\n):\n    super().__init__()\n    self.embed_dim = embed_dim\n    self.n_heads = num_heads\n    self.hidden_dim = embed_dim\n\n    # for MHC sublayer (NFE aspect)\n    self.compater_node = MultiHeadCompat(\n        num_heads, embed_dim, embed_dim, embed_dim, embed_dim\n    )\n\n    # for MHC sublayer (PFE aspect)\n    self.compater_pos = MultiHeadCompat(\n        num_heads, embed_dim, embed_dim, embed_dim, embed_dim\n    )\n\n    self.norm_factor = 1 / math.sqrt(1 * self.hidden_dim)\n\n    # for Max-Pooling sublayer\n    self.project_graph_pos = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n    self.project_graph_node = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n    self.project_node_pos = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n    self.project_node_node = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n\n    # for feed-forward aggregation (FFA)sublayer\n    self.value_head = MLP(\n        input_dim=2 * self.n_heads,\n        output_dim=1,\n        num_neurons=[32, 32],\n        dropout_probs=[0.05, 0.00],\n    )\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.dact.decoder.DACTDecoder.forward","title":"forward","text":"
forward(\n    td: TensorDict, final_h: Tensor, final_p: Tensor\n) -> Tensor\n

Compute the logits of the removing a node pair from the current solution

Parameters:

  • td (TensorDict) \u2013

    TensorDict with the current environment state

  • final_h (Tensor) \u2013

    final NFE embeddings

  • final_p (Tensor) \u2013

    final pfe embeddings

Source code in rl4co/models/zoo/dact/decoder.py
def forward(self, td: TensorDict, final_h: Tensor, final_p: Tensor) -> Tensor:\n    \"\"\"Compute the logits of the removing a node pair from the current solution\n\n    Args:\n        td: TensorDict with the current environment state\n        final_h: final NFE embeddings\n        final_p: final pfe embeddings\n    \"\"\"\n\n    batch_size, graph_size, dim = final_h.size()\n\n    # Max-Pooling sublayer\n    h_node_refined = self.project_node_node(final_h) + self.project_graph_node(\n        final_h.max(1)[0]\n    )[:, None, :].expand(batch_size, graph_size, dim)\n    h_pos_refined = self.project_node_pos(final_p) + self.project_graph_pos(\n        final_p.max(1)[0]\n    )[:, None, :].expand(batch_size, graph_size, dim)\n\n    # MHC sublayer\n    compatibility = torch.zeros(\n        (batch_size, graph_size, graph_size, self.n_heads * 2),\n        device=h_node_refined.device,\n    )\n    compatibility[:, :, :, : self.n_heads] = self.compater_pos(h_pos_refined).permute(\n        1, 2, 3, 0\n    )\n    compatibility[:, :, :, self.n_heads :] = self.compater_node(\n        h_node_refined\n    ).permute(1, 2, 3, 0)\n\n    # FFA sublater\n    return self.value_head(self.norm_factor * compatibility).squeeze(-1)\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.dact.policy.DACTPolicy","title":"DACTPolicy","text":"
DACTPolicy(\n    embed_dim: int = 64,\n    num_encoder_layers: int = 3,\n    num_heads: int = 4,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 64,\n    env_name: str = \"tsp_kopt\",\n    pos_type: str = \"CPE\",\n    init_embedding: Module = None,\n    pos_embedding: Module = None,\n    temperature: float = 1.0,\n    tanh_clipping: float = 6.0,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"sampling\",\n    test_decode_type: str = \"sampling\",\n)\n

Bases: ImprovementPolicy

DACT Policy based on Ma et al. (2021) This model first encodes the input graph and current solution using a DACT encoder (:class:DACTEncoder) and then decodes the 2-opt action (:class:DACTDecoder)

Parameters:

  • embed_dim (int, default: 64 ) \u2013

    Dimension of the node embeddings

  • num_encoder_layers (int, default: 3 ) \u2013

    Number of layers in the encoder

  • num_heads (int, default: 4 ) \u2013

    Number of heads in the attention layers

  • normalization (str, default: 'layer' ) \u2013

    Normalization type in the attention layers

  • feedforward_hidden (int, default: 64 ) \u2013

    Dimension of the hidden layer in the feedforward network

  • env_name (str, default: 'tsp_kopt' ) \u2013

    Name of the environment used to initialize embeddings

  • pos_type (str, default: 'CPE' ) \u2013

    Name of the used positional encoding method (CPE or APE)

  • init_embedding (Module, default: None ) \u2013

    Module to use for the initialization of the embeddings

  • pos_embedding (Module, default: None ) \u2013

    Module to use for the initialization of the positional embeddings

  • temperature (float, default: 1.0 ) \u2013

    Temperature for the softmax

  • tanh_clipping (float, default: 6.0 ) \u2013

    Tanh clipping value (see Bello et al., 2016)

  • train_decode_type (str, default: 'sampling' ) \u2013

    Type of decoding to use during training

  • val_decode_type (str, default: 'sampling' ) \u2013

    Type of decoding to use during validation

  • test_decode_type (str, default: 'sampling' ) \u2013

    Type of decoding to use during testing

Methods:

  • forward \u2013

    Forward pass of the policy.

Source code in rl4co/models/zoo/dact/policy.py
def __init__(\n    self,\n    embed_dim: int = 64,\n    num_encoder_layers: int = 3,\n    num_heads: int = 4,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 64,\n    env_name: str = \"tsp_kopt\",\n    pos_type: str = \"CPE\",\n    init_embedding: nn.Module = None,\n    pos_embedding: nn.Module = None,\n    temperature: float = 1.0,\n    tanh_clipping: float = 6.0,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"sampling\",\n    test_decode_type: str = \"sampling\",\n):\n    super(DACTPolicy, self).__init__()\n\n    self.env_name = env_name\n\n    # Encoder and decoder\n    self.encoder = DACTEncoder(\n        embed_dim=embed_dim,\n        init_embedding=init_embedding,\n        pos_embedding=pos_embedding,\n        env_name=env_name,\n        pos_type=pos_type,\n        num_heads=num_heads,\n        num_layers=num_encoder_layers,\n        normalization=normalization,\n        feedforward_hidden=feedforward_hidden,\n    )\n\n    self.decoder = DACTDecoder(embed_dim=embed_dim, num_heads=num_heads)\n\n    # Decoding strategies\n    self.temperature = temperature\n    self.tanh_clipping = tanh_clipping\n    self.train_decode_type = train_decode_type\n    self.val_decode_type = val_decode_type\n    self.test_decode_type = test_decode_type\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.dact.policy.DACTPolicy.forward","title":"forward","text":"
forward(\n    td: TensorDict,\n    env: Union[str, RL4COEnvBase] = None,\n    phase: str = \"train\",\n    return_actions: bool = True,\n    return_embeds: bool = False,\n    only_return_embed: bool = False,\n    actions=None,\n    **decoding_kwargs\n) -> dict\n

Forward pass of the policy.

Parameters:

  • td (TensorDict) \u2013

    TensorDict containing the environment state

  • env (Union[str, RL4COEnvBase], default: None ) \u2013

    Environment to use for decoding. If None, the environment is instantiated from env_name. Note that it is more efficient to pass an already instantiated environment each time for fine-grained control

  • phase (str, default: 'train' ) \u2013

    Phase of the algorithm (train, val, test)

  • return_actions (bool, default: True ) \u2013

    Whether to return the actions

  • actions \u2013

    Actions to use for evaluating the policy. If passed, use these actions instead of sampling from the policy to calculate log likelihood

  • decoding_kwargs \u2013

    Keyword arguments for the decoding strategy. See :class:rl4co.utils.decoding.DecodingStrategy for more information.

Returns:

  • out ( dict ) \u2013

    Dictionary containing the reward, log likelihood, and optionally the actions and entropy

Source code in rl4co/models/zoo/dact/policy.py
def forward(\n    self,\n    td: TensorDict,\n    env: Union[str, RL4COEnvBase] = None,\n    phase: str = \"train\",\n    return_actions: bool = True,\n    return_embeds: bool = False,\n    only_return_embed: bool = False,\n    actions=None,\n    **decoding_kwargs,\n) -> dict:\n    \"\"\"Forward pass of the policy.\n\n    Args:\n        td: TensorDict containing the environment state\n        env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that\n            it is more efficient to pass an already instantiated environment each time for fine-grained control\n        phase: Phase of the algorithm (train, val, test)\n        return_actions: Whether to return the actions\n        actions: Actions to use for evaluating the policy.\n            If passed, use these actions instead of sampling from the policy to calculate log likelihood\n        decoding_kwargs: Keyword arguments for the decoding strategy. See :class:`rl4co.utils.decoding.DecodingStrategy` for more information.\n\n    Returns:\n        out: Dictionary containing the reward, log likelihood, and optionally the actions and entropy\n    \"\"\"\n\n    # Encoder: get encoder output and initial embeddings from initial state\n    NFE, PFE = self.encoder(td)\n    h_featrues = torch.cat((NFE, PFE), -1)\n\n    if only_return_embed:\n        return {\"embeds\": h_featrues.detach()}\n\n    # Instantiate environment if needed\n    if isinstance(env, str) or env is None:\n        env_name = self.env_name if env is None else env\n        log.info(f\"Instantiated environment not provided; instantiating {env_name}\")\n        env = get_env(env_name)\n    assert env.two_opt_mode, \"DACT only support 2-opt\"\n\n    # Get decode type depending on phase and whether actions are passed for evaluation\n    decode_type = decoding_kwargs.pop(\"decode_type\", None)\n    if actions is not None:\n        decode_type = \"evaluate\"\n    elif decode_type is None:\n        decode_type = getattr(self, f\"{phase}_decode_type\")\n\n    # Setup decoding strategy\n    # we pop arguments that are not part of the decoding strategy\n    decode_strategy: DecodingStrategy = get_decoding_strategy(\n        decode_type,\n        temperature=decoding_kwargs.pop(\"temperature\", self.temperature),\n        tanh_clipping=decoding_kwargs.pop(\"tanh_clipping\", self.tanh_clipping),\n        mask_logits=True,\n        improvement_method_mode=True,\n        **decoding_kwargs,\n    )\n\n    # Perform the decoding\n    batch_size, seq_length = td[\"rec_current\"].size()\n    logits = self.decoder(td, NFE, PFE).view(batch_size, -1)\n\n    # Get mask\n    mask = env.get_mask(td)\n    if \"action\" in td.keys():\n        mask[torch.arange(batch_size), td[\"action\"][:, 0], td[\"action\"][:, 1]] = False\n        mask[torch.arange(batch_size), td[\"action\"][:, 1], td[\"action\"][:, 0]] = False\n    mask = mask.view(batch_size, -1)\n\n    # Get action and log-likelihood\n    logprob, action_sampled = decode_strategy.step(\n        logits,\n        mask,\n        action=(\n            actions[:, 0] * seq_length + actions[:, 1]\n            if actions is not None\n            else None\n        ),\n    )\n    action_sampled = action_sampled.unsqueeze(-1)\n    if phase == \"train\":\n        log_likelihood = logprob.gather(1, action_sampled)\n    else:\n        log_likelihood = torch.zeros(batch_size, device=td.device)\n\n    ## return\n    DACT_action = torch.cat(\n        (\n            action_sampled // seq_length,\n            action_sampled % seq_length,\n        ),\n        -1,\n    )\n\n    outdict = {\"log_likelihood\": log_likelihood, \"cost_bsf\": td[\"cost_bsf\"]}\n    td.set(\"action\", DACT_action)\n\n    if return_embeds:\n        outdict[\"embeds\"] = h_featrues.detach()\n\n    if return_actions:\n        outdict[\"actions\"] = DACT_action\n\n    return outdict\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.dact.model.DACT","title":"DACT","text":"
DACT(\n    env: RL4COEnvBase,\n    policy: Module = None,\n    critic: CriticNetwork = None,\n    policy_kwargs: dict = {},\n    critic_kwargs: dict = {},\n    **kwargs\n)\n

Bases: n_step_PPO

DACT Model based on n_step Proximal Policy Optimization (PPO) with an DACT model policy. We default to the DACT model policy and the improvement Critic Network.

Parameters:

  • env (RL4COEnvBase) \u2013

    Environment to use for the algorithm

  • policy (Module, default: None ) \u2013

    Policy to use for the algorithm

  • critic (CriticNetwork, default: None ) \u2013

    Critic to use for the algorithm

  • policy_kwargs (dict, default: {} ) \u2013

    Keyword arguments for policy

  • critic_kwargs (dict, default: {} ) \u2013

    Keyword arguments for critic

Source code in rl4co/models/zoo/dact/model.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: nn.Module = None,\n    critic: CriticNetwork = None,\n    policy_kwargs: dict = {},\n    critic_kwargs: dict = {},\n    **kwargs,\n):\n    if policy is None:\n        policy = DACTPolicy(env_name=env.name, **policy_kwargs)\n\n    if critic is None:\n        embed_dim = (\n            policy_kwargs[\"embed_dim\"] * 2 if \"embed_dim\" in policy_kwargs else 128\n        )  # the critic's embed_dim must be as policy's\n\n        encoder = MultiHeadAttentionLayer(\n            embed_dim,\n            critic_kwargs[\"num_heads\"] if \"num_heads\" in critic_kwargs else 4,\n            critic_kwargs[\"feedforward_hidden\"] * 2\n            if \"feedforward_hidden\" in critic_kwargs\n            else 128,\n            critic_kwargs[\"normalization\"]\n            if \"normalization\" in critic_kwargs\n            else \"layer\",\n            bias=False,\n        )\n        value_head = CriticDecoder(embed_dim)\n\n        critic = CriticNetwork(\n            encoder=encoder,\n            value_head=value_head,\n            customized=True,\n        )\n\n    super().__init__(env, policy, critic, **kwargs)\n
"},{"location":"docs/content/api/zoo/improvement/#n2s","title":"N2S","text":"

Classes:

  • N2SEncoder \u2013

    Neural Neighborhood Search Encoder as in Ma et al. (2022)

Classes:

  • NodePairRemovalDecoder \u2013

    N2S Node-Pair Removal decoder based on Ma et al. (2022)

  • NodePairReinsertionDecoder \u2013

    N2S Node-Pair Reinsertion decoder based on Ma et al. (2022)

Classes:

  • N2SPolicy \u2013

    N2S Policy based on Ma et al. (2022)

Classes:

  • N2S \u2013

    N2S Model based on n_step Proximal Policy Optimization (PPO) with an N2S model policy.

"},{"location":"docs/content/api/zoo/improvement/#models.zoo.n2s.encoder.N2SEncoder","title":"N2SEncoder","text":"
N2SEncoder(\n    embed_dim: int = 128,\n    init_embedding: Module = None,\n    pos_embedding: Module = None,\n    env_name: str = \"pdp_ruin_repair\",\n    pos_type: str = \"CPE\",\n    num_heads: int = 4,\n    num_layers: int = 3,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 128,\n)\n

Bases: ImprovementEncoder

Neural Neighborhood Search Encoder as in Ma et al. (2022) First embed the input and then process it with a Graph AttepdN2ntion Network.

Parameters:

  • embed_dim (int, default: 128 ) \u2013

    Dimension of the embedding space

  • init_embedding (Module, default: None ) \u2013

    Module to use for the initialization of the node embeddings

  • pos_embedding (Module, default: None ) \u2013

    Module to use for the initialization of the positional embeddings

  • env_name (str, default: 'pdp_ruin_repair' ) \u2013

    Name of the environment used to initialize embeddings

  • pos_type (str, default: 'CPE' ) \u2013

    Name of the used positional encoding method (CPE or APE)

  • num_heads (int, default: 4 ) \u2013

    Number of heads in the attention layers

  • num_layers (int, default: 3 ) \u2013

    Number of layers in the attention network

  • normalization (str, default: 'layer' ) \u2013

    Normalization type in the attention layers

  • feedforward_hidden (int, default: 128 ) \u2013

    Hidden dimension in the feedforward layers

Source code in rl4co/models/zoo/n2s/encoder.py
def __init__(\n    self,\n    embed_dim: int = 128,\n    init_embedding: nn.Module = None,\n    pos_embedding: nn.Module = None,\n    env_name: str = \"pdp_ruin_repair\",\n    pos_type: str = \"CPE\",\n    num_heads: int = 4,\n    num_layers: int = 3,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 128,\n):\n    super(N2SEncoder, self).__init__(\n        embed_dim=embed_dim,\n        init_embedding=init_embedding,\n        pos_embedding=pos_embedding,\n        env_name=env_name,\n        pos_type=pos_type,\n        num_heads=num_heads,\n        num_layers=num_layers,\n        normalization=normalization,\n        feedforward_hidden=feedforward_hidden,\n    )\n\n    self.pos_net = MultiHeadCompat(num_heads, embed_dim, feedforward_hidden)\n\n    self.net = AdaptiveSequential(\n        *(\n            N2SEncoderLayer(\n                num_heads,\n                embed_dim,\n                feedforward_hidden,\n                normalization,\n            )\n            for _ in range(num_layers)\n        )\n    )\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.n2s.decoder.NodePairRemovalDecoder","title":"NodePairRemovalDecoder","text":"
NodePairRemovalDecoder(\n    embed_dim: int = 128, num_heads: int = 4\n)\n

Bases: ImprovementDecoder

N2S Node-Pair Removal decoder based on Ma et al. (2022) Given the environment state and the node embeddings (positional embeddings are discarded), compute the logits for selecting a pair of pickup and delivery nodes for node pair removal from the current solution

Parameters:

  • embed_dim (int, default: 128 ) \u2013

    Embedding dimension

  • num_heads (int, default: 4 ) \u2013

    Number of attention heads

Methods:

  • forward \u2013

    Compute the logits of the removing a node pair from the current solution

Source code in rl4co/models/zoo/n2s/decoder.py
def __init__(\n    self,\n    embed_dim: int = 128,\n    num_heads: int = 4,\n):\n    super().__init__()\n    self.input_dim = embed_dim\n    self.n_heads = num_heads\n    self.hidden_dim = embed_dim\n\n    assert embed_dim % num_heads == 0\n\n    self.W_Q = nn.Parameter(\n        torch.Tensor(self.n_heads, self.input_dim, self.hidden_dim)\n    )\n    self.W_K = nn.Parameter(\n        torch.Tensor(self.n_heads, self.input_dim, self.hidden_dim)\n    )\n\n    self.agg = MLP(input_dim=2 * self.n_heads + 4, output_dim=1, num_neurons=[32, 32])\n\n    self.init_parameters()\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.n2s.decoder.NodePairRemovalDecoder.forward","title":"forward","text":"
forward(\n    td: TensorDict, final_h: Tensor, final_p: Tensor\n) -> Tensor\n

Compute the logits of the removing a node pair from the current solution

Parameters:

  • td (TensorDict) \u2013

    TensorDict with the current environment state

  • final_h (Tensor) \u2013

    final node embeddings

  • final_p (Tensor) \u2013

    final positional embeddings

Source code in rl4co/models/zoo/n2s/decoder.py
def forward(self, td: TensorDict, final_h: Tensor, final_p: Tensor) -> Tensor:\n    \"\"\"Compute the logits of the removing a node pair from the current solution\n\n    Args:\n        td: TensorDict with the current environment state\n        final_h: final node embeddings\n        final_p: final positional embeddings\n    \"\"\"\n\n    selection_recent = torch.cat(\n        (td[\"action_record\"][:, -3:], td[\"action_record\"].mean(1, True)), 1\n    )\n    solution = td[\"rec_current\"]\n\n    pre = solution.argsort()  # pre=[1,2,0]\n    post = solution.gather(\n        1, solution\n    )  # post=[1,2,0] # the second neighbour works better\n    batch_size, graph_size_plus1, input_dim = final_h.size()\n\n    hflat = final_h.contiguous().view(-1, input_dim)  #################   reshape\n\n    shp = (self.n_heads, batch_size, graph_size_plus1, self.hidden_dim)\n\n    # Calculate queries, (n_heads, batch_size, graph_size+1, key_size)\n    hidden_Q = torch.matmul(hflat, self.W_Q).view(shp)\n    hidden_K = torch.matmul(hflat, self.W_K).view(shp)\n\n    Q_pre = hidden_Q.gather(\n        2, pre.view(1, batch_size, graph_size_plus1, 1).expand_as(hidden_Q)\n    )\n    K_post = hidden_K.gather(\n        2, post.view(1, batch_size, graph_size_plus1, 1).expand_as(hidden_Q)\n    )\n\n    compatibility = (\n        (Q_pre * hidden_K).sum(-1)\n        + (hidden_Q * K_post).sum(-1)\n        - (Q_pre * K_post).sum(-1)\n    )[\n        :, :, 1:\n    ]  # (n_heads, batch_size, graph_size) (12)\n\n    compatibility_pairing = torch.cat(\n        (\n            compatibility[:, :, : graph_size_plus1 // 2],\n            compatibility[:, :, graph_size_plus1 // 2 :],\n        ),\n        0,\n    )  # (n_heads*2, batch_size, graph_size/2)\n\n    compatibility_pairing = self.agg(\n        torch.cat(\n            (\n                compatibility_pairing.permute(1, 2, 0),\n                selection_recent.permute(0, 2, 1),\n            ),\n            -1,\n        )\n    ).squeeze()  # (batch_size, graph_size/2)\n\n    return compatibility_pairing\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.n2s.decoder.NodePairReinsertionDecoder","title":"NodePairReinsertionDecoder","text":"
NodePairReinsertionDecoder(\n    embed_dim: int = 128, num_heads: int = 4\n)\n

Bases: ImprovementDecoder

N2S Node-Pair Reinsertion decoder based on Ma et al. (2022) Given the environment state, the node embeddings (positional embeddings are discarded), and the removed node from the NodePairRemovalDecoder, compute the logits for finding places to re-insert the removed pair of pickup and delivery nodes to form a new solution

Parameters:

  • embed_dim (int, default: 128 ) \u2013

    Embedding dimension

  • num_heads (int, default: 4 ) \u2013

    Number of attention heads

Source code in rl4co/models/zoo/n2s/decoder.py
def __init__(\n    self,\n    embed_dim: int = 128,\n    num_heads: int = 4,\n):\n    super().__init__()\n    self.input_dim = embed_dim\n    self.n_heads = num_heads\n    self.hidden_dim = embed_dim\n\n    assert embed_dim % num_heads == 0\n\n    self.compater_insert1 = MultiHeadCompat(\n        num_heads, embed_dim, embed_dim, embed_dim, embed_dim\n    )\n\n    self.compater_insert2 = MultiHeadCompat(\n        num_heads, embed_dim, embed_dim, embed_dim, embed_dim\n    )\n\n    self.agg = MLP(input_dim=4 * self.n_heads, output_dim=1, num_neurons=[32, 32])\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.n2s.policy.N2SPolicy","title":"N2SPolicy","text":"
N2SPolicy(\n    embed_dim: int = 128,\n    num_encoder_layers: int = 3,\n    num_heads: int = 4,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 128,\n    env_name: str = \"pdp_ruin_repair\",\n    pos_type: str = \"CPE\",\n    init_embedding: Module = None,\n    pos_embedding: Module = None,\n    temperature: float = 1.0,\n    tanh_clipping: float = 6.0,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"sampling\",\n    test_decode_type: str = \"sampling\",\n)\n

Bases: ImprovementPolicy

N2S Policy based on Ma et al. (2022) This model first encodes the input graph and current solution using a N2S encoder (:class:N2SEncoder) and then decodes the node-pair removal and reinsertion action using the Node-Pair Removal (:class:NodePairRemovalDecoder) and Reinsertion (:class:NodePairReinsertionDecoder) decoders

Parameters:

  • embed_dim (int, default: 128 ) \u2013

    Dimension of the node embeddings

  • num_encoder_layers (int, default: 3 ) \u2013

    Number of layers in the encoder

  • num_heads (int, default: 4 ) \u2013

    Number of heads in the attention layers

  • normalization (str, default: 'layer' ) \u2013

    Normalization type in the attention layers

  • feedforward_hidden (int, default: 128 ) \u2013

    Dimension of the hidden layer in the feedforward network

  • env_name (str, default: 'pdp_ruin_repair' ) \u2013

    Name of the environment used to initialize embeddings

  • pos_type (str, default: 'CPE' ) \u2013

    Name of the used positional encoding method (CPE or APE)

  • init_embedding (Module, default: None ) \u2013

    Module to use for the initialization of the embeddings

  • pos_embedding (Module, default: None ) \u2013

    Module to use for the initialization of the positional embeddings

  • temperature (float, default: 1.0 ) \u2013

    Temperature for the softmax

  • tanh_clipping (float, default: 6.0 ) \u2013

    Tanh clipping value (see Bello et al., 2016)

  • train_decode_type (str, default: 'sampling' ) \u2013

    Type of decoding to use during training

  • val_decode_type (str, default: 'sampling' ) \u2013

    Type of decoding to use during validation

  • test_decode_type (str, default: 'sampling' ) \u2013

    Type of decoding to use during testing

Methods:

  • forward \u2013

    Forward pass of the policy.

Source code in rl4co/models/zoo/n2s/policy.py
def __init__(\n    self,\n    embed_dim: int = 128,\n    num_encoder_layers: int = 3,\n    num_heads: int = 4,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 128,\n    env_name: str = \"pdp_ruin_repair\",\n    pos_type: str = \"CPE\",\n    init_embedding: nn.Module = None,\n    pos_embedding: nn.Module = None,\n    temperature: float = 1.0,\n    tanh_clipping: float = 6.0,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"sampling\",\n    test_decode_type: str = \"sampling\",\n):\n    super(N2SPolicy, self).__init__()\n\n    self.env_name = env_name\n\n    # Encoder and decoder\n    self.encoder = N2SEncoder(\n        embed_dim=embed_dim,\n        init_embedding=init_embedding,\n        pos_embedding=pos_embedding,\n        env_name=env_name,\n        pos_type=pos_type,\n        num_heads=num_heads,\n        num_layers=num_encoder_layers,\n        normalization=normalization,\n        feedforward_hidden=feedforward_hidden,\n    )\n\n    self.removal_decoder = NodePairRemovalDecoder(\n        embed_dim=embed_dim, num_heads=num_heads\n    )\n\n    self.reinsertion_decoder = NodePairReinsertionDecoder(\n        embed_dim=embed_dim, num_heads=num_heads\n    )\n\n    self.project_graph = nn.Linear(embed_dim, embed_dim, bias=False)\n    self.project_node = nn.Linear(embed_dim, embed_dim, bias=False)\n\n    # Decoding strategies\n    self.temperature = temperature\n    self.tanh_clipping = tanh_clipping\n    self.train_decode_type = train_decode_type\n    self.val_decode_type = val_decode_type\n    self.test_decode_type = test_decode_type\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.n2s.policy.N2SPolicy.forward","title":"forward","text":"
forward(\n    td: TensorDict,\n    env: Union[str, RL4COEnvBase] = None,\n    phase: str = \"train\",\n    return_actions: bool = True,\n    return_embeds: bool = False,\n    only_return_embed: bool = False,\n    actions=None,\n    **decoding_kwargs\n) -> dict\n

Forward pass of the policy.

Parameters:

  • td (TensorDict) \u2013

    TensorDict containing the environment state

  • env (Union[str, RL4COEnvBase], default: None ) \u2013

    Environment to use for decoding. If None, the environment is instantiated from env_name. Note that it is more efficient to pass an already instantiated environment each time for fine-grained control

  • phase (str, default: 'train' ) \u2013

    Phase of the algorithm (train, val, test)

  • return_actions (bool, default: True ) \u2013

    Whether to return the actions

  • actions \u2013

    Actions to use for evaluating the policy. If passed, use these actions instead of sampling from the policy to calculate log likelihood

  • decoding_kwargs \u2013

    Keyword arguments for the decoding strategy. See :class:rl4co.utils.decoding.DecodingStrategy for more information.

Returns:

  • out ( dict ) \u2013

    Dictionary containing the reward, log likelihood, and optionally the actions and entropy

Source code in rl4co/models/zoo/n2s/policy.py
def forward(\n    self,\n    td: TensorDict,\n    env: Union[str, RL4COEnvBase] = None,\n    phase: str = \"train\",\n    return_actions: bool = True,\n    return_embeds: bool = False,\n    only_return_embed: bool = False,\n    actions=None,\n    **decoding_kwargs,\n) -> dict:\n    \"\"\"Forward pass of the policy.\n\n    Args:\n        td: TensorDict containing the environment state\n        env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that\n            it is more efficient to pass an already instantiated environment each time for fine-grained control\n        phase: Phase of the algorithm (train, val, test)\n        return_actions: Whether to return the actions\n        actions: Actions to use for evaluating the policy.\n            If passed, use these actions instead of sampling from the policy to calculate log likelihood\n        decoding_kwargs: Keyword arguments for the decoding strategy. See :class:`rl4co.utils.decoding.DecodingStrategy` for more information.\n\n    Returns:\n        out: Dictionary containing the reward, log likelihood, and optionally the actions and entropy\n    \"\"\"\n\n    # Encoder: get encoder output and initial embeddings from initial state\n    h_wave, final_p = self.encoder(td)\n    if only_return_embed:\n        return {\"embeds\": h_wave.detach()}\n    final_h = (\n        self.project_node(h_wave) + self.project_graph(h_wave.max(1)[0])[:, None, :]\n    )\n\n    # Instantiate environment if needed\n    if isinstance(env, str) or env is None:\n        env_name = self.env_name if env is None else env\n        log.info(f\"Instantiated environment not provided; instantiating {env_name}\")\n        env = get_env(env_name)\n\n    # Get decode type depending on phase and whether actions are passed for evaluation\n    decode_type = decoding_kwargs.pop(\"decode_type\", None)\n    if actions is not None:\n        decode_type = \"evaluate\"\n    elif decode_type is None:\n        decode_type = getattr(self, f\"{phase}_decode_type\")\n\n    # Setup decoding strategy\n    # we pop arguments that are not part of the decoding strategy\n    decode_strategy: DecodingStrategy = get_decoding_strategy(\n        decode_type,\n        temperature=decoding_kwargs.pop(\"temperature\", self.temperature),\n        tanh_clipping=decoding_kwargs.pop(\"tanh_clipping\", self.tanh_clipping),\n        mask_logits=True,\n        improvement_method_mode=True,\n        **decoding_kwargs,\n    )\n\n    ## action 1\n\n    # Perform the decoding\n    logits = self.removal_decoder(td, final_h, final_p)\n\n    # Get mask\n    mask = torch.ones_like(td[\"action_record\"][:, 0], device=td.device).bool()\n    if \"action\" in td.keys():\n        mask = mask.scatter(1, td[\"action\"][:, :1], 0)\n\n    # Get action and log-likelihood\n    logprob_removal, action_removal = decode_strategy.step(\n        logits,\n        mask,\n        action=actions[:, 0] if actions is not None else None,\n    )\n    action_removal = action_removal.unsqueeze(-1)\n    if phase == \"train\":\n        selected_log_ll_action1 = logprob_removal.gather(1, action_removal)\n\n    ## action 2\n    td.set(\"action\", action_removal)\n\n    # Perform the decoding\n    batch_size, seq_length = td[\"rec_current\"].size()\n    logits = self.reinsertion_decoder(td, final_h, final_p).view(batch_size, -1)\n\n    # Get mask\n    mask = env.get_mask(action_removal + 1, td).view(batch_size, -1)\n    # Get action and log-likelihood\n    logprob_reinsertion, action_reinsertion = decode_strategy.step(\n        logits,\n        mask,\n        action=(\n            actions[:, 1] * seq_length + actions[:, 2]\n            if actions is not None\n            else None\n        ),\n    )\n    action_reinsertion = action_reinsertion.unsqueeze(-1)\n    if phase == \"train\":\n        selected_log_ll_action2 = logprob_reinsertion.gather(1, action_reinsertion)\n\n    ## return\n    N2S_action = torch.cat(\n        (\n            action_removal.view(batch_size, -1),\n            action_reinsertion // seq_length,\n            action_reinsertion % seq_length,\n        ),\n        -1,\n    )\n    if phase == \"train\":\n        log_likelihood = selected_log_ll_action1 + selected_log_ll_action2\n    else:\n        log_likelihood = torch.zeros(batch_size, device=td.device)\n\n    outdict = {\"log_likelihood\": log_likelihood, \"cost_bsf\": td[\"cost_bsf\"]}\n    td.set(\"action\", N2S_action)\n\n    if return_embeds:\n        outdict[\"embeds\"] = h_wave.detach()\n\n    if return_actions:\n        outdict[\"actions\"] = N2S_action\n\n    return outdict\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.n2s.model.N2S","title":"N2S","text":"
N2S(\n    env: RL4COEnvBase,\n    policy: Module = None,\n    critic: CriticNetwork = None,\n    policy_kwargs: dict = {},\n    critic_kwargs: dict = {},\n    **kwargs\n)\n

Bases: n_step_PPO

N2S Model based on n_step Proximal Policy Optimization (PPO) with an N2S model policy. We default to the N2S model policy and the improvement Critic Network.

Parameters:

  • env (RL4COEnvBase) \u2013

    Environment to use for the algorithm

  • policy (Module, default: None ) \u2013

    Policy to use for the algorithm

  • critic (CriticNetwork, default: None ) \u2013

    Critic to use for the algorithm

  • policy_kwargs (dict, default: {} ) \u2013

    Keyword arguments for policy

  • critic_kwargs (dict, default: {} ) \u2013

    Keyword arguments for critic

Source code in rl4co/models/zoo/n2s/model.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: nn.Module = None,\n    critic: CriticNetwork = None,\n    policy_kwargs: dict = {},\n    critic_kwargs: dict = {},\n    **kwargs,\n):\n    if policy is None:\n        policy = N2SPolicy(env_name=env.name, **policy_kwargs)\n\n    if critic is None:\n        embed_dim = (\n            policy_kwargs[\"embed_dim\"] if \"embed_dim\" in policy_kwargs else 128\n        )  # the critic's embed_dim must be as policy's\n\n        encoder = MultiHeadAttentionLayer(\n            embed_dim,\n            critic_kwargs[\"num_heads\"] if \"num_heads\" in critic_kwargs else 4,\n            critic_kwargs[\"feedforward_hidden\"]\n            if \"feedforward_hidden\" in critic_kwargs\n            else 128,\n            critic_kwargs[\"normalization\"]\n            if \"normalization\" in critic_kwargs\n            else \"layer\",\n            bias=False,\n        )\n        value_head = CriticDecoder(embed_dim)\n\n        critic = CriticNetwork(\n            encoder=encoder,\n            value_head=value_head,\n            customized=True,\n        )\n\n    super().__init__(env, policy, critic, **kwargs)\n
"},{"location":"docs/content/api/zoo/improvement/#neuopt","title":"NeuOpt","text":"

Classes:

  • RDSDecoder \u2013

    RDS Decoder for flexible k-opt based on Ma et al. (2023)

Classes:

  • CustomizeTSPInitEmbedding \u2013

    Initial embedding for the Traveling Salesman Problems (TSP).

  • NeuOptPolicy \u2013

    NeuOpt Policy based on Ma et al. (2023)

Classes:

  • NeuOpt \u2013

    NeuOpt Model based on n_step Proximal Policy Optimization (PPO) with an NeuOpt model policy.

"},{"location":"docs/content/api/zoo/improvement/#models.zoo.neuopt.decoder.RDSDecoder","title":"RDSDecoder","text":"
RDSDecoder(embed_dim: int = 128)\n

Bases: ImprovementDecoder

RDS Decoder for flexible k-opt based on Ma et al. (2023) Given the environment state and the node embeddings (positional embeddings are discarded), compute the logits for selecting a k-opt exchange on basis moves (S-move, I-move, E-move) from the current solution

Parameters:

  • embed_dim (int, default: 128 ) \u2013

    Embedding dimension

  • num_heads \u2013

    Number of attention heads

Source code in rl4co/models/zoo/neuopt/decoder.py
def __init__(\n    self,\n    embed_dim: int = 128,\n):\n    super().__init__()\n    self.embed_dim = embed_dim\n\n    self.linear_K1 = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n    self.linear_K2 = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n    self.linear_K3 = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n    self.linear_K4 = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n\n    self.linear_Q1 = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n    self.linear_Q2 = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n    self.linear_Q3 = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n    self.linear_Q4 = nn.Linear(self.embed_dim, self.embed_dim, bias=False)\n\n    self.linear_V1 = nn.Parameter(torch.Tensor(self.embed_dim))\n    self.linear_V2 = nn.Parameter(torch.Tensor(self.embed_dim))\n\n    self.rnn1 = nn.GRUCell(self.embed_dim, self.embed_dim)\n    self.rnn2 = nn.GRUCell(self.embed_dim, self.embed_dim)\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.neuopt.policy.CustomizeTSPInitEmbedding","title":"CustomizeTSPInitEmbedding","text":"
CustomizeTSPInitEmbedding(embed_dim, linear_bias=True)\n

Bases: Module

Initial embedding for the Traveling Salesman Problems (TSP). Embed the following node features to the embedding space:

- locs: x, y coordinates of the cities\n
Source code in rl4co/models/zoo/neuopt/policy.py
def __init__(self, embed_dim, linear_bias=True):\n    super(CustomizeTSPInitEmbedding, self).__init__()\n    node_dim = 2  # x, y\n    self.init_embed = nn.Sequential(\n        nn.Linear(node_dim, embed_dim // 2, linear_bias),\n        nn.ReLU(inplace=True),\n        nn.Linear(embed_dim // 2, embed_dim, linear_bias),\n    )\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.neuopt.policy.NeuOptPolicy","title":"NeuOptPolicy","text":"
NeuOptPolicy(\n    embed_dim: int = 128,\n    num_encoder_layers: int = 3,\n    num_heads: int = 4,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 128,\n    env_name: str = \"tsp_kopt\",\n    pos_type: str = \"CPE\",\n    init_embedding: Module = None,\n    pos_embedding: Module = None,\n    temperature: float = 1.0,\n    tanh_clipping: float = 6.0,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"sampling\",\n    test_decode_type: str = \"sampling\",\n)\n

Bases: ImprovementPolicy

NeuOpt Policy based on Ma et al. (2023) This model first encodes the input graph and current solution using a N2S encoder (:class:N2SEncoder) and then decodes the k-opt action (:class:RDSDecoder)

Parameters:

  • embed_dim (int, default: 128 ) \u2013

    Dimension of the node embeddings

  • num_encoder_layers (int, default: 3 ) \u2013

    Number of layers in the encoder

  • num_heads (int, default: 4 ) \u2013

    Number of heads in the attention layers

  • normalization (str, default: 'layer' ) \u2013

    Normalization type in the attention layers

  • feedforward_hidden (int, default: 128 ) \u2013

    Dimension of the hidden layer in the feedforward network

  • env_name (str, default: 'tsp_kopt' ) \u2013

    Name of the environment used to initialize embeddings

  • pos_type (str, default: 'CPE' ) \u2013

    Name of the used positional encoding method (CPE or APE)

  • init_embedding (Module, default: None ) \u2013

    Module to use for the initialization of the embeddings

  • pos_embedding (Module, default: None ) \u2013

    Module to use for the initialization of the positional embeddings

  • temperature (float, default: 1.0 ) \u2013

    Temperature for the softmax

  • tanh_clipping (float, default: 6.0 ) \u2013

    Tanh clipping value (see Bello et al., 2016)

  • train_decode_type (str, default: 'sampling' ) \u2013

    Type of decoding to use during training

  • val_decode_type (str, default: 'sampling' ) \u2013

    Type of decoding to use during validation

  • test_decode_type (str, default: 'sampling' ) \u2013

    Type of decoding to use during testing

Methods:

  • forward \u2013

    Forward pass of the policy.

Source code in rl4co/models/zoo/neuopt/policy.py
def __init__(\n    self,\n    embed_dim: int = 128,\n    num_encoder_layers: int = 3,\n    num_heads: int = 4,\n    normalization: str = \"layer\",\n    feedforward_hidden: int = 128,\n    env_name: str = \"tsp_kopt\",\n    pos_type: str = \"CPE\",\n    init_embedding: nn.Module = None,\n    pos_embedding: nn.Module = None,\n    temperature: float = 1.0,\n    tanh_clipping: float = 6.0,\n    train_decode_type: str = \"sampling\",\n    val_decode_type: str = \"sampling\",\n    test_decode_type: str = \"sampling\",\n):\n    super(NeuOptPolicy, self).__init__()\n\n    self.env_name = env_name\n    self.embed_dim = embed_dim\n\n    # Decoding strategies\n    self.temperature = temperature\n    self.tanh_clipping = tanh_clipping\n    self.train_decode_type = train_decode_type\n    self.val_decode_type = val_decode_type\n    self.test_decode_type = test_decode_type\n\n    # Encoder and decoder\n    if init_embedding is None:\n        init_embedding = CustomizeTSPInitEmbedding(self.embed_dim)\n\n    self.encoder = N2SEncoder(\n        embed_dim=embed_dim,\n        init_embedding=init_embedding,\n        pos_embedding=pos_embedding,\n        env_name=env_name,\n        pos_type=pos_type,\n        num_heads=num_heads,\n        num_layers=num_encoder_layers,\n        normalization=normalization,\n        feedforward_hidden=feedforward_hidden,\n    )\n\n    self.decoder = RDSDecoder(embed_dim=embed_dim)\n\n    self.init_hidden_W = nn.Linear(self.embed_dim, self.embed_dim)\n    self.init_query_learnable = nn.Parameter(torch.Tensor(self.embed_dim))\n\n    self.init_parameters()\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.neuopt.policy.NeuOptPolicy.forward","title":"forward","text":"
forward(\n    td: TensorDict,\n    env: Union[str, RL4COEnvBase] = None,\n    phase: str = \"train\",\n    return_actions: bool = True,\n    return_embeds: bool = False,\n    only_return_embed: bool = False,\n    actions=None,\n    **decoding_kwargs\n) -> dict\n

Forward pass of the policy.

Parameters:

  • td (TensorDict) \u2013

    TensorDict containing the environment state

  • env (Union[str, RL4COEnvBase], default: None ) \u2013

    Environment to use for decoding. If None, the environment is instantiated from env_name. Note that it is more efficient to pass an already instantiated environment each time for fine-grained control

  • phase (str, default: 'train' ) \u2013

    Phase of the algorithm (train, val, test)

  • return_actions (bool, default: True ) \u2013

    Whether to return the actions

  • actions \u2013

    Actions to use for evaluating the policy. If passed, use these actions instead of sampling from the policy to calculate log likelihood

  • decoding_kwargs \u2013

    Keyword arguments for the decoding strategy. See :class:rl4co.utils.decoding.DecodingStrategy for more information.

Returns:

  • out ( dict ) \u2013

    Dictionary containing the reward, log likelihood, and optionally the actions and entropy

Source code in rl4co/models/zoo/neuopt/policy.py
def forward(\n    self,\n    td: TensorDict,\n    env: Union[str, RL4COEnvBase] = None,\n    phase: str = \"train\",\n    return_actions: bool = True,\n    return_embeds: bool = False,\n    only_return_embed: bool = False,\n    actions=None,\n    **decoding_kwargs,\n) -> dict:\n    \"\"\"Forward pass of the policy.\n\n    Args:\n        td: TensorDict containing the environment state\n        env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that\n            it is more efficient to pass an already instantiated environment each time for fine-grained control\n        phase: Phase of the algorithm (train, val, test)\n        return_actions: Whether to return the actions\n        actions: Actions to use for evaluating the policy.\n            If passed, use these actions instead of sampling from the policy to calculate log likelihood\n        decoding_kwargs: Keyword arguments for the decoding strategy. See :class:`rl4co.utils.decoding.DecodingStrategy` for more information.\n\n    Returns:\n        out: Dictionary containing the reward, log likelihood, and optionally the actions and entropy\n    \"\"\"\n\n    # Encoder: get encoder output and initial embeddings from initial state\n    nfe, _ = self.encoder(td)\n    if only_return_embed:\n        return {\"embeds\": nfe.detach()}\n\n    # Instantiate environment if needed\n    if isinstance(env, str) or env is None:\n        env_name = self.env_name if env is None else env\n        log.info(f\"Instantiated environment not provided; instantiating {env_name}\")\n        env = get_env(env_name)\n    assert not env.two_opt_mode, \"NeuOpt only support k-opt with k > 2\"\n\n    # Get decode type depending on phase and whether actions are passed for evaluation\n    decode_type = decoding_kwargs.pop(\"decode_type\", None)\n    if actions is not None:\n        decode_type = \"evaluate\"\n    elif decode_type is None:\n        decode_type = getattr(self, f\"{phase}_decode_type\")\n\n    # Setup decoding strategy\n    # we pop arguments that are not part of the decoding strategy\n    decode_strategy: DecodingStrategy = get_decoding_strategy(\n        decode_type,\n        temperature=decoding_kwargs.pop(\"temperature\", self.temperature),\n        tanh_clipping=decoding_kwargs.pop(\"tanh_clipping\", self.tanh_clipping),\n        mask_logits=True,\n        improvement_method_mode=True,\n        **decoding_kwargs,\n    )\n\n    # Perform the decoding\n    bs, gs, _, ll, action_sampled, rec, visited_time = (\n        *nfe.size(),\n        0.0,\n        None,\n        td[\"rec_current\"],\n        td[\"visited_time\"],\n    )\n    action_index = torch.zeros(bs, env.k_max, dtype=torch.long).to(rec.device)\n    k_action_left = torch.zeros(bs, env.k_max + 1, dtype=torch.long).to(rec.device)\n    k_action_right = torch.zeros(bs, env.k_max, dtype=torch.long).to(rec.device)\n    next_of_last_action = (\n        torch.zeros_like(rec[:, :1], dtype=torch.long).to(rec.device) - 1\n    )\n    mask = torch.zeros_like(rec, dtype=torch.bool).to(rec.device)\n    stopped = torch.ones(bs, dtype=torch.bool).to(rec.device)\n    zeros = torch.zeros((bs, 1), device=td.device)\n\n    # init queries\n    h_mean = nfe.mean(1)\n    init_query = self.init_query_learnable.repeat(bs, 1)\n    input_q1 = input_q2 = init_query.clone()\n    init_hidden = self.init_hidden_W(h_mean)\n    q1 = q2 = init_hidden.clone()\n\n    for i in range(env.k_max):\n        # Pass RDS decoder\n        logits, q1, q2 = self.decoder(nfe, q1, q2, input_q1, input_q2)\n\n        # Calc probs\n        if i == 0 and \"action\" in td.keys():\n            mask = mask.scatter(1, td[\"action\"][:, :1], 1)\n\n        logprob, action_sampled = decode_strategy.step(\n            logits,\n            ~mask.clone(),\n            action=actions[:, i : i + 1].squeeze() if actions is not None else None,\n        )\n        action_sampled = action_sampled.unsqueeze(-1)\n        if i > 0:\n            action_sampled = torch.where(\n                stopped.unsqueeze(-1), action_index[:, :1], action_sampled\n            )\n        if phase == \"train\":\n            loss_now = logprob.gather(1, action_sampled)\n        else:\n            loss_now = zeros.clone()\n\n        # Record log_likelihood and Entropy\n        if i > 0:\n            ll = ll + torch.where(stopped.unsqueeze(-1), zeros * 0, loss_now)\n        else:\n            ll = ll + loss_now\n\n        # Store and Process actions\n        next_of_new_action = rec.gather(1, action_sampled)\n        action_index[:, i] = action_sampled.squeeze().clone()\n        k_action_left[stopped, i] = action_sampled[stopped].squeeze().clone()\n        k_action_right[~stopped, i - 1] = action_sampled[~stopped].squeeze().clone()\n        k_action_left[:, i + 1] = next_of_new_action.squeeze().clone()\n\n        # Prepare next RNN input\n        input_q1 = nfe.gather(\n            1, action_sampled.view(bs, 1, 1).expand(bs, 1, self.embed_dim)\n        ).squeeze(1)\n        input_q2 = torch.where(\n            stopped.view(bs, 1).expand(bs, self.embed_dim),\n            input_q1.clone(),\n            nfe.gather(\n                1,\n                (next_of_last_action % gs)\n                .view(bs, 1, 1)\n                .expand(bs, 1, self.embed_dim),\n            ).squeeze(1),\n        )\n\n        # Process if k-opt close\n        # assert (input_q1[stopped] == input_q2[stopped]).all()\n        if i > 0:\n            stopped = stopped | (action_sampled == next_of_last_action).squeeze()\n        else:\n            stopped = (action_sampled == next_of_last_action).squeeze()\n        # assert (input_q1[stopped] == input_q2[stopped]).all()\n\n        k_action_left[stopped, i] = k_action_left[stopped, i - 1]\n        k_action_right[stopped, i] = k_action_right[stopped, i - 1]\n\n        # Calc next basic masks\n        if i == 0:\n            visited_time_tag = (\n                visited_time - visited_time.gather(1, action_sampled)\n            ) % gs\n        mask &= False\n        mask[(visited_time_tag <= visited_time_tag.gather(1, action_sampled))] = True\n        if i == 0:\n            mask[visited_time_tag > (gs - 2)] = True\n        mask[stopped, action_sampled[stopped].squeeze()] = (\n            False  # allow next k-opt starts immediately\n        )\n        # if True:#i == env.k_max - 2: # allow special case: close k-opt at the first selected node\n        index_allow_first_node = (~stopped) & (\n            next_of_new_action.squeeze() == action_index[:, 0]\n        )\n        mask[index_allow_first_node, action_index[index_allow_first_node, 0]] = False\n\n        # Move to next\n        next_of_last_action = next_of_new_action\n        next_of_last_action[stopped] = -1\n\n    # Form final action\n    k_action_right[~stopped, -1] = k_action_left[~stopped, -1].clone()\n    k_action_left = k_action_left[:, : env.k_max]\n    action_all = torch.cat((action_index, k_action_left, k_action_right), -1)\n\n    outdict = {\"log_likelihood\": ll, \"cost_bsf\": td[\"cost_bsf\"]}\n    td.set(\"action\", action_all)\n\n    if return_embeds:\n        outdict[\"embeds\"] = nfe.detach()\n\n    if return_actions:\n        outdict[\"actions\"] = action_all\n\n    return outdict\n
"},{"location":"docs/content/api/zoo/improvement/#models.zoo.neuopt.model.NeuOpt","title":"NeuOpt","text":"
NeuOpt(\n    env: RL4COEnvBase,\n    policy: Module = None,\n    critic: CriticNetwork = None,\n    policy_kwargs: dict = {},\n    critic_kwargs: dict = {},\n    **kwargs\n)\n

Bases: n_step_PPO

NeuOpt Model based on n_step Proximal Policy Optimization (PPO) with an NeuOpt model policy. We default to the NeuOpt model policy and the improvement Critic Network.

Parameters:

  • env (RL4COEnvBase) \u2013

    Environment to use for the algorithm

  • policy (Module, default: None ) \u2013

    Policy to use for the algorithm

  • critic (CriticNetwork, default: None ) \u2013

    Critic to use for the algorithm

  • policy_kwargs (dict, default: {} ) \u2013

    Keyword arguments for policy

  • critic_kwargs (dict, default: {} ) \u2013

    Keyword arguments for critic

Source code in rl4co/models/zoo/neuopt/model.py
def __init__(\n    self,\n    env: RL4COEnvBase,\n    policy: nn.Module = None,\n    critic: CriticNetwork = None,\n    policy_kwargs: dict = {},\n    critic_kwargs: dict = {},\n    **kwargs,\n):\n    if policy is None:\n        policy = NeuOptPolicy(env_name=env.name, **policy_kwargs)\n\n    if critic is None:\n        embed_dim = (\n            policy_kwargs[\"embed_dim\"] if \"embed_dim\" in policy_kwargs else 128\n        )  # the critic's embed_dim must be as policy's\n\n        encoder = MultiHeadAttentionLayer(\n            embed_dim,\n            critic_kwargs[\"num_heads\"] if \"num_heads\" in critic_kwargs else 4,\n            critic_kwargs[\"feedforward_hidden\"]\n            if \"feedforward_hidden\" in critic_kwargs\n            else 128,\n            critic_kwargs[\"normalization\"]\n            if \"normalization\" in critic_kwargs\n            else \"layer\",\n            bias=False,\n        )\n        value_head = CriticDecoder(embed_dim, dropout_rate=0.001)\n\n        critic = CriticNetwork(\n            encoder=encoder,\n            value_head=value_head,\n            customized=True,\n        )\n\n    super().__init__(env, policy, critic, **kwargs)\n
"},{"location":"docs/content/api/zoo/transductive/","title":"Transductive Methods","text":""},{"location":"docs/content/api/zoo/transductive/#transductive-methods","title":"Transductive Methods","text":"

These methods update policy parameters during online testing to improve the solutions of a specific instance.

"},{"location":"docs/content/api/zoo/transductive/#active-search-as","title":"Active Search (AS)","text":"

Classes:

  • ActiveSearch \u2013

    Active Search for Neural Combination Optimization from Bello et al. (2016).

"},{"location":"docs/content/api/zoo/transductive/#models.zoo.active_search.search.ActiveSearch","title":"ActiveSearch","text":"
ActiveSearch(\n    env,\n    policy,\n    dataset: Union[Dataset, str],\n    batch_size: int = 1,\n    max_iters: int = 200,\n    augment_size: int = 8,\n    augment_dihedral: bool = True,\n    num_parallel_runs: int = 1,\n    max_runtime: int = 86400,\n    save_path: str = None,\n    optimizer: Union[str, Optimizer, partial] = \"Adam\",\n    optimizer_kwargs: dict = {\n        \"lr\": 0.00026,\n        \"weight_decay\": 1e-06,\n    },\n    **kwargs\n)\n

Bases: TransductiveModel

Active Search for Neural Combination Optimization from Bello et al. (2016). Fine-tunes the whole policy network (encoder + decoder) on a batch of instances. Reference: https://arxiv.org/abs/1611.09940

Parameters:

  • env \u2013

    RL4CO environment to be solved

  • policy \u2013

    policy network

  • dataset (Union[Dataset, str]) \u2013

    dataset to be used for training

  • batch_size (int, default: 1 ) \u2013

    batch size for training

  • max_iters (int, default: 200 ) \u2013

    maximum number of iterations

  • augment_size (int, default: 8 ) \u2013

    number of augmentations per state

  • augment_dihedral (bool, default: True ) \u2013

    whether to augment with dihedral rotations

  • parallel_runs \u2013

    number of parallel runs

  • max_runtime (int, default: 86400 ) \u2013

    maximum runtime in seconds

  • save_path (str, default: None ) \u2013

    path to save solution checkpoints

  • optimizer (Union[str, Optimizer, partial], default: 'Adam' ) \u2013

    optimizer to use for training

  • optimizer_kwargs (dict, default: {'lr': 0.00026, 'weight_decay': 1e-06} ) \u2013

    keyword arguments for optimizer

  • **kwargs \u2013

    additional keyword arguments

Methods:

  • setup \u2013

    Setup base class and instantiate:

  • on_train_batch_start \u2013

    Called before training (i.e. search) for a new batch begins.

  • training_step \u2013

    Main search loop. We use the training step to effectively adapt to a batch of instances.

  • on_train_batch_end \u2013

    We store the best solution and reward found.

  • on_train_epoch_end \u2013

    Called when the training ends.

Source code in rl4co/models/zoo/active_search/search.py
def __init__(\n    self,\n    env,\n    policy,\n    dataset: Union[Dataset, str],\n    batch_size: int = 1,\n    max_iters: int = 200,\n    augment_size: int = 8,\n    augment_dihedral: bool = True,\n    num_parallel_runs: int = 1,\n    max_runtime: int = 86_400,\n    save_path: str = None,\n    optimizer: Union[str, torch.optim.Optimizer, partial] = \"Adam\",\n    optimizer_kwargs: dict = {\"lr\": 2.6e-4, \"weight_decay\": 1e-6},\n    **kwargs,\n):\n    self.save_hyperparameters(logger=False)\n\n    assert batch_size == 1, \"Batch size must be 1 for active search\"\n\n    super(ActiveSearch, self).__init__(\n        env,\n        policy=policy,\n        dataset=dataset,\n        batch_size=batch_size,\n        max_iters=max_iters,\n        max_runtime=max_runtime,\n        save_path=save_path,\n        optimizer=optimizer,\n        optimizer_kwargs=optimizer_kwargs,\n        **kwargs,\n    )\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.active_search.search.ActiveSearch.setup","title":"setup","text":"
setup(stage='fit')\n

Setup base class and instantiate:

  • augmentation
  • instance solutions and rewards
  • original policy state dict
Source code in rl4co/models/zoo/active_search/search.py
def setup(self, stage=\"fit\"):\n    \"\"\"Setup base class and instantiate:\n    - augmentation\n    - instance solutions and rewards\n    - original policy state dict\n    \"\"\"\n    log.info(\"Setting up active search...\")\n    super(ActiveSearch, self).setup(stage)\n\n    # Instantiate augmentation\n    self.augmentation = StateAugmentation(\n        num_augment=self.hparams.augment_size,\n        augment_fn=\"dihedral8\" if self.hparams.augment_dihedral else \"symmetric\",\n    )\n\n    # Store original policy state dict\n    self.original_policy_state = self.policy.state_dict()\n\n    # Get dataset size and problem size\n    dataset_size = len(self.dataset)\n    _batch = next(iter(self.train_dataloader()))\n    self.problem_size = self.env.reset(_batch)[\"action_mask\"].shape[-1]\n    self.instance_solutions = torch.zeros(\n        dataset_size, self.problem_size * 2, dtype=int\n    )\n    self.instance_rewards = torch.zeros(dataset_size)\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.active_search.search.ActiveSearch.on_train_batch_start","title":"on_train_batch_start","text":"
on_train_batch_start(batch: Any, batch_idx: int)\n

Called before training (i.e. search) for a new batch begins. We re-load the original policy state dict and configure the optimizer.

Source code in rl4co/models/zoo/active_search/search.py
def on_train_batch_start(self, batch: Any, batch_idx: int):\n    \"\"\"Called before training (i.e. search) for a new batch begins.\n    We re-load the original policy state dict and configure the optimizer.\n    \"\"\"\n    self.policy.load_state_dict(self.original_policy_state)\n    self.configure_optimizers(self.policy.parameters())\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.active_search.search.ActiveSearch.training_step","title":"training_step","text":"
training_step(batch, batch_idx)\n

Main search loop. We use the training step to effectively adapt to a batch of instances.

Source code in rl4co/models/zoo/active_search/search.py
def training_step(self, batch, batch_idx):\n    \"\"\"Main search loop. We use the training step to effectively adapt to a `batch` of instances.\"\"\"\n    # Augment state\n    batch_size = batch.shape[0]\n    td_init = self.env.reset(batch)\n    n_aug, n_start, n_runs = (\n        self.augmentation.num_augment,\n        self.env.get_num_starts(td_init),\n        self.hparams.num_parallel_runs,\n    )\n    td_init = self.augmentation(td_init)\n    td_init = batchify(td_init, n_runs)\n\n    # Solution and reward buffer\n    max_reward = torch.full((batch_size,), -float(\"inf\"), device=batch.device)\n    best_solutions = torch.zeros(\n        batch_size, self.problem_size * 2, device=batch.device, dtype=int\n    )\n\n    # Init search\n    t_start = time.time()\n    for i in range(self.hparams.max_iters):\n        # Evaluate policy with sampling multistarts (as in POMO)\n        out = self.policy(\n            td_init.clone(),\n            env=self.env,\n            decode_type=\"multistart_sampling\",\n            num_starts=n_start,\n        )\n\n        if i == 0:\n            log.info(f\"Initial reward: {out['reward'].max():.2f}\")\n\n        # Update best solution and reward found\n        max_reward_iter = out[\"reward\"].max()\n        if max_reward_iter > max_reward:\n            max_reward_idx = out[\"reward\"].argmax()\n            best_solution_iter = out[\"actions\"][max_reward_idx]\n            max_reward = max_reward_iter\n            best_solutions[0, : best_solution_iter.shape[0]] = best_solution_iter\n\n        # Compute REINFORCE loss with shared baseline\n        reward = unbatchify(out[\"reward\"], (n_runs, n_aug, n_start))\n        ll = unbatchify(out[\"log_likelihood\"], (n_runs, n_aug, n_start))\n        advantage = reward - reward.mean(dim=-1, keepdim=True)\n        loss = -(advantage * ll).mean()\n\n        # Backpropagate loss\n        # perform manual optimization following the Lightning routine\n        # https://lightning.ai/docs/pytorch/stable/common/optimization.html\n        opt = self.optimizers()\n        opt.zero_grad()\n        self.manual_backward(loss)\n\n        self.log_dict(\n            {\n                \"loss\": loss,\n                \"max_reward\": max_reward,\n                \"step\": i,\n                \"time\": time.time() - t_start,\n            },\n            on_step=self.log_on_step,\n        )\n\n        # Stop if max runtime is exceeded\n        if time.time() - t_start > self.hparams.max_runtime:\n            break\n\n    return {\"max_reward\": max_reward, \"best_solutions\": best_solutions}\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.active_search.search.ActiveSearch.on_train_batch_end","title":"on_train_batch_end","text":"
on_train_batch_end(\n    outputs: STEP_OUTPUT, batch: Any, batch_idx: int\n) -> None\n

We store the best solution and reward found.

Source code in rl4co/models/zoo/active_search/search.py
def on_train_batch_end(\n    self, outputs: STEP_OUTPUT, batch: Any, batch_idx: int\n) -> None:\n    \"\"\"We store the best solution and reward found.\"\"\"\n    max_rewards, best_solutions = outputs[\"max_reward\"], outputs[\"best_solutions\"]\n    self.instance_rewards[batch_idx] = max_rewards\n    self.instance_solutions[batch_idx, :] = best_solutions.squeeze(\n        0\n    )  # only one instance\n    log.info(f\"Best reward: {max_rewards.mean():.2f}\")\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.active_search.search.ActiveSearch.on_train_epoch_end","title":"on_train_epoch_end","text":"
on_train_epoch_end() -> None\n

Called when the training ends. If the epoch ends, it means we have finished searching over the instances, thus the trainer should stop.

Source code in rl4co/models/zoo/active_search/search.py
def on_train_epoch_end(self) -> None:\n    \"\"\"Called when the training ends.\n    If the epoch ends, it means we have finished searching over the\n    instances, thus the trainer should stop.\n    \"\"\"\n    save_path = self.hparams.save_path\n    if save_path is not None:\n        log.info(f\"Saving solutions and rewards to {save_path}...\")\n        torch.save(\n            {\"solutions\": self.instance_solutions, \"rewards\": self.instance_rewards},\n            save_path,\n        )\n\n    # https://github.com/Lightning-AI/lightning/issues/1406\n    self.trainer.should_stop = True\n
"},{"location":"docs/content/api/zoo/transductive/#efficent-active-search-eas","title":"Efficent Active Search (EAS)","text":"

Classes:

  • EAS \u2013

    Efficient Active Search for Neural Combination Optimization from Hottung et al. (2022).

  • EASEmb \u2013

    EAS with embedding adaptation

  • EASLay \u2013

    EAS with layer adaptation

Functions:

  • forward_pointer_attn_eas_lay \u2013

    Add layer to the forward pass of logit attention, i.e.

  • forward_eas \u2013

    Forward pass of the decoder

Classes:

  • EASLayerNet \u2013

    Instantiate weights and biases for the added layer.

"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.search.EAS","title":"EAS","text":"
EAS(\n    env,\n    policy,\n    dataset: Union[Dataset, str],\n    use_eas_embedding: bool = True,\n    use_eas_layer: bool = False,\n    eas_emb_cache_keys: List[str] = [\"logit_key\"],\n    eas_lambda: float = 0.013,\n    batch_size: int = 2,\n    max_iters: int = 200,\n    augment_size: int = 8,\n    augment_dihedral: bool = True,\n    num_parallel_runs: int = 1,\n    baseline: str = \"multistart\",\n    max_runtime: int = 86400,\n    save_path: str = None,\n    optimizer: Union[str, Optimizer, partial] = \"Adam\",\n    optimizer_kwargs: dict = {\n        \"lr\": 0.0041,\n        \"weight_decay\": 1e-06,\n    },\n    verbose: bool = True,\n    **kwargs\n)\n

Bases: TransductiveModel

Efficient Active Search for Neural Combination Optimization from Hottung et al. (2022). Fine-tunes a subset of parameters (such as node embeddings or newly added layers) thus avoiding expensive re-encoding of the problem. Reference: https://openreview.net/pdf?id=nO5caZwFwYu

Parameters:

  • env \u2013

    RL4CO environment to be solved

  • policy \u2013

    policy network

  • dataset (Union[Dataset, str]) \u2013

    dataset to be used for training

  • use_eas_embedding (bool, default: True ) \u2013

    whether to use EAS embedding (EASEmb)

  • use_eas_layer (bool, default: False ) \u2013

    whether to use EAS layer (EASLay)

  • eas_emb_cache_keys (List[str], default: ['logit_key'] ) \u2013

    keys to cache in the embedding

  • eas_lambda (float, default: 0.013 ) \u2013

    lambda parameter for IL loss

  • batch_size (int, default: 2 ) \u2013

    batch size for training

  • max_iters (int, default: 200 ) \u2013

    maximum number of iterations

  • augment_size (int, default: 8 ) \u2013

    number of augmentations per state

  • augment_dihedral (bool, default: True ) \u2013

    whether to augment with dihedral rotations

  • parallel_runs \u2013

    number of parallel runs

  • baseline (str, default: 'multistart' ) \u2013

    REINFORCE baseline type (multistart, symmetric, full)

  • max_runtime (int, default: 86400 ) \u2013

    maximum runtime in seconds

  • save_path (str, default: None ) \u2013

    path to save solution checkpoints

  • optimizer (Union[str, Optimizer, partial], default: 'Adam' ) \u2013

    optimizer to use for training

  • optimizer_kwargs (dict, default: {'lr': 0.0041, 'weight_decay': 1e-06} ) \u2013

    keyword arguments for optimizer

  • verbose (bool, default: True ) \u2013

    whether to print progress for each iteration

Methods:

  • setup \u2013

    Setup base class and instantiate:

  • on_train_batch_start \u2013

    Called before training (i.e. search) for a new batch begins.

  • training_step \u2013

    Main search loop. We use the training step to effectively adapt to a batch of instances.

  • on_train_batch_end \u2013

    We store the best solution and reward found.

  • on_train_epoch_end \u2013

    Called when the train ends.

Source code in rl4co/models/zoo/eas/search.py
def __init__(\n    self,\n    env,\n    policy,\n    dataset: Union[Dataset, str],\n    use_eas_embedding: bool = True,\n    use_eas_layer: bool = False,\n    eas_emb_cache_keys: List[str] = [\"logit_key\"],\n    eas_lambda: float = 0.013,\n    batch_size: int = 2,\n    max_iters: int = 200,\n    augment_size: int = 8,\n    augment_dihedral: bool = True,\n    num_parallel_runs: int = 1,\n    baseline: str = \"multistart\",\n    max_runtime: int = 86_400,\n    save_path: str = None,\n    optimizer: Union[str, torch.optim.Optimizer, partial] = \"Adam\",\n    optimizer_kwargs: dict = {\"lr\": 0.0041, \"weight_decay\": 1e-6},\n    verbose: bool = True,\n    **kwargs,\n):\n    self.save_hyperparameters(logger=False)\n\n    assert (\n        self.hparams.use_eas_embedding or self.hparams.use_eas_layer\n    ), \"At least one of `use_eas_embedding` or `use_eas_layer` must be True.\"\n\n    super(EAS, self).__init__(\n        env,\n        policy=policy,\n        dataset=dataset,\n        batch_size=batch_size,\n        max_iters=max_iters,\n        max_runtime=max_runtime,\n        save_path=save_path,\n        optimizer=optimizer,\n        optimizer_kwargs=optimizer_kwargs,\n        **kwargs,\n    )\n\n    assert self.hparams.baseline in [\n        \"multistart\",\n        \"symmetric\",\n        \"full\",\n    ], f\"Baseline {self.hparams.baseline} not supported.\"\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.search.EAS.setup","title":"setup","text":"
setup(stage='fit')\n

Setup base class and instantiate:

  • augmentation
  • instance solutions and rewards
  • original policy state dict
Source code in rl4co/models/zoo/eas/search.py
def setup(self, stage=\"fit\"):\n    \"\"\"Setup base class and instantiate:\n    - augmentation\n    - instance solutions and rewards\n    - original policy state dict\n    \"\"\"\n    log.info(\n        f\"Setting up Efficient Active Search (EAS) with: \\n\"\n        f\"- EAS Embedding: {self.hparams.use_eas_embedding} \\n\"\n        f\"- EAS Layer: {self.hparams.use_eas_layer} \\n\"\n    )\n    super(EAS, self).setup(stage)\n\n    # Instantiate augmentation\n    self.augmentation = StateAugmentation(\n        num_augment=self.hparams.augment_size,\n        augment_fn=\"dihedral8\" if self.hparams.augment_dihedral else \"symmetric\",\n    )\n\n    # Store original policy state dict\n    self.original_policy_state = self.policy.state_dict()\n\n    # Get dataset size and problem size\n    len(self.dataset)\n    _batch = next(iter(self.train_dataloader()))\n    self.problem_size = self.env.reset(_batch)[\"action_mask\"].shape[-1]\n    self.instance_solutions = []\n    self.instance_rewards = []\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.search.EAS.on_train_batch_start","title":"on_train_batch_start","text":"
on_train_batch_start(batch: Any, batch_idx: int)\n

Called before training (i.e. search) for a new batch begins. We re-load the original policy state dict and configure all parameters not to require gradients. We do the rest in the training step.

Source code in rl4co/models/zoo/eas/search.py
def on_train_batch_start(self, batch: Any, batch_idx: int):\n    \"\"\"Called before training (i.e. search) for a new batch begins.\n    We re-load the original policy state dict and configure all parameters not to require gradients.\n    We do the rest in the training step.\n    \"\"\"\n    self.policy.load_state_dict(self.original_policy_state)\n\n    # Set all policy parameters to not require gradients\n    for param in self.policy.parameters():\n        param.requires_grad = False\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.search.EAS.training_step","title":"training_step","text":"
training_step(batch, batch_idx)\n

Main search loop. We use the training step to effectively adapt to a batch of instances.

Source code in rl4co/models/zoo/eas/search.py
def training_step(self, batch, batch_idx):\n    \"\"\"Main search loop. We use the training step to effectively adapt to a `batch` of instances.\"\"\"\n    # Augment state\n    batch_size = batch.shape[0]\n    td_init = self.env.reset(batch)\n    n_aug, n_start, n_runs = (\n        self.augmentation.num_augment,\n        self.env.get_num_starts(td_init),\n        self.hparams.num_parallel_runs,\n    )\n    td_init = self.augmentation(td_init)\n    td_init = batchify(td_init, n_runs)\n    num_instances = batch_size * n_aug * n_runs  # NOTE: no num_starts!\n    # batch_r = n_runs * batch_size # effective batch size\n    group_s = (\n        n_start + 1\n    )  # number of different rollouts per instance (+1 for incumbent solution construction)\n\n    # Get encoder and decoder for simplicity\n    encoder = self.policy.encoder\n    decoder = self.policy.decoder\n\n    # Precompute the cache of the embeddings (i.e. q,k,v and logit_key)\n    embeddings, _ = encoder(td_init)\n    cached_embeds = decoder._precompute_cache(embeddings)\n\n    # Collect optimizer parameters\n    opt_params = []\n    if self.hparams.use_eas_layer:\n        # EASLay: replace forward of logit attention computation. EASLayer\n        eas_layer = EASLayerNet(num_instances, decoder.embed_dim).to(batch.device)\n        decoder.pointer.eas_layer = partial(eas_layer, decoder.pointer)\n        decoder.pointer.forward = partial(\n            forward_pointer_attn_eas_lay, decoder.pointer\n        )\n        for param in eas_layer.parameters():\n            opt_params.append(param)\n    if self.hparams.use_eas_embedding:\n        # EASEmb: set gradient of emb_key to True\n        # for all the keys, wrap the embedding in a nn.Parameter\n        for key in self.hparams.eas_emb_cache_keys:\n            setattr(\n                cached_embeds, key, torch.nn.Parameter(getattr(cached_embeds, key))\n            )\n            opt_params.append(getattr(cached_embeds, key))\n    decoder.forward_eas = partial(forward_eas, decoder)\n\n    # We pass attributes saved in policy too\n    def set_attr_if_exists(attr):\n        if hasattr(self.policy, attr):\n            setattr(decoder, attr, getattr(self.policy, attr))\n\n    for attr in [\"temperature\", \"tanh_clipping\", \"mask_logits\"]:\n        set_attr_if_exists(attr)\n\n    self.configure_optimizers(opt_params)\n\n    # Solution and reward buffer\n    max_reward = torch.full((batch_size,), -float(\"inf\"), device=batch.device)\n    best_solutions = torch.zeros(\n        batch_size, self.problem_size * 2, device=batch.device, dtype=int\n    )  # i.e. incumbent solutions\n\n    # Init search\n    t_start = time.time()\n    for iter_count in range(self.hparams.max_iters):\n        # Evaluate policy with sampling multistarts passing the cached embeddings\n        best_solutions_expanded = best_solutions.repeat(n_aug, 1).repeat(n_runs, 1)\n        logprobs, actions, td_out, reward = decoder.forward_eas(\n            td_init.clone(),\n            cached_embeds=cached_embeds,\n            best_solutions=best_solutions_expanded,\n            iter_count=iter_count,\n            env=self.env,\n            decode_type=\"multistart_sampling\",\n            num_starts=n_start,\n        )\n\n        # Unbatchify to get correct dimensions\n        ll = get_log_likelihood(logprobs, actions, td_out.get(\"mask\", None))\n        ll = unbatchify(ll, (n_runs * batch_size, n_aug, group_s)).squeeze()\n        reward = unbatchify(reward, (n_runs * batch_size, n_aug, group_s)).squeeze()\n        actions = unbatchify(actions, (n_runs * batch_size, n_aug, group_s)).squeeze()\n\n        # Compute REINFORCE loss with shared baselines\n        # compared to original EAS, we also support symmetric and full baselines\n        group_reward = reward[..., :-1]  # exclude incumbent solution\n        if self.hparams.baseline == \"multistart\":\n            bl_val = group_reward.mean(dim=-1, keepdim=True)\n        elif self.hparams.baseline == \"symmetric\":\n            bl_val = group_reward.mean(dim=-2, keepdim=True)\n        elif self.hparams.baseline == \"full\":\n            bl_val = group_reward.mean(dim=-1, keepdim=True).mean(\n                dim=-2, keepdim=True\n            )\n        else:\n            raise ValueError(f\"Baseline {self.hparams.baseline} not supported.\")\n\n        # REINFORCE loss\n        advantage = group_reward - bl_val\n        loss_rl = -(advantage * ll[..., :-1]).mean()\n        # IL loss\n        loss_il = -ll[..., -1].mean()\n        # Total loss\n        loss = loss_rl + self.hparams.eas_lambda * loss_il\n\n        # Manual backpropagation\n        opt = self.optimizers()\n        opt.zero_grad()\n        self.manual_backward(loss)\n\n        # Save best solutions and rewards\n        # Get max reward for each group and instance\n        max_reward = reward.max(dim=2)[0].max(dim=1)[0]\n\n        # Reshape and rank rewards\n        reward_group = reward.reshape(n_runs * batch_size, -1)\n        _, top_indices = torch.topk(reward_group, k=1, dim=1)\n\n        # Obtain best solutions found so far\n        solutions = actions.reshape(n_runs * batch_size, n_aug * group_s, -1)\n        best_solutions_iter = gather_by_index(solutions, top_indices, dim=1)\n        best_solutions[:, : best_solutions_iter.shape[1]] = best_solutions_iter\n\n        self.log_dict(\n            {\n                \"loss\": loss,\n                \"max_reward\": max_reward.mean(),\n                \"step\": iter_count,\n                \"time\": time.time() - t_start,\n            },\n            on_step=self.log_on_step,\n        )\n\n        log.info(\n            f\"{iter_count}/{self.hparams.max_iters} | \"\n            f\" Reward: {max_reward.mean().item():.2f} \"\n        )\n\n        # Stop if max runtime is exceeded\n        if time.time() - t_start > self.hparams.max_runtime:\n            log.info(f\"Max runtime of {self.hparams.max_runtime} seconds exceeded.\")\n            break\n\n    return {\"max_reward\": max_reward, \"best_solutions\": best_solutions}\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.search.EAS.on_train_batch_end","title":"on_train_batch_end","text":"
on_train_batch_end(\n    outputs: STEP_OUTPUT, batch: Any, batch_idx: int\n) -> None\n

We store the best solution and reward found.

Source code in rl4co/models/zoo/eas/search.py
def on_train_batch_end(\n    self, outputs: STEP_OUTPUT, batch: Any, batch_idx: int\n) -> None:\n    \"\"\"We store the best solution and reward found.\"\"\"\n    max_rewards, best_solutions = outputs[\"max_reward\"], outputs[\"best_solutions\"]\n    self.instance_solutions.append(best_solutions)\n    self.instance_rewards.append(max_rewards)\n    log.info(f\"Best reward: {max_rewards.mean():.2f}\")\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.search.EAS.on_train_epoch_end","title":"on_train_epoch_end","text":"
on_train_epoch_end() -> None\n

Called when the train ends.

Source code in rl4co/models/zoo/eas/search.py
def on_train_epoch_end(self) -> None:\n    \"\"\"Called when the train ends.\"\"\"\n    save_path = self.hparams.save_path\n    # concatenate solutions and rewards\n    self.instance_solutions = pad_sequence(\n        self.instance_solutions, batch_first=True, padding_value=0\n    ).squeeze()\n    self.instance_rewards = torch.cat(self.instance_rewards, dim=0).squeeze()\n    if save_path is not None:\n        log.info(f\"Saving solutions and rewards to {save_path}...\")\n        torch.save(\n            {\"solutions\": self.instance_solutions, \"rewards\": self.instance_rewards},\n            save_path,\n        )\n\n    # https://github.com/Lightning-AI/lightning/issues/1406\n    self.trainer.should_stop = True\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.search.EASEmb","title":"EASEmb","text":"
EASEmb(*args, **kwargs)\n

Bases: EAS

EAS with embedding adaptation

Source code in rl4co/models/zoo/eas/search.py
def __init__(\n    self,\n    *args,\n    **kwargs,\n):\n    if not kwargs.get(\"use_eas_embedding\", False) or kwargs.get(\n        \"use_eas_layer\", True\n    ):\n        log.warning(\n            \"Setting `use_eas_embedding` to True and `use_eas_layer` to False. Use EAS base class to override.\"\n        )\n    kwargs[\"use_eas_embedding\"] = True\n    kwargs[\"use_eas_layer\"] = False\n    super(EASEmb, self).__init__(*args, **kwargs)\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.search.EASLay","title":"EASLay","text":"
EASLay(*args, **kwargs)\n

Bases: EAS

EAS with layer adaptation

Source code in rl4co/models/zoo/eas/search.py
def __init__(\n    self,\n    *args,\n    **kwargs,\n):\n    if kwargs.get(\"use_eas_embedding\", False) or not kwargs.get(\n        \"use_eas_layer\", True\n    ):\n        log.warning(\n            \"Setting `use_eas_embedding` to True and `use_eas_layer` to False. Use EAS base class to override.\"\n        )\n    kwargs[\"use_eas_embedding\"] = False\n    kwargs[\"use_eas_layer\"] = True\n    super(EASLay, self).__init__(*args, **kwargs)\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.decoder.forward_pointer_attn_eas_lay","title":"forward_pointer_attn_eas_lay","text":"
forward_pointer_attn_eas_lay(\n    self, query, key, value, logit_key, mask\n)\n

Add layer to the forward pass of logit attention, i.e. Single-head attention.

Source code in rl4co/models/zoo/eas/decoder.py
def forward_pointer_attn_eas_lay(self, query, key, value, logit_key, mask):\n    \"\"\"Add layer to the forward pass of logit attention, i.e.\n    Single-head attention.\n    \"\"\"\n    # Compute inner multi-head attention with no projections.\n    heads = self._inner_mha(query, key, value, mask)\n\n    # Add residual for EAS layer if is set\n    if getattr(self, \"eas_layer\", None) is not None:\n        heads = heads + self.eas_layer(heads)\n\n    glimpse = self.project_out(heads)\n\n    # Batch matrix multiplication to compute logits (batch_size, num_steps, graph_size)\n    # bmm is slightly faster than einsum and matmul\n    logits = (\n        torch.bmm(glimpse, logit_key.squeeze(1).transpose(-2, -1))\n        / math.sqrt(glimpse.size(-1))\n    ).squeeze(1)\n\n    return logits\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.decoder.forward_eas","title":"forward_eas","text":"
forward_eas(\n    self,\n    td: TensorDict,\n    cached_embeds,\n    best_solutions,\n    iter_count: int = 0,\n    env: Union[str, RL4COEnvBase] = None,\n    decode_type: str = \"multistart_sampling\",\n    num_starts: int = None,\n    mask_logits: bool = True,\n    temperature: float = 1.0,\n    tanh_clipping: float = 0,\n    **decode_kwargs\n)\n

Forward pass of the decoder Given the environment state and the pre-computed embeddings, compute the logits and sample actions

Parameters:

  • td (TensorDict) \u2013

    Input TensorDict containing the environment state

  • embeddings \u2013

    Precomputed embeddings for the nodes. Can be already precomputed cached in form of q, k, v and

  • env (Union[str, RL4COEnvBase], default: None ) \u2013

    Environment to use for decoding. If None, the environment is instantiated from env_name. Note that it is more efficient to pass an already instantiated environment each time for fine-grained control

  • decode_type (str, default: 'multistart_sampling' ) \u2013

    Type of decoding to use. Can be one of:

    • \"sampling\": sample from the logits
    • \"greedy\": take the argmax of the logits
    • \"multistart_sampling\": sample as sampling, but with multi-start decoding
    • \"multistart_greedy\": sample as greedy, but with multi-start decoding
  • num_starts (int, default: None ) \u2013

    Number of multi-starts to use. If None, will be calculated from the action mask

  • calc_reward \u2013

    Whether to calculate the reward for the decoded sequence

Source code in rl4co/models/zoo/eas/decoder.py
def forward_eas(\n    self,\n    td: TensorDict,\n    cached_embeds,\n    best_solutions,\n    iter_count: int = 0,\n    env: Union[str, RL4COEnvBase] = None,\n    decode_type: str = \"multistart_sampling\",\n    num_starts: int = None,\n    mask_logits: bool = True,\n    temperature: float = 1.0,\n    tanh_clipping: float = 0,\n    **decode_kwargs,\n):\n    \"\"\"Forward pass of the decoder\n    Given the environment state and the pre-computed embeddings, compute the logits and sample actions\n\n    Args:\n        td: Input TensorDict containing the environment state\n        embeddings: Precomputed embeddings for the nodes. Can be already precomputed cached in form of q, k, v and\n        env: Environment to use for decoding. If None, the environment is instantiated from `env_name`. Note that\n            it is more efficient to pass an already instantiated environment each time for fine-grained control\n        decode_type: Type of decoding to use. Can be one of:\n            - \"sampling\": sample from the logits\n            - \"greedy\": take the argmax of the logits\n            - \"multistart_sampling\": sample as sampling, but with multi-start decoding\n            - \"multistart_greedy\": sample as greedy, but with multi-start decoding\n        num_starts: Number of multi-starts to use. If None, will be calculated from the action mask\n        calc_reward: Whether to calculate the reward for the decoded sequence\n    \"\"\"\n    # TODO: this could be refactored by decoding strategies\n\n    # Collect logprobs\n    logprobs = []\n    actions = []\n\n    decode_step = 0\n    # Multi-start decoding: first action is chosen by ad-hoc node selection\n    if num_starts > 1 or \"multistart\" in decode_type:\n        action = env.select_start_nodes(td, num_starts + 1) % num_starts\n        # Append incumbent solutions\n        if iter_count > 0:\n            action = unbatchify(action, num_starts + 1)\n            action[:, -1] = best_solutions[:, decode_step]\n            action = action.permute(1, 0).reshape(-1)\n\n        # Expand td to batch_size * (num_starts + 1)\n        td = batchify(td, num_starts + 1)\n\n        td.set(\"action\", action)\n        td = env.step(td)[\"next\"]\n        logp = torch.zeros_like(\n            td[\"action_mask\"], device=td.device\n        )  # first logprobs is 0, so p = logprobs.exp() = 1\n\n        logprobs.append(logp)\n        actions.append(action)\n\n    # Main decoding: loop until all sequences are done\n    while not td[\"done\"].all():\n        decode_step += 1\n        logits, mask = self.forward(td, cached_embeds, num_starts + 1)\n\n        logp = process_logits(\n            logits,\n            mask,\n            temperature=self.temperature if self.temperature is not None else temperature,\n            tanh_clipping=self.tanh_clipping\n            if self.tanh_clipping is not None\n            else tanh_clipping,\n            mask_logits=self.mask_logits if self.mask_logits is not None else mask_logits,\n        )\n\n        # Select the indices of the next nodes in the sequences, result (batch_size) long\n        action = decode_logprobs(logp, mask, decode_type=decode_type)\n\n        if iter_count > 0:  # append incumbent solutions\n            init_shp = action.shape\n            action = unbatchify(action, num_starts + 1)\n            action[:, -1] = best_solutions[:, decode_step]\n            action = action.permute(1, 0).reshape(init_shp)\n\n        td.set(\"action\", action)\n        td = env.step(td)[\"next\"]\n\n        # Collect output of step\n        logprobs.append(logp)\n        actions.append(action)\n\n    logprobs, actions = torch.stack(logprobs, 1), torch.stack(actions, 1)\n    rewards = env.get_reward(td, actions)\n    return logprobs, actions, td, rewards\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.nn.EASLayerNet","title":"EASLayerNet","text":"
EASLayerNet(num_instances: int, emb_dim: int)\n

Bases: Module

Instantiate weights and biases for the added layer. The layer is defined as: h = relu(emb * W1 + b1); out = h * W2 + b2. Wrapping in nn.Parameter makes the parameters trainable and sets gradient to True.

Parameters:

  • num_instances (int) \u2013

    Number of instances in the dataset

  • emb_dim (int) \u2013

    Dimension of the embedding

Methods:

  • forward \u2013

    emb: [num_instances, group_num, emb_dim]

Source code in rl4co/models/zoo/eas/nn.py
def __init__(self, num_instances: int, emb_dim: int):\n    super().__init__()\n    # W2 and b2 are initialized to zero so in the first iteration the layer is identity\n    self.W1 = nn.Parameter(torch.randn(num_instances, emb_dim, emb_dim))\n    self.b1 = nn.Parameter(torch.randn(num_instances, 1, emb_dim))\n    self.W2 = nn.Parameter(torch.zeros(num_instances, emb_dim, emb_dim))\n    self.b2 = nn.Parameter(torch.zeros(num_instances, 1, emb_dim))\n    torch.nn.init.xavier_uniform_(self.W1)\n    torch.nn.init.xavier_uniform_(self.b1)\n
"},{"location":"docs/content/api/zoo/transductive/#models.zoo.eas.nn.EASLayerNet.forward","title":"forward","text":"
forward(*args)\n

emb: [num_instances, group_num, emb_dim]

Source code in rl4co/models/zoo/eas/nn.py
def forward(self, *args):\n    \"\"\"emb: [num_instances, group_num, emb_dim]\"\"\"\n    # get tensor arg (from partial instantiation)\n    emb = [arg for arg in args if isinstance(arg, torch.Tensor)][0]\n    h = torch.relu(torch.matmul(emb, self.W1) + self.b1.expand_as(emb))\n    return torch.matmul(h, self.W2) + self.b2.expand_as(h)\n
"},{"location":"docs/content/general/ai4co/","title":"AI4CO Community","text":"

We invite you to join our AI4CO community, an open and inclusive research group in Artificial Intelligence (AI) for Combinatorial Optimization (CO)!

"},{"location":"docs/content/general/ai4co/#links","title":"Links","text":"
  • GitHub
  • Slack
  • Website (coming soon!)
"},{"location":"docs/content/general/contribute/","title":"Contributing to RL4CO","text":"

Have a suggestion, request, or found a bug? Feel free to open an issue or submit a pull request. If you would like to contribute, please check out our contribution guidelines here. We welcome and look forward to all contributions to RL4CO!

We are also on Slack if you have any questions or would like to discuss RL4CO with us. We are open to collaborations and would love to hear from you \ud83d\ude80

"},{"location":"docs/content/general/contribute/#contributors","title":"Contributors","text":""},{"location":"docs/content/general/faq/","title":"FAQ","text":"

You can submit your questions via GitHub Issues or Discussions.

You may search for your question in the existing issues or discussions before submitting a new one. If asked more than a few times, we will add it here!

"},{"location":"docs/content/general/faq/#i-ran-into-an-error-in-the-tutorials-what-should-i-do","title":"I ran into an error in the tutorials. What should I do?","text":"

We try our best to test the tutorials but some edge cases may not be covered. If you encounter an issue, firstly we recommend to try installing the bleeding edge version of the library from source, which may resolve the it. You can do this by running the following command:

pip install -U git+https://github.com/ai4co/rl4co.git\n

If you still encounter an error, you may check out open issues on GitHub here and in case open one. Remember to report versions of the library and the environment you are using with the following commands:

python -c 'from rl4co.utils import show_versions; show_versions()'\n
"},{"location":"docs/content/general/licensing/","title":"License and Usage","text":"

Our library is released under the MIT License, which is an open and permissive license. This means:

  • You can use, modify, and distribute the code without any restrictions, even for commercial purposes.
  • Your projects will not inherit any additional limitations from our library, even if you modify or extend it.

All contributions to the library are covered by the MIT License, ensuring that everything is free to use under the same open terms. A copy of the license is available here.

"},{"location":"docs/content/general/paper/","title":"Paper and Citation","text":""},{"location":"docs/content/general/paper/#paper-reference","title":"Paper Reference","text":"

Our paper is available here for further details.

If you find RL4CO valuable for your research or applied projects, don't forget to cite us! \ud83d\ude80

@article{berto2024rl4co,\n    title={{RL4CO: an Extensive Reinforcement Learning for Combinatorial Optimization Benchmark}},\n    author={Federico Berto and Chuanbo Hua and Junyoung Park and Laurin Luttmann and Yining Ma and Fanchen Bu and Jiarui Wang and Haoran Ye and Minsu Kim and Sanghyeok Choi and Nayeli Gast Zepeda and Andr\\'e Hottung and Jianan Zhou and Jieyi Bi and Yu Hu and Fei Liu and Hyeonah Kim and Jiwoo Son and Haeyeon Kim and Davide Angioni and Wouter Kool and Zhiguang Cao and Jie Zhang and Kijung Shin and Cathy Wu and Sungsoo Ahn and Guojie Song and Changhyun Kwon and Lin Xie and Jinkyoo Park},\n    year={2024},\n    journal={arXiv preprint arXiv:2306.17100},\n    note={\\url{https://github.com/ai4co/rl4co}}\n}\n
"},{"location":"docs/content/intro/environments/","title":"Environments","text":""},{"location":"docs/content/intro/environments/#definition","title":"Definition","text":"

Given a CO problem instance \\(\\mathbf{x}\\), we formulate the solution-generating procedure as a Markov Decision Process (MDP) characterized by a tuple \\((\\mathcal{S}, \\mathcal{A}, \\mathcal{T}, \\mathcal{R}, \\gamma)\\) as follows:

  • State \\(\\mathcal{S}\\) is the space of states that represent the given problem \\(\\mathbf{x}\\) and the current partial solution being updated in the MDP.
  • Action \\(\\mathcal{A}\\) is the action space, which includes all feasible actions \\(a_t\\) that can be taken at each step \\(t\\).
  • State Transition \\(\\mathcal{T}\\) is the deterministic state transition function \\(s_{t+1} = \\mathcal{T}(s_t, a_t)\\) that updates a state \\(s_t\\) to the next state \\(s_{t+1}\\).
  • Reward \\(\\mathcal{R}\\) is the reward function \\(\\mathcal{R}(s_t, a_t)\\) representing the immediate reward received after taking action \\(a_t\\) in state \\(s_t\\).
  • Discount Factor \\(\\gamma \\in [0, 1]\\) determines the importance of future rewards. Often, \\(\\gamma = 1\\) is used for CO problems, i.e., no discounting.

Since the state transition is deterministic, we represent the solution for a problem \\(\\mathbf{x}\\) as a sequence of \\(T\\) actions \\(\\mathbf{a} = (a_1, \\ldots, a_T)\\). Then the total return \\(\\sum_{t=1}^T \\mathcal{R}(s_t, a_t)\\) translates to the negative cost function of the CO problem.

In the following, we define the above MDP for the main CO problem types we consider in our library.

"},{"location":"docs/content/intro/environments/#routing-problems","title":"Routing Problems","text":"

Routing problems are perhaps the most known class of CO problems. They are problems of great practical importance, not only for logistics, where they are more commonly framed, but also for industry, engineering, science, and medicine. The typical objective of routing problems is to minimize the total length of the paths needed to visit some (or all) the nodes in a graph \\(G = (V, E)\\)., and \\(i, j \\in V\\) are nodes in the graph.

"},{"location":"docs/content/intro/environments/#mdp","title":"MDP","text":"

For routing problems, in RL4CO we consider two types of MDPs: Construction MDP and Improvement MDP.

"},{"location":"docs/content/intro/environments/#construction-mdp","title":"Construction MDP","text":"

The Construction MDP describes a process of iteratively building a solution from scratch:

  • State \\(s_t \\in \\mathcal{S}\\): Reflects (1) node-level information for each customer node (e.g., coordinates, demand), (2) global-level information about the route construction (e.g., remaining vehicle capacity), and (3) the current partial solution \\(\\{a_1, \\ldots, a_{t-1}\\}\\) where \\(a_i\\) is the previously selected node (action) at time \\(i\\). The initial state at \\(t = 0\\) has an empty partial solution.
  • Action \\(a_t \\in \\mathcal{A}\\): Choosing a valid node from set \\(V\\). The action space is state-dependent, with infeasible actions masked to ensure all constraints are satisfied.
  • Transition \\(\\mathcal{T}\\): Deterministic transition that adds the selected action \\(a_t\\) to the partial solution, updating it from \\(\\{a_1, \\ldots, a_{t-1}\\}\\) to \\(\\{a_1, \\ldots, a_{t-1}, a_t\\}\\), and updates the node-level and global-level information accordingly.
  • Reward \\(\\mathcal{R}\\): Typically set to the negative value of the increase in tour length, ensuring that maximizing cumulative rewards is equivalent to minimizing the tour length objective.
  • Policy \\(\\pi\\): Usually parameterized by a deep neural network, it decides on an action \\(a_t\\) given the input state \\(s_t\\). The policy is typically stochastic, learning an action distribution for selecting each node.
"},{"location":"docs/content/intro/environments/#improvement-mdp","title":"Improvement MDP","text":"

The Improvement MDP describes a search process similar to neighborhood search, starting from a sub-optimal solution \\(\\bm{a}^{0}=(a_{0}^{0},\\ldots, a_{T-1}^{0})\\) and finding another one potentially with higher quality:

  • State \\(s_t \\in \\mathcal{S}\\): Reflects (1) node-level information for each customer node, (2) global-level information about the search (e.g., historical visited solutions and their costs), and (3) the current solution \\(\\bm{a^t}\\). The initial state \\(s_0\\) contains a randomly generated feasible solution \\(\\bm{a^0}\\).
  • Action \\(a_t \\in \\mathcal{A}\\): A specific operation that changes the current solution \\(\\bm{a^t}\\) into a new one \\(\\bm{a^{t+1}}\\). For example, specifying two nodes \\((i, j)\\) in \\(V\\) to perform a pairwise local search operation.
  • Transition \\(\\mathcal{T}\\): Usually deterministic, accepting the proposed solution \\(\\bm{a^{t+1}}\\) as the solution for the next state and updating node-level and global-level information accordingly.
  • Reward \\(\\mathcal{R}\\): Typically set to the immediate reduced objective value of the current best-so-far solution after taking the local search action.
  • Policy \\(\\pi\\): Usually stochastic and parameterized by a deep model. The time horizon can be user-specified based on the available time budget, often requiring a discount factor \\(\\gamma < 1\\).

The best solution found throughout the improvement horizon is recognized as the final solution to the routing problem.

"},{"location":"docs/content/intro/environments/#documentation","title":"Documentation","text":"

Click here for API documentation on routing problems.

"},{"location":"docs/content/intro/environments/#scheduling-problems","title":"Scheduling Problems","text":"

Scheduling problems are a fundamental class of problems in operations research and industrial engineering, where the objective is to optimize the allocation of resources over time. These problems are critical in various industries, such as manufacturing, computer science, and project management.

"},{"location":"docs/content/intro/environments/#mdp_1","title":"MDP","text":"

Here we show a general constructive MDP formulation based on the Job Shop Scheduling Problem (JSSP), a well-known scheduling problem, which can be adapted to other scheduling problems.

  • State \\(s_t \\in \\mathcal{S}\\): The state is represented by a disjunctive graph, where:
    • Operations are nodes
    • Processing orders between operations are shown by directed arcs
    • This graph encapsulates both the problem instance and the current partial schedule
  • Action \\(a_t \\in \\mathcal{A}\\): An action involves selecting a feasible operation to assign to its designated machine, a process often referred to as dispatching. The action space consists of all operations that can be feasibly scheduled at the current state.
  • Transition \\(\\mathcal{T}\\): The transition function deterministically updates the disjunctive graph based on the dispatched operation. This includes:
    • Modifying the graph's topology (e.g., adding new connections between operations)
    • Updating operation attributes (e.g., start times)
  • Reward \\(\\mathcal{R}\\): The reward function is designed to align with the optimization objective. For instance, if minimizing makespan is the goal, the reward could be the negative change in makespan resulting from the latest action.
  • Policy \\(\\pi\\): The policy, typically stochastic, takes the current disjunctive graph as input and outputs a probability distribution over feasible dispatching actions. This process continues until a complete schedule is constructed.
"},{"location":"docs/content/intro/environments/#documentation_1","title":"Documentation","text":"

Click here for API documentation on scheduling problems.

"},{"location":"docs/content/intro/environments/#electronic-design-automation","title":"Electronic Design Automation","text":"

Electronic Design Automation (EDA) is a sophisticated process that involves the use of software tools to design, simulate, and analyze electronic systems, particularly integrated circuits (ICs) and printed circuit boards (PCBs). EDA encompasses a wide range of tasks, from schematic capture and layout design to verification and testing. Optimization is a critical aspect of EDA, where the goal is to achieve the best possible performance, power efficiency, and cost within the constraints of the design.

"},{"location":"docs/content/intro/environments/#mdp_2","title":"MDP","text":"

EDA encompasses many problem types; here we'll focus on placement problems, which are fundamental in the physical design of integrated circuits and printed circuit boards. We'll use the Decap Placement Problem (DPP) as an example to illustrate a typical MDP formulation for EDA placement problems.

  • State \\(s_t \\in \\mathcal{S}\\): The state typically represents the current configuration of the design space, which may include:
    • Locations of fixed elements (e.g., ports, keepout regions)
    • Current placements of movable elements
    • Remaining resources or components to be placed
  • Action \\(a_t \\in \\mathcal{A}\\): An action usually involves placing a component at a valid location within the design space. The action space consists of all feasible placement locations, considering design rules and constraints.
  • Transition \\(\\mathcal{T}\\): The transition function updates the design state based on the placement action, which may include:
    • Updating the placement map
    • Adjusting available resources or remaining components
    • Recalculating relevant metrics (e.g., wire length, power distribution)
  • Reward \\(\\mathcal{R}\\): The reward is typically based on the improvement in the design objective resulting from the latest placement action. This could involve metrics such as area efficiency, signal integrity, or power consumption.
  • Policy \\(\\pi\\): The policy takes the current design state as input and outputs a probability distribution over possible placement actions.

Note that specific problems may introduce additional complexities or constraints.

"},{"location":"docs/content/intro/environments/#documentation_2","title":"Documentation","text":"

Click here for API documentation on EDA problems.

"},{"location":"docs/content/intro/environments/#graph-problems","title":"Graph Problems","text":"

Many CO problems can be (re-)formulated on graphs. In typical CO problems on graphs, actions are defined on nodes/edges, while problem variables and constraints are incorporated in graph topology and node/edge attributes (e.g., weights). The graph-based formulation gives us concise and systematic representations of CO problems.

In graph problems, we typically work with a graph \\(G = (V, E)\\), where \\(V\\) is a set of vertices (or nodes) and \\(E\\) is a set of edges connecting these vertices. The optimization task often involves selecting a subset of vertices, edges, or subgraphs to maximize or minimize a given objective function, subject to certain constraints.

"},{"location":"docs/content/intro/environments/#mdp_3","title":"MDP","text":"

Graph problems can be effectively modeled using a Markov Decision Process (MDP) framework in a constructive fashion. Here, we outline the key components of the MDP formulation for graph problems:

  • State \\(s_t \\in \\mathcal{S}\\): The state encapsulates the current configuration of the graph and the optimization progress. It typically includes:
    • The graph structure (vertices and edges)
    • Attributes associated with vertices or edges
    • The set of elements (vertices, edges, or subgraphs) selected so far
    • Problem-specific information, such as remaining selections or resources
  • Action \\(a_t \\in \\mathcal{A}\\): An action usually involves selecting a graph element (e.g., a vertex, edge, or subgraph). The action space comprises all valid selections based on the problem constraints and the current state.
  • Transition \\(\\mathcal{T}\\): The transition function \\(\\mathcal{T}(s_t, a_t) \\rightarrow s_{t+1}\\) updates the graph state based on the selected action. This typically involves:
    • Updating the set of selected elements
    • Modifying graph attributes affected by the selection
    • Updating problem-specific information (e.g., remaining selections or resources)
  • Reward \\(\\mathcal{R}\\): The reward function \\(\\mathcal{R}(s_t, a_t)\\) quantifies the quality of the action taken. It is typically based on the improvement in the optimization objective resulting from the latest selection. This could involve metrics such as coverage, distance, connectivity, or any other problem-specific criteria.
  • Policy \\(\\pi\\): The policy \\(\\pi(a_t|s_t)\\) is a probability distribution over possible actions given the current state. It guides the decision-making process, determining which graph elements to select at each step to optimize the objective.

Specific problems may introduce additional complexities or constraints, which can often be incorporated through careful design of the state space, action space, and reward function.

"},{"location":"docs/content/intro/environments/#documentation_3","title":"Documentation","text":"

Click here for API documentation on graph problems.

"},{"location":"docs/content/intro/environments/#implementation-details","title":"Implementation Details","text":"

Environments in our library fully specify the CO problems and their logic. They are based on the RL4COEnvBase class that extends from the EnvBase in TorchRL.

Key features:

  • A modular generator can be provided to the environment.
  • The generator provides CO instances to the environment, and different generators can be used to generate different data distributions.
  • Static instance data and dynamic variables, such as the current state \\(s_t\\), current solution \\(\\mathbf{a}^k\\) for improvement environments, policy actions \\(a_t\\), rewards, and additional information are passed in a stateless fashion in a TensorDict, that we call td, through the environment reset and step functions.

Our environment API contains several functions:

  • render
  • check_solution_validity
  • select_start_nodes (i.e., for POMO-based optimization)
  • Optional API such as local_search for solution improvement

It's worth noting that our library enhances the efficiency of environments when compared to vanilla TorchRL, by overriding and optimizing some methods in TorchRL EnvBase. For instance, our new step method brings a decrease of up to 50% in latency and halves the memory impact by avoiding saving duplicate components in the stateless TensorDict.

"},{"location":"docs/content/intro/intro/","title":"Introduction","text":"

RL4CO is an extensive Reinforcement Learning (RL) for Combinatorial Optimization (CO) benchmark. Our goal is to provide a unified framework for RL-based CO algorithms, and to facilitate reproducible research in this field, decoupling the science from the engineering.

"},{"location":"docs/content/intro/intro/#motivation","title":"Motivation","text":""},{"location":"docs/content/intro/intro/#why-nco","title":"Why NCO?","text":"

Neural Combinatorial Optimization (NCO) is a subfield of AI that aims to solve combinatorial optimization problems using neural networks. NCO has been successfully applied to a wide range of problems, such as the routing problems in logistics, the scheduling problems in manufacturing, and electronic design automation. The key idea behind NCO is to learn a policy that maps the input data to the optimal solution, without the need for hand-crafted heuristics or domain-specific knowledge.

"},{"location":"docs/content/intro/intro/#why-rl","title":"Why RL?","text":"

Reinforcement Learning (RL) is a machine learning paradigm that enables agents to learn how to make decisions by interacting with an environment. RL has been successfully applied to a wide range of problems, such as playing games, controlling robots, and optimizing complex systems. The key idea behind RL is to learn a policy that maps the state of the environment to the optimal action, by maximizing a reward signal. Importantly, optimal solutions are not required for training, as RL agents learn from the feedback they receive from the environment.

"},{"location":"docs/content/intro/intro/#contents","title":"Contents","text":"

We explore in other pages the following components:

  • Environments: Markov Decision Process (MDP) for CO problems and base classes for environments. These are based on TorchRL.
  • Policies: the neural networks that are used to solve CO problems and their base classes. These are based on PyTorch.
  • RL Algorithms: (broadly: \"models\"), which are the processes used to train the policies and their base classes. These are based on PyTorch Lightning.
"},{"location":"docs/content/intro/intro/#paper-reference","title":"Paper Reference","text":"

Our paper is available here for further details.

If you find RL4CO valuable for your research or applied projects, don't forget to cite us! \ud83d\ude80

@article{berto2024rl4co,\n    title={{RL4CO: an Extensive Reinforcement Learning for Combinatorial Optimization Benchmark}},\n    author={Federico Berto and Chuanbo Hua and Junyoung Park and Laurin Luttmann and Yining Ma and Fanchen Bu and Jiarui Wang and Haoran Ye and Minsu Kim and Sanghyeok Choi and Nayeli Gast Zepeda and Andr\\'e Hottung and Jianan Zhou and Jieyi Bi and Yu Hu and Fei Liu and Hyeonah Kim and Jiwoo Son and Haeyeon Kim and Davide Angioni and Wouter Kool and Zhiguang Cao and Jie Zhang and Kijung Shin and Cathy Wu and Sungsoo Ahn and Guojie Song and Changhyun Kwon and Lin Xie and Jinkyoo Park},\n    year={2024},\n    journal={arXiv preprint arXiv:2306.17100},\n    note={\\url{https://github.com/ai4co/rl4co}}\n}\n
"},{"location":"docs/content/intro/policies/","title":"Policies","text":"

The policies can be categorized into constructive policies, which generate a solution from scratch, and improvement policies, which refine an existing solution.

"},{"location":"docs/content/intro/policies/#constructive-policies","title":"Constructive policies","text":"

A policy \\(\\pi\\) is used to construct a solution from scratch for a given problem instance \\(\\mathbf{x}\\). It can be further categorized into autoregressive (AR) and non-autoregressive (NAR) policies.

"},{"location":"docs/content/intro/policies/#autoregressive-ar-policies","title":"Autoregressive (AR) policies","text":"

An AR policy is composed of an encoder \\(f\\) that maps the instance \\(\\mathbf{x}\\) into an embedding space \\(\\mathbf{h}=f(\\mathbf{x})\\) and by a decoder \\(g\\) that iteratively determines a sequence of actions \\(\\mathbf{a}\\) as follows:

\\[ a_t \\sim g(a_t | a_{t-1}, ... ,a_0, s_t, \\mathbf{h}), \\quad \\pi(\\mathbf{a}|\\mathbf{x}) \\triangleq \\prod_{t=1}^{T-1} g(a_{t} | a_{t-1}, \\ldots ,a_0, s_t, \\mathbf{h}). \\]"},{"location":"docs/content/intro/policies/#non-autoregressive-nar-policies","title":"Non-autoregressive (NAR) policies","text":"

A NAR policy encodes a problem \\(\\mathbf{x}\\) into a heuristic \\(\\mathcal{H} = f(\\mathbf{x}) \\in \\mathbb{R}^{N}_{+}\\), where \\(N\\) is the number of possible assignments across all decision variables. Each number in \\(\\mathcal{H}\\) represents a (unnormalized) probability of a particular assignment. To obtain a solution \\(\\mathbf{a}\\) from \\(\\mathcal{H}\\), one can sample a sequence of assignments from \\(\\mathcal{H}\\) while dynamically masking infeasible assignments to meet problem-specific constraints. It can also guide a search process, e.g., Ant Colony Optimization, or be incorporated into hybrid frameworks. Here, the heuristic helps identify promising transitions and improve the efficiency of finding an optimal or near-optimal solution.

"},{"location":"docs/content/intro/policies/#improvement-policies","title":"Improvement policies","text":"

A policy can be used for improving an initial solution \\(\\mathbf{a}^{0}=(a_{0}^{0},\\ldots, a_{T-1}^{0})\\) into another one potentially with higher quality, which can be formulated as follows:

\\[ \\mathbf{a}^k \\sim g(\\mathbf{a}^{0}, \\mathbf{h}), \\quad\\pi(\\mathbf{a}^K|\\mathbf{a}^0,\\mathbf{x}) \\triangleq \\prod_{k=1}^{K-1} g(\\mathbf{a}^k | \\mathbf{a}^{k-1}, ... ,\\mathbf{a}^0, \\mathbf{h}), \\]

where \\(\\mathbf{a}^{k}\\) is the \\(k\\)-th updated solution and \\(K\\) is the budget for number of improvements. This process allows continuous refinement for a long time to enhance the solution quality.

"},{"location":"docs/content/intro/policies/#implementation","title":"Implementation","text":"

Policies in our library are subclasses of PyTorch's nn.Module and contain the encoding-decoding logic and neural network parameters \\(\\theta\\). Different policies in the RL4CO \"zoo\" can inherit from metaclasses like ConstructivePolicy or ImprovementPolicy. We modularize components to process raw features into the embedding space via a parametrized function \\(\\phi_\\omega\\), called feature embeddings.

  1. Node Embeddings \\(\\phi_n\\): transform \\(m_n\\) node features of instances \\(\\mathbf{x}\\) from the feature space to the embedding space \\(h\\), i.e., \\([B, N, m_n] \\rightarrow [B, N, h]\\).
  2. Edge Embeddings \\(\\phi_e\\): transform \\(m_e\\) edge features of instances \\(\\mathbf{x}\\) from the feature space to the embedding space \\(h\\), i.e., \\([B, E, m_e] \\rightarrow [B, E, h]\\), where \\(E\\) is the number of edges.
  3. Context Embeddings \\(\\phi_c\\): capture contextual information by transforming \\(m_c\\) context features from the current decoding step \\(s_t\\) from the feature space to the embedding space \\(h\\), i.e., \\([B, m_c] \\rightarrow [B, h]\\), for nodes or edges.

Embeddings can be automatically selected by our library at runtime by simply passing the env_name to the policy. Additionally, we allow for granular control of any higher-level policy component independently, such as encoders and decoders.

"},{"location":"docs/content/intro/rl/","title":"RL Algorithms","text":""},{"location":"docs/content/intro/rl/#definitions","title":"Definitions","text":"

The RL objective is to learn a policy \\(\\pi\\) that maximizes the expected cumulative reward (or equivalently minimizes the cost) over the distribution of problem instances:

\\[ \\theta^{*} = \\underset{\\theta}{\\text{argmax}} \\, \\mathbb{E}_{\\mathbf{x} \\sim P(\\mathbf{x})} \\left[ \\mathbb{E}_{\\pi(\\mathbf{a}|\\mathbf{x})} \\left[ \\sum_{t=0}^{T-1} \\gamma^t \\mathcal{R}(s_t, a_t) \\right] \\right], \\]

where \\(\\theta\\) is the set of parameters of \\(\\pi\\) and \\(P(\\mathbf{x})\\) is the distribution of problem instances.

This equation can be solved using algorithms such as variations of REINFORCE, Advantage Actor-Critic (A2C) methods, or Proximal Policy Optimization (PPO).

These algorithms are employed to train the policy network \\(\\pi\\), by transforming the maximization problem into a minimization problem involving a loss function, which is then optimized using gradient descent algorithms. For instance, the REINFORCE loss function gradient is given by:

\\[ \\nabla_{\\theta} \\mathcal{L}_a(\\theta|\\mathbf{x}) = \\mathbb{E}_{\\pi(\\mathbf{a}|\\mathbf{x})} \\left[(R(\\mathbf{a}, \\mathbf{x}) - b(\\mathbf{x})) \\nabla_{\\theta}\\log \\pi(\\mathbf{a}|\\mathbf{x})\\right], \\]

where \\(b(\\cdot)\\) is a baseline function used to stabilize training and reduce gradient variance.

We also distinguish between two types of RL (pre)training:

  1. Inductive RL: The focus is on learning patterns from the training dataset to generalize to new instances, thus amortizing the inference procedure.
  2. Transductive RL (or test-time optimization): Optimizes parameters during testing on target instances.

Typically, a policy \\(\\pi\\) is trained using inductive RL, followed by transductive RL for test-time optimization.

"},{"location":"docs/content/intro/rl/#implementation","title":"Implementation","text":"

RL algorithms in our library define the process that takes the Environment with its problem instances and the Policy to optimize its parameters \\(\\theta\\). The parent class of algorithms is the RL4COLitModule, inheriting from PyTorch Lightning's pl.LightningModule. This allows for granular support of various methods including the [train, val, test]_step, automatic logging with several logging services such as Wandb via log_metrics, automatic optimizer configuration via configure_optimizers and several useful callbacks for RL methods such as on_train_epoch_end.

RL algorithms are additionally attached to an RL4COTrainer, a wrapper we made with additional optimizations around pl.Trainer. This module seamlessly supports features of modern training pipelines, including:

  • Logging
  • Checkpoint management
  • Mixed-precision training
  • Various hardware acceleration supports (e.g., CPU, GPU, TPU, and Apple Silicon)
  • Multi-device hardware accelerator in distributed settings

For instance, using mixed-precision training significantly decreases training time without sacrificing much convergence and enables us to leverage recent routines, e.g., FlashAttention.

"},{"location":"docs/content/start/hydra/","title":"Training with Hydra Configurations","text":"

You may find Hydra configurations under configs/ divided into categories (model, env, train, experiment, etc.).

In practice, we usually want to modify configurations under the experiment folder, of which we report an example below here.

"},{"location":"docs/content/start/hydra/#usage","title":"Usage","text":"

Train model with default configuration (AM on TSP environment):

python run.py\n

"},{"location":"docs/content/start/hydra/#change-experiment","title":"Change experiment","text":"

Train model with chosen experiment configuration from configs/experiment/

python run.py experiment=routing/am env=tsp env.generator_params.num_loc=50 model.optimizer_kwargs.lr=2e-4\n
Here you may change the environment, e.g. with env=cvrp by command line or by modifying the corresponding experiment e.g. configs/experiment/routing/am.yaml.

"},{"location":"docs/content/start/hydra/#disable-logging","title":"Disable logging","text":"

python run.py experiment=test/am logger=none '~callbacks.learning_rate_monitor'\n
Note that ~ is used to disable a callback that would need a logger.

"},{"location":"docs/content/start/hydra/#create-a-sweep-over-hyperparameters","title":"Create a sweep over hyperparameters","text":"

We can use -m for multirun:

python run.py -m experiment=routing/am  model.optimizer_kwargs.lr=1e-3,1e-4,1e-5\n
"},{"location":"docs/content/start/hydra/#experiment-configuration-example","title":"Experiment Configuration Example","text":"

We report here a configuration for running the Attention Model (AM) on a TSP environment with 50 locations that can be placed under configs/experiment:

# @package _global_\n\ndefaults:\n\n  - override /model: am.yaml\n  - override /env: tsp.yaml\n  - override /callbacks: default.yaml\n  - override /trainer: default.yaml\n  - override /logger: wandb.yaml\n\nenv:\n  generator_params:\n    loc_distribution: \"uniform\"\n    num_loc: 50\n\nmodel:\n  policy:\n    _target_: \"rl4co.models.zoo.am.AttentionModelPolicy\"\n    embed_dim: 128\n    num_heads: 8\n    num_encoder_layers: 3\n  batch_size: 512\n  val_batch_size: 1024\n  test_batch_size: 1024\n  train_data_size: 1_280_000\n  val_data_size: 10_000\n  test_data_size: 10_000\n  optimizer_kwargs:\n    lr: 1e-4\n    weight_decay: 1e-6\n  lr_scheduler:\n    \"MultiStepLR\"\n  lr_scheduler_kwargs:\n    milestones: [80, 95]\n    gamma: 0.1\n\ntrainer:\n  max_epochs: 100\n\nlogger:\n  wandb:\n    project: \"rl4co\"\n    tags: [\"am\", \"${env.name}\"]\n    group: ${env.name}${env.generator_params.num_loc}\n    name: am-${env.name}${env.generator_params.num_loc}\n

What does this configuration do? Let's break it down!

defaults:\n\n  - override /model: am.yaml\n  - override /env: tsp.yaml\n  - override /callbacks: default.yaml\n  - override /trainer: default.yaml\n  - override /logger: wandb.yaml\n

This section sets the default configuration for the model, environment, callbacks, trainer, and logger. This means that if a key is not specified in the experiment configuration, the default value will be used. Note that these are set in the root configs/ folder, and are useful for better organization and reusability.

env: \n  generator_params:\n    loc_distribution: \"uniform\"\n    num_loc: 50\n

This section specifies the environment configuration. In this case, we are using the TSP environment with 50 locations generated uniformly.

model:\n  policy:\n    _target_: \"rl4co.models.zoo.am.AttentionModelPolicy\"\n    embed_dim: 128\n    num_heads: 8\n    num_encoder_layers: 3\n  batch_size: 512\n  val_batch_size: 1024\n  test_batch_size: 1024\n  train_data_size: 1_280_000\n  val_data_size: 10_000\n  test_data_size: 10_000\n  optimizer_kwargs:\n    lr: 1e-4\n    weight_decay: 1e-6\n  lr_scheduler:\n    \"MultiStepLR\"\n  lr_scheduler_kwargs:\n    milestones: [80, 95]\n    gamma: 0.1\n

This section specifies the RL model (i.e., Lightning module) configuration. While this usually includes the policy architecture already (hence the name \"model\"), we can override it by specifying a _target_ key and additional parameters to initialize the policy. Finally, we specify the batch sizes, data sizes, optimizer parameters, and learning rate scheduler.

trainer:\n  max_epochs: 100\n

This section specifies the trainer configuration. Here, we are training the model for 100 epochs.

logger:\n  wandb:\n    project: \"rl4co\"\n    tags: [\"am\", \"${env.name}\"]\n    group: ${env.name}${env.generator_params.num_loc}\n    name: am-${env.name}${env.generator_params.num_loc}\n

Finally, this section specifies the logger configuration. In this case, we are using Weights & Biases (WandB) to log the results of the experiment. We specify the project name, tags, group, and name of the experiment.

That's it! \ud83c\udf89

Tip

For more advanced content and detailed descriptions, you may also check out this notebook!

Now, you are ready to start training. If you save the above under configs/experiment/mynewexperiment.yaml, you can run it from the root of your RL4CO-based project with:

python run.py experiment=mynewexperiment\n

"},{"location":"docs/content/start/installation/","title":"Installation","text":"

RL4CO is now available for installation on pip!

pip install rl4co\n

"},{"location":"docs/content/start/installation/#local-install-and-development","title":"Local install and development","text":"

If you want to develop RL4CO or access the latest builds, we recommend you to install it locally with pip in editable mode:

git clone https://github.com/ai4co/rl4co && cd rl4co\npip install -e .\n

Note: conda is also a good candidate for hassle-free installation of PyTorch: check out the PyTorch website for more details.

"},{"location":"docs/content/start/installation/#minimalistic-example","title":"Minimalistic Example","text":"

Here is a minimalistic example training the Attention Model with greedy rollout baseline on TSP in less than 30 lines of code:

from rl4co.envs.routing import TSPEnv, TSPGenerator\nfrom rl4co.models import AttentionModelPolicy, POMO\nfrom rl4co.utils import RL4COTrainer\n\n# Instantiate generator and environment\ngenerator = TSPGenerator(num_loc=50, loc_distribution=\"uniform\")\nenv = TSPEnv(generator)\n\n# Create policy and RL model\npolicy = AttentionModelPolicy(env_name=env.name, num_encoder_layers=6)\nmodel = POMO(env, policy, batch_size=64, optimizer_kwargs={\"lr\": 1e-4})\n\n# Instantiate Trainer and fit\ntrainer = RL4COTrainer(max_epochs=10, accelerator=\"gpu\", precision=\"16-mixed\")\ntrainer.fit(model)\n

Tip

We recommend checking out our quickstart notebook!

"},{"location":"examples/","title":"\ud83e\udde9 Examples and Tutorials","text":"

This is a collection of examples and tutorials for using the RL4CO library.

The root directory is made of quickstarts and contains the following:

"},{"location":"examples/#quickstarts","title":"\u26a1\ufe0f Quickstarts","text":"

This is the root directory of the examples. The following quickstarts are available:

  • 1-quickstart.ipynb: here we train a model on a simple environment - it takes less than 2 minutes!
  • 2-full-training.ipynb: similar to the previous notebooks but with a more interesting environment, with checkpointing, logging, and callbacks.

    - 2b-train-simple.py: here we show a simple script that can be called with python 2b-train-simple.py. This is simplified and does not use Hydra - for those who prefer a simpler setup. Note that we also made a Hydra tutorial here. - 3-creating-new-env-model.ipynb: here we show how to extend RL4CO to solve new problems and create new models from zero to hero!

"},{"location":"examples/#folders-index","title":"\ud83d\udcc1 Folders Index","text":""},{"location":"examples/#modeling","title":"Modeling","text":"

Under the modeling/ directory, here are some additional examples for modeling and inference.

"},{"location":"examples/#datasets","title":"Datasets","text":"

Under the datasets/ directory, here are some additional examples for using your custom data to train/evaluate your models

"},{"location":"examples/#advanced","title":"Advanced","text":"

Under the advanced/ directory, here are some additional examples for advanced topics.

"},{"location":"examples/#other","title":"Other","text":"

Under the other/ directory, here are some additional examples for other topics.

"},{"location":"examples/1-quickstart/","title":"RL4CO Quickstart Notebook","text":"

In this notebook we will train the AttentionModel (AM) on the TSP environment for 20 nodes. On a GPU, this should less than 2 minutes! \ud83d\ude80

In\u00a0[6]: Copied!
## Uncomment the following line to install the package from PyPI\n## You may need to restart the runtime in Colab after this\n## Remember to choose a GPU runtime for faster training!\n\n# !pip install rl4co\n
## Uncomment the following line to install the package from PyPI ## You may need to restart the runtime in Colab after this ## Remember to choose a GPU runtime for faster training! # !pip install rl4co In\u00a0[7]: Copied!
%load_ext autoreload\n%autoreload 2\n\nimport torch\n\nfrom rl4co.envs import TSPEnv\nfrom rl4co.models import AttentionModelPolicy, REINFORCE\nfrom rl4co.utils.trainer import RL4COTrainer\n
%load_ext autoreload %autoreload 2 import torch from rl4co.envs import TSPEnv from rl4co.models import AttentionModelPolicy, REINFORCE from rl4co.utils.trainer import RL4COTrainer
The autoreload extension is already loaded. To reload it, use:\n  %reload_ext autoreload\n
In\u00a0[8]: Copied!
# RL4CO env based on TorchRL\nenv = TSPEnv(generator_params={'num_loc': 50})\n\n# Policy: neural network, in this case with encoder-decoder architecture\npolicy = AttentionModelPolicy(env_name=env.name, \n                              embed_dim=128,\n                              num_encoder_layers=3,\n                              num_heads=8,\n                            )\n\n# RL Model: REINFORCE and greedy rollout baseline\nmodel = REINFORCE(env, \n                    policy,\n                    baseline=\"rollout\",\n                    batch_size=512,\n                    train_data_size=100_000,\n                    val_data_size=10_000,\n                    optimizer_kwargs={\"lr\": 1e-4},\n                    )\n
# RL4CO env based on TorchRL env = TSPEnv(generator_params={'num_loc': 50}) # Policy: neural network, in this case with encoder-decoder architecture policy = AttentionModelPolicy(env_name=env.name, embed_dim=128, num_encoder_layers=3, num_heads=8, ) # RL Model: REINFORCE and greedy rollout baseline model = REINFORCE(env, policy, baseline=\"rollout\", batch_size=512, train_data_size=100_000, val_data_size=10_000, optimizer_kwargs={\"lr\": 1e-4}, ) In\u00a0[9]: Copied!
# Greedy rollouts over untrained policy\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\ntd_init = env.reset(batch_size=[3]).to(device)\npolicy = policy.to(device)\nout = policy(td_init.clone(), phase=\"test\", decode_type=\"greedy\", return_actions=True)\nactions_untrained = out['actions'].cpu().detach()\nrewards_untrained = out['reward'].cpu().detach()\n\nfor i in range(3):\n    print(f\"Problem {i+1} | Cost: {-rewards_untrained[i]:.3f}\")\n    env.render(td_init[i], actions_untrained[i])\n
# Greedy rollouts over untrained policy device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\") td_init = env.reset(batch_size=[3]).to(device) policy = policy.to(device) out = policy(td_init.clone(), phase=\"test\", decode_type=\"greedy\", return_actions=True) actions_untrained = out['actions'].cpu().detach() rewards_untrained = out['reward'].cpu().detach() for i in range(3): print(f\"Problem {i+1} | Cost: {-rewards_untrained[i]:.3f}\") env.render(td_init[i], actions_untrained[i])
Problem 1 | Cost: 10.648\nProblem 2 | Cost: 9.375\nProblem 3 | Cost: 11.713\n
In\u00a0[10]: Copied!
trainer = RL4COTrainer(\n    max_epochs=3,\n    accelerator=\"gpu\",\n    devices=1,\n    logger=None,\n)\n
trainer = RL4COTrainer( max_epochs=3, accelerator=\"gpu\", devices=1, logger=None, )
Using 16bit Automatic Mixed Precision (AMP)\nGPU available: True (cuda), used: True\nGPU available: True (cuda), used: True\nTPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\n
In\u00a0[11]: Copied!
trainer.fit(model)\n
trainer.fit(model)
val_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\nLOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n\n  | Name     | Type                 | Params\n--------------------------------------------------\n0 | env      | TSPEnv               | 0     \n1 | policy   | AttentionModelPolicy | 710 K \n2 | baseline | WarmupBaseline       | 710 K \n--------------------------------------------------\n1.4 M     Trainable params\n0         Non-trainable params\n1.4 M     Total params\n5.681     Total estimated model params size (MB)\n
Sanity Checking: |          | 0/? [00:00<?, ?it/s]
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n
Training: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
`Trainer.fit` stopped: `max_epochs=3` reached.\n
In\u00a0[12]: Copied!
# Greedy rollouts over trained model (same states as previous plot)\npolicy = model.policy.to(device)\nout = policy(td_init.clone(), phase=\"test\", decode_type=\"greedy\", return_actions=True)\nactions_trained = out['actions'].cpu().detach()\n\n# Plotting\nimport matplotlib.pyplot as plt\nfor i, td in enumerate(td_init):\n    fig, axs = plt.subplots(1,2, figsize=(11,5))\n    env.render(td, actions_untrained[i], ax=axs[0]) \n    env.render(td, actions_trained[i], ax=axs[1])\n    axs[0].set_title(f\"Untrained | Cost = {-rewards_untrained[i].item():.3f}\")\n    axs[1].set_title(r\"Trained $\\pi_\\theta$\" + f\"| Cost = {-out['reward'][i].item():.3f}\")\n
# Greedy rollouts over trained model (same states as previous plot) policy = model.policy.to(device) out = policy(td_init.clone(), phase=\"test\", decode_type=\"greedy\", return_actions=True) actions_trained = out['actions'].cpu().detach() # Plotting import matplotlib.pyplot as plt for i, td in enumerate(td_init): fig, axs = plt.subplots(1,2, figsize=(11,5)) env.render(td, actions_untrained[i], ax=axs[0]) env.render(td, actions_trained[i], ax=axs[1]) axs[0].set_title(f\"Untrained | Cost = {-rewards_untrained[i].item():.3f}\") axs[1].set_title(r\"Trained $\\pi_\\theta$\" + f\"| Cost = {-out['reward'][i].item():.3f}\")

We can see that even after just 3 epochs, our trained AM is able to find much better solutions than the random policy! \ud83c\udf89

In\u00a0[13]: Copied!
# Optionally, save the checkpoint for later use (e.g. in tutorials/4-search-methods.ipynb)\ntrainer.save_checkpoint(\"tsp-quickstart.ckpt\")\n
# Optionally, save the checkpoint for later use (e.g. in tutorials/4-search-methods.ipynb) trainer.save_checkpoint(\"tsp-quickstart.ckpt\")"},{"location":"examples/1-quickstart/#rl4co-quickstart-notebook","title":"RL4CO Quickstart Notebook\u00b6","text":"

Documentation | Getting Started | Usage | Contributing | Paper | Citation

"},{"location":"examples/1-quickstart/#installation","title":"Installation\u00b6","text":""},{"location":"examples/1-quickstart/#imports","title":"Imports\u00b6","text":""},{"location":"examples/1-quickstart/#environment-policy-and-model","title":"Environment, Policy and Model\u00b6","text":"

Full documentation of:https://rl4.co/docs/content/api/envs/base/

  • Base environment class here
  • Base policy class here
  • Base model class here
"},{"location":"examples/1-quickstart/#test-greedy-rollout-with-untrained-model-and-plot","title":"Test greedy rollout with untrained model and plot\u00b6","text":""},{"location":"examples/1-quickstart/#trainer","title":"Trainer\u00b6","text":"

The RL4CO trainer is a wrapper around PyTorch Lightning's Trainer class which adds some functionality and more efficient defaults

"},{"location":"examples/1-quickstart/#fit-the-model","title":"Fit the model\u00b6","text":""},{"location":"examples/1-quickstart/#testing","title":"Testing\u00b6","text":""},{"location":"examples/2-full-training/","title":"Training: Checkpoints, Logging, and Callbacks","text":"

In this notebook we will cover a quickstart training of the Split Delivery Vehicle Routing Problem (SDVRP), with some additional comments along the way. The SDVRP is a variant of the VRP where a vehicle can deliver a part of the demand of a customer and return later to deliver the rest of the demand.

In\u00a0[1]: Copied!
# !pip install rl4co\n\n## NOTE: to install latest version from Github (may be unstable) install from source instead:\n# !pip install git+https://github.com/ai4co/rl4co.git\n
# !pip install rl4co ## NOTE: to install latest version from Github (may be unstable) install from source instead: # !pip install git+https://github.com/ai4co/rl4co.git In\u00a0[2]: Copied!
import torch\nfrom lightning.pytorch.callbacks import ModelCheckpoint, RichModelSummary\n\nfrom rl4co.envs import SDVRPEnv\nfrom rl4co.models.zoo import AttentionModel\nfrom rl4co.utils.trainer import RL4COTrainer\n
import torch from lightning.pytorch.callbacks import ModelCheckpoint, RichModelSummary from rl4co.envs import SDVRPEnv from rl4co.models.zoo import AttentionModel from rl4co.utils.trainer import RL4COTrainer In\u00a0[3]: Copied!
# RL4CO env based on TorchRL\nenv = SDVRPEnv(generator_params=dict(num_loc=20))\n\n# Model: default is AM with REINFORCE and greedy rollout baseline\nmodel = AttentionModel(env,\n                       baseline='rollout',\n                       train_data_size=100_000, # really small size for demo\n                       val_data_size=10_000)\n
# RL4CO env based on TorchRL env = SDVRPEnv(generator_params=dict(num_loc=20)) # Model: default is AM with REINFORCE and greedy rollout baseline model = AttentionModel(env, baseline='rollout', train_data_size=100_000, # really small size for demo val_data_size=10_000)
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n
In\u00a0[4]: Copied!
# Greedy rollouts over untrained policy\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\ntd_init = env.reset(batch_size=[3]).to(device)\npolicy = model.policy.to(device)\nout = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\")\n\n# Plotting\nprint(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\")\nfor td, actions in zip(td_init, out['actions'].cpu()):\n    env.render(td, actions)\n
# Greedy rollouts over untrained policy device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\") td_init = env.reset(batch_size=[3]).to(device) policy = model.policy.to(device) out = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\") # Plotting print(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\") for td, actions in zip(td_init, out['actions'].cpu()): env.render(td, actions)
Tour lengths: ['29.45', '14.26', '21.15']\n
In\u00a0[5]: Copied!
# Checkpointing callback: save models when validation reward improves\ncheckpoint_callback = ModelCheckpoint(  dirpath=\"checkpoints\", # save to checkpoints/\n                                        filename=\"epoch_{epoch:03d}\",  # save as epoch_XXX.ckpt\n                                        save_top_k=1, # save only the best model\n                                        save_last=True, # save the last model\n                                        monitor=\"val/reward\", # monitor validation reward\n                                        mode=\"max\") # maximize validation reward\n\n# Print model summary\nrich_model_summary = RichModelSummary(max_depth=3)\n\n# Callbacks list\ncallbacks = [checkpoint_callback, rich_model_summary]\n
# Checkpointing callback: save models when validation reward improves checkpoint_callback = ModelCheckpoint( dirpath=\"checkpoints\", # save to checkpoints/ filename=\"epoch_{epoch:03d}\", # save as epoch_XXX.ckpt save_top_k=1, # save only the best model save_last=True, # save the last model monitor=\"val/reward\", # monitor validation reward mode=\"max\") # maximize validation reward # Print model summary rich_model_summary = RichModelSummary(max_depth=3) # Callbacks list callbacks = [checkpoint_callback, rich_model_summary]

We make sure we're logged into W&B so that our experiments can be associated with our account. You may comment the below line if you don't want to use it.

In\u00a0[6]: Copied!
# import wandb\n# wandb.login()\n
# import wandb # wandb.login() In\u00a0[7]: Copied!
## Comment following two lines if you don't want logging\nfrom lightning.pytorch.loggers import WandbLogger\n\nlogger = WandbLogger(project=\"rl4co\", name=\"sdvrp-am\")\n\n\n## Keep below if you don't want logging\n# logger = None\n
## Comment following two lines if you don't want logging from lightning.pytorch.loggers import WandbLogger logger = WandbLogger(project=\"rl4co\", name=\"sdvrp-am\") ## Keep below if you don't want logging # logger = None

The Trainer handles the logging, checkpointing and more for you.

In\u00a0[8]: Copied!
from rl4co.utils.trainer import RL4COTrainer\n\ntrainer = RL4COTrainer(\n    max_epochs=2,\n    accelerator=\"gpu\",\n    devices=1,\n    logger=logger,\n    callbacks=callbacks,\n)\n
from rl4co.utils.trainer import RL4COTrainer trainer = RL4COTrainer( max_epochs=2, accelerator=\"gpu\", devices=1, logger=logger, callbacks=callbacks, )
Using 16bit Automatic Mixed Precision (AMP)\nTrainer already configured with model summary callbacks: [<class 'lightning.pytorch.callbacks.rich_model_summary.RichModelSummary'>]. Skipping setting a default `ModelSummary` callback.\nGPU available: True (cuda), used: True\nTrainer already configured with model summary callbacks: [<class 'lightning.pytorch.callbacks.rich_model_summary.RichModelSummary'>]. Skipping setting a default `ModelSummary` callback.\nGPU available: True (cuda), used: True\nTPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\n
In\u00a0[9]: Copied!
trainer.fit(model)\n
trainer.fit(model)
Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.\n
wandb: Currently logged in as: silab-kaist. Use `wandb login --relogin` to force relogin\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/wandb/sdk/lib/ipython.py:77: DeprecationWarning: Importing display from IPython.core.display is deprecated since IPython 7.14, please import from IPython display\n  from IPython.core.display import HTML, display  # type: ignore\n
wandb version 0.16.6 is available! To upgrade, please run: $ pip install wandb --upgrade Tracking run with wandb version 0.16.5 Run data is saved locally in ./wandb/run-20240428_182146-xcgdzio4 Syncing run sdvrp-am to Weights & Biases (docs) View project at https://wandb.ai/silab-kaist/rl4co View run at https://wandb.ai/silab-kaist/rl4co/runs/xcgdzio4/workspace
val_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\nLOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n
\u250f\u2501\u2501\u2501\u2501\u2533\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2533\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2533\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2513\n\u2503    \u2503 Name                                   \u2503 Type                  \u2503 Params \u2503\n\u2521\u2501\u2501\u2501\u2501\u2547\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2547\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2547\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2529\n\u2502 0  \u2502 env                                    \u2502 SDVRPEnv              \u2502      0 \u2502\n\u2502 1  \u2502 policy                                 \u2502 AttentionModelPolicy  \u2502  694 K \u2502\n\u2502 2  \u2502 policy.encoder                         \u2502 AttentionModelEncoder \u2502  595 K \u2502\n\u2502 3  \u2502 policy.encoder.init_embedding          \u2502 VRPInitEmbedding      \u2502    896 \u2502\n\u2502 4  \u2502 policy.encoder.net                     \u2502 GraphAttentionNetwork \u2502  594 K \u2502\n\u2502 5  \u2502 policy.decoder                         \u2502 AttentionModelDecoder \u2502 98.8 K \u2502\n\u2502 6  \u2502 policy.decoder.context_embedding       \u2502 VRPContext            \u2502 16.5 K \u2502\n\u2502 7  \u2502 policy.decoder.dynamic_embedding       \u2502 SDVRPDynamicEmbedding \u2502    384 \u2502\n\u2502 8  \u2502 policy.decoder.pointer                 \u2502 PointerAttention      \u2502 16.4 K \u2502\n\u2502 9  \u2502 policy.decoder.project_node_embeddings \u2502 Linear                \u2502 49.2 K \u2502\n\u2502 10 \u2502 policy.decoder.project_fixed_context   \u2502 Linear                \u2502 16.4 K \u2502\n\u2502 11 \u2502 baseline                               \u2502 WarmupBaseline        \u2502  694 K \u2502\n\u2502 12 \u2502 baseline.baseline                      \u2502 RolloutBaseline       \u2502  694 K \u2502\n\u2502 13 \u2502 baseline.baseline.policy               \u2502 AttentionModelPolicy  \u2502  694 K \u2502\n\u2502 14 \u2502 baseline.warmup_baseline               \u2502 ExponentialBaseline   \u2502      0 \u2502\n\u2514\u2500\u2500\u2500\u2500\u2534\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2534\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2534\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2518\n
Trainable params: 1.4 M                                                                                            \nNon-trainable params: 0                                                                                            \nTotal params: 1.4 M                                                                                                \nTotal estimated model params size (MB): 5                                                                          \n
Sanity Checking: |          | 0/? [00:00<?, ?it/s]
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n
Training: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
`Trainer.fit` stopped: `max_epochs=2` reached.\n
In\u00a0[10]: Copied!
# Greedy rollouts over trained model (same states as previous plot)\npolicy = model.policy.to(device)\nout = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\")\n\n# Plotting\nprint(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\")\nfor td, actions in zip(td_init, out['actions'].cpu()):\n    env.render(td, actions)\n
# Greedy rollouts over trained model (same states as previous plot) policy = model.policy.to(device) out = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\") # Plotting print(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\") for td, actions in zip(td_init, out['actions'].cpu()): env.render(td, actions)
Tour lengths: ['9.12', '7.16', '9.55']\n
In\u00a0[11]: Copied!
trainer.test(model)\n
trainer.test(model)
val_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\nLOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'test_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n
Testing: |          | 0/? [00:00<?, ?it/s]
\u250f\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2533\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2513\n\u2503        Test metric        \u2503       DataLoader 0        \u2503\n\u2521\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2547\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2529\n\u2502        test/reward        \u2502    -7.363526344299316     \u2502\n\u2514\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2534\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2518\n
Out[11]:
[{'test/reward': -7.363526344299316}]
In\u00a0[12]: Copied!
# Test generalization to 50 nodes (not going to be great due to few epochs, but hey)\nenv = SDVRPEnv(generator_params=dict(num_loc=50))\n\n# Generate data (100) and set as test dataset\nnew_dataset = env.dataset(50)\ndataloader = model._dataloader(new_dataset, batch_size=100)\n
# Test generalization to 50 nodes (not going to be great due to few epochs, but hey) env = SDVRPEnv(generator_params=dict(num_loc=50)) # Generate data (100) and set as test dataset new_dataset = env.dataset(50) dataloader = model._dataloader(new_dataset, batch_size=100) In\u00a0[15]: Copied!
# Greedy rollouts over trained policy (same states as previous plot, with 20 nodes)\ninit_states = next(iter(dataloader))[:3]\ntd_init_generalization = env.reset(init_states).to(device)\n\npolicy = model.policy.to(device)\nout = policy(td_init_generalization.clone(), env, phase=\"test\", decode_type=\"greedy\")\n\n# Plotting\nprint(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\")\nfor td, actions in zip(td_init_generalization, out['actions'].cpu()):\n    env.render(td, actions)\n
# Greedy rollouts over trained policy (same states as previous plot, with 20 nodes) init_states = next(iter(dataloader))[:3] td_init_generalization = env.reset(init_states).to(device) policy = model.policy.to(device) out = policy(td_init_generalization.clone(), env, phase=\"test\", decode_type=\"greedy\") # Plotting print(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\") for td, actions in zip(td_init_generalization, out['actions'].cpu()): env.render(td, actions)
Tour lengths: ['11.84', '12.49', '12.20']\n
In\u00a0[16]: Copied!
# Environment, Model, and Lightning Module (reinstantiate from scratch)\nmodel = AttentionModel(env,\n                       baseline=\"rollout\",\n                       train_data_size=100_000,\n                       test_data_size=10_000,\n                       optimizer_kwargs={'lr': 1e-4}\n                       )\n\n# Note that by default, Lightning will call checkpoints from newer runs with \"-v{version}\" suffix\n# unless you specify the checkpoint path explicitly\nnew_model_checkpoint = AttentionModel.load_from_checkpoint(\"checkpoints/last.ckpt\", strict=False)\n
# Environment, Model, and Lightning Module (reinstantiate from scratch) model = AttentionModel(env, baseline=\"rollout\", train_data_size=100_000, test_data_size=10_000, optimizer_kwargs={'lr': 1e-4} ) # Note that by default, Lightning will call checkpoints from newer runs with \"-v{version}\" suffix # unless you specify the checkpoint path explicitly new_model_checkpoint = AttentionModel.load_from_checkpoint(\"checkpoints/last.ckpt\", strict=False)
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/core/saving.py:188: Found keys that are not in the model state dict but in the checkpoint: ['baseline.baseline.policy.encoder.init_embedding.init_embed.weight', 'baseline.baseline.policy.encoder.init_embedding.init_embed.bias', 'baseline.baseline.policy.encoder.init_embedding.init_embed_depot.weight', 'baseline.baseline.policy.encoder.init_embedding.init_embed_depot.bias', 'baseline.baseline.policy.encoder.net.layers.0.0.module.Wqkv.weight', 'baseline.baseline.policy.encoder.net.layers.0.0.module.Wqkv.bias', 'baseline.baseline.policy.encoder.net.layers.0.0.module.out_proj.weight', 'baseline.baseline.policy.encoder.net.layers.0.0.module.out_proj.bias', 'baseline.baseline.policy.encoder.net.layers.0.1.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.0.1.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.0.1.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.0.1.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.0.1.normalizer.num_batches_tracked', 'baseline.baseline.policy.encoder.net.layers.0.2.module.0.weight', 'baseline.baseline.policy.encoder.net.layers.0.2.module.0.bias', 'baseline.baseline.policy.encoder.net.layers.0.2.module.2.weight', 'baseline.baseline.policy.encoder.net.layers.0.2.module.2.bias', 'baseline.baseline.policy.encoder.net.layers.0.3.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.0.3.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.0.3.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.0.3.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.0.3.normalizer.num_batches_tracked', 'baseline.baseline.policy.encoder.net.layers.1.0.module.Wqkv.weight', 'baseline.baseline.policy.encoder.net.layers.1.0.module.Wqkv.bias', 'baseline.baseline.policy.encoder.net.layers.1.0.module.out_proj.weight', 'baseline.baseline.policy.encoder.net.layers.1.0.module.out_proj.bias', 'baseline.baseline.policy.encoder.net.layers.1.1.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.1.1.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.1.1.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.1.1.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.1.1.normalizer.num_batches_tracked', 'baseline.baseline.policy.encoder.net.layers.1.2.module.0.weight', 'baseline.baseline.policy.encoder.net.layers.1.2.module.0.bias', 'baseline.baseline.policy.encoder.net.layers.1.2.module.2.weight', 'baseline.baseline.policy.encoder.net.layers.1.2.module.2.bias', 'baseline.baseline.policy.encoder.net.layers.1.3.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.1.3.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.1.3.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.1.3.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.1.3.normalizer.num_batches_tracked', 'baseline.baseline.policy.encoder.net.layers.2.0.module.Wqkv.weight', 'baseline.baseline.policy.encoder.net.layers.2.0.module.Wqkv.bias', 'baseline.baseline.policy.encoder.net.layers.2.0.module.out_proj.weight', 'baseline.baseline.policy.encoder.net.layers.2.0.module.out_proj.bias', 'baseline.baseline.policy.encoder.net.layers.2.1.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.2.1.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.2.1.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.2.1.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.2.1.normalizer.num_batches_tracked', 'baseline.baseline.policy.encoder.net.layers.2.2.module.0.weight', 'baseline.baseline.policy.encoder.net.layers.2.2.module.0.bias', 'baseline.baseline.policy.encoder.net.layers.2.2.module.2.weight', 'baseline.baseline.policy.encoder.net.layers.2.2.module.2.bias', 'baseline.baseline.policy.encoder.net.layers.2.3.normalizer.weight', 'baseline.baseline.policy.encoder.net.layers.2.3.normalizer.bias', 'baseline.baseline.policy.encoder.net.layers.2.3.normalizer.running_mean', 'baseline.baseline.policy.encoder.net.layers.2.3.normalizer.running_var', 'baseline.baseline.policy.encoder.net.layers.2.3.normalizer.num_batches_tracked', 'baseline.baseline.policy.decoder.context_embedding.project_context.weight', 'baseline.baseline.policy.decoder.dynamic_embedding.projection.weight', 'baseline.baseline.policy.decoder.pointer.project_out.weight', 'baseline.baseline.policy.decoder.project_node_embeddings.weight', 'baseline.baseline.policy.decoder.project_fixed_context.weight']\nval_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\n

Now we can load both the model and environment from the checkpoint!

In\u00a0[17]: Copied!
# Greedy rollouts over trained model (same states as previous plot, with 20 nodes)\npolicy_new = new_model_checkpoint.policy.to(device)\nenv = new_model_checkpoint.env.to(device)\n\nout = policy_new(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\")\n\n# Plotting\nprint(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\")\nfor td, actions in zip(td_init, out['actions'].cpu()):\n    env.render(td, actions)\n
# Greedy rollouts over trained model (same states as previous plot, with 20 nodes) policy_new = new_model_checkpoint.policy.to(device) env = new_model_checkpoint.env.to(device) out = policy_new(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\") # Plotting print(f\"Tour lengths: {[f'{-r.item():.2f}' for r in out['reward']]}\") for td, actions in zip(td_init, out['actions'].cpu()): env.render(td, actions)
Tour lengths: ['9.12', '7.16', '9.55']\n
"},{"location":"examples/2-full-training/#training-checkpoints-logging-and-callbacks","title":"Training: Checkpoints, Logging, and Callbacks\u00b6","text":""},{"location":"examples/2-full-training/#installation","title":"Installation\u00b6","text":"

Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!

Note: You may need to restart the runtime in Colab after this

"},{"location":"examples/2-full-training/#imports","title":"Imports\u00b6","text":""},{"location":"examples/2-full-training/#main-setup","title":"Main Setup\u00b6","text":""},{"location":"examples/2-full-training/#environment-model-and-litmodule","title":"Environment, Model and LitModule\u00b6","text":""},{"location":"examples/2-full-training/#test-greedy-rollout-with-untrained-model-and-plot","title":"Test greedy rollout with untrained model and plot\u00b6","text":""},{"location":"examples/2-full-training/#training","title":"Training\u00b6","text":""},{"location":"examples/2-full-training/#callbacks","title":"Callbacks\u00b6","text":"

Here we set up a checkpoint callback to save the best model and another callback for demonstration (nice progress bar). You may check other callbacks here

"},{"location":"examples/2-full-training/#logging","title":"Logging\u00b6","text":"

Here we will use Wandb. You may comment below lines if you don't want to use it. You may check other loggers here

"},{"location":"examples/2-full-training/#trainer","title":"Trainer\u00b6","text":"

The RL4CO trainer is a wrapper around PyTorch Lightning's Trainer class which adds some functionality and more efficient defaults

"},{"location":"examples/2-full-training/#fit-the-model","title":"Fit the model\u00b6","text":""},{"location":"examples/2-full-training/#testing","title":"Testing\u00b6","text":""},{"location":"examples/2-full-training/#plotting","title":"Plotting\u00b6","text":"

Here we plot the solution (greedy rollout) of the trained policy to the initial problem

"},{"location":"examples/2-full-training/#test-function","title":"Test function\u00b6","text":"

By default, the dataset is generated or loaded by the environment. You may load a dataset by setting test_file during the env config:

env = SDVRPEnv(\n    ...\n    test_file=\"path/to/test/file\"\n)\n

In this case, we test directly on the generated test dataset

"},{"location":"examples/2-full-training/#test-generalization-to-new-dataset","title":"Test generalization to new dataset\u00b6","text":"

Here we can load a new dataset (with 50 nodes) and test the trained model on it

"},{"location":"examples/2-full-training/#plotting-generalization","title":"Plotting generalization\u00b6","text":""},{"location":"examples/2-full-training/#loading-model","title":"Loading model\u00b6","text":"

Thanks to PyTorch Lightning, we can easily save and load a model to and from a checkpoint! This is declared in the Trainer using the model checkpoint callback. For example, we can load the last model via the last.ckpt file located in the folder we specified in the Trainer.

"},{"location":"examples/2-full-training/#checkpointing","title":"Checkpointing\u00b6","text":""},{"location":"examples/2-full-training/#additional-resources","title":"Additional resources\u00b6","text":"

Documentation | Getting Started | Usage | Contributing | Paper | Citation

Have feedback about this notebook? Feel free to contribute by either opening an issue or a pull request! ;)

"},{"location":"examples/3-creating-new-env-model/","title":"New Environment: Creating and Modeling","text":"

In this notebook, we will show how to extend RL4CO to solve new problems from zero to hero! \ud83d\ude80

In\u00a0[1]: Copied!
## Uncomment the following line to install the package from PyPI\n## You may need to restart the runtime in Colab after this\n## Remember to choose a GPU runtime for faster training!\n\n# !pip install rl4co\n
## Uncomment the following line to install the package from PyPI ## You may need to restart the runtime in Colab after this ## Remember to choose a GPU runtime for faster training! # !pip install rl4co In\u00a0[16]: Copied!
from typing import Optional\nimport torch\nimport torch.nn as nn\n\nfrom tensordict.tensordict import TensorDict\nfrom torchrl.data import (\n    Bounded,\n    Composite,\n    Unbounded,\n    Unbounded,\n)\n\nfrom rl4co.utils.decoding import rollout, random_policy\nfrom rl4co.envs.common import RL4COEnvBase, Generator, get_sampler\nfrom rl4co.models.zoo import AttentionModel, AttentionModelPolicy\nfrom rl4co.utils.ops import gather_by_index, get_tour_length\nfrom rl4co.utils.trainer import RL4COTrainer\n
from typing import Optional import torch import torch.nn as nn from tensordict.tensordict import TensorDict from torchrl.data import ( Bounded, Composite, Unbounded, Unbounded, ) from rl4co.utils.decoding import rollout, random_policy from rl4co.envs.common import RL4COEnvBase, Generator, get_sampler from rl4co.models.zoo import AttentionModel, AttentionModelPolicy from rl4co.utils.ops import gather_by_index, get_tour_length from rl4co.utils.trainer import RL4COTrainer

We will base environment creation on the RL4COEnvBase class, which is based on TorchRL. More information in documentation!

In\u00a0[2]: Copied!
def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict:\n    # Initialize locations\n    init_locs = td[\"locs\"] if td is not None else None\n    if batch_size is None:\n        batch_size = self.batch_size if init_locs is None else init_locs.shape[:-2]\n    device = init_locs.device if init_locs is not None else self.device\n    self.to(device)\n    if init_locs is None:\n        init_locs = self.generate_data(batch_size=batch_size).to(device)[\"locs\"]\n    batch_size = [batch_size] if isinstance(batch_size, int) else batch_size\n\n    # We do not enforce loading from self for flexibility\n    num_loc = init_locs.shape[-2]\n\n    # Other variables\n    current_node = torch.zeros((batch_size), dtype=torch.int64, device=device)\n    available = torch.ones(\n        (*batch_size, num_loc), dtype=torch.bool, device=device\n    )  # 1 means not visited, i.e. action is allowed\n    i = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device)\n\n    return TensorDict(\n        {\n            \"locs\": init_locs,\n            \"first_node\": current_node,\n            \"current_node\": current_node,\n            \"i\": i,\n            \"action_mask\": available,\n            \"reward\": torch.zeros((*batch_size, 1), dtype=torch.float32),\n        },\n        batch_size=batch_size,\n    )\n
def _reset(self, td: Optional[TensorDict] = None, batch_size=None) -> TensorDict: # Initialize locations init_locs = td[\"locs\"] if td is not None else None if batch_size is None: batch_size = self.batch_size if init_locs is None else init_locs.shape[:-2] device = init_locs.device if init_locs is not None else self.device self.to(device) if init_locs is None: init_locs = self.generate_data(batch_size=batch_size).to(device)[\"locs\"] batch_size = [batch_size] if isinstance(batch_size, int) else batch_size # We do not enforce loading from self for flexibility num_loc = init_locs.shape[-2] # Other variables current_node = torch.zeros((batch_size), dtype=torch.int64, device=device) available = torch.ones( (*batch_size, num_loc), dtype=torch.bool, device=device ) # 1 means not visited, i.e. action is allowed i = torch.zeros((*batch_size, 1), dtype=torch.int64, device=device) return TensorDict( { \"locs\": init_locs, \"first_node\": current_node, \"current_node\": current_node, \"i\": i, \"action_mask\": available, \"reward\": torch.zeros((*batch_size, 1), dtype=torch.float32), }, batch_size=batch_size, ) In\u00a0[3]: Copied!
def _step(self, td: TensorDict) -> TensorDict:\n    current_node = td[\"action\"]\n    first_node = current_node if td[\"i\"].all() == 0 else td[\"first_node\"]\n\n    # Set not visited to 0 (i.e., we visited the node)\n    # Note: we may also use a separate function for obtaining the mask for more flexibility\n    available = td[\"action_mask\"].scatter(\n        -1, current_node.unsqueeze(-1).expand_as(td[\"action_mask\"]), 0\n    )\n\n    # We are done there are no unvisited locations\n    done = torch.sum(available, dim=-1) == 0\n\n    # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here\n    reward = torch.zeros_like(done)\n\n    td.update(\n        {\n            \"first_node\": first_node,\n            \"current_node\": current_node,\n            \"i\": td[\"i\"] + 1,\n            \"action_mask\": available,\n            \"reward\": reward,\n            \"done\": done,\n        },\n    )\n    return td\n
def _step(self, td: TensorDict) -> TensorDict: current_node = td[\"action\"] first_node = current_node if td[\"i\"].all() == 0 else td[\"first_node\"] # Set not visited to 0 (i.e., we visited the node) # Note: we may also use a separate function for obtaining the mask for more flexibility available = td[\"action_mask\"].scatter( -1, current_node.unsqueeze(-1).expand_as(td[\"action_mask\"]), 0 ) # We are done there are no unvisited locations done = torch.sum(available, dim=-1) == 0 # The reward is calculated outside via get_reward for efficiency, so we set it to 0 here reward = torch.zeros_like(done) td.update( { \"first_node\": first_node, \"current_node\": current_node, \"i\": td[\"i\"] + 1, \"action_mask\": available, \"reward\": reward, \"done\": done, }, ) return td In\u00a0[4]: Copied!
def get_action_mask(self, td: TensorDict) -> TensorDict:\n    # Here: your logic \n    return td[\"action_mask\"]\n
def get_action_mask(self, td: TensorDict) -> TensorDict: # Here: your logic return td[\"action_mask\"] In\u00a0[5]: Copied!
def check_solution_validity(self, td: TensorDict, actions: torch.Tensor):\n    \"\"\"Check that solution is valid: nodes are visited exactly once\"\"\"\n    assert (\n        torch.arange(actions.size(1), out=actions.data.new())\n        .view(1, -1)\n        .expand_as(actions)\n        == actions.data.sort(1)[0]\n    ).all(), \"Invalid tour\"\n
def check_solution_validity(self, td: TensorDict, actions: torch.Tensor): \"\"\"Check that solution is valid: nodes are visited exactly once\"\"\" assert ( torch.arange(actions.size(1), out=actions.data.new()) .view(1, -1) .expand_as(actions) == actions.data.sort(1)[0] ).all(), \"Invalid tour\" In\u00a0[26]: Copied!
def _get_reward(self, td, actions) -> TensorDict:\n    # Sanity check if enabled\n    if self.check_solution:\n        self.check_solution_validity(td, actions)\n\n    # Gather locations in order of tour and return distance between them (i.e., -reward)\n    locs_ordered = gather_by_index(td[\"locs\"], actions)\n    return -get_tour_length(locs_ordered)\n
def _get_reward(self, td, actions) -> TensorDict: # Sanity check if enabled if self.check_solution: self.check_solution_validity(td, actions) # Gather locations in order of tour and return distance between them (i.e., -reward) locs_ordered = gather_by_index(td[\"locs\"], actions) return -get_tour_length(locs_ordered) In\u00a0[21]: Copied!
def _make_spec(self, generator):\n    \"\"\"Make the observation and action specs from the parameters\"\"\"\n    self.observation_spec = Composite(\n        locs=Bounded(\n            low=self.generator.min_loc,\n            high=self.generator.max_loc,\n            shape=(self.generator.num_loc, 2),\n            dtype=torch.float32,\n        ),\n        first_node=Unbounded(\n            shape=(1),\n            dtype=torch.int64,\n        ),\n        current_node=Unbounded(\n            shape=(1),\n            dtype=torch.int64,\n        ),\n        i=Unbounded(\n            shape=(1),\n            dtype=torch.int64,\n        ),\n        action_mask=Unbounded(\n            shape=(self.generator.num_loc),\n            dtype=torch.bool,\n        ),\n        shape=(),\n    )\n    self.action_spec = Bounded(\n        shape=(1,),\n        dtype=torch.int64,\n        low=0,\n        high=self.generator.num_loc,\n    )\n    self.reward_spec = Unbounded(shape=(1,))\n    self.done_spec = Unbounded(shape=(1,), dtype=torch.bool)\n
def _make_spec(self, generator): \"\"\"Make the observation and action specs from the parameters\"\"\" self.observation_spec = Composite( locs=Bounded( low=self.generator.min_loc, high=self.generator.max_loc, shape=(self.generator.num_loc, 2), dtype=torch.float32, ), first_node=Unbounded( shape=(1), dtype=torch.int64, ), current_node=Unbounded( shape=(1), dtype=torch.int64, ), i=Unbounded( shape=(1), dtype=torch.int64, ), action_mask=Unbounded( shape=(self.generator.num_loc), dtype=torch.bool, ), shape=(), ) self.action_spec = Bounded( shape=(1,), dtype=torch.int64, low=0, high=self.generator.num_loc, ) self.reward_spec = Unbounded(shape=(1,)) self.done_spec = Unbounded(shape=(1,), dtype=torch.bool) In\u00a0[22]: Copied!
class TSPGenerator(Generator):\n    def __init__(\n        self,\n        num_loc: int = 20,\n        min_loc: float = 0.0,\n        max_loc: float = 1.0,\n    ):\n        self.num_loc = num_loc\n        self.min_loc = min_loc\n        self.max_loc = max_loc\n        self.loc_sampler = torch.distributions.Uniform(\n            low=min_loc, high=max_loc\n        )\n\n    def _generate(self, batch_size) -> TensorDict:\n        # Sample locations\n        locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2))\n        return TensorDict({\"locs\": locs}, batch_size=batch_size)\n    \n# Test generator\ngenerator = TSPGenerator(num_loc=20)\nlocs = generator(32)\nprint(locs[\"locs\"].shape)\n
class TSPGenerator(Generator): def __init__( self, num_loc: int = 20, min_loc: float = 0.0, max_loc: float = 1.0, ): self.num_loc = num_loc self.min_loc = min_loc self.max_loc = max_loc self.loc_sampler = torch.distributions.Uniform( low=min_loc, high=max_loc ) def _generate(self, batch_size) -> TensorDict: # Sample locations locs = self.loc_sampler.sample((*batch_size, self.num_loc, 2)) return TensorDict({\"locs\": locs}, batch_size=batch_size) # Test generator generator = TSPGenerator(num_loc=20) locs = generator(32) print(locs[\"locs\"].shape)
torch.Size([32, 20, 2])\n
In\u00a0[23]: Copied!
def render(self, td, actions=None, ax=None):\n    import matplotlib.pyplot as plt\n    import numpy as np\n\n    if ax is None:\n        # Create a plot of the nodes\n        _, ax = plt.subplots()\n\n    td = td.detach().cpu()\n\n    if actions is None:\n        actions = td.get(\"action\", None)\n    # if batch_size greater than 0 , we need to select the first batch element\n    if td.batch_size != torch.Size([]):\n        td = td[0]\n        actions = actions[0]\n\n    locs = td[\"locs\"]\n\n    # gather locs in order of action if available\n    if actions is None:\n        print(\"No action in TensorDict, rendering unsorted locs\")\n    else:\n        actions = actions.detach().cpu()\n        locs = gather_by_index(locs, actions, dim=0)\n\n    # Cat the first node to the end to complete the tour\n    locs = torch.cat((locs, locs[0:1]))\n    x, y = locs[:, 0], locs[:, 1]\n\n    # Plot the visited nodes\n    ax.scatter(x, y, color=\"tab:blue\")\n\n    # Add arrows between visited nodes as a quiver plot\n    dx, dy = np.diff(x), np.diff(y)\n    ax.quiver(\n        x[:-1], y[:-1], dx, dy, scale_units=\"xy\", angles=\"xy\", scale=1, color=\"k\"\n    )\n\n    # Setup limits and show\n    ax.set_xlim(-0.05, 1.05)\n    ax.set_ylim(-0.05, 1.05)\n
def render(self, td, actions=None, ax=None): import matplotlib.pyplot as plt import numpy as np if ax is None: # Create a plot of the nodes _, ax = plt.subplots() td = td.detach().cpu() if actions is None: actions = td.get(\"action\", None) # if batch_size greater than 0 , we need to select the first batch element if td.batch_size != torch.Size([]): td = td[0] actions = actions[0] locs = td[\"locs\"] # gather locs in order of action if available if actions is None: print(\"No action in TensorDict, rendering unsorted locs\") else: actions = actions.detach().cpu() locs = gather_by_index(locs, actions, dim=0) # Cat the first node to the end to complete the tour locs = torch.cat((locs, locs[0:1])) x, y = locs[:, 0], locs[:, 1] # Plot the visited nodes ax.scatter(x, y, color=\"tab:blue\") # Add arrows between visited nodes as a quiver plot dx, dy = np.diff(x), np.diff(y) ax.quiver( x[:-1], y[:-1], dx, dy, scale_units=\"xy\", angles=\"xy\", scale=1, color=\"k\" ) # Setup limits and show ax.set_xlim(-0.05, 1.05) ax.set_ylim(-0.05, 1.05) In\u00a0[28]: Copied!
class TSPEnv(RL4COEnvBase):\n    \"\"\"Traveling Salesman Problem (TSP) environment\"\"\"\n\n    name = \"tsp\"\n\n    def __init__(\n        self,\n        generator = TSPGenerator,\n        generator_params = {},\n        **kwargs,\n    ):\n        super().__init__(**kwargs)\n        self.generator = generator(**generator_params)\n        self._make_spec(self.generator)\n        \n    _reset = _reset\n    _step = _step\n    _get_reward = _get_reward\n    check_solution_validity = check_solution_validity\n    get_action_mask = get_action_mask\n    _make_spec = _make_spec\n    render = render\n
class TSPEnv(RL4COEnvBase): \"\"\"Traveling Salesman Problem (TSP) environment\"\"\" name = \"tsp\" def __init__( self, generator = TSPGenerator, generator_params = {}, **kwargs, ): super().__init__(**kwargs) self.generator = generator(**generator_params) self._make_spec(self.generator) _reset = _reset _step = _step _get_reward = _get_reward check_solution_validity = check_solution_validity get_action_mask = get_action_mask _make_spec = _make_spec render = render In\u00a0[29]: Copied!
batch_size = 2\n\nenv = TSPEnv(generator_params=dict(num_loc=20))\nreward, td, actions = rollout(env, env.reset(batch_size=[batch_size]), random_policy)\nenv.render(td, actions)\n
batch_size = 2 env = TSPEnv(generator_params=dict(num_loc=20)) reward, td, actions = rollout(env, env.reset(batch_size=[batch_size]), random_policy) env.render(td, actions) In\u00a0[30]: Copied!
class TSPInitEmbedding(nn.Module):\n    \"\"\"Initial embedding for the Traveling Salesman Problems (TSP).\n    Embed the following node features to the embedding space:\n        - locs: x, y coordinates of the cities\n    \"\"\"\n\n    def __init__(self, embed_dim, linear_bias=True):\n        super(TSPInitEmbedding, self).__init__()\n        node_dim = 2  # x, y\n        self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias)\n\n    def forward(self, td):\n        out = self.init_embed(td[\"locs\"])\n        return out\n
class TSPInitEmbedding(nn.Module): \"\"\"Initial embedding for the Traveling Salesman Problems (TSP). Embed the following node features to the embedding space: - locs: x, y coordinates of the cities \"\"\" def __init__(self, embed_dim, linear_bias=True): super(TSPInitEmbedding, self).__init__() node_dim = 2 # x, y self.init_embed = nn.Linear(node_dim, embed_dim, linear_bias) def forward(self, td): out = self.init_embed(td[\"locs\"]) return out In\u00a0[31]: Copied!
class TSPContext(nn.Module):\n    \"\"\"Context embedding for the Traveling Salesman Problem (TSP).\n    Project the following to the embedding space:\n        - first node embedding\n        - current node embedding\n    \"\"\"\n\n    def __init__(self, embed_dim,  linear_bias=True):\n        super(TSPContext, self).__init__()\n        self.W_placeholder = nn.Parameter(\n            torch.Tensor(2 * embed_dim).uniform_(-1, 1)\n        )\n        self.project_context = nn.Linear(\n            embed_dim*2, embed_dim, bias=linear_bias\n        )\n\n    def forward(self, embeddings, td):\n        batch_size = embeddings.size(0)\n        # By default, node_dim = -1 (we only have one node embedding per node)\n        node_dim = (\n            (-1,) if td[\"first_node\"].dim() == 1 else (td[\"first_node\"].size(-1), -1)\n        )\n        if td[\"i\"][(0,) * td[\"i\"].dim()].item() < 1:  # get first item fast\n            context_embedding = self.W_placeholder[None, :].expand(\n                batch_size, self.W_placeholder.size(-1)\n            )\n        else:\n            context_embedding = gather_by_index(\n                embeddings,\n                torch.stack([td[\"first_node\"], td[\"current_node\"]], -1).view(\n                    batch_size, -1\n                ),\n            ).view(batch_size, *node_dim)\n        return self.project_context(context_embedding)\n
class TSPContext(nn.Module): \"\"\"Context embedding for the Traveling Salesman Problem (TSP). Project the following to the embedding space: - first node embedding - current node embedding \"\"\" def __init__(self, embed_dim, linear_bias=True): super(TSPContext, self).__init__() self.W_placeholder = nn.Parameter( torch.Tensor(2 * embed_dim).uniform_(-1, 1) ) self.project_context = nn.Linear( embed_dim*2, embed_dim, bias=linear_bias ) def forward(self, embeddings, td): batch_size = embeddings.size(0) # By default, node_dim = -1 (we only have one node embedding per node) node_dim = ( (-1,) if td[\"first_node\"].dim() == 1 else (td[\"first_node\"].size(-1), -1) ) if td[\"i\"][(0,) * td[\"i\"].dim()].item() < 1: # get first item fast context_embedding = self.W_placeholder[None, :].expand( batch_size, self.W_placeholder.size(-1) ) else: context_embedding = gather_by_index( embeddings, torch.stack([td[\"first_node\"], td[\"current_node\"]], -1).view( batch_size, -1 ), ).view(batch_size, *node_dim) return self.project_context(context_embedding) In\u00a0[32]: Copied!
class StaticEmbedding(nn.Module):\n    def __init__(self, *args, **kwargs):\n        super(StaticEmbedding, self).__init__()\n\n    def forward(self, td):\n        return 0, 0, 0\n
class StaticEmbedding(nn.Module): def __init__(self, *args, **kwargs): super(StaticEmbedding, self).__init__() def forward(self, td): return 0, 0, 0 In\u00a0[33]: Copied!
# Instantiate our environment\nenv = TSPEnv(generator_params=dict(num_loc=20))\n\n# Instantiate policy with the embeddings we created above\nemb_dim = 128\npolicy = AttentionModelPolicy(env_name=env.name, # this is actually not needed since we are initializing the embeddings!\n                              embed_dim=emb_dim,\n                              init_embedding=TSPInitEmbedding(emb_dim),\n                              context_embedding=TSPContext(emb_dim),\n                              dynamic_embedding=StaticEmbedding(emb_dim)\n)\n\n\n# Model: default is AM with REINFORCE and greedy rollout baseline\nmodel = AttentionModel(env, \n                       policy=policy,\n                       baseline='rollout',\n                       train_data_size=100_000,\n                       val_data_size=10_000)\n
# Instantiate our environment env = TSPEnv(generator_params=dict(num_loc=20)) # Instantiate policy with the embeddings we created above emb_dim = 128 policy = AttentionModelPolicy(env_name=env.name, # this is actually not needed since we are initializing the embeddings! embed_dim=emb_dim, init_embedding=TSPInitEmbedding(emb_dim), context_embedding=TSPContext(emb_dim), dynamic_embedding=StaticEmbedding(emb_dim) ) # Model: default is AM with REINFORCE and greedy rollout baseline model = AttentionModel(env, policy=policy, baseline='rollout', train_data_size=100_000, val_data_size=10_000)
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n
In\u00a0[34]: Copied!
# Greedy rollouts over untrained model\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\ntd_init = env.reset(batch_size=[3]).to(device)\npolicy = model.policy.to(device)\nout = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\")\nactions_untrained = out['actions'].cpu().detach()\nrewards_untrained = out['reward'].cpu().detach()\n\nfor i in range(3):\n    print(f\"Problem {i+1} | Cost: {-rewards_untrained[i]:.3f}\")\n    env.render(td_init[i], actions_untrained[i])\n
# Greedy rollouts over untrained model device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\") td_init = env.reset(batch_size=[3]).to(device) policy = model.policy.to(device) out = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\") actions_untrained = out['actions'].cpu().detach() rewards_untrained = out['reward'].cpu().detach() for i in range(3): print(f\"Problem {i+1} | Cost: {-rewards_untrained[i]:.3f}\") env.render(td_init[i], actions_untrained[i])
Problem 1 | Cost: 11.545\nProblem 2 | Cost: 8.525\nProblem 3 | Cost: 12.461\n
In\u00a0[35]: Copied!
# We use our own wrapper around Lightning's `Trainer` to make it easier to use\ntrainer = RL4COTrainer(max_epochs=3, devices=1)\ntrainer.fit(model)\n
# We use our own wrapper around Lightning's `Trainer` to make it easier to use trainer = RL4COTrainer(max_epochs=3, devices=1) trainer.fit(model)
Using 16bit Automatic Mixed Precision (AMP)\nGPU available: True (cuda), used: True\nTPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\nval_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\nLOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n\n  | Name     | Type                 | Params\n--------------------------------------------------\n0 | env      | TSPEnv               | 0     \n1 | policy   | AttentionModelPolicy | 710 K \n2 | baseline | WarmupBaseline       | 710 K \n--------------------------------------------------\n1.4 M     Trainable params\n0         Non-trainable params\n1.4 M     Total params\n5.682     Total estimated model params size (MB)\n
Sanity Checking: |          | 0/? [00:00<?, ?it/s]
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n
Training: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
`Trainer.fit` stopped: `max_epochs=3` reached.\n
In\u00a0[36]: Copied!
# Greedy rollouts over trained policy (same states as previous plot)\npolicy = model.policy.to(device)\nout = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\")\nactions_trained = out['actions'].cpu().detach()\n\n# Plotting\nimport matplotlib.pyplot as plt\nfor i, td in enumerate(td_init):\n    fig, axs = plt.subplots(1,2, figsize=(11,5))\n    env.render(td, actions_untrained[i], ax=axs[0]) \n    env.render(td, actions_trained[i], ax=axs[1])\n    axs[0].set_title(f\"Untrained | Cost = {-rewards_untrained[i].item():.3f}\")\n    axs[1].set_title(r\"Trained $\\pi_\\theta$\" + f\"| Cost = {-out['reward'][i].item():.3f}\")\n
# Greedy rollouts over trained policy (same states as previous plot) policy = model.policy.to(device) out = policy(td_init.clone(), env, phase=\"test\", decode_type=\"greedy\") actions_trained = out['actions'].cpu().detach() # Plotting import matplotlib.pyplot as plt for i, td in enumerate(td_init): fig, axs = plt.subplots(1,2, figsize=(11,5)) env.render(td, actions_untrained[i], ax=axs[0]) env.render(td, actions_trained[i], ax=axs[1]) axs[0].set_title(f\"Untrained | Cost = {-rewards_untrained[i].item():.3f}\") axs[1].set_title(r\"Trained $\\pi_\\theta$\" + f\"| Cost = {-out['reward'][i].item():.3f}\")

We can see that solutions are way better than with the untrained model, even just after 3 epochs! \ud83d\ude80

"},{"location":"examples/3-creating-new-env-model/#new-environment-creating-and-modeling","title":"New Environment: Creating and Modeling\u00b6","text":""},{"location":"examples/3-creating-new-env-model/#contents","title":"Contents\u00b6","text":"
  1. Environment
  2. Modeling
  3. Training
  4. Evaluation
"},{"location":"examples/3-creating-new-env-model/#problem-tsp","title":"Problem: TSP\u00b6","text":"

We will build an environment and model for the Traveling Salesman Problem (TSP). The TSP is a well-known combinatorial optimization problem that consists of finding the shortest route that visits each city in a given list exactly once and returns to the origin city. The TSP is NP-hard, and it is one of the most studied problems in combinatorial optimization.

"},{"location":"examples/3-creating-new-env-model/#installation","title":"Installation\u00b6","text":""},{"location":"examples/3-creating-new-env-model/#imports","title":"Imports\u00b6","text":""},{"location":"examples/3-creating-new-env-model/#environment-creation","title":"Environment Creation\u00b6","text":""},{"location":"examples/3-creating-new-env-model/#reset","title":"Reset\u00b6","text":"

The _reset function is used to initialize the environment to an initial state. It returns a TensorDict of the initial state.

"},{"location":"examples/3-creating-new-env-model/#step","title":"Step\u00b6","text":"

Environment _step: this defines the state update of the TSP problem gived a TensorDict (td in the code) of the current state and the action to take:

"},{"location":"examples/3-creating-new-env-model/#optional-separate-action-mask-function","title":"[Optional] Separate Action Mask Function\u00b6","text":"

The get_action_mask function simply returns a mask of the valid actions for the current updated state. This can be used in _step and _reset for larger environments with several constraints and may be useful for modularity

"},{"location":"examples/3-creating-new-env-model/#optional-check-solution-validity","title":"[Optional] Check Solution Validity\u00b6","text":"

Another optional utility, this checks whether the solution is feasible and can help identify bugs

"},{"location":"examples/3-creating-new-env-model/#reward-function","title":"Reward function\u00b6","text":"

The _get_reward function is used to evaluate the reward given the solution (actions).

"},{"location":"examples/3-creating-new-env-model/#environment-action-specs","title":"Environment Action Specs\u00b6","text":"

This defines the input and output domains of the environment - similar to Gym's spaces. This is not strictly necessary, but it is useful to have a clear definition of the environment's action and observation spaces and if we want to sample actions using TorchRL's utils

Note: this is actually not necessary, but it is useful to have a clear definition of the environment's action and observation spaces and if we want to sample actions using TorchRL's utils

"},{"location":"examples/3-creating-new-env-model/#data-generator","title":"Data generator\u00b6","text":"

The generator allows to generate random instances of the problem. Note that this is a simplified example: this can include additional distributions via the rl4co.envs.common.utils.get_sampler method!

"},{"location":"examples/3-creating-new-env-model/#render-function","title":"Render function\u00b6","text":"

The render function is optional, but can be useful for quickly visualizing the results of your algorithm!

"},{"location":"examples/3-creating-new-env-model/#putting-everything-together","title":"Putting everything together\u00b6","text":""},{"location":"examples/3-creating-new-env-model/#modeling","title":"Modeling\u00b6","text":"

Now we need to model the problem by transforming input information into the latent space to be processed. Here we focus on AttentionModel-based embeddings with an encoder-decoder structure. In RL4CO, we divide embeddings in 3 parts:

  • init_embedding: (encoder) embed initial states of the problem
  • context_embedding: (decoder) embed context information of the problem for the current partial solution to modify the query
  • dynamic_embedding: (decoder) embed dynamic information of the problem for the current partial solution to modify the query, key, and value (i.e. if other nodes also change state)
"},{"location":"examples/3-creating-new-env-model/#init-embedding","title":"Init Embedding\u00b6","text":"

Embed initial problem into latent space. In our case, we can project the coordinates of the cities into a latent space.

"},{"location":"examples/3-creating-new-env-model/#context-embedding","title":"Context Embedding\u00b6","text":"

Context embedding takes the current context and returns a vector representation of it. In TSP, we can take the embedding of the first node visited (since we need to complete the tour) as well as the embedding of current node visited (in the first step we just have a placeholder since they are the same).

"},{"location":"examples/3-creating-new-env-model/#dynamic-embedding","title":"Dynamic Embedding\u00b6","text":"

Since the states do not change except for visited nodes, we do not need to modify the keys and values. Therefore, we set this to 0

"},{"location":"examples/3-creating-new-env-model/#training-our-model","title":"Training our Model\u00b6","text":""},{"location":"examples/3-creating-new-env-model/#rollout-untrained-model","title":"Rollout untrained model\u00b6","text":""},{"location":"examples/3-creating-new-env-model/#training-loop","title":"Training loop\u00b6","text":""},{"location":"examples/3-creating-new-env-model/#evaluation","title":"Evaluation\u00b6","text":""},{"location":"examples/advanced/","title":"Advanced","text":"

Collection of advanced examples and tutorials - which at the moment are a bit mixed together.

"},{"location":"examples/advanced/#index","title":"Index","text":"
  • 1-hydra-config.ipynb: here we show how to use Hydra to configure your training and testing scripts.
  • 2-flash-attention-2.ipynb: this notebook shows the effects of different SDPA (Scaled Dot-Product Attention) implementations on the training of a model.
"},{"location":"examples/advanced/1-hydra-config/","title":"Hydra Configuration","text":"In\u00a0[1]: Copied!
from hydra import compose, initialize\nfrom omegaconf import OmegaConf\n\nROOT_DIR = \"../../\" # relative to this file\n
from hydra import compose, initialize from omegaconf import OmegaConf ROOT_DIR = \"../../\" # relative to this file In\u00a0[2]: Copied!
# context initialization\nwith initialize(version_base=None, config_path=ROOT_DIR+\"configs\"):\n    cfg = compose(config_name=\"main\")\n
# context initialization with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"): cfg = compose(config_name=\"main\")

Hydra stores the configurations in a dictionary like object called OmegaConf

In\u00a0[3]: Copied!
type(cfg)\n
type(cfg) Out[3]:
omegaconf.dictconfig.DictConfig

The different subfolders in the configs folder are represented as distinct keys in the omegaconf

In\u00a0[4]: Copied!
list(cfg.keys())\n
list(cfg.keys()) Out[4]:
['mode',\n 'tags',\n 'train',\n 'test',\n 'compile',\n 'ckpt_path',\n 'seed',\n 'matmul_precision',\n 'model',\n 'callbacks',\n 'logger',\n 'trainer',\n 'paths',\n 'extras',\n 'env']

Keys can be accessed using the dot notation (e.g. cfg.model) or via normal dictionaries:

In\u00a0[5]: Copied!
print(cfg.model == cfg[\"model\"])\n
print(cfg.model == cfg[\"model\"])
True\n

The dot notation is however more convenient especially in nested structures

In\u00a0[6]: Copied!
print(cfg.model._target_ == cfg[\"model\"][\"_target_\"])\n
print(cfg.model._target_ == cfg[\"model\"][\"_target_\"])
True\n

For example, lets look at the model configuration (which corresponds the model/default.yaml configuration).

In\u00a0[7]: Copied!
print(OmegaConf.to_yaml(cfg.model))\n
print(OmegaConf.to_yaml(cfg.model))
generate_default_data: true\nmetrics:\n  train:\n  - loss\n  - reward\n  val:\n  - reward\n  test:\n  - reward\n  log_on_step: true\n_target_: rl4co.models.AttentionModel\nbaseline: rollout\nbatch_size: 512\nval_batch_size: 1024\ntest_batch_size: 1024\ntrain_data_size: 1280000\nval_data_size: 10000\ntest_data_size: 10000\noptimizer_kwargs:\n  lr: 0.0001\n\n

If we want to change parts of the configuration, it is generally a good practice to make the changes via the command line when executing the respective python script (in the case of RL4CO for example rl4co/tasks/train.py). For example, if we want to use a different model configuration, we can do something like:

python train.py model=pomo model.batch_size=32\n

Here we use the model/pomo.yaml configuration for the model and also change the batch size during training to 32.

Note: check out the see override syntax documentation on the Hydra website for more!

In\u00a0[8]: Copied!
with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"):\n    cfg = compose(config_name=\"main\", overrides=[\"model=pomo\",\"model.batch_size=32\"])\n    print(OmegaConf.to_yaml(cfg.model))\n
with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"): cfg = compose(config_name=\"main\", overrides=[\"model=pomo\",\"model.batch_size=32\"]) print(OmegaConf.to_yaml(cfg.model))
generate_default_data: true\nmetrics:\n  train:\n  - loss\n  - reward\n  val:\n  - reward\n  - max_reward\n  - max_aug_reward\n  test: ${metrics.val}\n  log_on_step: true\n_target_: rl4co.models.POMO\nnum_augment: 8\nbatch_size: 32\nval_batch_size: 1024\ntest_batch_size: 1024\ntrain_data_size: 1280000\nval_data_size: 10000\ntest_data_size: 10000\noptimizer_kwargs:\n  lr: 0.0001\n\n

It is also possible to add new parameters to a config using the + prefix. Using ++ will add a new parameter if it does not exist and overwrite it if it does.

In\u00a0[9]: Copied!
with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"):\n    cfg = compose(config_name=\"main\", overrides=[\"model=pomo\",\"model.batch_size=32\",\"+model.num_starts=10\"])\n    print(OmegaConf.to_yaml(cfg.model))\n
with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"): cfg = compose(config_name=\"main\", overrides=[\"model=pomo\",\"model.batch_size=32\",\"+model.num_starts=10\"]) print(OmegaConf.to_yaml(cfg.model))
generate_default_data: true\nmetrics:\n  train:\n  - loss\n  - reward\n  val:\n  - reward\n  - max_reward\n  - max_aug_reward\n  test: ${metrics.val}\n  log_on_step: true\n_target_: rl4co.models.POMO\nnum_augment: 8\nbatch_size: 32\nval_batch_size: 1024\ntest_batch_size: 1024\ntrain_data_size: 1280000\nval_data_size: 10000\ntest_data_size: 10000\noptimizer_kwargs:\n  lr: 0.0001\nnum_starts: 10\n\n

Likewise, we can also remove unwanted parts of the configuration. For example, if we do not want to use any experiment configuration, we can remove the changes to the configuration made by experiments/base.yaml using the ~ prefix:

In\u00a0[10]: Copied!
with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"):\n    cfg = compose(config_name=\"main\", overrides=[\"model=pomo\",\"~experiment\"])\n    print(OmegaConf.to_yaml(cfg.model))\n
with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"): cfg = compose(config_name=\"main\", overrides=[\"model=pomo\",\"~experiment\"]) print(OmegaConf.to_yaml(cfg.model))
generate_default_data: true\nmetrics:\n  train:\n  - loss\n  - reward\n  val:\n  - reward\n  - max_reward\n  - max_aug_reward\n  test: ${metrics.val}\n  log_on_step: true\n_target_: rl4co.models.POMO\nnum_augment: 8\n\n

As you can see, parameters like \"batch_size\" were removed from the model config, as those were set by the experiment config base.yaml. Through the hashbang

# @package _global_\n

in the configs/experiments/base.yaml, this configuration is able to make changes to all parts of the configuration (like model, trainer, logger). So instead of adding a new key to the omegaconf object, configurations with a # @package _global_ hashbang typically alter other parts of the configuration.

Another example of such a configuration is the debug/default.yaml, which sets all parameters into a lightweight debugging mode:

In\u00a0[11]: Copied!
with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"):\n    cfg = compose(config_name=\"main\", overrides=[\"debug=default\"])\n    print(OmegaConf.to_yaml(cfg.model))\n
with initialize(version_base=None, config_path=ROOT_DIR+\"configs\"): cfg = compose(config_name=\"main\", overrides=[\"debug=default\"]) print(OmegaConf.to_yaml(cfg.model))
generate_default_data: true\nmetrics:\n  train:\n  - loss\n  - reward\n  val:\n  - reward\n  test:\n  - reward\n  log_on_step: true\n_target_: rl4co.models.AttentionModel\nbaseline: rollout\nbatch_size: 8\nval_batch_size: 32\ntest_batch_size: 32\ntrain_data_size: 64\nval_data_size: 1000\ntest_data_size: 1000\noptimizer_kwargs:\n  lr: 0.0001\n\n
"},{"location":"examples/advanced/1-hydra-config/#hydra-configuration","title":"Hydra Configuration\u00b6","text":"

Hydra makes it extremely convenient to configure projects with lots of parameter settings like the RL4CO library.

While you don't need Hydra to use RL4CO, it is recommended to use it for your own projects to make it easier to manage the configuration of your experiments.

Hydra uses config files in .yaml format for this. These files can be found in the configs/ folder, where the subfolders define configurations for specific parts of the framework which are then combined in the main.yaml configuration. In this tutorial we will have a look at how to use these different configuration files and how to add new parameters to the configuration.

"},{"location":"examples/advanced/1-hydra-config/#summary","title":"Summary\u00b6","text":"
  • Reference config files using the CLI flag <key>=<config_file> (e.g. model=am)
  • Add parameters (or even entire keys) to the config using the \"+\" prefix (e.g. +model.batch_size=32)
  • Remove parameters (or even entire keys) to the config using the \"~\" prefix (e.g. ~logger.wandb)
  • The # @package _global_ hashbang allows global access from any config file
  • Turn on debugging mode using debug=default
"},{"location":"examples/advanced/2-flash-attention-2/","title":"Using Flash Attention 2 \u26a1","text":"

In this notebook we will compare Flash Attention 2 with the torch.nn.functional.scaled_dot_product_attention function and a simple implementation.

In\u00a0[1]: Copied!
## Uncomment the following line to install the package from PyPI\n## You may need to restart the runtime in Colab after this\n## Remember to choose a GPU runtime for faster training!\n\n# !pip install rl4co\n
## Uncomment the following line to install the package from PyPI ## You may need to restart the runtime in Colab after this ## Remember to choose a GPU runtime for faster training! # !pip install rl4co In\u00a0[2]: Copied!
import torch\nimport torch.utils.benchmark as benchmark\n\n\n# Simple implementation in PyTorch\nfrom rl4co.models.nn.attention import scaled_dot_product_attention_simple\n# PyTorch official implementation of FlashAttention 1\nfrom torch.nn.functional import scaled_dot_product_attention\n# FlashAttention 2\nfrom rl4co.models.nn.flash_attention import scaled_dot_product_attention_flash_attn\n\nfrom rl4co.envs import TSPEnv\nfrom rl4co.models.zoo.am import AttentionModel\nfrom rl4co.utils.trainer import RL4COTrainer\nfrom rl4co.models.common.constructive.autoregressive import GraphAttentionEncoder\n
import torch import torch.utils.benchmark as benchmark # Simple implementation in PyTorch from rl4co.models.nn.attention import scaled_dot_product_attention_simple # PyTorch official implementation of FlashAttention 1 from torch.nn.functional import scaled_dot_product_attention # FlashAttention 2 from rl4co.models.nn.flash_attention import scaled_dot_product_attention_flash_attn from rl4co.envs import TSPEnv from rl4co.models.zoo.am import AttentionModel from rl4co.utils.trainer import RL4COTrainer from rl4co.models.common.constructive.autoregressive import GraphAttentionEncoder
/home/botu/.local/lib/python3.10/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n  from .autonotebook import tqdm as notebook_tqdm\n
In\u00a0[3]: Copied!
bs, head, length, d = 64, 8, 512, 128\n\nquery = torch.rand(bs, head, length, d, dtype=torch.float16, device=\"cuda\")\nkey = torch.rand(bs, head, length, d, dtype=torch.float16, device=\"cuda\")\nvalue = torch.rand(bs, head, length, d, dtype=torch.float16, device=\"cuda\")\n\n# Simple implementation in PyTorch\nout_simple = scaled_dot_product_attention_simple(query, key, value)\n\n# PyTorch official implementation of FlashAttention 1\nout_pytorch = scaled_dot_product_attention(query, key, value)\n\n# FlashAttention 2\nout_flash_attn = scaled_dot_product_attention_flash_attn(query, key, value)\n\n\nprint(torch.allclose(out_simple, out_pytorch, atol=1e-3))\nprint(torch.allclose(out_flash_attn, out_pytorch, atol=1e-3))\n\nprint(torch.max(torch.abs(out_simple - out_pytorch)), torch.mean(torch.abs(out_simple - out_pytorch)))\nprint(torch.max(torch.abs(out_flash_attn - out_pytorch)), torch.mean(torch.abs(out_flash_attn - out_pytorch)))\n
bs, head, length, d = 64, 8, 512, 128 query = torch.rand(bs, head, length, d, dtype=torch.float16, device=\"cuda\") key = torch.rand(bs, head, length, d, dtype=torch.float16, device=\"cuda\") value = torch.rand(bs, head, length, d, dtype=torch.float16, device=\"cuda\") # Simple implementation in PyTorch out_simple = scaled_dot_product_attention_simple(query, key, value) # PyTorch official implementation of FlashAttention 1 out_pytorch = scaled_dot_product_attention(query, key, value) # FlashAttention 2 out_flash_attn = scaled_dot_product_attention_flash_attn(query, key, value) print(torch.allclose(out_simple, out_pytorch, atol=1e-3)) print(torch.allclose(out_flash_attn, out_pytorch, atol=1e-3)) print(torch.max(torch.abs(out_simple - out_pytorch)), torch.mean(torch.abs(out_simple - out_pytorch))) print(torch.max(torch.abs(out_flash_attn - out_pytorch)), torch.mean(torch.abs(out_flash_attn - out_pytorch)))
True\nTrue\ntensor(0.0005, device='cuda:0', dtype=torch.float16) tensor(1.2159e-05, device='cuda:0', dtype=torch.float16)\ntensor(0.0005, device='cuda:0', dtype=torch.float16) tensor(6.3777e-06, device='cuda:0', dtype=torch.float16)\n
In\u00a0[4]: Copied!
env = TSPEnv(generator_params=dict(num_loc=1000))\n\nnum_heads = 8\nembed_dim = 128\nnum_layers = 3\nenc_simple = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n                            sdpa_fn=scaled_dot_product_attention_simple)\n\nenc_fa1 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n                            sdpa_fn=scaled_dot_product_attention)\n\nenc_fa2 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n                            sdpa_fn=scaled_dot_product_attention_flash_attn)\n\n# Flash Attention supports only FP16 and BFloat16\nenc_simple.to(\"cuda\").half()\nenc_fa1.to(\"cuda\").half()\nenc_fa2.to(\"cuda\").half()\n
env = TSPEnv(generator_params=dict(num_loc=1000)) num_heads = 8 embed_dim = 128 num_layers = 3 enc_simple = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers, sdpa_fn=scaled_dot_product_attention_simple) enc_fa1 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers, sdpa_fn=scaled_dot_product_attention) enc_fa2 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers, sdpa_fn=scaled_dot_product_attention_flash_attn) # Flash Attention supports only FP16 and BFloat16 enc_simple.to(\"cuda\").half() enc_fa1.to(\"cuda\").half() enc_fa2.to(\"cuda\").half() Out[4]:
GraphAttentionEncoder(\n  (init_embedding): TSPInitEmbedding(\n    (init_embed): Linear(in_features=2, out_features=128, bias=True)\n  )\n  (net): GraphAttentionNetwork(\n    (layers): Sequential(\n      (0): MultiHeadAttentionLayer(\n        (0): SkipConnection(\n          (module): MultiHeadAttention(\n            (Wqkv): Linear(in_features=128, out_features=384, bias=True)\n            (out_proj): Linear(in_features=128, out_features=128, bias=True)\n          )\n        )\n        (1): Normalization(\n          (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n        )\n        (2): SkipConnection(\n          (module): Sequential(\n            (0): Linear(in_features=128, out_features=512, bias=True)\n            (1): ReLU()\n            (2): Linear(in_features=512, out_features=128, bias=True)\n          )\n        )\n        (3): Normalization(\n          (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n        )\n      )\n      (1): MultiHeadAttentionLayer(\n        (0): SkipConnection(\n          (module): MultiHeadAttention(\n            (Wqkv): Linear(in_features=128, out_features=384, bias=True)\n            (out_proj): Linear(in_features=128, out_features=128, bias=True)\n          )\n        )\n        (1): Normalization(\n          (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n        )\n        (2): SkipConnection(\n          (module): Sequential(\n            (0): Linear(in_features=128, out_features=512, bias=True)\n            (1): ReLU()\n            (2): Linear(in_features=512, out_features=128, bias=True)\n          )\n        )\n        (3): Normalization(\n          (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n        )\n      )\n      (2): MultiHeadAttentionLayer(\n        (0): SkipConnection(\n          (module): MultiHeadAttention(\n            (Wqkv): Linear(in_features=128, out_features=384, bias=True)\n            (out_proj): Linear(in_features=128, out_features=128, bias=True)\n          )\n        )\n        (1): Normalization(\n          (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n        )\n        (2): SkipConnection(\n          (module): Sequential(\n            (0): Linear(in_features=128, out_features=512, bias=True)\n            (1): ReLU()\n            (2): Linear(in_features=512, out_features=128, bias=True)\n          )\n        )\n        (3): Normalization(\n          (normalizer): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n        )\n      )\n    )\n  )\n)
In\u00a0[5]: Copied!
def build_models(num_heads=8, embed_dim=128, num_layers=3):\n    enc_simple = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n                                sdpa_fn=scaled_dot_product_attention_simple)\n\n    enc_fa1 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n                                sdpa_fn=scaled_dot_product_attention)\n\n    enc_fa2 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers,\n                                sdpa_fn=scaled_dot_product_attention_flash_attn)\n\n    # Flash Attention supports only FP16 and BFloat16\n    enc_simple.to(\"cuda\").half()\n    enc_fa1.to(\"cuda\").half()\n    enc_fa2.to(\"cuda\").half()\n    return enc_simple, enc_fa1, enc_fa2\n
def build_models(num_heads=8, embed_dim=128, num_layers=3): enc_simple = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers, sdpa_fn=scaled_dot_product_attention_simple) enc_fa1 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers, sdpa_fn=scaled_dot_product_attention) enc_fa2 = GraphAttentionEncoder(env, num_heads=num_heads, embed_dim=embed_dim, num_layers=num_layers, sdpa_fn=scaled_dot_product_attention_flash_attn) # Flash Attention supports only FP16 and BFloat16 enc_simple.to(\"cuda\").half() enc_fa1.to(\"cuda\").half() enc_fa2.to(\"cuda\").half() return enc_simple, enc_fa1, enc_fa2 In\u00a0[6]: Copied!
threads = 32\nsizes = [10, 20, 50, 100, 200, 500, 1000, 2000, 5000, 10000]\n\ntimes_simple = []\ntimes_fa1 = []\ntimes_fa2 = []\n\n# for embed_dim in [64, 128, 256]:\nfor embed_dim in [128]:\n    # Get models\n    enc_simple, enc_fa1, enc_fa2 = build_models(embed_dim=embed_dim)\n\n    for problem_size in sizes:\n\n        with torch.no_grad():\n            # initial data\n            env = TSPEnv(generator_params=dict(num_loc=problem_size))\n            td_init = env.reset(batch_size=[2])\n            # set dtype to float16\n            td_init = td_init.to(dest=\"cuda\", dtype=torch.float16)\n\n            t_simple = benchmark.Timer(\n                setup='x = td_init',\n                stmt='encode(x)',\n                globals={'td_init': td_init, 'encode': enc_simple},\n                num_threads=threads)\n\n            t_fa1 = benchmark.Timer(\n                setup='x = td_init',\n                stmt='encode(x)',\n                globals={'td_init': td_init, 'encode': enc_fa1},\n                num_threads=threads)\n            \n            t_fa2 = benchmark.Timer(\n                setup='x = td_init',\n                stmt='encode(x)',\n                globals={'td_init': td_init, 'encode': enc_fa2},\n                num_threads=threads)\n            \n            times_simple.append(torch.tensor(t_simple.blocked_autorange().times).mean())\n            times_fa2.append(torch.tensor(t_fa2.blocked_autorange().times).mean())\n            times_fa1.append(torch.tensor(t_fa1.blocked_autorange().times).mean())\n\n            print(f\"Times for problem size {problem_size}: Simple {times_simple[-1]*1e3:.3f}, FA1 {times_fa1[-1]*1e3:.3f}, FA2 {times_fa2[-1]*1e3:.3f}\")\n\n    # eliminate cache\n    torch.cuda.empty_cache()\n
threads = 32 sizes = [10, 20, 50, 100, 200, 500, 1000, 2000, 5000, 10000] times_simple = [] times_fa1 = [] times_fa2 = [] # for embed_dim in [64, 128, 256]: for embed_dim in [128]: # Get models enc_simple, enc_fa1, enc_fa2 = build_models(embed_dim=embed_dim) for problem_size in sizes: with torch.no_grad(): # initial data env = TSPEnv(generator_params=dict(num_loc=problem_size)) td_init = env.reset(batch_size=[2]) # set dtype to float16 td_init = td_init.to(dest=\"cuda\", dtype=torch.float16) t_simple = benchmark.Timer( setup='x = td_init', stmt='encode(x)', globals={'td_init': td_init, 'encode': enc_simple}, num_threads=threads) t_fa1 = benchmark.Timer( setup='x = td_init', stmt='encode(x)', globals={'td_init': td_init, 'encode': enc_fa1}, num_threads=threads) t_fa2 = benchmark.Timer( setup='x = td_init', stmt='encode(x)', globals={'td_init': td_init, 'encode': enc_fa2}, num_threads=threads) times_simple.append(torch.tensor(t_simple.blocked_autorange().times).mean()) times_fa2.append(torch.tensor(t_fa2.blocked_autorange().times).mean()) times_fa1.append(torch.tensor(t_fa1.blocked_autorange().times).mean()) print(f\"Times for problem size {problem_size}: Simple {times_simple[-1]*1e3:.3f}, FA1 {times_fa1[-1]*1e3:.3f}, FA2 {times_fa2[-1]*1e3:.3f}\") # eliminate cache torch.cuda.empty_cache()
Times for problem size 10: Simple 0.633, FA1 0.511, FA2 0.554\nTimes for problem size 20: Simple 0.646, FA1 0.535, FA2 0.565\nTimes for problem size 50: Simple 0.663, FA1 0.547, FA2 0.580\nTimes for problem size 100: Simple 0.664, FA1 0.547, FA2 0.580\nTimes for problem size 200: Simple 0.670, FA1 0.509, FA2 0.585\nTimes for problem size 500: Simple 0.669, FA1 0.512, FA2 0.582\nTimes for problem size 1000: Simple 1.088, FA1 0.555, FA2 0.609\nTimes for problem size 2000: Simple 3.626, FA1 1.292, FA2 0.790\nTimes for problem size 5000: Simple 20.332, FA1 5.748, FA2 2.943\nTimes for problem size 10000: Simple 80.337, FA1 20.701, FA2 10.230\n
In\u00a0[7]: Copied!
# Plot results\nimport matplotlib.pyplot as plt\n\n\nfig, ax = plt.subplots(1, 1, figsize=(10, 5))\nax.plot(sizes, times_simple, label=\"Simple\")\nax.plot(sizes, times_fa1, label=\"FlashAttention 1\")\nax.plot(sizes, times_fa2, label=\"FlashAttention 2\")\n\n# fancy grid\nax.grid(True, which=\"both\", ls=\"-\", alpha=0.5)\nax.set_xscale(\"log\")\nax.set_yscale(\"log\")\nax.set_xlabel(\"Problem size\")\nax.set_ylabel(\"Time (ms)\")\nax.legend()\n\n# Instead of 10^1, 10^2... show nuber\nax.xaxis.set_major_formatter(plt.FuncFormatter(lambda x, _: f\"{x:.0f}\"))\n\nplt.show()\n
# Plot results import matplotlib.pyplot as plt fig, ax = plt.subplots(1, 1, figsize=(10, 5)) ax.plot(sizes, times_simple, label=\"Simple\") ax.plot(sizes, times_fa1, label=\"FlashAttention 1\") ax.plot(sizes, times_fa2, label=\"FlashAttention 2\") # fancy grid ax.grid(True, which=\"both\", ls=\"-\", alpha=0.5) ax.set_xscale(\"log\") ax.set_yscale(\"log\") ax.set_xlabel(\"Problem size\") ax.set_ylabel(\"Time (ms)\") ax.legend() # Instead of 10^1, 10^2... show nuber ax.xaxis.set_major_formatter(plt.FuncFormatter(lambda x, _: f\"{x:.0f}\")) plt.show()

Using FlashAttention can speed up inference even at small context lengths (number of nodes in the graph). Difference can be of several times for large graphs between different implementations!

"},{"location":"examples/advanced/2-flash-attention-2/#using-flash-attention-2","title":"Using Flash Attention 2 \u26a1\u00b6","text":""},{"location":"examples/advanced/2-flash-attention-2/#installation","title":"Installation\u00b6","text":"

Follow instructions here: https://github.com/Dao-AILab/flash-attention

"},{"location":"examples/advanced/2-flash-attention-2/#imports","title":"Imports\u00b6","text":""},{"location":"examples/advanced/2-flash-attention-2/#testing-differences-with-simple-tensors","title":"Testing differences with simple tensors\u00b6","text":""},{"location":"examples/advanced/2-flash-attention-2/#testing-graph-attention-encoders-with-flash-attention-2","title":"Testing Graph Attention Encoders with Flash Attention 2\u00b6","text":""},{"location":"examples/advanced/3-local-search/","title":"Local Search","text":"In\u00a0[1]: Copied!
# !pip install rl4co[routing]  # include pyvrp\n
# !pip install rl4co[routing] # include pyvrp In\u00a0[2]: Copied!
import torch\n\nfrom rl4co.envs import TSPEnv\nfrom rl4co.models.zoo import AttentionModel\n
import torch from rl4co.envs import TSPEnv from rl4co.models.zoo import AttentionModel In\u00a0[3]: Copied!
# RL4CO env based on TorchRL\nenv = TSPEnv(num_loc=50) \n\ncheckpoint_path = \"../tsp-quickstart.ckpt\"  # checkpoint from the ../1-quickstart.ipynb\n\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n\n# Model: default is AM with REINFORCE and greedy rollout baseline\nmodel = AttentionModel.load_from_checkpoint(checkpoint_path, load_baseline=False)\n
# RL4CO env based on TorchRL env = TSPEnv(num_loc=50) checkpoint_path = \"../tsp-quickstart.ckpt\" # checkpoint from the ../1-quickstart.ipynb device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\") # Model: default is AM with REINFORCE and greedy rollout baseline model = AttentionModel.load_from_checkpoint(checkpoint_path, load_baseline=False)
/home/sanghyeok/NCO/rl4co/.venv/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n/home/sanghyeok/NCO/rl4co/.venv/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n/home/sanghyeok/NCO/rl4co/.venv/lib/python3.10/site-packages/lightning/pytorch/core/saving.py:188: Found keys that are not in the model state dict but in the checkpoint: ['baseline.baseline.model.encoder.init_embedding.init_embed.weight', 'baseline.baseline.model.encoder.init_embedding.init_embed.bias', 'baseline.baseline.model.encoder.net.layers.0.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.0.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.0.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.0.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.0.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.0.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.0.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.0.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.1.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.1.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.1.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.1.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.1.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.1.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.1.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.1.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.2.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.2.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.2.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.2.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.2.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.2.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.2.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.2.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.num_batches_tracked', 'baseline.baseline.model.decoder.context_embedding.W_placeholder', 'baseline.baseline.model.decoder.context_embedding.project_context.weight', 'baseline.baseline.model.decoder.project_node_embeddings.weight', 'baseline.baseline.model.decoder.project_fixed_context.weight', 'baseline.baseline.model.decoder.pointer.project_out.weight']\n
In\u00a0[4]: Copied!
# Greedy rollouts over trained model (same states as previous plot)\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\ntd_init = env.reset(batch_size=[3]).to(device)\nmodel = model.to(device)\nout = model(td_init.clone(), phase=\"test\", decode_type=\"greedy\")\nactions = out['actions']\n\n# Improve solutions using LocalSearch\nimproved_actions = env.local_search(td_init, actions, rng=0)\nimproved_rewards = env.get_reward(td_init, improved_actions)\n\n# Plotting\nimport matplotlib.pyplot as plt\nfor i, td in enumerate(td_init):\n    fig, axs = plt.subplots(1,2, figsize=(11,5))\n    env.render(td, actions[i], ax=axs[0]) \n    env.render(td, improved_actions[i], ax=axs[1])\n    axs[0].set_title(f\"Before improvement | Cost = {-out['reward'][i].item():.3f}\")\n    axs[1].set_title(f\"After improvement | Cost = {-improved_rewards[i].item():.3f}\")\n
# Greedy rollouts over trained model (same states as previous plot) device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\") td_init = env.reset(batch_size=[3]).to(device) model = model.to(device) out = model(td_init.clone(), phase=\"test\", decode_type=\"greedy\") actions = out['actions'] # Improve solutions using LocalSearch improved_actions = env.local_search(td_init, actions, rng=0) improved_rewards = env.get_reward(td_init, improved_actions) # Plotting import matplotlib.pyplot as plt for i, td in enumerate(td_init): fig, axs = plt.subplots(1,2, figsize=(11,5)) env.render(td, actions[i], ax=axs[0]) env.render(td, improved_actions[i], ax=axs[1]) axs[0].set_title(f\"Before improvement | Cost = {-out['reward'][i].item():.3f}\") axs[1].set_title(f\"After improvement | Cost = {-improved_rewards[i].item():.3f}\")

We can see that the solution has improved after using 2-opt.

"},{"location":"examples/advanced/3-local-search/#local-search","title":"Local Search\u00b6","text":"

In this notebook, we will show how to improve the solution at hand using local search and other techniques. Here we solve TSP and use 2-opt to improve the solution. You can check how the improvement works for other problems in each Env's local_search method.

Note that this notebook is based on 1-quickstart and we use the checkpoint file from it. If you haven't checked it yet, we recommend you to check it first.

"},{"location":"examples/advanced/3-local-search/#installation","title":"Installation\u00b6","text":"

We use LocalSearch operator provided by PyVRP. See https://github.com/PyVRP/PyVRP for more details.

Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!

Note: You may need to restart the runtime in Colab after this

"},{"location":"examples/advanced/3-local-search/#imports","title":"Imports\u00b6","text":""},{"location":"examples/advanced/3-local-search/#environment-policy-and-model-from-saved-checkpoint","title":"Environment, Policy, and Model from saved checkpoint\u00b6","text":""},{"location":"examples/advanced/3-local-search/#testing-with-solution-improvement","title":"Testing with Solution Improvement\u00b6","text":""},{"location":"examples/datasets/","title":"Datasets","text":"

Collection of examples for training and testing with custom datasets.

"},{"location":"examples/datasets/#index","title":"Index","text":"
  • 1-test-on-tsplib.ipynb: here we show how to test a model on the TSPLIB dataset.
  • 2-test-on-cvrplib.ipynb: here we show how to test a model on the CVRPLIB dataset.
"},{"location":"examples/datasets/1-test-on-tsplib/","title":"Testing Model on TSPLib","text":"In\u00a0[3]: Copied!
# !pip install rl4co\n# !pip install tsplib95\n\n## NOTE: to install latest version from Github (may be unstable) install from source instead:\n# !pip install git+https://github.com/ai4co/rl4co.git\n
# !pip install rl4co # !pip install tsplib95 ## NOTE: to install latest version from Github (may be unstable) install from source instead: # !pip install git+https://github.com/ai4co/rl4co.git In\u00a0[4]: Copied!
%load_ext autoreload\n%autoreload 2\n\nimport torch\nfrom tensordict import TensorDict\n\nfrom rl4co.envs import TSPEnv\nfrom rl4co.models.zoo.am import AttentionModelPolicy\nfrom rl4co.models.rl import REINFORCE\nfrom rl4co.utils.trainer import RL4COTrainer\n
%load_ext autoreload %autoreload 2 import torch from tensordict import TensorDict from rl4co.envs import TSPEnv from rl4co.models.zoo.am import AttentionModelPolicy from rl4co.models.rl import REINFORCE from rl4co.utils.trainer import RL4COTrainer In\u00a0[5]: Copied!
import requests, tarfile, os, gzip, shutil\nfrom tqdm.auto import tqdm\nfrom tsplib95.loaders import load_problem, load_solution\n\ndef download_and_extract_tsplib(url, directory=\"tsplib\", delete_after_unzip=True):\n    os.makedirs(directory, exist_ok=True)\n    \n    # Download with progress bar\n    with requests.get(url, stream=True) as r:\n        r.raise_for_status()\n        total_size = int(r.headers.get('content-length', 0))\n        with open(\"tsplib.tar.gz\", 'wb') as f, tqdm(total=total_size, unit='B', unit_scale=True) as pbar:\n            for chunk in r.iter_content(8192):\n                f.write(chunk)\n                pbar.update(len(chunk))\n\n    # Extract tar.gz\n    with tarfile.open(\"tsplib.tar.gz\", 'r:gz') as tar:\n        tar.extractall(directory)\n\n    # Decompress .gz files inside directory\n    for root, _, files in os.walk(directory):\n        for file in files:\n            if file.endswith(\".gz\"):\n                path = os.path.join(root, file)\n                with gzip.open(path, 'rb') as f_in, open(path[:-3], 'wb') as f_out:\n                    shutil.copyfileobj(f_in, f_out)\n                os.remove(path)\n\n    if delete_after_unzip:\n        os.remove(\"tsplib.tar.gz\")\n\n# Download and extract all tsp files under tsplib directory\ndownload_and_extract_tsplib(\"http://comopt.ifi.uni-heidelberg.de/software/TSPLIB95/tsp/ALL_tsp.tar.gz\")\n
import requests, tarfile, os, gzip, shutil from tqdm.auto import tqdm from tsplib95.loaders import load_problem, load_solution def download_and_extract_tsplib(url, directory=\"tsplib\", delete_after_unzip=True): os.makedirs(directory, exist_ok=True) # Download with progress bar with requests.get(url, stream=True) as r: r.raise_for_status() total_size = int(r.headers.get('content-length', 0)) with open(\"tsplib.tar.gz\", 'wb') as f, tqdm(total=total_size, unit='B', unit_scale=True) as pbar: for chunk in r.iter_content(8192): f.write(chunk) pbar.update(len(chunk)) # Extract tar.gz with tarfile.open(\"tsplib.tar.gz\", 'r:gz') as tar: tar.extractall(directory) # Decompress .gz files inside directory for root, _, files in os.walk(directory): for file in files: if file.endswith(\".gz\"): path = os.path.join(root, file) with gzip.open(path, 'rb') as f_in, open(path[:-3], 'wb') as f_out: shutil.copyfileobj(f_in, f_out) os.remove(path) if delete_after_unzip: os.remove(\"tsplib.tar.gz\") # Download and extract all tsp files under tsplib directory download_and_extract_tsplib(\"http://comopt.ifi.uni-heidelberg.de/software/TSPLIB95/tsp/ALL_tsp.tar.gz\")
  0%|          | 0.00/2.02M [00:00<?, ?B/s]
In\u00a0[6]: Copied!
# Load the problem from TSPLib\ntsplib_dir = './tsplib'# modify this to the directory of your prepared files\nfiles = os.listdir(tsplib_dir)\nproblem_files_full = [file for file in files if file.endswith('.tsp')]\n\n# Load the optimal solution files from TSPLib\nsolution_files = [file for file in files if file.endswith('.opt.tour')]\n
# Load the problem from TSPLib tsplib_dir = './tsplib'# modify this to the directory of your prepared files files = os.listdir(tsplib_dir) problem_files_full = [file for file in files if file.endswith('.tsp')] # Load the optimal solution files from TSPLib solution_files = [file for file in files if file.endswith('.opt.tour')] In\u00a0[7]: Copied!
problems = []\n# Load only problems with solution files\nfor sol_file in solution_files:\n    prob_file = sol_file.replace('.opt.tour', '.tsp')\n    problem = load_problem(os.path.join(tsplib_dir, prob_file))\n\n    # NOTE: in some problem files (e.g. hk48), the node coordinates are not available\n    # we temporarily skip these problems\n    if not len(problem.node_coords):\n        continue\n    \n    node_coords = torch.tensor([v for v in problem.node_coords.values()])\n    solution = load_solution(os.path.join(tsplib_dir, sol_file))\n    \n    problems.append({\n        \"name\": sol_file.replace('.opt.tour', ''),\n        \"node_coords\": node_coords,\n        \"solution\": solution.tours[0],\n        \"dimension\": problem.dimension\n    })\n    \n    \n# order by dimension\nproblems = sorted(problems, key=lambda x: x['dimension'])\n
problems = [] # Load only problems with solution files for sol_file in solution_files: prob_file = sol_file.replace('.opt.tour', '.tsp') problem = load_problem(os.path.join(tsplib_dir, prob_file)) # NOTE: in some problem files (e.g. hk48), the node coordinates are not available # we temporarily skip these problems if not len(problem.node_coords): continue node_coords = torch.tensor([v for v in problem.node_coords.values()]) solution = load_solution(os.path.join(tsplib_dir, sol_file)) problems.append({ \"name\": sol_file.replace('.opt.tour', ''), \"node_coords\": node_coords, \"solution\": solution.tours[0], \"dimension\": problem.dimension }) # order by dimension problems = sorted(problems, key=lambda x: x['dimension'])
/tmp/ipykernel_76573/449557851.py:5: DeprecationWarning: Call to deprecated function (or staticmethod) load_problem. (Will be removed in newer versions. Use `tsplib95.load` instead.) -- Deprecated since version 7.0.0.\n  problem = load_problem(os.path.join(tsplib_dir, prob_file))\n/tmp/ipykernel_76573/449557851.py:13: DeprecationWarning: Call to deprecated function (or staticmethod) load_solution. (Will be removed in newer versions. Use `tsplib95.load` instead.) -- Deprecated since version 7.0.0.\n  solution = load_solution(os.path.join(tsplib_dir, sol_file))\n
In\u00a0[8]: Copied!
# Utils function: we will normalize the coordinates of the VRP instances\ndef normalize_coord(coord:torch.Tensor) -> torch.Tensor:\n    x, y = coord[:, 0], coord[:, 1]\n    x_min, x_max = x.min(), x.max()\n    y_min, y_max = y.min(), y.max()\n    x_scaled = (x - x_min) / (x_max - x_min) \n    y_scaled = (y - y_min) / (y_max - y_min)\n    coord_scaled = torch.stack([x_scaled, y_scaled], dim=1)\n    return coord_scaled \n\ndef tsplib_to_td(problem, normalize=True):\n    coords = torch.tensor(problem['node_coords']).float()\n    coords_norm = normalize_coord(coords) if normalize else coords\n    td = TensorDict({\n        'locs': coords_norm,\n    })\n    td = td[None] # add batch dimension, in this case just 1\n    return td\n
# Utils function: we will normalize the coordinates of the VRP instances def normalize_coord(coord:torch.Tensor) -> torch.Tensor: x, y = coord[:, 0], coord[:, 1] x_min, x_max = x.min(), x.max() y_min, y_max = y.min(), y.max() x_scaled = (x - x_min) / (x_max - x_min) y_scaled = (y - y_min) / (y_max - y_min) coord_scaled = torch.stack([x_scaled, y_scaled], dim=1) return coord_scaled def tsplib_to_td(problem, normalize=True): coords = torch.tensor(problem['node_coords']).float() coords_norm = normalize_coord(coords) if normalize else coords td = TensorDict({ 'locs': coords_norm, }) td = td[None] # add batch dimension, in this case just 1 return td In\u00a0[9]: Copied!
device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n\n# RL4CO env based on TorchRL\nenv = TSPEnv(generator_params={'num_loc': 50})\n\n# Policy: neural network, in this case with encoder-decoder architecture\npolicy = AttentionModelPolicy(env_name=env.name).to(device)\n\n# RL Model: REINFORCE and greedy rollout baseline\nmodel = REINFORCE(env, \n                    policy,\n                    baseline=\"rollout\",\n                    batch_size=512,\n                    train_data_size=100_000,\n                    val_data_size=10_000,\n                    optimizer_kwargs={\"lr\": 1e-4},\n                    )\n
device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\") # RL4CO env based on TorchRL env = TSPEnv(generator_params={'num_loc': 50}) # Policy: neural network, in this case with encoder-decoder architecture policy = AttentionModelPolicy(env_name=env.name).to(device) # RL Model: REINFORCE and greedy rollout baseline model = REINFORCE(env, policy, baseline=\"rollout\", batch_size=512, train_data_size=100_000, val_data_size=10_000, optimizer_kwargs={\"lr\": 1e-4}, )
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n
In\u00a0[10]: Copied!
tds, actions = [], []\n\npolicy = policy.eval()\nfor problem in problems:\n\n    with torch.inference_mode():\n        td_reset = env.reset(tsplib_to_td(problem)).to(device)\n        out = policy(td_reset.clone(), env, decode_type = \"greedy\")\n        unnormalized_td = env.reset(tsplib_to_td(problem, normalize=False)).to(device)\n        cost = -env.get_reward(unnormalized_td, out[\"actions\"]).item() # unnormalized cost\n        \n    bks_sol = (torch.tensor(problem['solution'], device=device, dtype=torch.int64) - 1)[None]\n    bks_cost = -env.get_reward(unnormalized_td, bks_sol)\n    \n    tds.append(tsplib_to_td(problem))\n    actions.append(out[\"actions\"])\n    \n    gap = (cost - bks_cost.item()) / bks_cost.item()\n            \n    print(f\"Problem: {problem['name']:<15} Cost: {cost:<14.4f} BKS: {bks_cost.item():<10.4f}\\t Gap: {gap:.2%}\")\n
tds, actions = [], [] policy = policy.eval() for problem in problems: with torch.inference_mode(): td_reset = env.reset(tsplib_to_td(problem)).to(device) out = policy(td_reset.clone(), env, decode_type = \"greedy\") unnormalized_td = env.reset(tsplib_to_td(problem, normalize=False)).to(device) cost = -env.get_reward(unnormalized_td, out[\"actions\"]).item() # unnormalized cost bks_sol = (torch.tensor(problem['solution'], device=device, dtype=torch.int64) - 1)[None] bks_cost = -env.get_reward(unnormalized_td, bks_sol) tds.append(tsplib_to_td(problem)) actions.append(out[\"actions\"]) gap = (cost - bks_cost.item()) / bks_cost.item() print(f\"Problem: {problem['name']:<15} Cost: {cost:<14.4f} BKS: {bks_cost.item():<10.4f}\\t Gap: {gap:.2%}\")
/tmp/ipykernel_76573/1596842480.py:12: UserWarning: To copy construct from a tensor, it is recommended to use sourceTensor.clone().detach() or sourceTensor.clone().detach().requires_grad_(True), rather than torch.tensor(sourceTensor).\n  coords = torch.tensor(problem['node_coords']).float()\n
Problem: ulysses16       Cost: 160.6761       BKS: 74.1087   \t Gap: 116.81%\nProblem: ulysses22       Cost: 173.5413       BKS: 75.6651   \t Gap: 129.35%\nProblem: att48           Cost: 86775.2031     BKS: 33523.7109\t Gap: 158.85%\nProblem: eil51           Cost: 1256.7629      BKS: 429.9833  \t Gap: 192.28%\nProblem: berlin52        Cost: 15761.3652     BKS: 7544.3662 \t Gap: 108.92%\nProblem: st70            Cost: 2429.2407      BKS: 678.5975  \t Gap: 257.98%\nProblem: pr76            Cost: 358580.5000    BKS: 108159.4375\t Gap: 231.53%\nProblem: eil76           Cost: 1801.1833      BKS: 545.3876  \t Gap: 230.26%\nProblem: gr96            Cost: 1714.3306      BKS: 512.3093  \t Gap: 234.63%\nProblem: rd100           Cost: 30248.6816     BKS: 7910.3960 \t Gap: 282.39%\nProblem: kroD100         Cost: 80604.9609     BKS: 21294.2930\t Gap: 278.53%\nProblem: kroC100         Cost: 61475.9688     BKS: 20750.7617\t Gap: 196.26%\nProblem: kroA100         Cost: 86844.4609     BKS: 21285.4414\t Gap: 308.00%\nProblem: eil101          Cost: 2444.7129      BKS: 642.3096  \t Gap: 280.61%\nProblem: lin105          Cost: 56784.3906     BKS: 14382.9961\t Gap: 294.80%\nProblem: ch130           Cost: 26669.8164     BKS: 6110.8608 \t Gap: 336.43%\nProblem: ch150           Cost: 32037.0078     BKS: 6532.2812 \t Gap: 390.44%\nProblem: gr202           Cost: 2277.4905      BKS: 549.9980  \t Gap: 314.09%\nProblem: tsp225          Cost: 24270.3203     BKS: 3859.0000 \t Gap: 528.93%\nProblem: a280            Cost: 17521.9512     BKS: 2586.7695 \t Gap: 577.37%\nProblem: pcb442          Cost: 445898.6250    BKS: 50783.5469\t Gap: 778.04%\nProblem: gr666           Cost: 37270.4531     BKS: 3952.5356 \t Gap: 842.95%\nProblem: pr1002          Cost: 3692658.0000   BKS: 259066.6719\t Gap: 1325.37%\nProblem: pr2392          Cost: 11149681.0000  BKS: 378062.8125\t Gap: 2849.16%\n
In\u00a0[11]: Copied!
# Plot some instances\nenv.render(tds[0], actions[0].cpu())\nenv.render(tds[-2], actions[-2].cpu())\nenv.render(tds[-1], actions[-1].cpu())\n
# Plot some instances env.render(tds[0], actions[0].cpu()) env.render(tds[-2], actions[-2].cpu()) env.render(tds[-1], actions[-1].cpu()) In\u00a0[\u00a0]: Copied!
trainer = RL4COTrainer(\n    max_epochs=3,\n    accelerator=\"gpu\",\n    devices=1,\n    logger=None,\n)\n\ntrainer.fit(model)\n
trainer = RL4COTrainer( max_epochs=3, accelerator=\"gpu\", devices=1, logger=None, ) trainer.fit(model)
Using 16bit Automatic Mixed Precision (AMP)\nGPU available: True (cuda), used: True\nTPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\nval_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\nLOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n\n  | Name     | Type                 | Params\n--------------------------------------------------\n0 | env      | TSPEnv               | 0     \n1 | policy   | AttentionModelPolicy | 710 K \n2 | baseline | WarmupBaseline       | 710 K \n--------------------------------------------------\n1.4 M     Trainable params\n0         Non-trainable params\n1.4 M     Total params\n5.681     Total estimated model params size (MB)\n
Sanity Checking: |          | 0/? [00:00<?, ?it/s]
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n
Training: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
`Trainer.fit` stopped: `max_epochs=3` reached.\n
In\u00a0[13]: Copied!
tds, actions = [], []\n\npolicy = model.policy.eval().to(device)\nfor problem in problems:\n\n    with torch.inference_mode():\n        td_reset = env.reset(tsplib_to_td(problem)).to(device)\n        out = policy(td_reset.clone(), env, decode_type = \"greedy\")\n        unnormalized_td = env.reset(tsplib_to_td(problem, normalize=False)).to(device)\n        cost = -env.get_reward(unnormalized_td, out[\"actions\"]).item() # unnormalized cost\n        \n    bks_sol = (torch.tensor(problem['solution'], device=device, dtype=torch.int64) - 1)[None]\n    bks_cost = -env.get_reward(unnormalized_td, bks_sol)\n    \n    tds.append(tsplib_to_td(problem))\n    actions.append(out[\"actions\"])\n    \n    gap = (cost - bks_cost.item()) / bks_cost.item()\n            \n    print(f\"Problem: {problem['name']:<15} Cost: {cost:<14.4f} BKS: {bks_cost.item():<10.4f}\\t Gap: {gap:.2%}\")\n
tds, actions = [], [] policy = model.policy.eval().to(device) for problem in problems: with torch.inference_mode(): td_reset = env.reset(tsplib_to_td(problem)).to(device) out = policy(td_reset.clone(), env, decode_type = \"greedy\") unnormalized_td = env.reset(tsplib_to_td(problem, normalize=False)).to(device) cost = -env.get_reward(unnormalized_td, out[\"actions\"]).item() # unnormalized cost bks_sol = (torch.tensor(problem['solution'], device=device, dtype=torch.int64) - 1)[None] bks_cost = -env.get_reward(unnormalized_td, bks_sol) tds.append(tsplib_to_td(problem)) actions.append(out[\"actions\"]) gap = (cost - bks_cost.item()) / bks_cost.item() print(f\"Problem: {problem['name']:<15} Cost: {cost:<14.4f} BKS: {bks_cost.item():<10.4f}\\t Gap: {gap:.2%}\")
/tmp/ipykernel_76573/1596842480.py:12: UserWarning: To copy construct from a tensor, it is recommended to use sourceTensor.clone().detach() or sourceTensor.clone().detach().requires_grad_(True), rather than torch.tensor(sourceTensor).\n  coords = torch.tensor(problem['node_coords']).float()\n
Problem: ulysses16       Cost: 82.6168        BKS: 74.1087   \t Gap: 11.48%\nProblem: ulysses22       Cost: 88.0642        BKS: 75.6651   \t Gap: 16.39%\nProblem: att48           Cost: 39196.7305     BKS: 33523.7109\t Gap: 16.92%\nProblem: eil51           Cost: 529.8539       BKS: 429.9833  \t Gap: 23.23%\nProblem: berlin52        Cost: 9453.5234      BKS: 7544.3662 \t Gap: 25.31%\nProblem: st70            Cost: 861.5684       BKS: 678.5975  \t Gap: 26.96%\nProblem: pr76            Cost: 138428.1250    BKS: 108159.4375\t Gap: 27.99%\nProblem: eil76           Cost: 673.4647       BKS: 545.3876  \t Gap: 23.48%\nProblem: gr96            Cost: 633.9059       BKS: 512.3093  \t Gap: 23.74%\nProblem: rd100           Cost: 10517.4844     BKS: 7910.3960 \t Gap: 32.96%\nProblem: kroD100         Cost: 33366.3086     BKS: 21294.2930\t Gap: 56.69%\nProblem: kroC100         Cost: 31602.7129     BKS: 20750.7617\t Gap: 52.30%\nProblem: kroA100         Cost: 30531.9688     BKS: 21285.4414\t Gap: 43.44%\nProblem: eil101          Cost: 870.1373       BKS: 642.3096  \t Gap: 35.47%\nProblem: lin105          Cost: 31638.4492     BKS: 14382.9961\t Gap: 119.97%\nProblem: ch130           Cost: 7974.3115      BKS: 6110.8608 \t Gap: 30.49%\nProblem: ch150           Cost: 9568.7695      BKS: 6532.2812 \t Gap: 46.48%\nProblem: gr202           Cost: 900.7198       BKS: 549.9980  \t Gap: 63.77%\nProblem: tsp225          Cost: 6863.4614      BKS: 3859.0000 \t Gap: 77.86%\nProblem: a280            Cost: 4896.9160      BKS: 2586.7695 \t Gap: 89.31%\nProblem: pcb442          Cost: 90279.2500     BKS: 50783.5469\t Gap: 77.77%\nProblem: gr666           Cost: 5742.3789      BKS: 3952.5356 \t Gap: 45.28%\nProblem: pr1002          Cost: 575474.1250    BKS: 259066.6719\t Gap: 122.13%\nProblem: pr2392          Cost: 1145526.0000   BKS: 378062.8125\t Gap: 203.00%\n
In\u00a0[14]: Copied!
# Plot some instances\nenv.render(tds[0], actions[0].cpu())\nenv.render(tds[-2], actions[-2].cpu())\nenv.render(tds[-1], actions[-1].cpu())\n
# Plot some instances env.render(tds[0], actions[0].cpu()) env.render(tds[-2], actions[-2].cpu()) env.render(tds[-1], actions[-1].cpu())

Great! We can see that the performance vastly improved even with just few minutes of training.

There are several ways to improve the model's performance further, such as:

  • Training for more steps
  • Using a different model architecture
  • Using a different training algorithm
  • Using a different hyperparameters
  • Using a different Generator
  • ... and many more!
"},{"location":"examples/datasets/1-test-on-tsplib/#testing-model-on-tsplib","title":"Testing Model on TSPLib\u00b6","text":"

In this notebook, we will test the trained model's performance on the TSPLib benchmark.

TSPLib is a collection of instances related to the TSP, which is a classic optimization challenge in the field of logistics and transportation.

"},{"location":"examples/datasets/1-test-on-tsplib/#installation","title":"Installation\u00b6","text":"

Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!

Note: You may need to restart the runtime in Colab after this

"},{"location":"examples/datasets/1-test-on-tsplib/#imports","title":"Imports\u00b6","text":""},{"location":"examples/datasets/1-test-on-tsplib/#utils-download-and-load-tsplib-instances-in-rl4co","title":"Utils: download and load TSPLib instances in RL4CO\u00b6","text":""},{"location":"examples/datasets/1-test-on-tsplib/#test-an-untrained-model","title":"Test an untrained model\u00b6","text":""},{"location":"examples/datasets/1-test-on-tsplib/#train","title":"Train\u00b6","text":"

We will train for few steps just to show the effects of training a model. Alternatively, we can load the a pretrained checkpoint, e.g. with:

model = AttentionModel.load_from_checkpoint(checkpoint_path, load_baseline=False)\n
"},{"location":"examples/datasets/1-test-on-tsplib/#test-trained-model","title":"Test trained model\u00b6","text":""},{"location":"examples/datasets/2-test-on-cvrplib/","title":"Testing Model on VRPLib","text":"In\u00a0[\u00a0]: Copied!
# !pip install rl4co[graph] # include torch-geometric\n# !pip install vrplib # for reading instance files\n\n## NOTE: to install latest version from Github (may be unstable) install from source instead:\n# !pip install git+https://github.com/ai4co/rl4co.git\n
# !pip install rl4co[graph] # include torch-geometric # !pip install vrplib # for reading instance files ## NOTE: to install latest version from Github (may be unstable) install from source instead: # !pip install git+https://github.com/ai4co/rl4co.git In\u00a0[2]: Copied!
# Install the `vrplib` package\n# !pip install vrplib\n
# Install the `vrplib` package # !pip install vrplib In\u00a0[3]: Copied!
%load_ext autoreload\n%autoreload 2\n\nimport os\nimport torch\nimport vrplib\nfrom tensordict import TensorDict\n\nfrom rl4co.envs import CVRPEnv\nfrom rl4co.models.zoo.am import AttentionModelPolicy\nfrom rl4co.models.rl import REINFORCE\nfrom rl4co.utils.trainer import RL4COTrainer\n\nfrom tqdm import tqdm\n
%load_ext autoreload %autoreload 2 import os import torch import vrplib from tensordict import TensorDict from rl4co.envs import CVRPEnv from rl4co.models.zoo.am import AttentionModelPolicy from rl4co.models.rl import REINFORCE from rl4co.utils.trainer import RL4COTrainer from tqdm import tqdm
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/fabric/__init__.py:41: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:3144: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('sphinxcontrib')`.\nImplementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n  declare_namespace(pkg)\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/fabric/__init__.py:41: Deprecated call to `pkg_resources.declare_namespace('lightning.fabric')`.\nImplementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:2553: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('lightning')`.\nImplementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n  declare_namespace(parent)\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/__init__.py:37: Deprecated call to `pkg_resources.declare_namespace('lightning.pytorch')`.\nImplementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:2553: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('lightning')`.\nImplementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n  declare_namespace(parent)\n
In\u00a0[4]: Copied!
device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n\n# RL4CO env based on TorchRL\nenv = CVRPEnv(generator_params={'num_loc': 50})\n\n# Policy: neural network, in this case with encoder-decoder architecture\npolicy = AttentionModelPolicy(env_name=env.name).to(device)\n\n# RL Model: REINFORCE and greedy rollout baseline\nmodel = REINFORCE(env, \n                    policy,\n                    baseline=\"rollout\",\n                    batch_size=512,\n                    train_data_size=100_000,\n                    val_data_size=10_000,\n                    optimizer_kwargs={\"lr\": 1e-4},\n                    )\n
device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\") # RL4CO env based on TorchRL env = CVRPEnv(generator_params={'num_loc': 50}) # Policy: neural network, in this case with encoder-decoder architecture policy = AttentionModelPolicy(env_name=env.name).to(device) # RL Model: REINFORCE and greedy rollout baseline model = REINFORCE(env, policy, baseline=\"rollout\", batch_size=512, train_data_size=100_000, val_data_size=10_000, optimizer_kwargs={\"lr\": 1e-4}, )
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n
In\u00a0[5]: Copied!
problem_names = vrplib.list_names(low=50, high=100, vrp_type='cvrp') \n\ninstances = [] # Collect Set A, B, E, F, M datasets\nfor name in problem_names:\n    if 'A' in name:\n        instances.append(name)\n    elif 'B' in name:\n        instances.append(name)\n    elif 'E' in name:\n        instances.append(name)\n    elif 'F' in name:\n        instances.append(name)\n    elif 'M' in name and 'CMT' not in name:\n        instances.append(name)\n\n# Modify the path you want to save \n# Note: we don't have to create this folder in advance\npath_to_save = './vrplib/' \n\ntry:\n    os.makedirs(path_to_save)\n    for instance in tqdm(instances):\n        vrplib.download_instance(instance, path_to_save)\n        vrplib.download_solution(instance, path_to_save)\nexcept: # already exist\n    pass\n
problem_names = vrplib.list_names(low=50, high=100, vrp_type='cvrp') instances = [] # Collect Set A, B, E, F, M datasets for name in problem_names: if 'A' in name: instances.append(name) elif 'B' in name: instances.append(name) elif 'E' in name: instances.append(name) elif 'F' in name: instances.append(name) elif 'M' in name and 'CMT' not in name: instances.append(name) # Modify the path you want to save # Note: we don't have to create this folder in advance path_to_save = './vrplib/' try: os.makedirs(path_to_save) for instance in tqdm(instances): vrplib.download_instance(instance, path_to_save) vrplib.download_solution(instance, path_to_save) except: # already exist pass
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/vrplib/download/list_names.py:58: DeprecationWarning: read_text is deprecated. Use files() instead. Refer to https://importlib-resources.readthedocs.io/en/latest/using.html#migrating-from-legacy for migration advice.\n  fi = pkg_resource.read_text(__package__, \"instance_data.csv\")\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/importlib/resources/_legacy.py:80: DeprecationWarning: open_text is deprecated. Use files() instead. Refer to https://importlib-resources.readthedocs.io/en/latest/using.html#migrating-from-legacy for migration advice.\n  with open_text(package, resource, encoding, errors) as fp:\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/vrplib/download/list_names.py:32: DeprecationWarning: The function 'list_names' is deprecated and will be removed in the next major version (vrplib v2.0.0).\n  warnings.warn(msg, DeprecationWarning)\n
In\u00a0[6]: Copied!
# Utils function: we will normalize the coordinates of the VRP instances\ndef normalize_coord(coord:torch.Tensor) -> torch.Tensor:\n    x, y = coord[:, 0], coord[:, 1]\n    x_min, x_max = x.min(), x.max()\n    y_min, y_max = y.min(), y.max()\n    \n    x_scaled = (x - x_min) / (x_max - x_min) \n    y_scaled = (y - y_min) / (y_max - y_min)\n    coord_scaled = torch.stack([x_scaled, y_scaled], dim=1)\n    return coord_scaled \n\ndef vrplib_to_td(problem, normalize=True):\n    coords = torch.tensor(problem['node_coord']).float()\n    coords_norm = normalize_coord(coords) if normalize else coords\n    demand = torch.tensor(problem['demand'][1:]).float()\n    capacity = problem['capacity']\n    n = coords.shape[0]\n    td = TensorDict({\n        'depot': coords_norm[0,:],\n        'locs': coords_norm[1:,:],\n        'demand': demand / capacity, # normalized demand\n        'capacity': capacity, # original capacity, not needed for inference\n    })\n    td = td[None] # add batch dimension, in this case just 1\n    return td\n
# Utils function: we will normalize the coordinates of the VRP instances def normalize_coord(coord:torch.Tensor) -> torch.Tensor: x, y = coord[:, 0], coord[:, 1] x_min, x_max = x.min(), x.max() y_min, y_max = y.min(), y.max() x_scaled = (x - x_min) / (x_max - x_min) y_scaled = (y - y_min) / (y_max - y_min) coord_scaled = torch.stack([x_scaled, y_scaled], dim=1) return coord_scaled def vrplib_to_td(problem, normalize=True): coords = torch.tensor(problem['node_coord']).float() coords_norm = normalize_coord(coords) if normalize else coords demand = torch.tensor(problem['demand'][1:]).float() capacity = problem['capacity'] n = coords.shape[0] td = TensorDict({ 'depot': coords_norm[0,:], 'locs': coords_norm[1:,:], 'demand': demand / capacity, # normalized demand 'capacity': capacity, # original capacity, not needed for inference }) td = td[None] # add batch dimension, in this case just 1 return td In\u00a0[8]: Copied!
tds, actions = [], []\nfor instance in instances:\n    # Inference\n    problem = vrplib.read_instance(os.path.join(path_to_save, instance+'.vrp'))\n    td_reset = env.reset(vrplib_to_td(problem).to(device))\n    with torch.inference_mode():\n        out = policy(td_reset.clone(), env, decode_type=\"sampling\", num_samples=128, select_best=True)\n        unnormalized_td = env.reset(vrplib_to_td(problem, normalize=False).to(device))\n        cost = -env.get_reward(unnormalized_td, out[\"actions\"]).int().item() # unnormalized cost\n        \n    # Load the optimal cost\n    solution = vrplib.read_solution(os.path.join(path_to_save, instance+'.sol'))\n    optimal_cost = solution['cost']\n\n    tds.append(td_reset)\n    actions.append(out[\"actions\"])\n    \n    # Calculate the gap and print\n    gap = (cost - optimal_cost) / optimal_cost\n    print(f'Problem: {instance:<15} Cost: {cost:<8} BKS: {optimal_cost:<8}\\t Gap: {gap:.2%}')\n
tds, actions = [], [] for instance in instances: # Inference problem = vrplib.read_instance(os.path.join(path_to_save, instance+'.vrp')) td_reset = env.reset(vrplib_to_td(problem).to(device)) with torch.inference_mode(): out = policy(td_reset.clone(), env, decode_type=\"sampling\", num_samples=128, select_best=True) unnormalized_td = env.reset(vrplib_to_td(problem, normalize=False).to(device)) cost = -env.get_reward(unnormalized_td, out[\"actions\"]).int().item() # unnormalized cost # Load the optimal cost solution = vrplib.read_solution(os.path.join(path_to_save, instance+'.sol')) optimal_cost = solution['cost'] tds.append(td_reset) actions.append(out[\"actions\"]) # Calculate the gap and print gap = (cost - optimal_cost) / optimal_cost print(f'Problem: {instance:<15} Cost: {cost:<8} BKS: {optimal_cost:<8}\\t Gap: {gap:.2%}')
Problem: A-n53-k7        Cost: 2777     BKS: 1010    \t Gap: 174.95%\nProblem: A-n54-k7        Cost: 3130     BKS: 1167    \t Gap: 168.21%\nProblem: A-n55-k9        Cost: 2812     BKS: 1073    \t Gap: 162.07%\nProblem: A-n60-k9        Cost: 3151     BKS: 1354    \t Gap: 132.72%\nProblem: A-n61-k9        Cost: 3060     BKS: 1034    \t Gap: 195.94%\nProblem: A-n62-k8        Cost: 3483     BKS: 1288    \t Gap: 170.42%\nProblem: A-n63-k9        Cost: 3736     BKS: 1616    \t Gap: 131.19%\nProblem: A-n63-k10       Cost: 3110     BKS: 1314    \t Gap: 136.68%\nProblem: A-n64-k9        Cost: 3721     BKS: 1401    \t Gap: 165.60%\nProblem: A-n65-k9        Cost: 3548     BKS: 1174    \t Gap: 202.21%\nProblem: A-n69-k9        Cost: 3600     BKS: 1159    \t Gap: 210.61%\nProblem: A-n80-k10       Cost: 4776     BKS: 1763    \t Gap: 170.90%\nProblem: B-n51-k7        Cost: 3286     BKS: 1032    \t Gap: 218.41%\nProblem: B-n52-k7        Cost: 2852     BKS: 747     \t Gap: 281.79%\nProblem: B-n56-k7        Cost: 2762     BKS: 707     \t Gap: 290.66%\nProblem: B-n57-k7        Cost: 3553     BKS: 1153    \t Gap: 208.15%\nProblem: B-n57-k9        Cost: 3622     BKS: 1598    \t Gap: 126.66%\nProblem: B-n63-k10       Cost: 3426     BKS: 1496    \t Gap: 129.01%\nProblem: B-n64-k9        Cost: 2804     BKS: 861     \t Gap: 225.67%\nProblem: B-n66-k9        Cost: 3273     BKS: 1316    \t Gap: 148.71%\nProblem: B-n67-k10       Cost: 2949     BKS: 1032    \t Gap: 185.76%\nProblem: B-n68-k9        Cost: 3992     BKS: 1272    \t Gap: 213.84%\nProblem: B-n78-k10       Cost: 4367     BKS: 1221    \t Gap: 257.66%\nProblem: E-n51-k5        Cost: 1615     BKS: 521     \t Gap: 209.98%\nProblem: E-n76-k7        Cost: 2396     BKS: 682     \t Gap: 251.32%\nProblem: E-n76-k8        Cost: 2402     BKS: 735     \t Gap: 226.80%\nProblem: E-n76-k10       Cost: 2393     BKS: 830     \t Gap: 188.31%\nProblem: E-n76-k14       Cost: 2520     BKS: 1021    \t Gap: 146.82%\nProblem: E-n101-k8       Cost: 3507     BKS: 815     \t Gap: 330.31%\nProblem: E-n101-k14      Cost: 3550     BKS: 1067    \t Gap: 232.71%\nProblem: F-n72-k4        Cost: 1274     BKS: 237     \t Gap: 437.55%\nProblem: M-n101-k10      Cost: 4036     BKS: 820     \t Gap: 392.20%\n
In\u00a0[\u00a0]: Copied!
# Plot some instances\nenv.render(tds[0], actions[0].cpu())\nenv.render(tds[-2], actions[-2].cpu())\nenv.render(tds[-1], actions[-1].cpu())\n
# Plot some instances env.render(tds[0], actions[0].cpu()) env.render(tds[-2], actions[-2].cpu()) env.render(tds[-1], actions[-1].cpu()) In\u00a0[10]: Copied!
trainer = RL4COTrainer(\n    max_epochs=3,\n    accelerator=\"gpu\",\n    devices=1,\n    logger=None,\n)\n\ntrainer.fit(model)\n
trainer = RL4COTrainer( max_epochs=3, accelerator=\"gpu\", devices=1, logger=None, ) trainer.fit(model)
Using 16bit Automatic Mixed Precision (AMP)\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/plugins/precision/amp.py:55: `torch.cuda.amp.GradScaler(args...)` is deprecated. Please use `torch.amp.GradScaler('cuda', args...)` instead.\nGPU available: True (cuda), used: True\nTPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\n
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\nval_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\nLOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n\n  | Name     | Type                 | Params\n--------------------------------------------------\n0 | env      | CVRPEnv              | 0     \n1 | policy   | AttentionModelPolicy | 694 K \n2 | baseline | WarmupBaseline       | 694 K \n--------------------------------------------------\n1.4 M     Trainable params\n0         Non-trainable params\n1.4 M     Total params\n5.553     Total estimated model params size (MB)\n
Sanity Checking: |          | 0/? [00:00<?, ?it/s]
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n
Training: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
`Trainer.fit` stopped: `max_epochs=3` reached.\n
In\u00a0[11]: Copied!
policy = model.policy.to(device).eval() # trained policy\n\ntds, actions = [], []\nfor instance in instances:\n    # Inference\n    problem = vrplib.read_instance(os.path.join(path_to_save, instance+'.vrp'))\n    td_reset = env.reset(vrplib_to_td(problem).to(device))\n    with torch.inference_mode():\n        out = policy(td_reset.clone(), env, decode_type=\"sampling\", num_samples=128, select_best=True)\n        unnormalized_td = env.reset(vrplib_to_td(problem, normalize=False).to(device))\n        cost = -env.get_reward(unnormalized_td, out[\"actions\"]).int().item() # unnormalized cost\n        \n    # Load the optimal cost\n    solution = vrplib.read_solution(os.path.join(path_to_save, instance+'.sol'))\n    optimal_cost = solution['cost']\n\n    tds.append(td_reset)\n    actions.append(out[\"actions\"])\n    \n    # Calculate the gap and print\n    gap = (cost - optimal_cost) / optimal_cost\n    print(f'Problem: {instance:<15} Cost: {cost:<8} BKS: {optimal_cost:<8}\\t Gap: {gap:.2%}')\n
policy = model.policy.to(device).eval() # trained policy tds, actions = [], [] for instance in instances: # Inference problem = vrplib.read_instance(os.path.join(path_to_save, instance+'.vrp')) td_reset = env.reset(vrplib_to_td(problem).to(device)) with torch.inference_mode(): out = policy(td_reset.clone(), env, decode_type=\"sampling\", num_samples=128, select_best=True) unnormalized_td = env.reset(vrplib_to_td(problem, normalize=False).to(device)) cost = -env.get_reward(unnormalized_td, out[\"actions\"]).int().item() # unnormalized cost # Load the optimal cost solution = vrplib.read_solution(os.path.join(path_to_save, instance+'.sol')) optimal_cost = solution['cost'] tds.append(td_reset) actions.append(out[\"actions\"]) # Calculate the gap and print gap = (cost - optimal_cost) / optimal_cost print(f'Problem: {instance:<15} Cost: {cost:<8} BKS: {optimal_cost:<8}\\t Gap: {gap:.2%}')
Problem: A-n53-k7        Cost: 1180     BKS: 1010    \t Gap: 16.83%\nProblem: A-n54-k7        Cost: 1256     BKS: 1167    \t Gap: 7.63%\nProblem: A-n55-k9        Cost: 1195     BKS: 1073    \t Gap: 11.37%\nProblem: A-n60-k9        Cost: 1502     BKS: 1354    \t Gap: 10.93%\nProblem: A-n61-k9        Cost: 1223     BKS: 1034    \t Gap: 18.28%\nProblem: A-n62-k8        Cost: 1491     BKS: 1288    \t Gap: 15.76%\nProblem: A-n63-k9        Cost: 1792     BKS: 1616    \t Gap: 10.89%\nProblem: A-n63-k10       Cost: 1459     BKS: 1314    \t Gap: 11.04%\nProblem: A-n64-k9        Cost: 1537     BKS: 1401    \t Gap: 9.71%\nProblem: A-n65-k9        Cost: 1355     BKS: 1174    \t Gap: 15.42%\nProblem: A-n69-k9        Cost: 1317     BKS: 1159    \t Gap: 13.63%\nProblem: A-n80-k10       Cost: 2009     BKS: 1763    \t Gap: 13.95%\nProblem: B-n51-k7        Cost: 1182     BKS: 1032    \t Gap: 14.53%\nProblem: B-n52-k7        Cost: 863      BKS: 747     \t Gap: 15.53%\nProblem: B-n56-k7        Cost: 889      BKS: 707     \t Gap: 25.74%\nProblem: B-n57-k7        Cost: 1323     BKS: 1153    \t Gap: 14.74%\nProblem: B-n57-k9        Cost: 1772     BKS: 1598    \t Gap: 10.89%\nProblem: B-n63-k10       Cost: 1671     BKS: 1496    \t Gap: 11.70%\nProblem: B-n64-k9        Cost: 1040     BKS: 861     \t Gap: 20.79%\nProblem: B-n66-k9        Cost: 1466     BKS: 1316    \t Gap: 11.40%\nProblem: B-n67-k10       Cost: 1201     BKS: 1032    \t Gap: 16.38%\nProblem: B-n68-k9        Cost: 1413     BKS: 1272    \t Gap: 11.08%\nProblem: B-n78-k10       Cost: 1529     BKS: 1221    \t Gap: 25.23%\nProblem: E-n51-k5        Cost: 630      BKS: 521     \t Gap: 20.92%\nProblem: E-n76-k7        Cost: 844      BKS: 682     \t Gap: 23.75%\nProblem: E-n76-k8        Cost: 862      BKS: 735     \t Gap: 17.28%\nProblem: E-n76-k10       Cost: 975      BKS: 830     \t Gap: 17.47%\nProblem: E-n76-k14       Cost: 1153     BKS: 1021    \t Gap: 12.93%\nProblem: E-n101-k8       Cost: 1070     BKS: 815     \t Gap: 31.29%\nProblem: E-n101-k14      Cost: 1303     BKS: 1067    \t Gap: 22.12%\nProblem: F-n72-k4        Cost: 312      BKS: 237     \t Gap: 31.65%\nProblem: M-n101-k10      Cost: 1134     BKS: 820     \t Gap: 38.29%\n
In\u00a0[12]: Copied!
# Plot some instances\nenv.render(tds[0], actions[0].cpu())\nenv.render(tds[-2], actions[-2].cpu())\nenv.render(tds[-1], actions[-1].cpu())\n
# Plot some instances env.render(tds[0], actions[0].cpu()) env.render(tds[-2], actions[-2].cpu()) env.render(tds[-1], actions[-1].cpu())

Great! We can see that the performance vastly improved even with just few minutes of training.

There are several ways to improve the model's performance further, such as:

  • Training for more steps
  • Using a different model architecture
  • Using a different training algorithm
  • Using a different hyperparameters
  • Using a different Generator
  • ... and many more!
"},{"location":"examples/datasets/2-test-on-cvrplib/#testing-model-on-vrplib","title":"Testing Model on VRPLib\u00b6","text":"

In this notebook, we will test the trained model's performance on the VRPLib benchmark.

VRPLib is a collection of instances related to the CVRP, which is a classic optimization challenge in the field of logistics and transportation.

"},{"location":"examples/datasets/2-test-on-cvrplib/#installation","title":"Installation\u00b6","text":"

Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!

Note: You may need to restart the runtime in Colab after this

"},{"location":"examples/datasets/2-test-on-cvrplib/#imports","title":"Imports\u00b6","text":""},{"location":"examples/datasets/2-test-on-cvrplib/#download-vrp-problems","title":"Download vrp problems\u00b6","text":""},{"location":"examples/datasets/2-test-on-cvrplib/#test-untrained","title":"Test untrained\u00b6","text":""},{"location":"examples/datasets/2-test-on-cvrplib/#train","title":"Train\u00b6","text":"

We will train for few steps just to show the effects of training a model. Alternatively, we can load the a pretrained checkpoint, e.g. with:

model = AttentionModel.load_from_checkpoint(checkpoint_path, load_baseline=False)\n
"},{"location":"examples/datasets/2-test-on-cvrplib/#test-trained-model","title":"Test trained model\u00b6","text":""},{"location":"examples/modeling/","title":"Modeling","text":"

Collection of examples on models and related topics.

"},{"location":"examples/modeling/#index","title":"Index","text":"
  • 1-decoding-strategies.ipynb: here we show how to use different decoding strategies at inference time, such as greedy evaluation, beam search, and various sampling methods including top-k and nucleus sampling.
  • 2-transductive-methods.ipynb: here we show how to use transductive methods (i.e. online / test time optimization) such as EAS.
  • 3-change-encoder.ipynb: here we show how to change the encoder of a model.
"},{"location":"examples/modeling/1-decoding-strategies/","title":"RL4CO Decoding Strategies Notebook","text":"In\u00a0[1]: Copied!
## Uncomment the following line to install the package from PyPI\n## You may need to restart the runtime in Colab after this\n## Remember to choose a GPU runtime for faster training!\n\n# !pip install rl4co\n
## Uncomment the following line to install the package from PyPI ## You may need to restart the runtime in Colab after this ## Remember to choose a GPU runtime for faster training! # !pip install rl4co In\u00a0[4]: Copied!
import torch\n\nfrom rl4co.envs import TSPEnv\nfrom rl4co.models.zoo import AttentionModel, AttentionModelPolicy\nfrom rl4co.utils.trainer import RL4COTrainer\nfrom rl4co.utils.ops import batchify\n
import torch from rl4co.envs import TSPEnv from rl4co.models.zoo import AttentionModel, AttentionModelPolicy from rl4co.utils.trainer import RL4COTrainer from rl4co.utils.ops import batchify In\u00a0[5]: Copied!
%%capture\n# RL4CO env based on TorchRL\nenv = TSPEnv(generator_params=dict(num_loc=50)) \n\n# Policy: neural network, in this case with encoder-decoder architecture\npolicy = AttentionModelPolicy(env_name=env.name, \n                              embed_dim=128,\n                              num_encoder_layers=3,\n                              num_heads=8,\n                            )\n\n# Model: default is AM with REINFORCE and greedy rollout baseline\nmodel = AttentionModel(env, \n                       baseline=\"rollout\",\n                       batch_size = 512,\n                       val_batch_size = 64, \n                       test_batch_size = 64, \n                       train_data_size=100_000, # fast training for demo\n                       val_data_size=1_000,\n                       test_data_size=1_000,\n                       optimizer_kwargs={\"lr\": 1e-4},\n                       policy_kwargs={  # we can specify the decode types using the policy_kwargs\n                           \"train_decode_type\": \"sampling\",\n                           \"val_decode_type\": \"greedy\",\n                           \"test_decode_type\": \"beam_search\",\n                       }\n                       )\n
%%capture # RL4CO env based on TorchRL env = TSPEnv(generator_params=dict(num_loc=50)) # Policy: neural network, in this case with encoder-decoder architecture policy = AttentionModelPolicy(env_name=env.name, embed_dim=128, num_encoder_layers=3, num_heads=8, ) # Model: default is AM with REINFORCE and greedy rollout baseline model = AttentionModel(env, baseline=\"rollout\", batch_size = 512, val_batch_size = 64, test_batch_size = 64, train_data_size=100_000, # fast training for demo val_data_size=1_000, test_data_size=1_000, optimizer_kwargs={\"lr\": 1e-4}, policy_kwargs={ # we can specify the decode types using the policy_kwargs \"train_decode_type\": \"sampling\", \"val_decode_type\": \"greedy\", \"test_decode_type\": \"beam_search\", } ) In\u00a0[4]: Copied!
trainer = RL4COTrainer(\n    max_epochs=3,\n    devices=1,\n)\n\ntrainer.fit(model)\n
trainer = RL4COTrainer( max_epochs=3, devices=1, ) trainer.fit(model)
Using 16bit Automatic Mixed Precision (AMP)\nGPU available: True (cuda), used: True\nTPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\nval_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\nLOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n\n  | Name     | Type                 | Params\n--------------------------------------------------\n0 | env      | TSPEnv               | 0     \n1 | policy   | AttentionModelPolicy | 710 K \n2 | baseline | WarmupBaseline       | 710 K \n--------------------------------------------------\n1.4 M     Trainable params\n0         Non-trainable params\n1.4 M     Total params\n5.681     Total estimated model params size (MB)\n
Sanity Checking: |          | 0/? [00:00<?, ?it/s]
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n
Training: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
`Trainer.fit` stopped: `max_epochs=3` reached.\n
In\u00a0[6]: Copied!
# here we evaluate the model on the test set using the beam search decoding strategy as declared in the model constructor\ntrainer.test(model=model)\n
# here we evaluate the model on the test set using the beam search decoding strategy as declared in the model constructor trainer.test(model=model) In\u00a0[9]: Copied!
# we can simply change the decoding type of the current model instance\nmodel.policy.test_decode_type = \"greedy\"\ntrainer.test(model=model)\n
# we can simply change the decoding type of the current model instance model.policy.test_decode_type = \"greedy\" trainer.test(model=model) In\u00a0[8]: Copied!
device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n\ntest_td_raw = next(iter(model.test_dataloader())).to(device)\ntd_test = env.reset(test_td_raw)\nmodel = model.to(device)\n
device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\") test_td_raw = next(iter(model.test_dataloader())).to(device) td_test = env.reset(test_td_raw) model = model.to(device) In\u00a0[10]: Copied!
# Example over full dataset\nrewards = []\nfor batch in model.test_dataloader():\n    with torch.inference_mode():\n        td = env.reset(batch).to(device)\n        out = model(td, decode_type=\"greedy\")\n    rewards.append(out[\"reward\"])\nprint(\"Average reward over all dataset: %.3f\" % torch.cat(rewards).mean().item())\n\n# Example over a single instance\nwith torch.inference_mode():\n    out = model(test_td_raw.clone(), decode_type=\"greedy\")\n    print(\"Average reward: %.3f\" % out[\"reward\"].mean().item())\n
# Example over full dataset rewards = [] for batch in model.test_dataloader(): with torch.inference_mode(): td = env.reset(batch).to(device) out = model(td, decode_type=\"greedy\") rewards.append(out[\"reward\"]) print(\"Average reward over all dataset: %.3f\" % torch.cat(rewards).mean().item()) # Example over a single instance with torch.inference_mode(): out = model(test_td_raw.clone(), decode_type=\"greedy\") print(\"Average reward: %.3f\" % out[\"reward\"].mean().item())
Average reward over all dataset: -6.376\nAverage reward: -6.415\n
In\u00a0[11]: Copied!
# Example over a single instance\nwith torch.inference_mode():\n    bs = td_test.batch_size[0]\n    out = model(td_test.clone(), decode_type=\"multistart_greedy\", num_starts=20)\n    rewards = torch.stack(out[\"reward\"].split(bs), 1).max(1).values\n    print(\"Average reward: %.3f\" % rewards.mean().item())\n
# Example over a single instance with torch.inference_mode(): bs = td_test.batch_size[0] out = model(td_test.clone(), decode_type=\"multistart_greedy\", num_starts=20) rewards = torch.stack(out[\"reward\"].split(bs), 1).max(1).values print(\"Average reward: %.3f\" % rewards.mean().item())
Average reward: -6.279\n
In\u00a0[44]: Copied!
num_samples = 32\nwith torch.inference_mode():\n    bs = td_test.batch_size[0]\n    td_test_batched = batchify(td_test, num_samples) # repeat the same instance num_samples times\n    out = model(td_test_batched.clone(), decode_type=\"sampling\")\n    rewards = torch.stack(out[\"reward\"].split(bs), 1).max(1).values # take the max reward over the num_samples samples\n    print(\"Average reward: %.3f\" % rewards.mean().item())\n
num_samples = 32 with torch.inference_mode(): bs = td_test.batch_size[0] td_test_batched = batchify(td_test, num_samples) # repeat the same instance num_samples times out = model(td_test_batched.clone(), decode_type=\"sampling\") rewards = torch.stack(out[\"reward\"].split(bs), 1).max(1).values # take the max reward over the num_samples samples print(\"Average reward: %.3f\" % rewards.mean().item())
Average reward: -6.157\n
In\u00a0[75]: Copied!
num_samples = 32\ntop_p = 0.9\nwith torch.inference_mode():\n    bs = td_test.batch_size[0]\n    td_test_batched = batchify(td_test, num_samples) # repeat the same instance num_samples times\n    out = model(td_test_batched.clone(), decode_type=\"sampling\", top_p=top_p)\n    rewards = torch.stack(out[\"reward\"].split(bs), 1).max(1).values # take the max reward over the num_samples samples\n    print(\"Average reward: %.3f\" % rewards.mean().item())\n
num_samples = 32 top_p = 0.9 with torch.inference_mode(): bs = td_test.batch_size[0] td_test_batched = batchify(td_test, num_samples) # repeat the same instance num_samples times out = model(td_test_batched.clone(), decode_type=\"sampling\", top_p=top_p) rewards = torch.stack(out[\"reward\"].split(bs), 1).max(1).values # take the max reward over the num_samples samples print(\"Average reward: %.3f\" % rewards.mean().item())
Average reward: -6.136\n
In\u00a0[67]: Copied!
num_samples = 32\ntop_k = 10\nwith torch.inference_mode():\n    bs = td_test.batch_size[0]\n    td_test_batched = batchify(td_test, num_samples) # repeat the same instance num_samples times\n    out = model(td_test_batched.clone(), decode_type=\"sampling\", top_k=top_k)\n    rewards = torch.stack(out[\"reward\"].split(bs), 1).max(1).values # take the max reward over the num_samples samples\n    print(\"Average reward: %.3f\" % rewards.mean().item())\n
num_samples = 32 top_k = 10 with torch.inference_mode(): bs = td_test.batch_size[0] td_test_batched = batchify(td_test, num_samples) # repeat the same instance num_samples times out = model(td_test_batched.clone(), decode_type=\"sampling\", top_k=top_k) rewards = torch.stack(out[\"reward\"].split(bs), 1).max(1).values # take the max reward over the num_samples samples print(\"Average reward: %.3f\" % rewards.mean().item())
Average reward: -6.158\n
In\u00a0[88]: Copied!
with torch.inference_mode():\n    bs = td_test.batch_size[0]\n    out = model(td_test.clone(), decode_type=\"beam_search\", beam_width=20)\n    rewards = torch.stack(out[\"reward\"].split(bs), 1).max(1).values # take the max reward over the num_samples samples\n    print(\"Average reward: %.3f\" % rewards.mean().item())\n
with torch.inference_mode(): bs = td_test.batch_size[0] out = model(td_test.clone(), decode_type=\"beam_search\", beam_width=20) rewards = torch.stack(out[\"reward\"].split(bs), 1).max(1).values # take the max reward over the num_samples samples print(\"Average reward: %.3f\" % rewards.mean().item())
Average reward: -6.195\n

We can see that beam search finds a better solution than the greedy decoder

We can also analyze the different solutions obtained via beam search when passing \"select_best=False\" to the forward pass of the policy. The solutions in this case are sorted per instance-wise, that is:

  • instance1_solution1
  • instance2_solution1
  • instance3_solution1
  • instance1_solution2
  • instance2_solution2
  • instance3_solution2
In\u00a0[90]: Copied!
out = model(td_test.clone(), decode_type=\"beam_search\", beam_width=5, select_best=False)\n
out = model(td_test.clone(), decode_type=\"beam_search\", beam_width=5, select_best=False) In\u00a0[91]: Copied!
# we split the sequence ofter every \"batch_size\" instances, then stack the different solutions obtained for each minibatch instance by the beam search together.\nactions_stacked = torch.stack(out[\"actions\"].split(bs), 1)\nrewards_stacked = torch.stack(out[\"reward\"].split(bs), 1)\n
# we split the sequence ofter every \"batch_size\" instances, then stack the different solutions obtained for each minibatch instance by the beam search together. actions_stacked = torch.stack(out[\"actions\"].split(bs), 1) rewards_stacked = torch.stack(out[\"reward\"].split(bs), 1) In\u00a0[95]: Copied!
import matplotlib.pyplot as plt\nbatch_instance = 0\nfor i, actions in enumerate(actions_stacked[batch_instance].cpu()):\n    reward = rewards_stacked[batch_instance, i]\n    _, ax = plt.subplots()\n    \n    env.render(td[0], actions, ax=ax)\n    ax.set_title(\"Reward: %s\" % reward.item())\n
import matplotlib.pyplot as plt batch_instance = 0 for i, actions in enumerate(actions_stacked[batch_instance].cpu()): reward = rewards_stacked[batch_instance, i] _, ax = plt.subplots() env.render(td[0], actions, ax=ax) ax.set_title(\"Reward: %s\" % reward.item())

For evaluation, we can also use additional decoding strategies used during evaluatin, such as sampling N times or greedy augmentations, available in rl4co/tasks/eval.py

"},{"location":"examples/modeling/1-decoding-strategies/#rl4co-decoding-strategies-notebook","title":"RL4CO Decoding Strategies Notebook\u00b6","text":"

This notebook demonstrates how to utilize the different decoding strategies available in rl4co/utils/decoding.py during the different phases of model development. We will also demonstrate how to evaluate the model for different decoding strategies on the test dataset.

"},{"location":"examples/modeling/1-decoding-strategies/#installation","title":"Installation\u00b6","text":""},{"location":"examples/modeling/1-decoding-strategies/#setup-policy-and-environment","title":"Setup Policy and Environment\u00b6","text":""},{"location":"examples/modeling/1-decoding-strategies/#setup-trainer-and-train-model","title":"Setup Trainer and train model\u00b6","text":""},{"location":"examples/modeling/1-decoding-strategies/#test-the-model-using-trainer-class","title":"Test the model using Trainer class\u00b6","text":""},{"location":"examples/modeling/1-decoding-strategies/#test-loop","title":"Test Loop\u00b6","text":"

Let's compare different decoding strategies on some test samples - for simplicity, we don't loop over the entire test dataset, but only over the on a single iteration of the test dataloader.

"},{"location":"examples/modeling/1-decoding-strategies/#greedy-decoding","title":"Greedy Decoding\u00b6","text":""},{"location":"examples/modeling/1-decoding-strategies/#greedy-decoding","title":"Greedy decoding\u00b6","text":""},{"location":"examples/modeling/1-decoding-strategies/#greedy-multistart-decoding","title":"Greedy multistart decoding\u00b6","text":"

Start from different nodes as done in POMO

"},{"location":"examples/modeling/1-decoding-strategies/#sampling","title":"Sampling\u00b6","text":""},{"location":"examples/modeling/1-decoding-strategies/#decoding-via-sampling","title":"Decoding via sampling\u00b6","text":"

In this case, we can parallelize the decoding process by batching the samples and decoding them in parallel.

"},{"location":"examples/modeling/1-decoding-strategies/#top-p-sampling-nucleus-sampling","title":"Top-p sampling (nucleus sampling)\u00b6","text":"

Top-p sampling is a sampling strategy where the top-p most likely tokens are selected and the probability mass is redistributed among them. This is useful when we want to sample from a subset of the nodes and we want to exclude from the lower-end tail of the distribution.

"},{"location":"examples/modeling/1-decoding-strategies/#top-k-sampling","title":"Top-k sampling\u00b6","text":"

In this case we only sample from the top-k most likely tokens.

"},{"location":"examples/modeling/1-decoding-strategies/#beam-search","title":"Beam search\u00b6","text":"

Beam search is a popular decoding strategy in sequence-to-sequence models. It maintains a list of the top-k most likely sequences and expands them by adding the next token in the sequence. The sequences are scored based on the log-likelihood of the sequence. The sequences are expanded until the end token is reached or the maximum length is reached.

"},{"location":"examples/modeling/1-decoding-strategies/#beam-search-decoding","title":"Beam search decoding\u00b6","text":""},{"location":"examples/modeling/1-decoding-strategies/#digging-deeper-into-beam-search-solutions","title":"Digging deeper into beam search solutions\u00b6","text":""},{"location":"examples/modeling/1-decoding-strategies/#final-notes","title":"Final notes\u00b6","text":""},{"location":"examples/modeling/2-transductive-methods/","title":"Transductive Methods","text":"In\u00a0[\u00a0]: Copied!
# !pip install rl4co[graph] # include torch-geometric\n\n## NOTE: to install latest version from Github (may be unstable) install from source instead:\n# !pip install git+https://github.com/ai4co/rl4co.git\n
# !pip install rl4co[graph] # include torch-geometric ## NOTE: to install latest version from Github (may be unstable) install from source instead: # !pip install git+https://github.com/ai4co/rl4co.git In\u00a0[1]: Copied!
%load_ext autoreload\n%autoreload 2\n\nimport torch\n\nfrom rl4co.envs import TSPEnv, CVRPEnv\nfrom rl4co.models.zoo.am import AttentionModel\nfrom rl4co.utils.trainer import RL4COTrainer\nfrom rl4co.utils.decoding import get_log_likelihood\nfrom rl4co.models.zoo import EAS, EASLay, EASEmb, ActiveSearch\n\nimport logging\n
%load_ext autoreload %autoreload 2 import torch from rl4co.envs import TSPEnv, CVRPEnv from rl4co.models.zoo.am import AttentionModel from rl4co.utils.trainer import RL4COTrainer from rl4co.utils.decoding import get_log_likelihood from rl4co.models.zoo import EAS, EASLay, EASEmb, ActiveSearch import logging
2023-08-22 16:29:17.903805: I tensorflow/core/util/port.cc:110] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.\n2023-08-22 16:29:17.923169: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\nTo enable the following instructions: AVX2 AVX512F AVX512_VNNI AVX512_BF16 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n2023-08-22 16:29:18.249479: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n
In\u00a0[2]: Copied!
# Load from checkpoint; alternatively, simply instantiate a new model\ncheckpoint_path = \"last.ckpt\" # model trained for one epoch only just for showing the examples\n\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n\n# load checkpoint\n# checkpoint = torch.load(checkpoint_path)\n\nmodel = AttentionModel.load_from_checkpoint(checkpoint_path, load_baseline=False)\npolicy = model.policy.to(device)\n
# Load from checkpoint; alternatively, simply instantiate a new model checkpoint_path = \"last.ckpt\" # model trained for one epoch only just for showing the examples device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\") # load checkpoint # checkpoint = torch.load(checkpoint_path) model = AttentionModel.load_from_checkpoint(checkpoint_path, load_baseline=False) policy = model.policy.to(device)
/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:196: UserWarning: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n  rank_zero_warn(\n/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:196: UserWarning: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n  rank_zero_warn(\n/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/core/saving.py:164: UserWarning: Found keys that are not in the model state dict but in the checkpoint: ['baseline.baseline.model.encoder.init_embedding.init_embed.weight', 'baseline.baseline.model.encoder.init_embedding.init_embed.bias', 'baseline.baseline.model.encoder.net.layers.0.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.0.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.0.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.0.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.0.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.0.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.0.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.0.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.0.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.0.3.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.1.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.1.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.1.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.1.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.1.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.1.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.1.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.1.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.1.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.1.3.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.2.0.module.Wqkv.weight', 'baseline.baseline.model.encoder.net.layers.2.0.module.Wqkv.bias', 'baseline.baseline.model.encoder.net.layers.2.0.module.out_proj.weight', 'baseline.baseline.model.encoder.net.layers.2.0.module.out_proj.bias', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.2.1.normalizer.num_batches_tracked', 'baseline.baseline.model.encoder.net.layers.2.2.module.0.weight', 'baseline.baseline.model.encoder.net.layers.2.2.module.0.bias', 'baseline.baseline.model.encoder.net.layers.2.2.module.2.weight', 'baseline.baseline.model.encoder.net.layers.2.2.module.2.bias', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.weight', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.bias', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.running_mean', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.running_var', 'baseline.baseline.model.encoder.net.layers.2.3.normalizer.num_batches_tracked', 'baseline.baseline.model.decoder.context_embedding.W_placeholder', 'baseline.baseline.model.decoder.context_embedding.project_context.weight', 'baseline.baseline.model.decoder.project_node_embeddings.weight', 'baseline.baseline.model.decoder.project_fixed_context.weight', 'baseline.baseline.model.decoder.logit_attention.project_out.weight']\n  rank_zero_warn(\n
In\u00a0[3]: Copied!
# env = CVRPEnv(generator_params=dict(num_loc=50))\n# policy = AttentionModel(env).policy.to(device)\n\nenv = TSPEnv(generator_params=dict(num_loc=50))\n\ntd = env.reset(batch_size=3).to(device)\n\nout = policy(td)\n
# env = CVRPEnv(generator_params=dict(num_loc=50)) # policy = AttentionModel(env).policy.to(device) env = TSPEnv(generator_params=dict(num_loc=50)) td = env.reset(batch_size=3).to(device) out = policy(td) In\u00a0[4]: Copied!
env.render(td.cpu(), out[\"actions\"].cpu())\n
env.render(td.cpu(), out[\"actions\"].cpu()) In\u00a0[5]: Copied!
logging.basicConfig(level=logging.DEBUG)\n\nenv.generator.num_loc = 200\n\ndataset = env.dataset(batch_size=[2])\n# eas_model = EASEmb(env, policy, dataset, batch_size=2, max_iters=20, save_path=\"eas_sols.pt\") # alternative\neas_model = EASLay(env, policy, dataset, batch_size=2, max_iters=20, save_path=\"eas_sols.pt\")\n\neas_model.setup()\n
logging.basicConfig(level=logging.DEBUG) env.generator.num_loc = 200 dataset = env.dataset(batch_size=[2]) # eas_model = EASEmb(env, policy, dataset, batch_size=2, max_iters=20, save_path=\"eas_sols.pt\") # alternative eas_model = EASLay(env, policy, dataset, batch_size=2, max_iters=20, save_path=\"eas_sols.pt\") eas_model.setup()
/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:196: UserWarning: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n  rank_zero_warn(\n/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/utilities/parsing.py:196: UserWarning: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n  rank_zero_warn(\nINFO:rl4co.models.rl.common.base:No metrics specified, using default\nINFO:rl4co.models.zoo.eas.search:Setting up Efficient Active Search (EAS) with: \n- EAS Embedding: False \n- EAS Layer: True \n\n
In\u00a0[6]: Copied!
# Plot initial solution\ntd_dataset = next(iter(eas_model.train_dataloader()))\ntd_dataset = env.reset(td_dataset).to(device)\nout = policy(td_dataset)\n\nenv.render(td_dataset.cpu(), out[\"actions\"].cpu())\n
# Plot initial solution td_dataset = next(iter(eas_model.train_dataloader())) td_dataset = env.reset(td_dataset).to(device) out = policy(td_dataset) env.render(td_dataset.cpu(), out[\"actions\"].cpu())
INFO:rl4co.models.common.constructive.autoregressive.policy:Instantiated environment not provided; instantiating tsp\n
In\u00a0[7]: Copied!
from rl4co.utils.trainer import RL4COTrainer\n\ntrainer = RL4COTrainer(\n    max_epochs=1,\n    gradient_clip_val=None,\n)\n\ntrainer.fit(eas_model)\n
from rl4co.utils.trainer import RL4COTrainer trainer = RL4COTrainer( max_epochs=1, gradient_clip_val=None, ) trainer.fit(eas_model)
WARNING:rl4co.utils.trainer:gradient_clip_val is set to None. This may lead to unstable training.\nUsing 16bit Automatic Mixed Precision (AMP)\nGPU available: True (cuda), used: True\nTPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\nINFO:rl4co.models.zoo.eas.search:Setting up Efficient Active Search (EAS) with: \n- EAS Embedding: False \n- EAS Layer: True \n\nDEBUG:fsspec.local:open file: /home/botu/Dev/rl4co-rebuttal/notebooks/dev/lightning_logs/version_181/hparams.yaml\nDEBUG:fsspec.local:open file: /home/botu/Dev/rl4co-rebuttal/notebooks/dev/lightning_logs/version_181/hparams.yaml\nLOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0]\nINFO:rl4co.models.rl.common.base:Instantiating optimizer <Adam>\n\n  | Name   | Type                 | Params\n------------------------------------------------\n0 | env    | TSPEnv               | 0     \n1 | policy | AttentionModelPolicy | 710 K \n------------------------------------------------\n710 K     Trainable params\n0         Non-trainable params\n710 K     Total params\n2.841     Total estimated model params size (MB)\n
Sanity Checking: 0it [00:00, ?it/s]
/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:432: PossibleUserWarning: The dataloader, val_dataloader, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 32 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n  rank_zero_warn(\n/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:432: PossibleUserWarning: The dataloader, train_dataloader, does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` (try 32 which is the number of cpus on this machine) in the `DataLoader` init to improve performance.\n  rank_zero_warn(\n/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/loops/fit_loop.py:280: PossibleUserWarning: The number of training batches (1) is smaller than the logging interval Trainer(log_every_n_steps=50). Set a lower value for log_every_n_steps if you want to see logs for the training epoch.\n  rank_zero_warn(\n
Training: 0it [00:00, ?it/s]
/home/botu/Dev/rl4co-rebuttal/notebooks/dev/../../rl4co/models/zoo/eas/nn.py:22: UserWarning: nn.init.xavier_uniform is now deprecated in favor of nn.init.xavier_uniform_.\n  torch.nn.init.xavier_uniform(self.W1)\n/home/botu/Dev/rl4co-rebuttal/notebooks/dev/../../rl4co/models/zoo/eas/nn.py:23: UserWarning: nn.init.xavier_uniform is now deprecated in favor of nn.init.xavier_uniform_.\n  torch.nn.init.xavier_uniform(self.b1)\nINFO:rl4co.models.rl.common.base:Instantiating optimizer <Adam>\n
/home/botu/miniconda3/envs/rl4co/lib/python3.10/site-packages/lightning/pytorch/trainer/connectors/logger_connector/result.py:212: UserWarning: You called `self.log('step', ...)` in your `training_step` but the value needs to be floating point. Converting it to torch.float32.\n  warning_cache.warn(\nINFO:rl4co.models.zoo.eas.search:0/20 |  Reward: -15.52 \nINFO:rl4co.models.zoo.eas.search:1/20 |  Reward: -15.32 \nINFO:rl4co.models.zoo.eas.search:2/20 |  Reward: -15.30 \nINFO:rl4co.models.zoo.eas.search:3/20 |  Reward: -15.28 \nINFO:rl4co.models.zoo.eas.search:4/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:5/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:6/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:7/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:8/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:9/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:10/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:11/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:12/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:13/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:14/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:15/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:16/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:17/20 |  Reward: -15.01 \nINFO:rl4co.models.zoo.eas.search:18/20 |  Reward: -14.84 \nINFO:rl4co.models.zoo.eas.search:19/20 |  Reward: -14.74 \nINFO:rl4co.models.zoo.eas.search:Best reward: -14.74\n
Validation: 0it [00:00, ?it/s]
INFO:rl4co.models.zoo.eas.search:Saving solutions and rewards to eas_sols.pt...\n`Trainer.fit` stopped: `max_epochs=1` reached.\n
In\u00a0[10]: Copied!
# Load\nactions = torch.load(\"eas_sols.pt\")[\"solutions\"][0].cpu()\nactions = actions[:torch.count_nonzero(actions, dim=-1)] # remove trailing zeros\nstate = td_dataset.cpu()[0]\n\nenv.render(state, actions)\n
# Load actions = torch.load(\"eas_sols.pt\")[\"solutions\"][0].cpu() actions = actions[:torch.count_nonzero(actions, dim=-1)] # remove trailing zeros state = td_dataset.cpu()[0] env.render(state, actions)

Even with few iterations, the search method can clearly find better solutions than the initial ones!

"},{"location":"examples/modeling/2-transductive-methods/#transductive-methods","title":"Transductive Methods\u00b6","text":"

In this notebook, we will showcase how to use the Efficient Active Search (EAS) algorithm to find better solutions to existing problems!

Tip: in transductive RL) we train (or finetune) to solve only specific ones.

"},{"location":"examples/modeling/2-transductive-methods/#installation","title":"Installation\u00b6","text":"

Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!

Note: You may need to restart the runtime in Colab after this

"},{"location":"examples/modeling/2-transductive-methods/#imports","title":"Imports\u00b6","text":""},{"location":"examples/modeling/2-transductive-methods/#eas","title":"EAS\u00b6","text":"

We perform few iterations of EASLay for demonstration

"},{"location":"examples/modeling/2-transductive-methods/#perform-search","title":"Perform search\u00b6","text":""},{"location":"examples/modeling/2-transductive-methods/#load-actions","title":"Load actions\u00b6","text":""},{"location":"examples/modeling/3-change-encoder/","title":"Encoder Customization","text":"In\u00a0[1]: Copied!
# !pip install rl4co[graph] # include torch-geometric\n\n## NOTE: to install latest version from Github (may be unstable) install from source instead:\n# !pip install git+https://github.com/ai4co/rl4co.git\n
# !pip install rl4co[graph] # include torch-geometric ## NOTE: to install latest version from Github (may be unstable) install from source instead: # !pip install git+https://github.com/ai4co/rl4co.git In\u00a0[1]: Copied!
from rl4co.envs import CVRPEnv\n\nfrom rl4co.models.zoo import AttentionModel\nfrom rl4co.utils.trainer import RL4COTrainer\n
from rl4co.envs import CVRPEnv from rl4co.models.zoo import AttentionModel from rl4co.utils.trainer import RL4COTrainer In\u00a0[3]: Copied!
# Init env, model, trainer\nenv = CVRPEnv(generator_params=dict(num_loc=20))\n\nmodel = AttentionModel(\n    env, \n    baseline='rollout',\n    train_data_size=100_000, # really small size for demo\n    val_data_size=10_000\n)\n \ntrainer = RL4COTrainer(\n    max_epochs=3, # few epochs for demo\n    accelerator='gpu',\n    devices=1,\n    logger=False,\n)\n\n# By default the AM uses the Graph Attention Encoder\nprint(f'Encoder: {model.policy.encoder._get_name()}')\n
# Init env, model, trainer env = CVRPEnv(generator_params=dict(num_loc=20)) model = AttentionModel( env, baseline='rollout', train_data_size=100_000, # really small size for demo val_data_size=10_000 ) trainer = RL4COTrainer( max_epochs=3, # few epochs for demo accelerator='gpu', devices=1, logger=False, ) # By default the AM uses the Graph Attention Encoder print(f'Encoder: {model.policy.encoder._get_name()}')
/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\nUsing 16bit Automatic Mixed Precision (AMP)\nGPU available: True (cuda), used: True\n
TPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\n
Encoder: GraphAttentionEncoder\n
In\u00a0[4]: Copied!
# Train the model\ntrainer.fit(model)\n
# Train the model trainer.fit(model)
/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/callbacks/model_checkpoint.py:630: Checkpoint directory /datasets/home/botu/Dev/rl4co/notebooks/tutorials/checkpoints exists and is not empty.\nval_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\nLOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n\n  | Name     | Type                 | Params\n--------------------------------------------------\n0 | env      | CVRPEnv              | 0     \n1 | policy   | AttentionModelPolicy | 694 K \n2 | baseline | WarmupBaseline       | 694 K \n--------------------------------------------------\n1.4 M     Trainable params\n0         Non-trainable params\n1.4 M     Total params\n5.553     Total estimated model params size (MB)\n
Sanity Checking: |          | 0/? [00:00<?, ?it/s]
/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=47` in the `DataLoader` to improve performance.\n/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=47` in the `DataLoader` to improve performance.\n
Training: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
`Trainer.fit` stopped: `max_epochs=3` reached.\n
In\u00a0[5]: Copied!
# Before we init, we need to install the graph neural network dependencies\n# !pip install rl4co[graph]\n
# Before we init, we need to install the graph neural network dependencies # !pip install rl4co[graph] In\u00a0[7]: Copied!
# Init the model with different encoder\nfrom rl4co.models.nn.graph.gcn import GCNEncoder\nfrom rl4co.models.nn.graph.mpnn import MessagePassingEncoder\n\ngcn_encoder = GCNEncoder(\n    env_name='cvrp', \n    embed_dim=128,\n    num_nodes=20, \n    num_layers=3,\n)\n\nmpnn_encoder = MessagePassingEncoder(\n    env_name='cvrp', \n    embed_dim=128,\n    num_nodes=20, \n    num_layers=3,\n)\n\nmodel = AttentionModel(\n    env, \n    baseline='rollout',\n    train_data_size=100_000, # really small size for demo\n    val_data_size=10_000, \n    policy_kwargs={\n        'encoder': gcn_encoder # gcn_encoder or mpnn_encoder\n    }\n)\n \ntrainer = RL4COTrainer(\n    max_epochs=3, # few epochs for demo\n    accelerator='gpu',\n    devices=1,\n    logger=False,\n)\n
# Init the model with different encoder from rl4co.models.nn.graph.gcn import GCNEncoder from rl4co.models.nn.graph.mpnn import MessagePassingEncoder gcn_encoder = GCNEncoder( env_name='cvrp', embed_dim=128, num_nodes=20, num_layers=3, ) mpnn_encoder = MessagePassingEncoder( env_name='cvrp', embed_dim=128, num_nodes=20, num_layers=3, ) model = AttentionModel( env, baseline='rollout', train_data_size=100_000, # really small size for demo val_data_size=10_000, policy_kwargs={ 'encoder': gcn_encoder # gcn_encoder or mpnn_encoder } ) trainer = RL4COTrainer( max_epochs=3, # few epochs for demo accelerator='gpu', devices=1, logger=False, )
/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\nUsing 16bit Automatic Mixed Precision (AMP)\nGPU available: True (cuda), used: True\nTPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\n
In\u00a0[8]: Copied!
# Train the model\ntrainer.fit(model)\n
# Train the model trainer.fit(model)
/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/callbacks/model_checkpoint.py:630: Checkpoint directory /datasets/home/botu/Dev/rl4co/notebooks/tutorials/checkpoints exists and is not empty.\nval_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\n
LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n\n  | Name     | Type                 | Params\n--------------------------------------------------\n0 | env      | CVRPEnv              | 0     \n1 | policy   | AttentionModelPolicy | 148 K \n2 | baseline | WarmupBaseline       | 148 K \n--------------------------------------------------\n297 K     Trainable params\n0         Non-trainable params\n297 K     Total params\n1.191     Total estimated model params size (MB)\n
Sanity Checking: |          | 0/? [00:00<?, ?it/s]
/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=47` in the `DataLoader` to improve performance.\n/datasets/home/botu/mambaforge/envs/rl4co-new/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=47` in the `DataLoader` to improve performance.\n
Training: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
`Trainer.fit` stopped: `max_epochs=3` reached.\n
In\u00a0[9]: Copied!
# Import necessary packages\nimport torch.nn as nn\nfrom torch import Tensor\nfrom tensordict import TensorDict\nfrom typing import Tuple, Union\nfrom rl4co.models.nn.env_embeddings import env_init_embedding\n\n\nclass BaseEncoder(nn.Module):\n    def __init__(\n            self,\n            env_name: str,\n            embed_dim: int,\n            init_embedding: nn.Module = None,\n        ):\n        super(BaseEncoder, self).__init__()\n        self.env_name = env_name\n        \n        # Init embedding for each environment\n        self.init_embedding = (\n            env_init_embedding(self.env_name, {\"embed_dim\": embed_dim})\n            if init_embedding is None\n            else init_embedding\n        )\n\n    def forward(\n        self, td: TensorDict, mask: Union[Tensor, None] = None\n    ) -> Tuple[Tensor, Tensor]:\n        \"\"\"\n        Args:\n            td: Input TensorDict containing the environment state\n            mask: Mask to apply to the attention\n\n        Returns:\n            h: Latent representation of the input\n            init_h: Initial embedding of the input\n        \"\"\"\n        init_h = self.init_embedding(td)\n        h = None\n        return h, init_h\n
# Import necessary packages import torch.nn as nn from torch import Tensor from tensordict import TensorDict from typing import Tuple, Union from rl4co.models.nn.env_embeddings import env_init_embedding class BaseEncoder(nn.Module): def __init__( self, env_name: str, embed_dim: int, init_embedding: nn.Module = None, ): super(BaseEncoder, self).__init__() self.env_name = env_name # Init embedding for each environment self.init_embedding = ( env_init_embedding(self.env_name, {\"embed_dim\": embed_dim}) if init_embedding is None else init_embedding ) def forward( self, td: TensorDict, mask: Union[Tensor, None] = None ) -> Tuple[Tensor, Tensor]: \"\"\" Args: td: Input TensorDict containing the environment state mask: Mask to apply to the attention Returns: h: Latent representation of the input init_h: Initial embedding of the input \"\"\" init_h = self.init_embedding(td) h = None return h, init_h"},{"location":"examples/modeling/3-change-encoder/#encoder-customization","title":"Encoder Customization\u00b6","text":"

In this notebook we will cover a tutorial for the flexible encoders!

"},{"location":"examples/modeling/3-change-encoder/#installation","title":"Installation\u00b6","text":"

Uncomment the following line to install the package from PyPI. Remember to choose a GPU runtime for faster training!

Note: You may need to restart the runtime in Colab after this

"},{"location":"examples/modeling/3-change-encoder/#imports","title":"Imports\u00b6","text":""},{"location":"examples/modeling/3-change-encoder/#a-default-minimal-training-script","title":"A default minimal training script\u00b6","text":"

Here we use the CVRP environment and AM model as a minimal example of training script. By default, the AM is initialized with a Graph Attention Encoder, but we can change it to anything we want.

"},{"location":"examples/modeling/3-change-encoder/#change-the-encoder","title":"Change the Encoder\u00b6","text":"

In RL4CO, we provides two graph neural network encoders: Graph Convolutionsal Network (GCN) encoder and Message Passing Neural Network (MPNN) encoder. In this tutorial, we will show how to change the encoder.

Note: while we provide these examples, you can also implement your own encoder and use it in RL4CO! For instance, you may use different encoders (and decoders) to solve problems that require e.g. distance matrices as input

"},{"location":"examples/modeling/3-change-encoder/#or-you-want-to-create-your-own-encoder","title":"Or you want to create your own encoder\u00b6","text":"

If you want to create a new encoder, you may want to follow the following base class to create the encoder class with the folowing components:

  1. RL4CO provides the env_init_embedding method for each environment. You may want to use it to get the initial embedding of the environment.
  2. h and init_h as return hidden features have the shape ([batch_size], num_node, hidden_size)
  3. In RL4CO, we put the graph neural network encoders in the rl4co/models/nn/graph folder. You may want to put your customized encoder to the same folder. Feel free to send a PR to add your encoder to RL4CO!
"},{"location":"examples/other/","title":"Miscellaneous Examples","text":"

Collection of examples on other topics.

"},{"location":"examples/other/#index","title":"Index","text":"
  • 1-mtvrp.ipynb: here we show how to use the Multi-Task Vehicle Routing Problem (MTVRP) environment, which includes 16 tasks that can be solved simultaneously.
  • 2-scheduling.ipynb: provides a brief introduction to scheduling problems with RL4CO with the Flexible Job Shop Scheduling Problem (FJSP) environment.
  • 3-data-generator-distributions.ipynb: here we show how to use the data generators and how to generate data from custom distributions.
"},{"location":"examples/other/1-mtvrp/","title":"MTVRP: Multi-task VRP environment","text":"In\u00a0[1]: Copied!
%load_ext autoreload\n%autoreload 2\n\nfrom rl4co.envs.routing.mtvrp.env import MTVRPEnv\nfrom rl4co.envs.routing.mtvrp.generator import MTVRPGenerator\n
%load_ext autoreload %autoreload 2 from rl4co.envs.routing.mtvrp.env import MTVRPEnv from rl4co.envs.routing.mtvrp.generator import MTVRPGenerator
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning_utilities/core/imports.py:14: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html\n  import pkg_resources\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:2832: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('sphinxcontrib')`.\nImplementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n  declare_namespace(pkg)\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/fabric/__init__.py:41: Deprecated call to `pkg_resources.declare_namespace('lightning.fabric')`.\nImplementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:2317: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('lightning')`.\nImplementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n  declare_namespace(parent)\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/__init__.py:37: Deprecated call to `pkg_resources.declare_namespace('lightning.pytorch')`.\nImplementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/pkg_resources/__init__.py:2317: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('lightning')`.\nImplementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages\n  declare_namespace(parent)\n

Let's now generate some variants! By default, we can generate all variants with the variants_preset variable

In\u00a0[2]: Copied!
# Single feat: generate a distribution of single-featured environments\ngenerator = MTVRPGenerator(num_loc=50, variant_preset=\"all\")\nenv = MTVRPEnv(generator, check_solution=False)\n\ntd_data = env.generator(8)\nenv.get_variant_names(td_data)\n
# Single feat: generate a distribution of single-featured environments generator = MTVRPGenerator(num_loc=50, variant_preset=\"all\") env = MTVRPEnv(generator, check_solution=False) td_data = env.generator(8) env.get_variant_names(td_data) Out[2]:
['VRPLTW', 'OVRP', 'VRPLTW', 'OVRPLTW', 'OVRPL', 'VRPB', 'OVRPTW', 'OVRPB']
In\u00a0[3]: Copied!
# Here is the list of presets and their probabilities of being generated (fully customizable)\nenv.print_presets()\n
# Here is the list of presets and their probabilities of being generated (fully customizable) env.print_presets()
all: {'O': 0.5, 'TW': 0.5, 'L': 0.5, 'B': 0.5}\nsingle_feat: {'O': 0.5, 'TW': 0.5, 'L': 0.5, 'B': 0.5}\nsingle_feat_otw: {'O': 0.5, 'TW': 0.5, 'L': 0.5, 'B': 0.5, 'OTW': 0.5}\ncvrp: {'O': 0.0, 'TW': 0.0, 'L': 0.0, 'B': 0.0}\novrp: {'O': 1.0, 'TW': 0.0, 'L': 0.0, 'B': 0.0}\nvrpb: {'O': 0.0, 'TW': 0.0, 'L': 0.0, 'B': 1.0}\nvrpl: {'O': 0.0, 'TW': 0.0, 'L': 1.0, 'B': 0.0}\nvrptw: {'O': 0.0, 'TW': 1.0, 'L': 0.0, 'B': 0.0}\novrptw: {'O': 1.0, 'TW': 1.0, 'L': 0.0, 'B': 0.0}\novrpb: {'O': 1.0, 'TW': 0.0, 'L': 0.0, 'B': 1.0}\novrpl: {'O': 1.0, 'TW': 0.0, 'L': 1.0, 'B': 0.0}\nvrpbl: {'O': 0.0, 'TW': 0.0, 'L': 1.0, 'B': 1.0}\nvrpbtw: {'O': 0.0, 'TW': 1.0, 'L': 0.0, 'B': 1.0}\nvrpltw: {'O': 0.0, 'TW': 1.0, 'L': 1.0, 'B': 0.0}\novrpbl: {'O': 1.0, 'TW': 0.0, 'L': 1.0, 'B': 1.0}\novrpbtw: {'O': 1.0, 'TW': 1.0, 'L': 0.0, 'B': 1.0}\novrpltw: {'O': 1.0, 'TW': 1.0, 'L': 1.0, 'B': 0.0}\nvrpbltw: {'O': 0.0, 'TW': 1.0, 'L': 1.0, 'B': 1.0}\novrpbltw: {'O': 1.0, 'TW': 1.0, 'L': 1.0, 'B': 1.0}\n

We can change the preset to generate some specific variant, for instance the VRPB

In\u00a0[4]: Copied!
# Change generator\ngenerator = MTVRPGenerator(num_loc=50, variant_preset=\"vrpb\")\nenv.generator = generator\ntd_data = env.generator(8)\nenv.get_variant_names(td_data)\n
# Change generator generator = MTVRPGenerator(num_loc=50, variant_preset=\"vrpb\") env.generator = generator td_data = env.generator(8) env.get_variant_names(td_data)
vrpb selected. Will not use feature combination!\n
Out[4]:
['VRPB', 'VRPB', 'VRPB', 'VRPB', 'VRPB', 'VRPB', 'VRPB', 'VRPB']
In\u00a0[5]: Copied!
import torch\nfrom rl4co.utils.ops import gather_by_index\n\n\n# Simple heuristics (nearest neighbor + capacity check)\ndef greedy_policy(td):\n    \"\"\"Select closest available action\"\"\"\n    available_actions = td[\"action_mask\"]\n    # distances\n    curr_node = td[\"current_node\"]\n    loc_cur = gather_by_index(td[\"locs\"], curr_node)\n    distances_next = torch.cdist(loc_cur[:, None, :], td[\"locs\"], p=2.0).squeeze(1)\n\n    distances_next[~available_actions.bool()] = float(\"inf\")\n    # do not select depot if some capacity is left\n    distances_next[:, 0] = float(\"inf\") * (\n        td[\"used_capacity_linehaul\"] < td[\"vehicle_capacity\"]\n    ).float().squeeze(-1)\n\n    # # if sum of available actions is 0, select depot\n    # distances_next[available_actions.sum(-1) == 0, 0] = 0\n    action = torch.argmin(distances_next, dim=-1)\n    td.set(\"action\", action)\n    return td\n\n\ndef rollout(env, td, policy=greedy_policy, max_steps: int = None):\n    \"\"\"Helper function to rollout a policy. Currently, TorchRL does not allow to step\n    over envs when done with `env.rollout()`. We need this because for environments that complete at different steps.\n    \"\"\"\n\n    max_steps = float(\"inf\") if max_steps is None else max_steps\n    actions = []\n    steps = 0\n\n    while not td[\"done\"].all():\n        td = policy(td)\n        actions.append(td[\"action\"])\n        td = env.step(td)[\"next\"]\n        steps += 1\n        if steps > max_steps:\n            print(\"Max steps reached\")\n            break\n    return torch.stack(actions, dim=1)\n
import torch from rl4co.utils.ops import gather_by_index # Simple heuristics (nearest neighbor + capacity check) def greedy_policy(td): \"\"\"Select closest available action\"\"\" available_actions = td[\"action_mask\"] # distances curr_node = td[\"current_node\"] loc_cur = gather_by_index(td[\"locs\"], curr_node) distances_next = torch.cdist(loc_cur[:, None, :], td[\"locs\"], p=2.0).squeeze(1) distances_next[~available_actions.bool()] = float(\"inf\") # do not select depot if some capacity is left distances_next[:, 0] = float(\"inf\") * ( td[\"used_capacity_linehaul\"] < td[\"vehicle_capacity\"] ).float().squeeze(-1) # # if sum of available actions is 0, select depot # distances_next[available_actions.sum(-1) == 0, 0] = 0 action = torch.argmin(distances_next, dim=-1) td.set(\"action\", action) return td def rollout(env, td, policy=greedy_policy, max_steps: int = None): \"\"\"Helper function to rollout a policy. Currently, TorchRL does not allow to step over envs when done with `env.rollout()`. We need this because for environments that complete at different steps. \"\"\" max_steps = float(\"inf\") if max_steps is None else max_steps actions = [] steps = 0 while not td[\"done\"].all(): td = policy(td) actions.append(td[\"action\"]) td = env.step(td)[\"next\"] steps += 1 if steps > max_steps: print(\"Max steps reached\") break return torch.stack(actions, dim=1) In\u00a0[6]: Copied!
# NOTE: if we don't select ovrpbltw, the below does not work and there is still some\n# minor bug in either masking or variant subselection\n\ngenerator = MTVRPGenerator(num_loc=50, variant_preset=\"all\")\nenv.generator = generator\ntd_data = env.generator(3)\nvariant_names = env.get_variant_names(td_data)\n\ntd = env.reset(td_data)\n\nactions = rollout(env, td.clone(), greedy_policy)\nrewards = env.get_reward(td, actions)\n\nfor idx in [0, 1, 2]:\n    env.render(td[idx], actions[idx])\n    print(\"Cost: \", - rewards[idx].item())\n    print(\"Problem: \", variant_names[idx])\n
# NOTE: if we don't select ovrpbltw, the below does not work and there is still some # minor bug in either masking or variant subselection generator = MTVRPGenerator(num_loc=50, variant_preset=\"all\") env.generator = generator td_data = env.generator(3) variant_names = env.get_variant_names(td_data) td = env.reset(td_data) actions = rollout(env, td.clone(), greedy_policy) rewards = env.get_reward(td, actions) for idx in [0, 1, 2]: env.render(td[idx], actions[idx]) print(\"Cost: \", - rewards[idx].item()) print(\"Problem: \", variant_names[idx])
Cost:  17.503389358520508\nProblem:  OVRPLTW\n
Cost:  18.86773109436035\nProblem:  CVRP\n
Cost:  15.39835262298584\nProblem:  VRPB\n
In\u00a0[7]: Copied!
from rl4co.utils.trainer import RL4COTrainer\nfrom rl4co.models.zoo import MVMoE_POMO\n\ndevice_id = 0\ndevice = torch.device(f\"cuda:{device_id}\" if torch.cuda.is_available() else \"cpu\")\ngenerator = MTVRPGenerator(num_loc=50, variant_preset=\"single_feat\")\nenv = MTVRPEnv(generator, check_solution=False)\n
from rl4co.utils.trainer import RL4COTrainer from rl4co.models.zoo import MVMoE_POMO device_id = 0 device = torch.device(f\"cuda:{device_id}\" if torch.cuda.is_available() else \"cpu\") generator = MTVRPGenerator(num_loc=50, variant_preset=\"single_feat\") env = MTVRPEnv(generator, check_solution=False)
single_feat selected. Will not use feature combination!\n
In\u00a0[8]: Copied!
moe_kwargs = {\"encoder\": {\"hidden_act\": \"ReLU\", \"num_experts\": 4, \"k\": 2, \"noisy_gating\": True},\n              \"decoder\": {\"light_version\": False, \"num_experts\": 4, \"k\": 2, \"noisy_gating\": True}}\nmodel = MVMoE_POMO(\n    env,\n    moe_kwargs=moe_kwargs,\n    batch_size=128,\n    train_data_size=10000,  # each epoch,\n    val_batch_size=100,\n    val_data_size=1000,\n    optimizer=\"Adam\",\n    optimizer_kwargs={\"lr\": 1e-4, \"weight_decay\": 1e-6},\n    lr_scheduler=\"MultiStepLR\",\n    lr_scheduler_kwargs={\"milestones\": [451, ], \"gamma\": 0.1},\n)\n\ntrainer = RL4COTrainer(\n        max_epochs=3,\n        accelerator=\"gpu\",\n        devices=[device_id],\n        logger=None\n    )\n\ntrainer.fit(model)\n
moe_kwargs = {\"encoder\": {\"hidden_act\": \"ReLU\", \"num_experts\": 4, \"k\": 2, \"noisy_gating\": True}, \"decoder\": {\"light_version\": False, \"num_experts\": 4, \"k\": 2, \"noisy_gating\": True}} model = MVMoE_POMO( env, moe_kwargs=moe_kwargs, batch_size=128, train_data_size=10000, # each epoch, val_batch_size=100, val_data_size=1000, optimizer=\"Adam\", optimizer_kwargs={\"lr\": 1e-4, \"weight_decay\": 1e-6}, lr_scheduler=\"MultiStepLR\", lr_scheduler_kwargs={\"milestones\": [451, ], \"gamma\": 0.1}, ) trainer = RL4COTrainer( max_epochs=3, accelerator=\"gpu\", devices=[device_id], logger=None ) trainer.fit(model)
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/utilities/parsing.py:199: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\nUsing 16bit Automatic Mixed Precision (AMP)\nGPU available: True (cuda), used: True\nTPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:75: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\nMissing logger folder: /home/botu/Dev/rl4co/examples/other/lightning_logs\nval_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\nLOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [0,1]\n\n  | Name     | Type                 | Params\n--------------------------------------------------\n0 | env      | MTVRPEnv             | 0     \n1 | policy   | AttentionModelPolicy | 3.7 M \n2 | baseline | SharedBaseline       | 0     \n--------------------------------------------------\n3.7 M     Trainable params\n0         Non-trainable params\n3.7 M     Total params\n14.868    Total estimated model params size (MB)\n
Sanity Checking: |          | 0/? [00:00<?, ?it/s]
/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n/home/botu/mambaforge/envs/rl4co/lib/python3.11/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=31` in the `DataLoader` to improve performance.\n
Training: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
Validation: |          | 0/? [00:00<?, ?it/s]
`Trainer.fit` stopped: `max_epochs=3` reached.\n
In\u00a0[34]: Copied!
# Greedy rollouts over trained model (same states as previous plot)\npolicy = model.policy.to(device)\nout = policy(td.to(device).clone(), env, phase=\"test\", decode_type=\"greedy\")\nactions_mvmoe = out['actions'].cpu().detach()\nrewards_mvmoe = out['reward'].cpu().detach()\n\nfor idx in [0, 1, 2]:\n    env.render(td[idx], actions_mvmoe[idx])\n    print(\"Cost: \", -rewards_mvmoe[idx].item())\n    print(\"Problem: \", variant_names[idx])\n
# Greedy rollouts over trained model (same states as previous plot) policy = model.policy.to(device) out = policy(td.to(device).clone(), env, phase=\"test\", decode_type=\"greedy\") actions_mvmoe = out['actions'].cpu().detach() rewards_mvmoe = out['reward'].cpu().detach() for idx in [0, 1, 2]: env.render(td[idx], actions_mvmoe[idx]) print(\"Cost: \", -rewards_mvmoe[idx].item()) print(\"Problem: \", variant_names[idx])
Cost:  17.188127517700195\nProblem:  OVRPLTW\n
Cost:  14.578388214111328\nProblem:  CVRP\n
Cost:  12.24499797821045\nProblem:  VRPB\n
In\u00a0[31]: Copied!
# PyVRP - HGS\npyvrp_actions, pyvrp_costs = env.solve(td, max_runtime=5, num_procs=10, solver=\"pyvrp\")\nrewards_pyvrp = env.get_reward(td, pyvrp_actions)\n
# PyVRP - HGS pyvrp_actions, pyvrp_costs = env.solve(td, max_runtime=5, num_procs=10, solver=\"pyvrp\") rewards_pyvrp = env.get_reward(td, pyvrp_actions) In\u00a0[36]: Copied!
def calculate_gap(cost, bks):   \n    gaps = (cost - bks) / bks\n    return gaps.mean() * 100\n\n# Nearest insertion\nactions = rollout(env, td.clone(), greedy_policy)\nrewards_ni = env.get_reward(td, actions)\n\nprint(rewards_mvmoe, rewards_ni, rewards_pyvrp)   \nprint(f\"Gap to HGS (NI): {calculate_gap(-rewards_ni, -rewards_pyvrp):.2f}%\")\nprint(f\"Gap to HGS (MVMoE): {calculate_gap(-rewards_mvmoe, -rewards_pyvrp):.2f}%\")\n
def calculate_gap(cost, bks): gaps = (cost - bks) / bks return gaps.mean() * 100 # Nearest insertion actions = rollout(env, td.clone(), greedy_policy) rewards_ni = env.get_reward(td, actions) print(rewards_mvmoe, rewards_ni, rewards_pyvrp) print(f\"Gap to HGS (NI): {calculate_gap(-rewards_ni, -rewards_pyvrp):.2f}%\") print(f\"Gap to HGS (MVMoE): {calculate_gap(-rewards_mvmoe, -rewards_pyvrp):.2f}%\")
tensor([-17.1881, -14.5784, -12.2450]) tensor([-17.5034, -18.8677, -15.3984]) tensor([-12.6954, -11.9107,  -9.9261])\nGap to HGS (NI): 50.47%\nGap to HGS (MVMoE): 27.05%\n

With only two short epochs, we can already get better than NI!

"},{"location":"examples/other/1-mtvrp/#mtvrp-multi-task-vrp-environment","title":"MTVRP: Multi-task VRP environment\u00b6","text":"

This environment can handle any of the following variants:

VRP Variant Capacity (C) Open Route (O) Backhaul (B) Duration Limit (L) Time Window (TW) CVRP \u2714 OVRP \u2714 \u2714 VRPB \u2714 \u2714 VRPL \u2714 \u2714 VRPTW \u2714 \u2714 OVRPTW \u2714 \u2714 \u2714 OVRPB \u2714 \u2714 \u2714 OVRPL \u2714 \u2714 \u2714 VRPBL \u2714 \u2714 \u2714 VRPBTW \u2714 \u2714 \u2714 VRPLTW \u2714 \u2714 \u2714 OVRPBL \u2714 \u2714 \u2714 \u2714 OVRPBTW \u2714 \u2714 \u2714 \u2714 OVRPLTW \u2714 \u2714 \u2714 \u2714 VRPBLTW \u2714 \u2714 \u2714 \u2714 OVRPBLTW \u2714 \u2714 \u2714 \u2714 \u2714

It is fully batched, meaning that different variants can be in the same batch too!

"},{"location":"examples/other/1-mtvrp/#greedy-rollout-and-plot","title":"Greedy rollout and plot\u00b6","text":""},{"location":"examples/other/1-mtvrp/#train-mvmoe-on-multiple-problems","title":"Train MVMoE on Multiple Problems\u00b6","text":""},{"location":"examples/other/1-mtvrp/#getting-gaps-to-classical-solvers","title":"Getting gaps to classical solvers\u00b6","text":"

We additionally offer an optional solve API to get solutions from classical solvers. We can use this to get the gaps to the optimal solutions.

"},{"location":"examples/other/2-scheduling/","title":"Solving the Flexible Job-Shop Scheduling Problem (FJSP)","text":"In\u00a0[1]: Copied!
! pip install torch_geometric\n
! pip install torch_geometric
Requirement already satisfied: torch_geometric in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (2.5.0)\nRequirement already satisfied: tqdm in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (4.66.1)\nRequirement already satisfied: numpy in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (1.26.3)\nRequirement already satisfied: scipy in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (1.11.4)\nRequirement already satisfied: fsspec in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (2023.12.2)\nRequirement already satisfied: jinja2 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (3.1.3)\nRequirement already satisfied: aiohttp in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (3.9.1)\nRequirement already satisfied: requests in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (2.31.0)\nRequirement already satisfied: pyparsing in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (3.1.1)\nRequirement already satisfied: scikit-learn in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (1.4.1.post1)\nRequirement already satisfied: psutil>=5.8.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from torch_geometric) (5.9.7)\nRequirement already satisfied: attrs>=17.3.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (23.2.0)\nRequirement already satisfied: multidict<7.0,>=4.5 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (6.0.4)\nRequirement already satisfied: yarl<2.0,>=1.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (1.9.4)\nRequirement already satisfied: frozenlist>=1.1.1 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (1.4.1)\nRequirement already satisfied: aiosignal>=1.1.2 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (1.3.1)\nRequirement already satisfied: async-timeout<5.0,>=4.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from aiohttp->torch_geometric) (4.0.3)\nRequirement already satisfied: MarkupSafe>=2.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from jinja2->torch_geometric) (2.1.3)\nRequirement already satisfied: charset-normalizer<4,>=2 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from requests->torch_geometric) (3.3.2)\nRequirement already satisfied: idna<4,>=2.5 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from requests->torch_geometric) (3.6)\nRequirement already satisfied: urllib3<3,>=1.21.1 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from requests->torch_geometric) (1.26.18)\nRequirement already satisfied: certifi>=2017.4.17 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from requests->torch_geometric) (2023.11.17)\nRequirement already satisfied: joblib>=1.2.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from scikit-learn->torch_geometric) (1.3.2)\nRequirement already satisfied: threadpoolctl>=2.0.0 in /Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages (from scikit-learn->torch_geometric) (3.3.0)\n
In\u00a0[2]: Copied!
%load_ext autoreload\n%autoreload 2\n\nimport torch\nimport numpy as np\nimport matplotlib.pyplot as plt\nimport numpy as np\nfrom IPython.display import display, clear_output\nimport time\nimport networkx as nx\nimport matplotlib.pyplot as plt\nfrom rl4co.envs import FJSPEnv\nfrom rl4co.models.zoo.l2d import L2DModel\nfrom rl4co.models.zoo.l2d.policy import L2DPolicy\nfrom rl4co.models.zoo.l2d.decoder import L2DDecoder\nfrom rl4co.models.nn.graph.hgnn import HetGNNEncoder\nfrom rl4co.utils.trainer import RL4COTrainer\n
%load_ext autoreload %autoreload 2 import torch import numpy as np import matplotlib.pyplot as plt import numpy as np from IPython.display import display, clear_output import time import networkx as nx import matplotlib.pyplot as plt from rl4co.envs import FJSPEnv from rl4co.models.zoo.l2d import L2DModel from rl4co.models.zoo.l2d.policy import L2DPolicy from rl4co.models.zoo.l2d.decoder import L2DDecoder from rl4co.models.nn.graph.hgnn import HetGNNEncoder from rl4co.utils.trainer import RL4COTrainer In\u00a0[3]: Copied!
generator_params = {\n  \"num_jobs\": 5,  # the total number of jobs\n  \"num_machines\": 5,  # the total number of machines that can process operations\n  \"min_ops_per_job\": 1,  # minimum number of operatios per job\n  \"max_ops_per_job\": 2,  # maximum number of operations per job\n  \"min_processing_time\": 1,  # the minimum time required for a machine to process an operation\n  \"max_processing_time\": 20,  # the maximum time required for a machine to process an operation\n  \"min_eligible_ma_per_op\": 1,  # the minimum number of machines capable to process an operation\n  \"max_eligible_ma_per_op\": 2,  # the maximum number of machines capable to process an operation\n}\n
generator_params = { \"num_jobs\": 5, # the total number of jobs \"num_machines\": 5, # the total number of machines that can process operations \"min_ops_per_job\": 1, # minimum number of operatios per job \"max_ops_per_job\": 2, # maximum number of operations per job \"min_processing_time\": 1, # the minimum time required for a machine to process an operation \"max_processing_time\": 20, # the maximum time required for a machine to process an operation \"min_eligible_ma_per_op\": 1, # the minimum number of machines capable to process an operation \"max_eligible_ma_per_op\": 2, # the maximum number of machines capable to process an operation } In\u00a0[4]: Copied!
env = FJSPEnv(generator_params=generator_params)\ntd = env.reset(batch_size=[1])\n
env = FJSPEnv(generator_params=generator_params) td = env.reset(batch_size=[1]) In\u00a0[5]: Copied!
# Create a bipartite graph from the adjacency matrix\nG = nx.Graph()\nproc_times = td[\"proc_times\"].squeeze(0)\njob_ops_adj = td[\"job_ops_adj\"].squeeze(0)\norder = td[\"ops_sequence_order\"].squeeze(0) + 1\n\nnum_machines, num_operations = proc_times.shape\nnum_jobs = job_ops_adj.size(0)\n\njobs = [f\"j{i+1}\" for i in range(num_jobs)]\nmachines = [f\"m{i+1}\" for i in range(num_machines)]\noperations = [f\"o{i+1}\" for i in range(num_operations)]\n\n# Add nodes from each set\nG.add_nodes_from(machines, bipartite=0)\nG.add_nodes_from(operations, bipartite=1)\nG.add_nodes_from(jobs, bipartite=2)\n\n# Add edges based on the adjacency matrix\nfor i in range(num_machines):\n    for j in range(num_operations):\n        edge_weigth = proc_times[i][j]\n        if edge_weigth != 0:\n            G.add_edge(f\"m{i+1}\", f\"o{j+1}\", weight=edge_weigth)\n\n\n# Add edges based on the adjacency matrix\nfor i in range(num_jobs):\n    for j in range(num_operations):\n        edge_weigth = job_ops_adj[i][j]\n        if edge_weigth != 0:\n            G.add_edge(f\"j{i+1}\", f\"o{j+1}\", weight=3, label=order[j])\n\n\nwidths = [x / 3 for x in nx.get_edge_attributes(G, 'weight').values()]\n\nplt.figure(figsize=(10,6))\n# Plot the graph\n\nmachines = [n for n, d in G.nodes(data=True) if d['bipartite'] == 0]\noperations = [n for n, d in G.nodes(data=True) if d['bipartite'] == 1]\njobs = [n for n, d in G.nodes(data=True) if d['bipartite'] == 2]\n\npos = {}\npos.update((node, (1, index)) for index, node in enumerate(machines))\npos.update((node, (2, index)) for index, node in enumerate(operations))\npos.update((node, (3, index)) for index, node in enumerate(jobs))\n\nedge_labels = {(u, v): d['label'].item() for u, v, d in G.edges(data=True) if d.get(\"label\") is not None}\nnx.draw_networkx_edge_labels(G, {k: (v[0]+.12, v[1]) for k,v in pos.items()}, edge_labels=edge_labels, rotate=False)\n\nnx.draw_networkx_nodes(G, pos, nodelist=machines, node_color='b', label=\"Machine\")\nnx.draw_networkx_nodes(G, pos, nodelist=operations, node_color='r', label=\"Operation\")\nnx.draw_networkx_nodes(G, pos, nodelist=jobs, node_color='y', label=\"jobs\")\nnx.draw_networkx_edges(G, pos, width=widths, alpha=0.6)\n\nplt.title('Visualization of the FJSP')\nplt.legend(bbox_to_anchor=(.95, 1.05))\nplt.axis('off')\nplt.show()\n
# Create a bipartite graph from the adjacency matrix G = nx.Graph() proc_times = td[\"proc_times\"].squeeze(0) job_ops_adj = td[\"job_ops_adj\"].squeeze(0) order = td[\"ops_sequence_order\"].squeeze(0) + 1 num_machines, num_operations = proc_times.shape num_jobs = job_ops_adj.size(0) jobs = [f\"j{i+1}\" for i in range(num_jobs)] machines = [f\"m{i+1}\" for i in range(num_machines)] operations = [f\"o{i+1}\" for i in range(num_operations)] # Add nodes from each set G.add_nodes_from(machines, bipartite=0) G.add_nodes_from(operations, bipartite=1) G.add_nodes_from(jobs, bipartite=2) # Add edges based on the adjacency matrix for i in range(num_machines): for j in range(num_operations): edge_weigth = proc_times[i][j] if edge_weigth != 0: G.add_edge(f\"m{i+1}\", f\"o{j+1}\", weight=edge_weigth) # Add edges based on the adjacency matrix for i in range(num_jobs): for j in range(num_operations): edge_weigth = job_ops_adj[i][j] if edge_weigth != 0: G.add_edge(f\"j{i+1}\", f\"o{j+1}\", weight=3, label=order[j]) widths = [x / 3 for x in nx.get_edge_attributes(G, 'weight').values()] plt.figure(figsize=(10,6)) # Plot the graph machines = [n for n, d in G.nodes(data=True) if d['bipartite'] == 0] operations = [n for n, d in G.nodes(data=True) if d['bipartite'] == 1] jobs = [n for n, d in G.nodes(data=True) if d['bipartite'] == 2] pos = {} pos.update((node, (1, index)) for index, node in enumerate(machines)) pos.update((node, (2, index)) for index, node in enumerate(operations)) pos.update((node, (3, index)) for index, node in enumerate(jobs)) edge_labels = {(u, v): d['label'].item() for u, v, d in G.edges(data=True) if d.get(\"label\") is not None} nx.draw_networkx_edge_labels(G, {k: (v[0]+.12, v[1]) for k,v in pos.items()}, edge_labels=edge_labels, rotate=False) nx.draw_networkx_nodes(G, pos, nodelist=machines, node_color='b', label=\"Machine\") nx.draw_networkx_nodes(G, pos, nodelist=operations, node_color='r', label=\"Operation\") nx.draw_networkx_nodes(G, pos, nodelist=jobs, node_color='y', label=\"jobs\") nx.draw_networkx_edges(G, pos, width=widths, alpha=0.6) plt.title('Visualization of the FJSP') plt.legend(bbox_to_anchor=(.95, 1.05)) plt.axis('off') plt.show() In\u00a0[6]: Copied!
# Lets generate a more complex instance\n\ngenerator_params = {\n  \"num_jobs\": 10,  # the total number of jobs\n  \"num_machines\": 5,  # the total number of machines that can process operations\n  \"min_ops_per_job\": 4,  # minimum number of operatios per job\n  \"max_ops_per_job\": 6,  # maximum number of operations per job\n  \"min_processing_time\": 1,  # the minimum time required for a machine to process an operation\n  \"max_processing_time\": 20,  # the maximum time required for a machine to process an operation\n  \"min_eligible_ma_per_op\": 1,  # the minimum number of machines capable to process an operation\n  \"max_eligible_ma_per_op\": 5,  # the maximum number of machines capable to process an operation\n}\n\nenv = FJSPEnv(generator_params=generator_params)\ntd = env.reset(batch_size=[1])\n
# Lets generate a more complex instance generator_params = { \"num_jobs\": 10, # the total number of jobs \"num_machines\": 5, # the total number of machines that can process operations \"min_ops_per_job\": 4, # minimum number of operatios per job \"max_ops_per_job\": 6, # maximum number of operations per job \"min_processing_time\": 1, # the minimum time required for a machine to process an operation \"max_processing_time\": 20, # the maximum time required for a machine to process an operation \"min_eligible_ma_per_op\": 1, # the minimum number of machines capable to process an operation \"max_eligible_ma_per_op\": 5, # the maximum number of machines capable to process an operation } env = FJSPEnv(generator_params=generator_params) td = env.reset(batch_size=[1]) In\u00a0[7]: Copied!
encoder = HetGNNEncoder(embed_dim=32, num_layers=2)\n(ma_emb, op_emb), init = encoder(td)\nprint(ma_emb.shape)\nprint(op_emb.shape)\n
encoder = HetGNNEncoder(embed_dim=32, num_layers=2) (ma_emb, op_emb), init = encoder(td) print(ma_emb.shape) print(op_emb.shape)
torch.Size([1, 60, 32])\ntorch.Size([1, 5, 32])\n

The decoder return logits over a composite action-space of size (1 + num_jobs * num_machines), where each entry corresponds to a machine-job combination plus one waiting-operation. The selected action specifies, which job is processed next by which machine. To be more precise, the next operation of the selected job is processed. This operation can be retrieved from td[\"next_op\"]

In\u00a0[8]: Copied!
# next operation per job\ntd[\"next_op\"]\n
# next operation per job td[\"next_op\"] Out[8]:
tensor([[ 0,  4, 10, 15, 21, 27, 33, 39, 45, 49]])
In\u00a0[9]: Copied!
decoder = L2DDecoder(env_name=env.name, embed_dim=32)\nlogits, mask = decoder(td, (ma_emb, op_emb), num_starts=0)\n# (1 + num_jobs * num_machines)\nprint(logits.shape)\n
decoder = L2DDecoder(env_name=env.name, embed_dim=32) logits, mask = decoder(td, (ma_emb, op_emb), num_starts=0) # (1 + num_jobs * num_machines) print(logits.shape)
torch.Size([1, 51])\n
In\u00a0[10]: Copied!
def make_step(td):\n    logits, mask = decoder(td, (ma_emb, op_emb), num_starts=0)\n    action = logits.masked_fill(~mask, -torch.inf).argmax(1)\n    td[\"action\"] = action\n    td = env.step(td)[\"next\"]\n    return td\n
def make_step(td): logits, mask = decoder(td, (ma_emb, op_emb), num_starts=0) action = logits.masked_fill(~mask, -torch.inf).argmax(1) td[\"action\"] = action td = env.step(td)[\"next\"] return td In\u00a0[11]: Copied!
env.render(td, 0)\n# Update plot within a for loop\nwhile not td[\"done\"].all():\n    # Clear the previous output for the next iteration\n    clear_output(wait=True)\n\n    td = make_step(td)\n    env.render(td, 0)\n    # Display updated plot\n    display(plt.gcf())\n    \n    # Pause for a moment to see the changes\n    time.sleep(.4)\n
env.render(td, 0) # Update plot within a for loop while not td[\"done\"].all(): # Clear the previous output for the next iteration clear_output(wait=True) td = make_step(td) env.render(td, 0) # Display updated plot display(plt.gcf()) # Pause for a moment to see the changes time.sleep(.4)
<Figure size 640x480 with 0 Axes>
<Figure size 640x480 with 0 Axes>
<Figure size 640x480 with 0 Axes>
In\u00a0[12]: Copied!
if torch.cuda.is_available():\n    accelerator = \"gpu\"\n    batch_size = 256\n    train_data_size = 2_000\n    embed_dim = 128\n    num_encoder_layers = 4\nelse:\n    accelerator = \"cpu\"\n    batch_size = 32\n    train_data_size = 1_000\n    embed_dim = 64\n    num_encoder_layers = 2\n
if torch.cuda.is_available(): accelerator = \"gpu\" batch_size = 256 train_data_size = 2_000 embed_dim = 128 num_encoder_layers = 4 else: accelerator = \"cpu\" batch_size = 32 train_data_size = 1_000 embed_dim = 64 num_encoder_layers = 2 In\u00a0[13]: Copied!
# Policy: neural network, in this case with encoder-decoder architecture\npolicy = L2DPolicy(embed_dim=embed_dim, num_encoder_layers=num_encoder_layers, env_name=\"fjsp\")\n\n# Model: default is AM with REINFORCE and greedy rollout baseline\nmodel = L2DModel(env,\n                 policy=policy, \n                 baseline=\"rollout\",\n                 batch_size=batch_size,\n                 train_data_size=train_data_size,\n                 val_data_size=1_000,\n                 optimizer_kwargs={\"lr\": 1e-4})\n\ntrainer = RL4COTrainer(\n    max_epochs=3,\n    accelerator=accelerator,\n    devices=1,\n    logger=None,\n)\n\ntrainer.fit(model)\n
# Policy: neural network, in this case with encoder-decoder architecture policy = L2DPolicy(embed_dim=embed_dim, num_encoder_layers=num_encoder_layers, env_name=\"fjsp\") # Model: default is AM with REINFORCE and greedy rollout baseline model = L2DModel(env, policy=policy, baseline=\"rollout\", batch_size=batch_size, train_data_size=train_data_size, val_data_size=1_000, optimizer_kwargs={\"lr\": 1e-4}) trainer = RL4COTrainer( max_epochs=3, accelerator=accelerator, devices=1, logger=None, ) trainer.fit(model)
/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'env' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['env'])`.\n/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/utilities/parsing.py:198: Attribute 'policy' is an instance of `nn.Module` and is already saved during checkpointing. It is recommended to ignore them using `self.save_hyperparameters(ignore=['policy'])`.\n/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/trainer/connectors/accelerator_connector.py:551: You passed `Trainer(accelerator='cpu', precision='16-mixed')` but AMP with fp16 is not supported on CPU. Using `precision='bf16-mixed'` instead.\nUsing bfloat16 Automatic Mixed Precision (AMP)\nGPU available: False, used: False\nTPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\n/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/trainer/connectors/logger_connector/logger_connector.py:67: Starting from v1.9.0, `tensorboardX` has been removed as a dependency of the `lightning.pytorch` package, due to potential conflicts with other packages in the ML ecosystem. For this reason, `logger=True` will use `CSVLogger` as the default logger, unless the `tensorboard` or `tensorboardX` packages are found. Please `pip install lightning[extra]` or one of them to enable TensorBoard support by default\nval_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\n\n  | Name     | Type           | Params\n--------------------------------------------\n0 | env      | FJSPEnv        | 0     \n1 | policy   | L2DPolicy      | 81.2 K\n2 | baseline | WarmupBaseline | 81.2 K\n--------------------------------------------\n162 K     Trainable params\n0         Non-trainable params\n162 K     Total params\n0.649     Total estimated model params size (MB)\n
Sanity Checking: |          | 0/? [00:00<?, ?it/s]
/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'val_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=7` in the `DataLoader` to improve performance.\n/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/trainer/connectors/data_connector.py:441: The 'train_dataloader' does not have many workers which may be a bottleneck. Consider increasing the value of the `num_workers` argument` to `num_workers=7` in the `DataLoader` to improve performance.\n/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/loops/fit_loop.py:293: The number of training batches (32) is smaller than the logging interval Trainer(log_every_n_steps=50). Set a lower value for log_every_n_steps if you want to see logs for the training epoch.\n
Training: |          | 0/? [00:00<?, ?it/s]
/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/trainer/call.py:54: Detected KeyboardInterrupt, attempting graceful shutdown...\n
In\u00a0[14]: Copied!
import gc\nfrom rl4co.envs import JSSPEnv\nfrom rl4co.models.zoo.l2d.model import L2DPPOModel\nfrom rl4co.models.zoo.l2d.policy import L2DPolicy4PPO\nfrom torch.utils.data import DataLoader\n
import gc from rl4co.envs import JSSPEnv from rl4co.models.zoo.l2d.model import L2DPPOModel from rl4co.models.zoo.l2d.policy import L2DPolicy4PPO from torch.utils.data import DataLoader In\u00a0[15]: Copied!
# Lets generate a more complex instance\n\ngenerator_params = {\n  \"num_jobs\": 15,  # the total number of jobs\n  \"num_machines\": 15,  # the total number of machines that can process operations\n  \"min_processing_time\": 1,  # the minimum time required for a machine to process an operation\n  \"max_processing_time\": 99,  # the maximum time required for a machine to process an operation\n}\n\nenv = JSSPEnv(\n    generator_params=generator_params, \n    _torchrl_mode=True, \n    stepwise_reward=True\n)\n
# Lets generate a more complex instance generator_params = { \"num_jobs\": 15, # the total number of jobs \"num_machines\": 15, # the total number of machines that can process operations \"min_processing_time\": 1, # the minimum time required for a machine to process an operation \"max_processing_time\": 99, # the maximum time required for a machine to process an operation } env = JSSPEnv( generator_params=generator_params, _torchrl_mode=True, stepwise_reward=True ) In\u00a0[16]: Copied!
# Policy: neural network, in this case with encoder-decoder architecture\npolicy = L2DPolicy4PPO(\n    embed_dim=embed_dim, \n    num_encoder_layers=num_encoder_layers, \n    env_name=\"jssp\",\n    het_emb=False\n)\n\nmodel = L2DPPOModel(\n    env=env,\n    policy=policy,\n    batch_size=batch_size,\n    train_data_size=train_data_size,\n    val_data_size=1_000,\n    optimizer_kwargs={\"lr\": 1e-4}\n)\n
# Policy: neural network, in this case with encoder-decoder architecture policy = L2DPolicy4PPO( embed_dim=embed_dim, num_encoder_layers=num_encoder_layers, env_name=\"jssp\", het_emb=False ) model = L2DPPOModel( env=env, policy=policy, batch_size=batch_size, train_data_size=train_data_size, val_data_size=1_000, optimizer_kwargs={\"lr\": 1e-4} ) In\u00a0[17]: Copied!
CHECKPOINT_PATH = \"last.ckpt\"\ndevice = \"cuda\" if torch.cuda.is_available() else \"cpu\"\ntry:\n    model = L2DPPOModel.load_from_checkpoint(CHECKPOINT_PATH)\nexcept FileNotFoundError:\n\n    trainer = RL4COTrainer(\n        max_epochs=1,\n        accelerator=accelerator,\n        devices=1,\n        logger=None,\n    )\n\n    trainer.fit(model)\nfinally:\n    model = model.to(device)\n
CHECKPOINT_PATH = \"last.ckpt\" device = \"cuda\" if torch.cuda.is_available() else \"cpu\" try: model = L2DPPOModel.load_from_checkpoint(CHECKPOINT_PATH) except FileNotFoundError: trainer = RL4COTrainer( max_epochs=1, accelerator=accelerator, devices=1, logger=None, ) trainer.fit(model) finally: model = model.to(device)
Using bfloat16 Automatic Mixed Precision (AMP)\nGPU available: False, used: False\nTPU available: False, using: 0 TPU cores\nIPU available: False, using: 0 IPUs\nHPU available: False, using: 0 HPUs\nOverriding gradient_clip_val to None for 'automatic_optimization=False' models\n/Users/luttmann/opt/miniconda3/envs/rl4co/lib/python3.9/site-packages/lightning/pytorch/utilities/parsing.py:43: attribute 'policy' removed from hparams because it cannot be pickled\nval_file not set. Generating dataset instead\ntest_file not set. Generating dataset instead\n\n  | Name       | Type          | Params\n---------------------------------------------\n0 | env        | JSSPEnv       | 0     \n1 | policy     | L2DPolicy4PPO | 25.5 K\n2 | policy_old | L2DPolicy4PPO | 25.5 K\n---------------------------------------------\n51.1 K    Trainable params\n0         Non-trainable params\n51.1 K    Total params\n0.204     Total estimated model params size (MB)\n
Sanity Checking: |          | 0/? [00:00<?, ?it/s]
Training: |          | 0/? [00:00<?, ?it/s]
In\u00a0[8]: Copied!
%%bash\n\n# Define the folder path\nDATA_PATH=\"./taillard\"\n\n# Check if the folder exists\nif [ -d \"$DATA_PATH\" ]; then\n    echo \"Folder already exists.\"\nelse\n    echo \"Folder does not exist. Creating folder and downloading taillard instances...\"\n    mkdir -p \"$DATA_PATH\"\n    ! wget http://mistic.heig-vd.ch/taillard/problemes.dir/ordonnancement.dir/jobshop.dir/tai20_15.txt -O taillard/tai20_15.txt\n    ! wget http://mistic.heig-vd.ch/taillard/problemes.dir/ordonnancement.dir/jobshop.dir/tai15_15.txt -O taillard/tai15_15.txt\n    ! wget http://mistic.heig-vd.ch/taillard/problemes.dir/ordonnancement.dir/jobshop.dir/tai20_20.txt -O taillard/tai20_20.txt\n    ! wget http://mistic.heig-vd.ch/taillard/problemes.dir/ordonnancement.dir/jobshop.dir/tai30_15.txt -O taillard/tai30_15.txt\n    ! wget http://mistic.heig-vd.ch/taillard/problemes.dir/ordonnancement.dir/jobshop.dir/tai30_20.txt -O taillard/tai30_20.txt\nfi\n\nexit 0\n
%%bash # Define the folder path DATA_PATH=\"./taillard\" # Check if the folder exists if [ -d \"$DATA_PATH\" ]; then echo \"Folder already exists.\" else echo \"Folder does not exist. Creating folder and downloading taillard instances...\" mkdir -p \"$DATA_PATH\" ! wget http://mistic.heig-vd.ch/taillard/problemes.dir/ordonnancement.dir/jobshop.dir/tai20_15.txt -O taillard/tai20_15.txt ! wget http://mistic.heig-vd.ch/taillard/problemes.dir/ordonnancement.dir/jobshop.dir/tai15_15.txt -O taillard/tai15_15.txt ! wget http://mistic.heig-vd.ch/taillard/problemes.dir/ordonnancement.dir/jobshop.dir/tai20_20.txt -O taillard/tai20_20.txt ! wget http://mistic.heig-vd.ch/taillard/problemes.dir/ordonnancement.dir/jobshop.dir/tai30_15.txt -O taillard/tai30_15.txt ! wget http://mistic.heig-vd.ch/taillard/problemes.dir/ordonnancement.dir/jobshop.dir/tai30_20.txt -O taillard/tai30_20.txt fi exit 0
Folder does not exist. Creating folder and downloading taillard instances...\n
bash: line 11: wget: command not found\nbash: line 12: wget: command not found\nbash: line 13: wget: command not found\nbash: line 14: wget: command not found\nbash: line 15: wget: command not found\n
In\u00a0[18]: Copied!
# path to taillard instances\nFILE_PATH = \"./taillard/tai{instance_type}.txt\"\n\nresults = {}\ninstance_types = [\"15_15\", \"20_15\", \"20_20\", \"30_15\", \"30_20\"]\n\nfor instance_type in instance_types:\n    \n    dataset = env.dataset(batch_size=[10], phase=\"test\", filename=FILE_PATH.format(instance_type=instance_type))\n    dl = DataLoader(dataset, batch_size=5, collate_fn=dataset.collate_fn)\n    rewards = []\n    \n    for batch in dl:\n        td = env.reset(batch).to(device)\n        # use policy.generate to avoid grad calculations which can lead to oom \n        out = model.policy.generate(td, env=env, phase=\"test\", decode_type=\"multistart_sampling\", num_starts=100, select_best=True)\n        rewards.append(out[\"reward\"])\n\n    reward = torch.cat(rewards, dim=0).mean().item()\n    results[instance_type] = reward\n\n    print(\"Done evaluating instance type %s with reward %s\" % (instance_type, reward))\n\n    # avoid ooms due to cache not being cleared \n    model.rb.empty()\n    gc.collect()\n    torch.cuda.empty_cache()\n
# path to taillard instances FILE_PATH = \"./taillard/tai{instance_type}.txt\" results = {} instance_types = [\"15_15\", \"20_15\", \"20_20\", \"30_15\", \"30_20\"] for instance_type in instance_types: dataset = env.dataset(batch_size=[10], phase=\"test\", filename=FILE_PATH.format(instance_type=instance_type)) dl = DataLoader(dataset, batch_size=5, collate_fn=dataset.collate_fn) rewards = [] for batch in dl: td = env.reset(batch).to(device) # use policy.generate to avoid grad calculations which can lead to oom out = model.policy.generate(td, env=env, phase=\"test\", decode_type=\"multistart_sampling\", num_starts=100, select_best=True) rewards.append(out[\"reward\"]) reward = torch.cat(rewards, dim=0).mean().item() results[instance_type] = reward print(\"Done evaluating instance type %s with reward %s\" % (instance_type, reward)) # avoid ooms due to cache not being cleared model.rb.empty() gc.collect() torch.cuda.empty_cache()
Provided file name ../../ai4co/rl4co/data/jssp/taillard/15j_15m not found. Make sure to provide a file in the right path first or unset test_file to generate data automatically instead\n
Done evaluating instance type 15j_15m with reward -1408.0999755859375\n
Provided file name ../../ai4co/rl4co/data/jssp/taillard/20j_15m not found. Make sure to provide a file in the right path first or unset test_file to generate data automatically instead\nProvided file name ../../ai4co/rl4co/data/jssp/taillard/20j_20m not found. Make sure to provide a file in the right path first or unset test_file to generate data automatically instead\n
Done evaluating instance type 20j_15m with reward -1380.699951171875\n
Provided file name ../../ai4co/rl4co/data/jssp/taillard/30j_15m not found. Make sure to provide a file in the right path first or unset test_file to generate data automatically instead\n
Done evaluating instance type 20j_20m with reward -1349.9000244140625\n
Provided file name ../../ai4co/rl4co/data/jssp/taillard/30j_20m not found. Make sure to provide a file in the right path first or unset test_file to generate data automatically instead\n
Done evaluating instance type 30j_15m with reward -1374.0999755859375\nDone evaluating instance type 30j_20m with reward -1371.699951171875\n
"},{"location":"examples/other/2-scheduling/#solving-the-flexible-job-shop-scheduling-problem-fjsp","title":"Solving the Flexible Job-Shop Scheduling Problem (FJSP)\u00b6","text":"

The following notebook explains the FJSP and explains the solution construction process using an encoder-decoder architecture based on a Heterogeneous Graph Neural Network (HetGNN)

"},{"location":"examples/other/2-scheduling/#visualize-the-problem","title":"Visualize the Problem\u00b6","text":"

Below we visualize the generated instance of the FJSP. Blue nodes correspond to machines, red nodes to operations and yellow nodes to jobs. A machine may process an operation if there exists an edge between the two.

The thickness of the connection between a machine and an operation node specifies the processing time the respective machine needs to process the operation (thicker line := longer processing).

Each operation belongs to exactly one job, where an edge between a job and an operation node indicates that the respective operation belongs to the job. The number above an operation-job edge specifies the precedence-order in which the operations of a job need to be processed. A job is done when all operations belonging to it are scheduled. The instance is solved when all jobs are fully scheduled.

Also note that some operation nodes are not connected. These operation nodes are padded, so that all instances in a batch have the same number of operations (where we determine the maximum number of operations as num_jobs * max_ops_per_job).

"},{"location":"examples/other/2-scheduling/#build-a-model-to-solve-the-fjsp","title":"Build a Model to Solve the FJSP\u00b6","text":"

In the FJSP we typically encode Operations and Machines separately, since they pose different node types in a k-partite Graph. Therefore, the encoder for the FJSP returns two hidden representations, the first containing machine embeddings and the second containing operation embeddings:

"},{"location":"examples/other/2-scheduling/#visualize-solution-construction","title":"Visualize solution construction\u00b6","text":"

Starting at $t=0$, the decoder uses the machine-operation embeddings of the encoder to decide which machine-job-combination to schedule next. Note, that due to the precedence relationship, the operations to be scheduled next are fixed per job. Therefore, it is sufficient to determine the next job to be scheduled, which significantly reduces the action space.

After some operations have been scheduled, either all the machines are busy or all the jobs have been scheduled with their currently active operation. In this case, the environment transitions to a new time step $t$. The new $t$ will be equal to the first time step where a machine finishes an operation in the partial schedule. When an operation is finished, the machine that has processed it is immediately ready to process the next operation. Also, the next operation of the respective job can then be scheduled.

The start time of an operation is always equal to the time step in which it is scheduled. The finish time of an operation is equal to its start time plus the processing time required by the machine on which it is being processed.

The figure below visualises this process.

"},{"location":"examples/other/2-scheduling/#solving-the-job-shop-scheduling-problem-jssp","title":"Solving the Job-Shop Scheduling Problem (JSSP)\u00b6","text":""},{"location":"examples/other/2-scheduling/#train-on-synthetic-data-and-test-on-taillard-benchmark","title":"Train on synthetic data and test on Taillard benchmark\u00b6","text":""},{"location":"examples/other/3-data-generator-distributions/","title":"Generating data in RL4CO","text":"In\u00a0[1]: Copied!
import matplotlib.pyplot as plt\nfrom rl4co.envs.routing import TSPEnv, TSPGenerator\nfrom rl4co.envs.common.distribution_utils import Cluster, Mix_Distribution, Mix_Multi_Distributions, Gaussian_Mixture, Mixed\n\n# Instantiate the environment and generator\ngenerator = TSPGenerator(num_loc=100)\nenv = TSPEnv(generator=generator)\n\n# Simple plot\nfig, axs = plt.subplots(1, 3, figsize=(10, 3))\ntd = env.generator(3) # generate 3 instances\nfor i in range(3):\n    axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1])\n    axs[i].set_xticks([]); axs[i].set_yticks([])\nfig.suptitle(\"TSP with 100 locations, uniform distribution\")\n
import matplotlib.pyplot as plt from rl4co.envs.routing import TSPEnv, TSPGenerator from rl4co.envs.common.distribution_utils import Cluster, Mix_Distribution, Mix_Multi_Distributions, Gaussian_Mixture, Mixed # Instantiate the environment and generator generator = TSPGenerator(num_loc=100) env = TSPEnv(generator=generator) # Simple plot fig, axs = plt.subplots(1, 3, figsize=(10, 3)) td = env.generator(3) # generate 3 instances for i in range(3): axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1]) axs[i].set_xticks([]); axs[i].set_yticks([]) fig.suptitle(\"TSP with 100 locations, uniform distribution\")
/home/botu/anaconda3/envs/rl4co/lib/python3.11/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n  from .autonotebook import tqdm as notebook_tqdm\n
Out[1]:
Text(0.5, 0.98, 'TSP with 100 locations, uniform distribution')

Generating data with different sizes

In\u00a0[2]: Copied!
generator = TSPGenerator(num_loc=1000)\nenv.generator = generator\n\nfig, axs = plt.subplots(1, 3, figsize=(10, 3))\ntd = env.generator(3) # generate 3 instances\nfor i in range(3):\n    axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1])\n    axs[i].set_xticks([]); axs[i].set_yticks([])\nfig.suptitle(\"TSP with 1000 locations, uniform distribution\")\n
generator = TSPGenerator(num_loc=1000) env.generator = generator fig, axs = plt.subplots(1, 3, figsize=(10, 3)) td = env.generator(3) # generate 3 instances for i in range(3): axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1]) axs[i].set_xticks([]); axs[i].set_yticks([]) fig.suptitle(\"TSP with 1000 locations, uniform distribution\") Out[2]:
Text(0.5, 0.98, 'TSP with 1000 locations, uniform distribution')

Changing distribution of the data to normal distribution. We can pass the arguments to it by using loc_ + distribution name as well as its keyword arguments, including here the mean and std of the normal distribution

In\u00a0[3]: Copied!
generator = TSPGenerator(num_loc=100, loc_distribution=\"normal\", loc_mean=0, loc_std=1)\nenv.generator = generator\n\nfig, axs = plt.subplots(1, 3, figsize=(10, 3))\ntd = env.generator(3) # generate 3 instances\nfor i in range(3):\n    axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1])\n    axs[i].set_xticks([]); axs[i].set_yticks([])\nfig.suptitle(\"TSP with 100 locations, normal distribution\")\n
generator = TSPGenerator(num_loc=100, loc_distribution=\"normal\", loc_mean=0, loc_std=1) env.generator = generator fig, axs = plt.subplots(1, 3, figsize=(10, 3)) td = env.generator(3) # generate 3 instances for i in range(3): axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1]) axs[i].set_xticks([]); axs[i].set_yticks([]) fig.suptitle(\"TSP with 100 locations, normal distribution\") Out[3]:
Text(0.5, 0.98, 'TSP with 100 locations, normal distribution')

We can pass a custom loc_sampler to the generator (we can make it ourselves!) to generate data from a custom distribution. In this case we use the mixture of three exemplar distributions in batch-level, i.e. Uniform, Cluster, Mixed following the setting in Bi et al. 2022 (https://arxiv.org/abs/2210.07686)

In\u00a0[4]: Copied!
loc_sampler = Mix_Distribution(n_cluster=3)\ngenerator = TSPGenerator(num_loc=200, loc_sampler=loc_sampler)\nenv.generator = generator\n\nfig, axs = plt.subplots(1, 3, figsize=(10, 3))\ntd = env.generator(3) # generate 3 instances\nfor i in range(3):\n    axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1])\n    axs[i].set_xticks([]); axs[i].set_yticks([])\nfig.suptitle(\"TSP with 200 locations, mixed distribution\")\n
loc_sampler = Mix_Distribution(n_cluster=3) generator = TSPGenerator(num_loc=200, loc_sampler=loc_sampler) env.generator = generator fig, axs = plt.subplots(1, 3, figsize=(10, 3)) td = env.generator(3) # generate 3 instances for i in range(3): axs[i].scatter(td[\"locs\"][i][:, 0], td[\"locs\"][i][:, 1]) axs[i].set_xticks([]); axs[i].set_yticks([]) fig.suptitle(\"TSP with 200 locations, mixed distribution\") Out[4]:
Text(0.5, 0.98, 'TSP with 200 locations, mixed distribution')
In\u00a0[5]: Copied!
from rl4co.envs.graph import MCPEnv, MCPGenerator\nfrom matplotlib import pyplot as plt\nimport torch\nfrom collections import Counter\n\ngenerator = MCPGenerator(size_distribution=\"uniform\", weight_distribution=\"uniform\")\nenv = MCPEnv(generator=generator)\ndata = env.generator(100)\n\nsizes = torch.count_nonzero(data[\"membership\"], dim=-1).flatten().tolist()\nsize2cnt = Counter(sizes)\nweights = data[\"weights\"].flatten().tolist()\nweight2cnt = Counter(weights)\n\n# plot the size distributions and the weight distributions\nplt.figure()\nplt.bar(size2cnt.keys(), size2cnt.values())\nplt.title(\"Size distribution\")\nplt.xlabel(\"Size\")\nplt.ylabel(\"Probability\")\nplt.show()\n\n# Note: the size distributions are not perfectly uniform since there might be repeated items and are removed in post-processing\n\nplt.figure()\nplt.bar(weight2cnt.keys(), weight2cnt.values())\nplt.title(\"Weight distribution\")\nplt.xlabel(\"Weight\")\nplt.ylabel(\"Probability\")\nplt.show()\n
from rl4co.envs.graph import MCPEnv, MCPGenerator from matplotlib import pyplot as plt import torch from collections import Counter generator = MCPGenerator(size_distribution=\"uniform\", weight_distribution=\"uniform\") env = MCPEnv(generator=generator) data = env.generator(100) sizes = torch.count_nonzero(data[\"membership\"], dim=-1).flatten().tolist() size2cnt = Counter(sizes) weights = data[\"weights\"].flatten().tolist() weight2cnt = Counter(weights) # plot the size distributions and the weight distributions plt.figure() plt.bar(size2cnt.keys(), size2cnt.values()) plt.title(\"Size distribution\") plt.xlabel(\"Size\") plt.ylabel(\"Probability\") plt.show() # Note: the size distributions are not perfectly uniform since there might be repeated items and are removed in post-processing plt.figure() plt.bar(weight2cnt.keys(), weight2cnt.values()) plt.title(\"Weight distribution\") plt.xlabel(\"Weight\") plt.ylabel(\"Probability\") plt.show()

We can also pass a custom sampler to generate data:

In\u00a0[6]: Copied!
from collections import Counter\nfrom torch.distributions import Normal\n\nsize_sampler = Normal(10, 2)\nweight_sampler = Normal(5, 1)\n\ngenerator = MCPGenerator(size_sampler=size_sampler, weight_sampler=weight_sampler)\nenv = MCPEnv(generator=generator)\ndata = env.generator(100)\n\nsizes = torch.count_nonzero(data[\"membership\"], dim=-1).flatten().tolist()\nsize2cnt = Counter(sizes)\nweights = data[\"weights\"].flatten().tolist()\nweight2cnt = Counter(weights)\n\n# plot the size distributions and the weight distributions\nplt.figure()\nplt.bar(size2cnt.keys(), size2cnt.values())\nplt.title(\"Size distribution\")\nplt.xlabel(\"Size\")\nplt.ylabel(\"Probability\")\nplt.show()\n\nplt.figure()\nplt.bar(weight2cnt.keys(), weight2cnt.values())\nplt.title(\"Weight distribution\")\nplt.xlabel(\"Weight\")\nplt.ylabel(\"Probability\")\nplt.show()\n
from collections import Counter from torch.distributions import Normal size_sampler = Normal(10, 2) weight_sampler = Normal(5, 1) generator = MCPGenerator(size_sampler=size_sampler, weight_sampler=weight_sampler) env = MCPEnv(generator=generator) data = env.generator(100) sizes = torch.count_nonzero(data[\"membership\"], dim=-1).flatten().tolist() size2cnt = Counter(sizes) weights = data[\"weights\"].flatten().tolist() weight2cnt = Counter(weights) # plot the size distributions and the weight distributions plt.figure() plt.bar(size2cnt.keys(), size2cnt.values()) plt.title(\"Size distribution\") plt.xlabel(\"Size\") plt.ylabel(\"Probability\") plt.show() plt.figure() plt.bar(weight2cnt.keys(), weight2cnt.values()) plt.title(\"Weight distribution\") plt.xlabel(\"Weight\") plt.ylabel(\"Probability\") plt.show()

Tl;dr: RL4CO allows for easily generating data for CO problems! \ud83d\ude80

"},{"location":"examples/other/3-data-generator-distributions/#generating-data-in-rl4co","title":"Generating data in RL4CO\u00b6","text":"

RL4CO allows for easily generating data from different distributions for CO problems

"},{"location":"examples/other/3-data-generator-distributions/#generating-different-distributions-for-tsp","title":"Generating different distributions for TSP\u00b6","text":""},{"location":"examples/other/3-data-generator-distributions/#generating-different-distributions-for-mcp","title":"Generating different distributions for MCP\u00b6","text":"

In here we visualize the different weight and size distributions for MCP by passing the distribution name, which is automatically parsed:

"},{"location":"rl4co/tasks/","title":"Evaluation","text":"

To evaluate your trained model, here are some steps to follow:

Step 1. Prepare your pre-trained model checkpoint and test instances data file. Put them in your preferred place. e.g., we will test the AttentionModel on TSP50:

.\n\u251c\u2500\u2500 rl4co/\n\u2502   \u2514\u2500\u2500 ...\n\u251c\u2500\u2500 checkpoints/\n\u2502   \u2514\u2500\u2500 am-tsp50.ckpt\n\u2514\u2500\u2500 data/\n    \u2514\u2500\u2500 tsp/\n        \u2514\u2500\u2500 tsp50_test_seed1234.npz\n

You can generate the test instances data file by running the following command:

python -c \"from rl4co.data.generate_data import generate_default_datasets; generate_default_datasets('data')\"\n

Step 2. Run the eval.py with your customized setting. e.g., let's use the sampling method with a top_p=0.95 sampling strategy:

python rl4co/tasks/eval.py --problem tsp --data-path data/tsp/tsp50_test_seed1234.npz --model AttentionModel --ckpt-path checkpoints/am-tsp50.ckpt --method sampling --top-p 0.95\n

Arguments guideline:

  • --problem: the problem name, e.g., tsp, cvrp, pdp, etc. This should be consistent with the env.name. Default is tsp.
  • --generator-params: the generator parameters for the test instances. You could specify the num_loc etc. Default is {'num_loc': 50}.
  • --data-path: the path to the test instances data file. Default is data/tsp/tsp50_test_seed1234.npz.
  • --model: the model class name, e.g., AttentionModel, POMO, SymNCO, etc. It will be dynamically imported and instantiated. Default is AttentionModel.
  • --ckpt-path: the path to the pre-trained model checkpoint. Default is checkpoints/am-tsp50.ckpt.
  • --device: the device to run the evaluation, e.g., cuda:0, cpu, etc. Default is cuda:0.
  • --method: the evaluation method, e.g., greedy, sampling, multistart_greedy, augment_dihedral_8, augment, multistart_greedy_augment_dihedral_8, and multistart_greedy_augment. Default is greedy.
  • --save-results: whether to save the evaluation results as a .pkl file. Deafult is True. The results include actions, rewards, inference_time, and avg_reward.
  • --save-path: the path to save the evaluation results. Default is results/.
  • --num-instances: the number of test instances to evaluate. Default is 1000.

If you use the sampling method, you may need to specify the following parameters:

  • --samples: the number of samples for the sampling method. Default is 1280.
  • --temperature: the temperature for the sampling method. Default is 1.0.
  • --top-p: the top-p for the sampling method. Default is 0.0, i.e. not activated.
  • --top-k: the top-k for the sampling method. Deafult is 0, i.e. not activated.
  • --select-best: whether to select the best action from the sampling results. If False, the results will include all sampled rewards, i.e., [num_instances * num_samples].

If you use the augment method, you may need to specify the following parameters:

  • --num-augments: the number of augmented instances for the augment method. Default is 8.
  • --force-dihedral-8: whether to force the augmented instances to be dihedral 8. Default is True.

Step 3. If you want to launch several evaluations with various parameters, you may refer to the following examples:

  • Evaluate POMO on TSP50 with a sampling of different Top-p and temperature:
        #!/bin/bash\n\n    top_p_list=(0.5 0.6 0.7 0.8 0.9 0.95 0.98 0.99 0.995 1.0)\n    temp_list=(0.1 0.3 0.5 0.7 0.8 0.9 1.0 1.1 1.2 1.5 1.8 2.0 2.2 2.5 2.8 3.0)\n\n    device=cuda:0\n\n    problem=tsp\n    model=POMO\n    ckpt_path=checkpoints/pomo-tsp50.ckpt\n    data_path=data/tsp/tsp50_test_seed1234.npz\n\n    num_instances=1000\n    save_path=results/tsp50-pomo-topp-1k\n\n    for top_p in ${top_p_list[@]}; do\n        for temp in ${temp_list[@]}; do\n            python rl4co/tasks/eval.py --problem ${problem} --model ${model} --ckpt_path ${ckpt_path} --data_path ${data_path} --save_path ${save_path} --method sampling --temperature=${temp} --top_p=${top_p} --top_k=0 --device ${device}\n        done\n    done\n
  • Evaluate POMO on CVRP50 with a sampling of different Top-k and temperature:
        #!/bin/bash\n\n    top_k_list=(5 10 15 20 25)\n    temp_list=(0.1 0.3 0.5 0.7 0.8 0.9 1.0 1.1 1.2 1.5 1.8 2.0 2.2 2.5 2.8 3.0)\n\n    device=cuda:1\n\n    problem=cvrp\n    model=POMO\n    ckpt_path=checkpoints/pomo-cvrp50.ckpt\n    data_path=data/vrp/vrp50_test_seed1234.npz\n\n    num_instances=1000\n    save_path=results/cvrp50-pomo-topk-1k\n\n    for top_k in ${top_k_list[@]}; do\n        for temp in ${temp_list[@]}; do\n            python rl4co/tasks/eval.py --problem ${problem} --model ${model} --ckpt_path ${ckpt_path} --data_path ${data_path} --save_path ${save_path} --method sampling --temperature=${temp} --top_p=0.0 --top_k=${top_k} --device ${device}\n        done\n    done\n
"}]} \ No newline at end of file diff --git a/sitemap.xml b/sitemap.xml new file mode 100644 index 00000000..a5b91c03 --- /dev/null +++ b/sitemap.xml @@ -0,0 +1,223 @@ + + + + https://ai4co.github.io/rl4co/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/README_backup/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/data/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/decoding/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/tasks/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/train_and_eval/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/envs/base/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/envs/eda/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/envs/graph/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/envs/routing/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/envs/scheduling/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/networks/base_policies/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/networks/env_embeddings/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/networks/improvement_policies/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/networks/nn/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/rl/a2c/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/rl/base/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/rl/ppo/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/rl/reinforce/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/zoo/constructive_ar/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/zoo/constructive_nar/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/zoo/improvement/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/api/zoo/transductive/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/general/ai4co/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/general/contribute/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/general/faq/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/general/licensing/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/general/paper/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/intro/environments/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/intro/intro/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/intro/policies/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/intro/rl/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/start/hydra/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/docs/content/start/installation/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/1-quickstart/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/2-full-training/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/3-creating-new-env-model/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/advanced/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/advanced/1-hydra-config/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/advanced/2-flash-attention-2/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/advanced/3-local-search/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/datasets/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/datasets/1-test-on-tsplib/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/datasets/2-test-on-cvrplib/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/modeling/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/modeling/1-decoding-strategies/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/modeling/2-transductive-methods/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/modeling/3-change-encoder/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/other/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/other/1-mtvrp/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/other/2-scheduling/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/examples/other/3-data-generator-distributions/ + 2024-10-24 + + + https://ai4co.github.io/rl4co/rl4co/tasks/ + 2024-10-24 + + \ No newline at end of file diff --git a/sitemap.xml.gz b/sitemap.xml.gz new file mode 100644 index 0000000000000000000000000000000000000000..0298466bc6de5eceb9952a08a548cd6dc381fd12 GIT binary patch literal 678 zcmV;X0$KeZiwFn+ju~eH|8r?{Wo=<_E_iKh0L_`bZrd;rfcHFw;r&cY$ z+h)K1`Qs~mSU(=_c7r#8coiqxuwS>#{U;%=*Xt%|rVjhCalR2jws8=|>rJuUd|V&y zR`Ey+%vaN~Gfp1TDj_a|`a!x)qq!YU8|{QQaV&Ns&3XR_2JW0X)Z6+2sx8zHamwqx zS%z4I{JXgCPoKYhdpe#_UWWeG!j+RDi%jV(lVyRu777{jL(pt{*+Ce?CI35NkJ=v5 zsw0hPvg42)gE(QJGDt{a86b_vzAXdAyMasap9v=A12vcucr5YN`O9p+$KDw&HHC7p zqP~vQok*qVR}h!(dhbT+;vWTS&D!iN-UzH^2^d8L=E%|at^^EE+Mb=4`E~N!xik*! z2g!P*Bl_}~Y#~tZ0!|S;u>`Y0%}UA&)Q}|~i@<4W5hQ8s^=aTT6m!PsA~<4_BpY%U zJ#REU_LSGNb+i(f3LNd7O@18;z?skaIf|&MW)z>d!3>O^Mf*#6EPzAD)QH9)Yj^V+ zlU}gv&FyVskz2v@pyg%OL@tOL&Vw;9ZGmJ6rVGbCNKcrWYOr*L7{?$=Ad?LU)reM- z$`4S%&X|!FtQy`oWY7_}P8GlvvqX!wA(+0N z-M->ph#a@srB~2#bfnA_HRRiW{tM+EQmlcwCu8S9=`gp>F-hIrdgt?he&L#aV)Q)x M0Y$I!Ekhmv0N6fFxc~qF literal 0 HcmV?d00001 diff --git a/tests/__init__.py b/tests/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/tests/test_envs.py b/tests/test_envs.py new file mode 100644 index 00000000..aa83d583 --- /dev/null +++ b/tests/test_envs.py @@ -0,0 +1,157 @@ +import warnings + +import matplotlib.pyplot as plt +import pytest +import torch + +from tensordict import TensorDict + +from rl4co.envs import ( + ATSPEnv, + CVRPEnv, + CVRPTWEnv, + DPPEnv, + FFSPEnv, + FJSPEnv, + JSSPEnv, + MDCPDPEnv, + MDPPEnv, + MTSPEnv, + MTVRPEnv, + OPEnv, + PCTSPEnv, + PDPEnv, + SDVRPEnv, + SMTWTPEnv, + SPCTSPEnv, + SVRPEnv, + TSPEnv, + FLPEnv, + MCPEnv, +) +from rl4co.utils.decoding import random_policy, rollout + +# Switch to non-GUI backend for testing +plt.switch_backend("Agg") +warnings.filterwarnings("ignore", "Matplotlib is currently using agg") + + +@pytest.mark.parametrize( + "env_cls", + [ + TSPEnv, + CVRPEnv, + CVRPTWEnv, + SVRPEnv, + SDVRPEnv, + PCTSPEnv, + SPCTSPEnv, + OPEnv, + PDPEnv, + MTSPEnv, + ATSPEnv, + MDCPDPEnv, + ], +) +def test_routing(env_cls, batch_size=2, size=20): + env = env_cls(generator_params=dict(num_loc=size)) + reward, td, actions = rollout(env, env.reset(batch_size=[batch_size]), random_policy) + assert reward.shape == (batch_size,) + + +@pytest.mark.parametrize( + "variant", + [ + "all", + "cvrp", + "ovrp", + "vrpb", + "vrpl", + "vrptw", + "ovrptw", + "ovrpb", + "ovrpl", + "vrpbl", + "vrpbtw", + "vrpltw", + "ovrpbl", + "ovrpltw", + "vrpltw", + "ovrpbltw", + ], +) +def test_mtvrp(variant, batch_size=2, size=20): + env = MTVRPEnv(generator_params=dict(num_loc=size, variant_preset=variant)) + reward, td, actions = rollout(env, env.reset(batch_size=[batch_size]), random_policy) + assert reward.shape == (batch_size,) + + +@pytest.mark.parametrize("env_cls", [DPPEnv, MDPPEnv]) +def test_eda(env_cls, batch_size=2, max_decaps=5): + env = env_cls(max_decaps=max_decaps) + reward, td, actions = rollout(env, env.reset(batch_size=[batch_size]), random_policy) + assert reward.shape == (batch_size,) + + +@pytest.mark.parametrize("env_cls", [FFSPEnv, FJSPEnv, JSSPEnv]) +@pytest.mark.parametrize("mask_no_ops", [True, False]) +def test_scheduling(env_cls, mask_no_ops, batch_size=2): + env = env_cls() + reward, td, actions = rollout(env, env.reset(batch_size=[batch_size]), random_policy) + assert reward.shape == (batch_size,) + + +@pytest.mark.parametrize("env_cls", [SMTWTPEnv]) +def test_smtwtp(env_cls, batch_size=2): + env = env_cls(num_job=4) + reward, td, actions = rollout(env, env.reset(batch_size=[batch_size]), random_policy) + assert reward.shape == (batch_size,) + + +@pytest.mark.parametrize("env_cls", [JSSPEnv]) +def test_jssp_lb(env_cls): + env = env_cls(generator_params={"num_jobs": 2, "num_machines": 2}) + td = TensorDict( + { + "proc_times": torch.tensor( + [[[1, 0, 0, 4], [0, 2, 3, 0]]], dtype=torch.float32 + ), + "start_op_per_job": torch.tensor([[0, 2]], dtype=torch.long), + "end_op_per_job": torch.tensor([[1, 3]], dtype=torch.long), + "pad_mask": torch.tensor([[0, 0, 0, 0]], dtype=torch.bool), + }, + batch_size=[1], + ) + + td = env.reset(td) + + actions = [0, 1, 1] + for action in actions: + # NOTE add 1 to account for dummy action (waiting) + td.set("action", torch.tensor([action + 1], dtype=torch.long)) + td = env.step(td)["next"] + + lb_expected = torch.tensor([[1, 5, 3, 7]], dtype=torch.float32) + assert torch.allclose(td["lbs"], lb_expected) + + +@pytest.mark.parametrize("env_cls", [FLPEnv, MCPEnv]) +def test_flp_mcp(env_cls, batch_size=2): + env = env_cls() + reward, td, actions = rollout(env, env.reset(batch_size=[batch_size]), random_policy) + assert reward.shape == (batch_size,) + + +def test_scheduling_dataloader(): + from tempfile import TemporaryDirectory + + from rl4co.envs.scheduling.fjsp.parser import write + + write_env = FJSPEnv() + + td = write_env.reset(batch_size=[2]) + with TemporaryDirectory() as tmpdirname: + write(tmpdirname, td) + read_env = FJSPEnv(generator_params={"file_path": tmpdirname}) + td = read_env.reset(batch_size=2) + assert td.size(0) == 2 diff --git a/tests/test_policy.py b/tests/test_policy.py new file mode 100644 index 00000000..6b2c21ab --- /dev/null +++ b/tests/test_policy.py @@ -0,0 +1,88 @@ +import pytest + +from rl4co.models import AttentionModelPolicy, N2SPolicy, PointerNetworkPolicy +from rl4co.utils.ops import select_start_nodes +from rl4co.utils.test_utils import generate_env_data + + +# Main autorergressive policy: rollout over multiple envs since it is the base +@pytest.mark.parametrize( + "env_name", + [ + "tsp", + "cvrp", + "cvrptw", + "sdvrp", + "mtsp", + "op", + "pctsp", + "spctsp", + "dpp", + "mdpp", + "smtwtp", + ], +) +def test_am_policy(env_name, size=20, batch_size=2): + env, x = generate_env_data(env_name, size, batch_size) + td = env.reset(x) + policy = AttentionModelPolicy(env_name=env.name) + out = policy(td, env, decode_type="greedy") + assert out["reward"].shape == (batch_size,) + + +@pytest.mark.parametrize( + "env_name", ["tsp", "cvrp", "cvrptw", "pctsp", "spctsp", "sdvrp", "op", "pdp"] +) +@pytest.mark.parametrize("policy_cls", [AttentionModelPolicy]) +def test_policy_multistart(env_name, policy_cls, size=20, batch_size=2): + env, x = generate_env_data(env_name, size, batch_size) + td = env.reset(x) + policy = policy_cls(env_name=env.name) + num_starts = size // 2 if env.name in ["pdp"] else size + out = policy( + td, + env, + decode_type="multistart_greedy", + num_starts=num_starts, + select_start_nodes_fn=select_start_nodes, + ) + assert out["reward"].shape == ( + batch_size * num_starts, + ) # to evaluate, we could just unbatchify + + +@pytest.mark.parametrize( + "env_name", + ["tsp", "cvrp", "cvrptw", "pctsp", "spctsp", "sdvrp", "op", "pdp"], +) +@pytest.mark.parametrize("select_best", [True, False]) +def test_beam_search(env_name, select_best, size=20, batch_size=2): + env, x = generate_env_data(env_name, size, batch_size) + td = env.reset(x) + policy = AttentionModelPolicy(env_name=env.name) + beam_width = size // 2 if env.name in ["pdp"] else size + out = policy( + td, env, decode_type="beam_search", beam_width=beam_width, select_best=select_best + ) + + if select_best: + expected_shape = (batch_size,) + else: + expected_shape = (batch_size * beam_width,) + assert out["reward"].shape == expected_shape + + +def test_pointer_network(size=20, batch_size=2): + env, x = generate_env_data("tsp", size, batch_size) + td = env.reset(x) + policy = PointerNetworkPolicy(env_name=env.name) + out = policy(td, env, decode_type="greedy") + assert out["reward"].shape == (batch_size,) + + +def test_N2S(size=20, batch_size=2): + env, x = generate_env_data("pdp_ruin_repair", size, batch_size) + td = env.reset(x) + policy = N2SPolicy(env_name=env.name) + out = policy(td, env, decode_type="greedy") + assert out["cost_bsf"].shape == (batch_size,) diff --git a/tests/test_tasks.py b/tests/test_tasks.py new file mode 100644 index 00000000..385f7734 --- /dev/null +++ b/tests/test_tasks.py @@ -0,0 +1,78 @@ +import sys + +import pyrootutils +import pytest + +from hydra import compose, initialize +from hydra.core.global_hydra import GlobalHydra +from hydra.core.hydra_config import HydraConfig +from omegaconf import DictConfig, open_dict + +from rl4co.envs import TSPEnv +from rl4co.models import AttentionModelPolicy +from rl4co.tasks.eval import evaluate_policy +from rl4co.tasks.train import run + + +@pytest.fixture(scope="package") +def cfg_train_global() -> DictConfig: + with initialize(config_path="../configs"): + cfg = compose(config_name="main.yaml", return_hydra_config=True, overrides=[]) + + # set defaults for all tests + with open_dict(cfg): + cfg.paths.root_dir = str(pyrootutils.find_root(indicator=".gitignore")) + cfg.trainer.max_epochs = 1 + cfg.model.train_data_size = 100 + cfg.model.val_data_size = 100 + cfg.model.test_data_size = 100 + cfg.model.batch_size = 2 # faster for CPU (not sure exactly why) + cfg.env.val_file = None # validate on self-generated data + cfg.env.test_file = None # validate on self-generated data + cfg.trainer.accelerator = "cpu" + cfg.trainer.devices = 1 + cfg.extras.print_config = False + cfg.extras.enforce_tags = False + cfg.logger = None + cfg.callbacks.learning_rate_monitor = None + + return cfg + + +@pytest.fixture(scope="function") +def cfg_train(cfg_train_global, tmp_path) -> DictConfig: + cfg = cfg_train_global.copy() + + with open_dict(cfg): + cfg.paths.output_dir = str(tmp_path) + cfg.paths.log_dir = str(tmp_path) + + yield cfg + + GlobalHydra.instance().clear() + + +# Skip if Python < 3.9 due to following error: +# AttributeError: 'OrphanPath' object has no attribute 'exists' +@pytest.mark.skipif( + sys.version_info[1] < 9, + reason="Python<3.9 raises error: 'OrphanPath' object has no attribute 'exists'", +) +def test_train_fast_dev_run(cfg_train): + """Run for 1 train, val and test step.""" + HydraConfig().set_config(cfg_train) + with open_dict(cfg_train): + cfg_train.trainer.fast_dev_run = True + cfg_train.trainer.accelerator = "cpu" + run(cfg_train) + + +@pytest.mark.parametrize( + "method", + ["greedy", "sampling", "multistart_greedy", "augment", "multistart_greedy_augment"], +) +def test_eval(method): + env = TSPEnv(generator_params=dict(num_loc=20)) + policy = AttentionModelPolicy(env_name=env.name) + out = evaluate_policy(env, policy, env.dataset(3), method=method) + assert out["rewards"].shape == (3,) diff --git a/tests/test_training.py b/tests/test_training.py new file mode 100644 index 00000000..07d23a25 --- /dev/null +++ b/tests/test_training.py @@ -0,0 +1,312 @@ +import os +import sys + +import pytest + +from rl4co.envs import ( + ATSPEnv, + FJSPEnv, + JSSPEnv, + PDPEnv, + PDPRuinRepairEnv, + TSPEnv, + TSPkoptEnv, +) +from rl4co.models.rl import A2C, PPO, REINFORCE +from rl4co.models.zoo import ( + DACT, + MDAM, + N2S, + POMO, + ActiveSearch, + AttentionModelPolicy, + DeepACO, + EASEmb, + EASLay, + HeterogeneousAttentionModel, + L2DPPOModel, + MatNet, + NARGNNPolicy, + NeuOpt, + PolyNet, + SymNCO, +) +from rl4co.utils import RL4COTrainer +from rl4co.utils.meta_trainer import ReptileCallback + +# Get env variable MAC_OS_GITHUB_RUNNER +if "MAC_OS_GITHUB_RUNNER" in os.environ: + accelerator = "cpu" +else: + accelerator = "auto" + + +# Test out simple training loop and test with multiple baselines +@pytest.mark.parametrize("baseline", ["rollout", "exponential", "mean", "no", "critic"]) +def test_reinforce(baseline): + env = TSPEnv(generator_params=dict(num_loc=20)) + policy = AttentionModelPolicy(env_name=env.name) + model = REINFORCE( + env, + policy, + baseline=baseline, + train_data_size=10, + val_data_size=10, + test_data_size=10, + ) + trainer = RL4COTrainer(max_epochs=1, devices=1, accelerator=accelerator) + trainer.fit(model) + trainer.test(model) + + +def test_a2c(): + env = TSPEnv(generator_params=dict(num_loc=20)) + policy = AttentionModelPolicy(env_name=env.name) + model = A2C(env, policy, train_data_size=10, val_data_size=10, test_data_size=10) + trainer = RL4COTrainer(max_epochs=1, devices=1, accelerator=accelerator) + trainer.fit(model) + trainer.test(model) + + +def test_ppo(): + env = TSPEnv(generator_params=dict(num_loc=20)) + policy = AttentionModelPolicy(env_name=env.name) + model = PPO(env, policy, train_data_size=10, val_data_size=10, test_data_size=10) + trainer = RL4COTrainer( + max_epochs=1, gradient_clip_val=None, devices=1, accelerator=accelerator + ) + trainer.fit(model) + trainer.test(model) + + +def test_symnco(): + env = TSPEnv(generator_params=dict(num_loc=20)) + model = SymNCO( + env, + train_data_size=10, + val_data_size=10, + test_data_size=10, + num_augment=2, + num_starts=20, + ) + trainer = RL4COTrainer(max_epochs=1, devices=1, accelerator=accelerator) + trainer.fit(model) + trainer.test(model) + + +def test_ham(): + env = PDPEnv(generator_params=dict(num_loc=20)) + model = HeterogeneousAttentionModel( + env, train_data_size=10, val_data_size=10, test_data_size=10 + ) + trainer = RL4COTrainer(max_epochs=1, devices=1, accelerator=accelerator) + trainer.fit(model) + trainer.test(model) + + +def test_matnet(): + env = ATSPEnv(generator_params=dict(num_loc=20)) + model = MatNet( + env, + baseline="shared", + train_data_size=10, + val_data_size=10, + test_data_size=10, + ) + trainer = RL4COTrainer(max_epochs=1, devices=1, accelerator=accelerator) + trainer.fit(model) + trainer.test(model) + + +def test_mdam(): + env = TSPEnv(generator_params=dict(num_loc=20)) + model = MDAM( + env, + train_data_size=10, + val_data_size=10, + test_data_size=10, + ) + trainer = RL4COTrainer(max_epochs=1, devices=1, accelerator=accelerator) + trainer.fit(model) + trainer.test(model) + + +def test_pomo_reptile(): + env = TSPEnv(generator_params=dict(num_loc=20)) + policy = AttentionModelPolicy( + env_name=env.name, + embed_dim=128, + num_encoder_layers=6, + num_heads=8, + normalization="instance", + use_graph_context=False, + ) + model = POMO( + env, + policy, + batch_size=5, + train_data_size=5 * 3, + val_data_size=10, + test_data_size=10, + ) + meta_callback = ReptileCallback( + data_type="size", + sch_bar=0.9, + num_tasks=2, + alpha=0.99, + alpha_decay=0.999, + min_size=20, + max_size=50, + ) + trainer = RL4COTrainer( + max_epochs=2, + callbacks=[meta_callback], + devices=1, + accelerator=accelerator, + limit_train_batches=3, + ) + trainer.fit(model) + trainer.test(model) + + +@pytest.mark.parametrize("SearchMethod", [ActiveSearch, EASEmb, EASLay]) +def test_search_methods(SearchMethod): + env = TSPEnv(generator_params=dict(num_loc=20)) + batch_size = 2 if SearchMethod not in [ActiveSearch] else 1 + dataset = env.dataset(2) + policy = AttentionModelPolicy(env_name=env.name) + model = SearchMethod(env, policy, dataset, max_iters=2, batch_size=batch_size) + trainer = RL4COTrainer(max_epochs=1, devices=1, accelerator=accelerator) + trainer.fit(model) + trainer.test(model) + + +@pytest.mark.skipif( + "torch_geometric" not in sys.modules, reason="PyTorch Geometric not installed" +) +def test_nargnn(): + env = TSPEnv(generator_params=dict(num_loc=20)) + policy = NARGNNPolicy(env_name=env.name) + model = REINFORCE( + env, policy=policy, train_data_size=10, val_data_size=10, test_data_size=10 + ) + trainer = RL4COTrainer( + max_epochs=1, gradient_clip_val=None, devices=1, accelerator=accelerator + ) + trainer.fit(model) + trainer.test(model) + + +@pytest.mark.skipif( + "torch_geometric" not in sys.modules, reason="PyTorch Geometric not installed" +) +@pytest.mark.skipfif("numba" not in sys.modules, reason="Numba not installed") +def test_deepaco(): + env = TSPEnv(generator_params=dict(num_loc=20)) + model = DeepACO( + env, + train_data_size=10, + val_data_size=10, + test_data_size=10, + policy_kwargs={"n_ants": 5}, + ) + trainer = RL4COTrainer( + max_epochs=1, gradient_clip_val=1, devices=1, accelerator=accelerator + ) + trainer.fit(model) + trainer.test(model) + + +def test_n2s(): + env = PDPRuinRepairEnv(generator_params=dict(num_loc=20)) + model = N2S( + env, + train_data_size=10, + val_data_size=10, + test_data_size=10, + n_step=2, + T_train=4, + T_test=4, + ) + trainer = RL4COTrainer( + max_epochs=1, + gradient_clip_val=0.05, + devices=1, + accelerator=accelerator, + ) + trainer.fit(model) + trainer.test(model) + + +def test_dact(): + env = TSPkoptEnv(generator_params=dict(num_loc=20), k_max=2) + model = DACT( + env, + train_data_size=10, + val_data_size=10, + test_data_size=10, + n_step=2, + T_train=4, + T_test=4, + CL_best=True, + ) + trainer = RL4COTrainer( + max_epochs=1, + gradient_clip_val=0.05, + devices=1, + accelerator=accelerator, + ) + trainer.fit(model) + trainer.test(model) + + +def test_neuopt(): + env = TSPkoptEnv(generator_params=dict(num_loc=20), k_max=4) + model = NeuOpt( + env, + train_data_size=10, + val_data_size=10, + test_data_size=10, + n_step=2, + T_train=4, + T_test=4, + CL_best=True, + ) + trainer = RL4COTrainer( + max_epochs=1, + gradient_clip_val=0.05, + devices=1, + accelerator=accelerator, + ) + trainer.fit(model) + trainer.test(model) + + +@pytest.mark.parametrize("env_cls", [FJSPEnv, JSSPEnv]) +def test_l2d_ppo(env_cls): + env = env_cls(stepwise_reward=True, _torchrl_mode=True) + model = L2DPPOModel( + env, train_data_size=10, val_data_size=10, test_data_size=10, buffer_size=1000 + ) + trainer = RL4COTrainer( + max_epochs=1, + gradient_clip_val=0.05, + devices=1, + accelerator=accelerator, + ) + trainer.fit(model) + trainer.test(model) + + +def test_polynet(): + env = TSPEnv(generator_params=dict(num_loc=20)) + model = PolyNet( + env, + k=10, + train_data_size=10, + val_data_size=10, + test_data_size=10, + ) + trainer = RL4COTrainer(max_epochs=1, devices=1, accelerator=accelerator) + trainer.fit(model) + trainer.test(model) diff --git a/tests/test_utils.py b/tests/test_utils.py new file mode 100644 index 00000000..c0f6041a --- /dev/null +++ b/tests/test_utils.py @@ -0,0 +1,52 @@ +import pytest +import torch + +from tensordict import TensorDict +from torch.nn.functional import scaled_dot_product_attention + +from rl4co.models.nn.attention import scaled_dot_product_attention_simple +from rl4co.utils.decoding import process_logits +from rl4co.utils.ops import batchify, unbatchify + + +@pytest.mark.parametrize( + "a", + [ + torch.randn(10, 20, 2), + TensorDict( + {"a": torch.randn(10, 20, 2), "b": torch.randn(10, 20, 2)}, batch_size=10 + ), + ], +) +@pytest.mark.parametrize("shape", [(2,), (2, 2), (2, 2, 2)]) +def test_batchify(a, shape): + # batchify: [b, ...] -> [b * prod(shape), ...] + # unbatchify: [b * prod(shape), ...] -> [b, shape[0], shape[1], ...] + a_batch = batchify(a, shape) + a_unbatch = unbatchify(a_batch, shape) + if isinstance(a, TensorDict): + a, a_unbatch = a["a"], a_unbatch["a"] + index = (slice(None),) + (0,) * len(shape) # (slice(None), 0, 0, ..., 0) + assert torch.allclose(a, a_unbatch[index]) + + +@pytest.mark.parametrize("top_p", [0.0, 0.5, 1.0]) +@pytest.mark.parametrize("top_k", [0, 5, 10]) +def test_top_k_top_p_sampling(top_p, top_k): + logits = torch.randn(8, 10) + mask = torch.ones(8, 10).bool() + logprobs = process_logits(logits, mask, top_p=top_p, top_k=top_k) + assert len(logprobs) == logits.size(0) + + +def test_scaled_dot_product_attention(): + bs, ns, ds = 2, 3, 4 + q = torch.rand(bs, ns, ds) + k = torch.rand(bs, ns, ds) + v = torch.rand(bs, ns, ds) + attn_mask = torch.rand(bs, ns, ns) > 0.5 + attn_mask[:, 0, :] = True # at least one row element is True + attn_mask[:, :, 0] = True # at least one column element is True + attn_torch = scaled_dot_product_attention(q, k, v, attn_mask) + attn_rl4co = scaled_dot_product_attention_simple(q, k, v, attn_mask) + assert torch.allclose(attn_torch, attn_rl4co)