From 9f7d81806dbbe8b959b593a8ad388113c706d45c Mon Sep 17 00:00:00 2001 From: Max Lucassen <74817215+maximilianluc@users.noreply.github.com> Date: Tue, 19 Jul 2022 13:31:41 +0200 Subject: [PATCH 01/10] Create README.md add readme --- samples/self-avoiding-path/README.md | 66 ++++++++++++++++++++++++++++ 1 file changed, 66 insertions(+) create mode 100644 samples/self-avoiding-path/README.md diff --git a/samples/self-avoiding-path/README.md b/samples/self-avoiding-path/README.md new file mode 100644 index 0000000..d8e3f34 --- /dev/null +++ b/samples/self-avoiding-path/README.md @@ -0,0 +1,66 @@ +--- +page_type: sample +languages: +- python +author: Maximilian Lucassen +ms.author: maxlucassen@microsoft.com +ms.date: 4/22/2022 +products: +- azure-quantum +- azure-qio +description: "Solve the self-avoiding path problem with Azure Quantum optimization service" +urlFragment: azure-quantum.self-avoiding-path +--- + +# Solving self-avoiding path problems with the Azure Quantum optimization service + +## Introduction + +This sample provides a walkthrough on how to solve the self-avoiding path problem with Azure QIO solvers, from problem definition to formulation of constraints to submitting the problem to the Azure QIO Service. + +By working through this sample, you will learn: + +- Model the problem mathematically to design objective and penalty functions +- Coding of the optimization problem using the Azure Quantum Optimization Python SDK +- Verifying results returned by the solver. + +## Prerequisites + +1. [Create an Azure Quantum Workspace](https://docs.microsoft.com/azure/quantum/how-to-create-quantum-workspaces-with-the-azure-portal) +2. [Install the `azure-quantum` Python module](https://docs.microsoft.com/azure/quantum/optimization-install-sdk) +3. (If you want to run the Jupyter notebook) [Install Jupyter Notebook](https://jupyter.org/install) +4. (Optional / Recommended learning) [Run and understand the basic ship loading sample](../ship-loading/) + +## Running the sample + +There are two ways to run the sample (.ipynb and .py): + +- [Jupyter Notebook (step-by-step walkthrough)](./self-avoiding-path.ipynb) +- [Python script (barebones annotations)](./self-avoiding-path.py) + +A html file of the Jupyter notebook is attached for improved readability: + +- [Html page (more readable format than Jupyter Notebook)](./self-avoiding-path.html) + +### Running the Jupyter Notebook + +To run this sample, use the commandline to navigate to the `self-avoiding-path` folder and run `jupyter notebook` + +Your web browser should automatically open a new window. + +If this doesn't happen, copy the localhost link shown in the terminal window and paste it into your browser's address bar. + +Once you see the page above, simply click on the `self-avoiding-path.ipynb` link to open the sample notebook. + +### Running the Python script + +- Open up the `self-avoiding-path.py` script using your favorite IDE or a text editor. +- Fill in your Azure Quantum workspace details at the beginning of the script. +- Run the script through your IDE or use the commandline to navigate to the `self-avoiding-path` folder and then run `python ./self-avoiding-path.py` or `python3 ./self-avoiding-path.py` (depending on how your environment is set up). + +### Manifest + +- **[self-avoiding-path.ipynb](https://github.com/microsoft/qio-samples/blob/main/samples/self-avoiding-path/self-avoiding-path.ipynb)**: Jupyter Notebook version of this sample. +- **[self-avoiding-path.py](https://github.com/microsoft/qio-samples/blob/main/samples/self-avoiding-path/self-avoiding-path.py)**: Standalone Python version of this sample. +- **[self-avoiding-path.html](https://github.com/microsoft/qio-samples/blob/main/samples/self-avoiding-path/self-avoiding-path.html)**: HTML version of this sample. + From 099803f53c1c5b4464938119ef1aab60ecf0d1fc Mon Sep 17 00:00:00 2001 From: Max Lucassen <74817215+maximilianluc@users.noreply.github.com> Date: Tue, 19 Jul 2022 13:32:13 +0200 Subject: [PATCH 02/10] Update README.md adjust date --- samples/self-avoiding-path/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/samples/self-avoiding-path/README.md b/samples/self-avoiding-path/README.md index d8e3f34..d1c1db0 100644 --- a/samples/self-avoiding-path/README.md +++ b/samples/self-avoiding-path/README.md @@ -4,7 +4,7 @@ languages: - python author: Maximilian Lucassen ms.author: maxlucassen@microsoft.com -ms.date: 4/22/2022 +ms.date: 7/19/2022 products: - azure-quantum - azure-qio From 89c05a1baae26e02ba21a98840d663d426914ea7 Mon Sep 17 00:00:00 2001 From: Max Lucassen <74817215+maximilianluc@users.noreply.github.com> Date: Tue, 19 Jul 2022 13:38:12 +0200 Subject: [PATCH 03/10] Update README.md --- samples/self-avoiding-path/README.md | 2 ++ 1 file changed, 2 insertions(+) diff --git a/samples/self-avoiding-path/README.md b/samples/self-avoiding-path/README.md index d1c1db0..5eb99aa 100644 --- a/samples/self-avoiding-path/README.md +++ b/samples/self-avoiding-path/README.md @@ -24,6 +24,8 @@ By working through this sample, you will learn: - Coding of the optimization problem using the Azure Quantum Optimization Python SDK - Verifying results returned by the solver. +The work presented in this folder is based on the following [paper](https://arxiv.org/abs/1811.00713). + ## Prerequisites 1. [Create an Azure Quantum Workspace](https://docs.microsoft.com/azure/quantum/how-to-create-quantum-workspaces-with-the-azure-portal) From 20dfdd9720918932e6cd59af2d259b0584bfdeb1 Mon Sep 17 00:00:00 2001 From: Max Lucassen <74817215+maximilianluc@users.noreply.github.com> Date: Tue, 19 Jul 2022 13:38:39 +0200 Subject: [PATCH 04/10] Update README.md --- samples/self-avoiding-path/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/samples/self-avoiding-path/README.md b/samples/self-avoiding-path/README.md index 5eb99aa..5217135 100644 --- a/samples/self-avoiding-path/README.md +++ b/samples/self-avoiding-path/README.md @@ -24,7 +24,7 @@ By working through this sample, you will learn: - Coding of the optimization problem using the Azure Quantum Optimization Python SDK - Verifying results returned by the solver. -The work presented in this folder is based on the following [paper](https://arxiv.org/abs/1811.00713). +The work presented in this folder is based on the following [paper - https://arxiv.org/abs/1811.00713](https://arxiv.org/abs/1811.00713). ## Prerequisites From 916e72c7a37b2099819fd92b25145bc039203ba2 Mon Sep 17 00:00:00 2001 From: Max Lucassen <74817215+maximilianluc@users.noreply.github.com> Date: Tue, 19 Jul 2022 13:39:20 +0200 Subject: [PATCH 05/10] Update README.md --- samples/self-avoiding-path/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/samples/self-avoiding-path/README.md b/samples/self-avoiding-path/README.md index 5217135..3c89df7 100644 --- a/samples/self-avoiding-path/README.md +++ b/samples/self-avoiding-path/README.md @@ -40,7 +40,7 @@ There are two ways to run the sample (.ipynb and .py): - [Jupyter Notebook (step-by-step walkthrough)](./self-avoiding-path.ipynb) - [Python script (barebones annotations)](./self-avoiding-path.py) -A html file of the Jupyter notebook is attached for improved readability: +A html file of the Jupyter notebook is attached for improved readability of the equations (tables aren't rendered correctly, however): - [Html page (more readable format than Jupyter Notebook)](./self-avoiding-path.html) From 22a75dc5d0e7a7c61c1a171781a501f43cd94d65 Mon Sep 17 00:00:00 2001 From: Max Lucassen <74817215+maximilianluc@users.noreply.github.com> Date: Tue, 19 Jul 2022 13:40:33 +0200 Subject: [PATCH 06/10] Add files via upload --- .../self-avoiding-walk.html | 15645 ++++++++++++++++ .../self-avoiding-walk.ipynb | 1086 ++ .../self-avoiding-path/self-avoiding-walk.py | 485 + 3 files changed, 17216 insertions(+) create mode 100644 samples/self-avoiding-path/self-avoiding-walk.html create mode 100644 samples/self-avoiding-path/self-avoiding-walk.ipynb create mode 100644 samples/self-avoiding-path/self-avoiding-walk.py diff --git a/samples/self-avoiding-path/self-avoiding-walk.html b/samples/self-avoiding-path/self-avoiding-walk.html new file mode 100644 index 0000000..5b3d7e4 --- /dev/null +++ b/samples/self-avoiding-path/self-avoiding-walk.html @@ -0,0 +1,15645 @@ + + + + + +self-avoiding-walk + + + + + + + + + + + + + + + + + + + + + +
+
+ + +
+
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+
+
+ + +
+
+
+ + +
+ +
+ + + + + + + + + diff --git a/samples/self-avoiding-path/self-avoiding-walk.ipynb b/samples/self-avoiding-path/self-avoiding-walk.ipynb new file mode 100644 index 0000000..be93700 --- /dev/null +++ b/samples/self-avoiding-path/self-avoiding-walk.ipynb @@ -0,0 +1,1086 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Self Avoiding Walk with Azure Quantum Inspired Optimization\n", + "\n", + "In this notebook we'll cover how to formulate an optimization problem to find a path through a 3D lattice that does not cross itself (self-avoiding). The optimization problem is solved with the Azure Quantum service which contains numerous heuristic (non-linear) optimization solvers. Finding a self-avoiding path in a 3D lattice can be considered a difficult problem, in the sense that it has suffers from exponential scaling conditioned on the number of turns and the number of dimensions (2D vs 3D, etc.). \n", + "\n", + "In this notebook, a step by step approach is taken to explain the function definitions to are necessary to create the optimization problem.\n", + "\n", + "Goal: To find a path in a 3D lattice that does not cross itself.\n", + "\n", + "To clarify some vocab and assumptions used in the notebook:\n", + "1. The number of dimensions is 3 (3D), meaning the path can be represented in a $x$-$y$-$z$ plane.\n", + "2. The position represents the location in the x-y-z plane, thus given by ($x$,$y$,$z$).\n", + "3. A direction describes the orientation of within in the x-y-z plane, thus in {$+x$,$-x$,$+y$,$-y$,$+z$,$-z$}.\n", + "4. \"Turns\" are equivalent to \"steps\". After each turn a new position is acquired that must be unique (not visited before). \n", + "5. The total number of turns is equivalent to the number of positions that needs to be visited minus one ($N-1$). \n", + "6. The decision variables for the optimization function are denoted by \"q\" because \"x\" is already associated with a direction, and are referred to as \"optimization variables\".\n", + "\n", + "Note: Because the number of terms to for this optimization problem grows explosively with the number of turns, you might want to try running this in the Azure Quantum notebooks. The more technical reason for this is that expansions of nonlinear terms have to be computed locally resulting in massive number of terms needing to be uploaded. Unless you are very patient, a recommendation would be to either check out the online notebook experience or rewrite this notebook's problem class to its streaming counterpart (https://docs.microsoft.com/en-us/azure/quantum/optimization-streaming-problem). \n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Import the necessary dependencies for the notebook" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import time\n", + "from math import floor, log2\n", + "from azure.quantum import Workspace\n", + "from azure.quantum.optimization import Problem, ProblemType, Term, ParallelTempering, Tabu, SimulatedAnnealing\n", + "from azure.identity import ClientSecretCredential\n", + "from mpl_toolkits import mplot3d\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Connect to your Azure Quantum workspace\n", + "\n", + "To run the sample, you'll need to have a quantum workspace. Check out this module if you don't have one yet: https://docs.microsoft.com/en-us/learn/modules/get-started-azure-quantum/.\n", + "Fill in the variables below." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "workspace = Workspace(\n", + " subscription_id = \"\",\n", + " resource_group = \"\",\n", + " name = \"\",\n", + " location = \"\",\n", + " credential = ClientSecretCredential(tenant_id=\"\",\n", + " client_id=\"\",\n", + " client_secret=\"\")\n", + ")\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Print readable cost functions\n", + "\n", + "Throughout the notebook you'll probably realize that printing the \"terms\" isn't going to provide much help, mainly because there will be too many of them and their dictionary format. A term is the way a mathematical term is expressed in terms of a dictionary for the SDK (see examples). Below a function is defined that prints the term(s) dictionaries that describe the constraint/cost function in terms of \"q\" optimization variables. You can call the function to check if the working is correct, or if you're unsure of what a constraint looks like. Note that for a large problem it nevertheless becomes difficult to understand the entire function output because of the number of terms.\n", + "\n", + "An example:\n", + "{'c': 1, 'ids': [0, 10, 11, 12]} ---> $1q_0q_{10}q_{11}q_{12}$\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def print_function(terms: list):\n", + "\n", + " '''\n", + " Purpose:\n", + " Takes a list of terms and prints it out as a mathematical (cost/constraint) function.\n", + " Example:\n", + " {'c': 1, 'ids': [0, 10, 11, 12]} ---> 1q_0q_10q_11q_12\n", + " Inputs:\n", + " 1. terms: the list of terms.\n", + " '''\n", + " \n", + " k = 0\n", + " final_string = ''\n", + " final_string = ''\n", + " for term in terms:\n", + " term = term.to_dict()\n", + " weight = term['c']\n", + " ids = term['ids']\n", + " string = '('\n", + " if weight >= 0:\n", + " if k == 0: \n", + " string = '('+str(weight)\n", + " else:\n", + " string = '+' + '('+str(weight)\n", + " if weight < 0:\n", + " if k == 0:\n", + " string = '(' + str(abs(weight))\n", + " else: \n", + " string = '-' + '(' + str(abs(weight))\n", + " for id_ in ids:\n", + " string = string + f'q_{id_}'\n", + " string = string + ')'\n", + " final_string = final_string + string\n", + " k += 1\n", + "\n", + " print('[ ' + final_string + ' ]')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Expansion of two term lists\n", + "\n", + "Throughout the notebook we will need to cross-multiply nonlinear terms, for computing squares for example. The function below performs the expansion. An important note to keep in mind here, especially if you're looking to optimize the code, is that the function does not assemble identical terms. Since the cost functions dealt with in this notebook are still rather small, reducing the number of terms was left out of the scope. \n", + "\n", + "More clearly stated in terms of equations:\n", + "\n", + "$$ \\text{Current function (see below): } \\hspace{0.2cm} (a+b)^2 = a^2 + ab + ab + b^2 $$\n", + "$$ \\text{Optimal function: } \\hspace{0.2cm} (a+b)^2 = a^2 + 2ab + b^2 $$\n", + "\n", + "Should be a fun programming exercise to reduce the number of terms significantly!" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def cross_multiply(list_a: list, list_b: list) -> list:\n", + "\n", + " '''\n", + " Purpose: Cross multiplies two lists of terms (linear ex. [q_0 + q_1] or non-linear ex. [q_0q_1]) to return the expansion.\n", + " Can compute powers of groups this way (^2, ^3,...), like squaring a list of terms.\n", + " Calculates the expansion locally, unlike the SlcTerm class.\n", + " Example: (2q_0q_1+3q_2q_3)^2 => (2q_0q_1)^2 + 6q_0q_1q_2q_3 + 6q_0q_1q_2q_3 + (3q_2q_3)^2\n", + " Input:\n", + " 1. list_a: list which serves as the reference list (first 'for' loop).\n", + " 2. list_b: list which serves as the target list (second 'for' loop).\n", + " Output:\n", + " 1. list of term objects.\n", + " '''\n", + "\n", + " terms = []\n", + " for one in list_a:\n", + " for uno in list_b:\n", + " alpha = one.to_dict()\n", + " beta = uno.to_dict()\n", + " weight = int(alpha['c'])*int(beta['c'])\n", + " ids = list(alpha['ids'])+list(beta['ids'])\n", + " terms += [Term(c = weight, indices = ids)] \n", + " return terms\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Parameters for running through the notebook\n", + "\n", + "While running through the notebook you might want to execute and print some of the constraint functions. To do that, you'll need some variables to be defined. Only 3 turns are considered with the defined parameters below, as that will keep the function outputs small and understandable!" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "nodes = \"ABCD\" # The four position/node names.\n", + "len_seq = len(nodes) # The length of the node \n", + "num_turns = len(nodes)-1 # The number of turns, which is one less than the number of therefore -1 turns.\n", + "num_dim = 3 # Number of optimization variables required to describe a turn\n", + "lambda_0 = 1 # Penalty weight for the 'distance constraint'\n", + "lambda_1 = 40 # Penalty weight for the 'no return constraint'\n", + "lambda_2 = 25 # Penalty weight for the invalid direction '000' constraint\n", + "lambda_3 = 25 # Penalty weight for the invalid direction '111' constraint" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 1. Encoding the directions \n", + "\n", + "Prior to starting to define our cost function, we have to construct some basic functions and agree on some definitions. In this part, we'll define the 6 directions of the x-y-z plane in terms of the optimization variables (\"q\"). \n", + "\n", + "A common way to encode a turn based optimization problem is through a direction-based string, in which each optimization variable substring (ex. $q_0q_1q_2$) denotes some kind of decision of which direction was takn. For example, take a car take can only move backward or forward. The decision of the driver at some time $t$ can be described as $q_t \\in \\{0, 1\\}$, where 0 represents going backward and 1 forward, respectively. Over a multiple time steps, say 3, one can then describe the movement of the car by:\n", + "\n", + "$$ \\text{Movements:} \\hspace{0.25cm} q_0q_1q_2 $$\n", + "\n", + "The sequence of movements, \"forward, backward, backward\", can then be represented as:\n", + "\n", + "$$ \\text{Sequence of movements:} \\hspace{0.25cm} q_0q_1q_2 = 100$$\n", + "\n", + "Alright, if that is clear to you, then the next step is to represent the 6 directions of the x-y-z plane in such a fashion. Regrettably, a \"q\" can only be either 0 or 1, not 2, 3, 4, 5 to represent the six directions. But what can be done is to use multiple optimization variables to describe a direction! For example:\n", + "\n", + "$$ \\text{Sequence of movements:} \\hspace{0.25cm} q_0q_1q_2q_3q_4q_5q_6q_7q_8 $$\n", + "$$ \\text{First move:} \\hspace{0.25cm} q_0q_1q_2 $$\n", + "$$ \\text{Second move:} \\hspace{0.25cm} q_3q_4q_5 $$\n", + "$$ \\text{Third move:} \\hspace{0.25cm} q_6q_7q_8 $$\n", + "\n", + "Because we need to encode 6 directions, we need at least 3 optimization variables to form unique substrings. The table explains this, we to have enough possible combinations to encode the 6 directions:\n", + "\n", + "
\n", + "\n", + "| Opt. var. substring | Combinations | \n", + "| ----------------------------- | -------------------------- |\n", + "| $q_0 \\cdot q_1$ | $2\\cdot 2 = 4 < 6$ |\n", + "| $q_0 \\cdot q_1 \\cdot q_2$ | $2\\cdot 2\\cdot 2 = 8 > 6$ |\n", + "\n", + "
\n", + "\n", + "Note, for later, you should keep in mind that 2 of the 8 combinations become irrelevant. It is important that the solver does not return those strings!\n", + "\n", + "Perfect! Now we just need to assign each direction a unique substring. Below you can find my choices, feel free to change these if you're starting from scratch.\n", + "\n", + "
\n", + "\n", + "| Direction | Opt. var. substring | \n", + "| --------- | ----------------- |\n", + "| +x | 100 |\n", + "| -x | 010 |\n", + "| +y | 001 |\n", + "| -y | 110 |\n", + "| +z | 101 |\n", + "| -z | 011 |\n", + "| N/A | 000 |\n", + "| N/A | 111 |\n", + "\n", + "
\n", + "\n", + "Now we just need to define direction variables. These are as defined in the above table. These variables should take a value 1 if a movement is made in that direction, while the other directions must all be zero. This can be achieved by the following scheme, where $k$ denotes the turn, and $\\gamma = 3(k-1)$ (3 because 3 dimensions):\n", + "\n", + "
\n", + "\n", + "| Direction | Opt. var. substring | Formula | \n", + "| ------------- | ---------------- | -------------------------------------------------- |\n", + "| $d_{+x}^{k}$ | 100 | $ q_{0+\\gamma} (1-q_{1+\\gamma}) (1-q_{2+\\gamma})$ |\n", + "| $d_{-x}^{k}$ | 010 | $ (1-q_{0+\\gamma}) q_{1+\\gamma} (1-q_{2+\\gamma})$ |\n", + "| $d_{+y}^{k}$ | 001 | $ (1-q_{0+\\gamma}) (1-q_{1+\\gamma}) q_{2+\\gamma}$ | \n", + "| $d_{-y}^{k}$ | 110 | $ q_{0+\\gamma} q_{1+\\gamma} (1-q_{2+\\gamma}) $ |\n", + "| $d_{+z}^{k}$ | 101 | $ q_{0+\\gamma} (1-q_{1+\\gamma}) q_{2+\\gamma} $ |\n", + "| $d_{-z}^{k}$ | 011 | $ (1-q_{0+\\gamma}) q_{1+\\gamma} q_{2+\\gamma} $ |\n", + "\n", + "
\n", + "\n", + "To clarify a bit further through an example:\n", + "If in the first turn (k=0) the solver returns $q_0=1$, $q_1=0$, $q_2=0$, and in the second turn (k=1) returns $q_3=0$, $q_4=0$, $q_5=1$, then a \"+x and +y\" were taken, respecively.\n", + "\n", + "These direction variables will help understand some difficult constraints later on. Defining these direction variables additionally makes the code much more readable, since we can define everything in terms of the direction variables instead of the individual optimization variables.\n", + "\n", + "Below you can find the function for the direction variables. The formulas have been expanded (mathematically) to easily declare them in a number of terms, however it is hard-coded this way. Some inputs to the function (\"sign_dir\", \"sign_pos\", \"lambda_\") are relevant for building constraints later in the notebook, but have to defined in this function. Further information can be found in the function docstring. \n", + " " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def direction_variables(direction: str, offset: int, sign_dir: int, sign_pos: int, lambda_: int) -> list:\n", + "\n", + " '''\n", + " Purpose:\n", + " Translates the direction (+x,-x,+y,-y,+z,-z) of turn 'i' as a function of three optimization variables. (Three q's because of the defined coordinate system).\n", + " Example:\n", + " Direction \"+z\" in the first turn (turn = 1) is translated to: q_{0+offset}q_{2+offset}-q_{0+offset}q_{1+offset}q_{2+offset}.\n", + " Inputs:\n", + " 1. direction: A direction from an x-y-z coordinate system, one of the following: ('+x','-x','+y','-y','+z','-z').\n", + " 2. offset: Offset gives the turn number expressed in the first \"q\" of that turn. Equal to gamma in the explanation.\n", + " Example: Turn 1 starts with \"q\" q_0, offset=0. Turn 2 starts with q_3, offset = 3.\n", + " 3. sign_dir: Changes the sign of the weights corresponding to negative directions \"-x\", \"-y\", \"-z\" -> necessary for finding the positions, for exmaple (+x) \"-\" (-x).\n", + " 4. sign_pos: Changes the sign of the weights corresponding to negative positions \"-(x,y,z)\" -> necessary for finding the distances between node \"i\" and node \"j\".\n", + " 5. lambda_: The weight term associated with a constraint.\n", + " Output:\n", + " 1. A list of term objects.\n", + " '''\n", + "\n", + " terms = []\n", + " if direction == \"+x\":\n", + " term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset])\n", + " term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset])\n", + " term_2 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset])\n", + " term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1, term_2, term_3]\n", + " elif direction == \"-x\":\n", + " term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset])\n", + " term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset])\n", + " term_2 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset])\n", + " term_3 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1, term_2, term_3]\n", + " elif direction == \"+y\":\n", + " term_0 = Term(c= 1*sign_pos*lambda_, indices=[2+offset])\n", + " term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset])\n", + " term_2 = Term(c=-1*sign_pos*lambda_, indices=[1+offset, 2+offset])\n", + " term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1, term_2, term_3]\n", + " elif direction == \"-y\":\n", + " term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset])\n", + " term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1]\n", + " elif direction == \"+z\":\n", + " term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 2+offset])\n", + " term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1]\n", + " elif direction == \"-z\":\n", + " term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset])\n", + " term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1]\n", + " return terms\n", + "\n", + "\n", + "##### ----- Test the function and print output:\n", + "turn = 1 # play with this value! \n", + "dir_var = direction_variables(\"+x\",(turn-1)*num_dim,1,1,lambda_0) \n", + "print('dir_var term dictionary \"+x\": ', dir_var)\n", + "print_function(dir_var)\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 2. Finding the difference in positions\n", + "\n", + "Great that we have the directions defined! Now let's use them and define a function that calculates the difference in positions, which we will need later. After each turn, a direction that appends to the path. A valid path is defined as a one that does not cross itself, meaning that we need to compare the positions over the turns. In other words, every new position appended to the path needs to be checked with all previously held positions, to verify that a position hasn't been visited twice. \n", + "\n", + "So how do we go about this?\n", + "\n", + "First we need a way to know the positions after choosing to go in a certain direction, so let's tackle that first. Consider the fact that the directions are recorded for each turn, which already gives some sort of log of the positions in the path. By summing the direction variables respective to their dimension (x/y/z) acoomplishes this, but only if a negative move can compensate a positive one. For example, after two turns the $x$-location can be expressed as:\n", + "\n", + "$$ x_2 = ( d^{1}_{+x} - d^{1}_{-x} ) + ( d^{2}_{+x} - d^{2}_{-x} )$$\n", + "\n", + "**_NOTE:_** In the above function (\"direction_variables\"), the negative sign for the negative direction variables is controlled through \"sign_dir\". \"sign_dir\" must be set to -1 to assign a negative sign to it as required in these position formulas!\n", + "\n", + "\n", + "Remember that for a turn only one direction variable can be set to 1! Thus if two moves in the $-x$ direction are taken, then:\n", + "\n", + "$$ x_2 = ( d^{1}_{+x} - d^{1}_{-x} ) + ( d^{2}_{+x} - d^{2}_{-x} ) = ( 0 - 1 ) + ( 0 - 1 ) = -2 $$\n", + "\n", + "As with the simple example for the x-dimension, the same can be applied to the $x$ and $y$ directions. The formulas below descrive the position after some number of turns through a summation (for the maths/physics enthousiasts, these are integrals of the velocities to derive the positions :) ).\n", + "\n", + "$$ x^k = \\sum_{k=1}^{k} ( d^{k}_{+x} - d^{k}_{-x} ) $$\n", + "$$ y^k = \\sum_{k=1}^{k} ( d^{k}_{+y} - d^{k}_{-y} ) $$\n", + "$$ z^k = \\sum_{k=1}^{k} ( d^{k}_{+z} - d^{k}_{-z} ) $$\n", + "\n", + "Great stuff! Now we have a method to find the positions along the path. To find the differences in position, for example between turn 2 and turn 1, it is only necessary to apply a subtraction: \n", + "\n", + "$$ x_2 - x_1 = \\sum_{k=1}^{2} ( d^{k}_{+x} - d^{k}_{-x} ) - \\sum_{k=1}^{1} ( d^{k}_{+x} - d^{k}_{-x}) = ( d^{2}_{+x} - d^{2}_{-x} ) $$\n", + "$$ y_2 - y_1 = \\sum_{k=1}^{2} ( d^{k}_{+y} - d^{k}_{-y} ) - \\sum_{k=1}^{1} ( d^{k}_{+y} - d^{k}_{-y}) = ( d^{2}_{+y} - d^{2}_{-y} ) $$\n", + "$$ z_2 - z_1 = \\sum_{k=1}^{2} ( d^{k}_{+z} - d^{k}_{-z} ) - \\sum_{k=1}^{1} ( d^{k}_{+z} - d^{k}_{-z}) = ( d^{2}_{+z} - d^{2}_{-z} ) $$\n", + "\n", + "Generalizing this to any difference between two positions:\n", + "\n", + "$$ x_j - x_i = \\sum_{k=i}^{j} ( d^{k}_{+x} - d^{k}_{-x} ) $$\n", + "$$ y_j - y_i = \\sum_{k=i}^{j} ( d^{k}_{+y} - d^{k}_{-y} ) $$\n", + "$$ z_j - z_i = \\sum_{k=i}^{j} ( d^{k}_{+z} - d^{k}_{-z} ) $$\n", + "\n", + "Fantastic! Now on to the function code for the difference in positions. Do read the function and its docstring to understand the implementation, because it reference the previously defined function to make use of direction variables. \n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def diff_in_pos(start_turn: int, end_turn: int, num_dim: int, lamda_: int):\n", + "\n", + " '''\n", + " Purpose:\n", + " Expresses the difference in position (x,y,z) between two turns as a function of the q's encoding of the directions.\n", + " In other words, expresses the difference in the position after the start_turn and position after the end_turn.\n", + " Example:\n", + " Difference between turn 0 (no turns yet, initial position = (0,0,0)) and turn 2:\n", + " x(2) = [ move(+x, turn 1) - move(-x, turn 1) ] + [ move(+x, turn 2) - move(-x, turn 2) ]\n", + " Note: only one 'move' per turn gets activated as they are represented by the same q's (ex. turn 1 is represented by q_0, q_1, and q_2).\n", + " Inputs:\n", + " 1. start_turn: the initial (reference) turn.\n", + " 2. end_turn: the final (target) turn.\n", + " 3. num_dim: the number of dimensions (3, x-y-z coordinate system).\n", + " Outputs:\n", + " 1. The difference in the x direction.\n", + " 2. The difference in the y direction.\n", + " 3. The difference in the z direction. \n", + " '''\n", + "\n", + " x_diff = y_diff = z_diff = []\n", + " if start_turn < end_turn and start_turn >= 0 and end_turn >= 1:\n", + " for turn in range(start_turn,end_turn+1):\n", + " x_diff += direction_variables(\"+x\",(turn-1)*num_dim,1,1,lamda_)+direction_variables(\"-x\",(turn-1)*num_dim,-1,1,lamda_)\n", + " y_diff += direction_variables(\"+y\",(turn-1)*num_dim,1,1,lamda_)+direction_variables(\"-y\",(turn-1)*num_dim,-1,1,lamda_)\n", + " z_diff += direction_variables(\"+z\",(turn-1)*num_dim,1,1,lamda_)+direction_variables(\"-z\",(turn-1)*num_dim,-1,1,lamda_)\n", + " return x_diff, y_diff, z_diff\n", + "\n", + "\n", + "##### ----- Test the function and print output: \n", + "start_turn = 1 # play with this value! \n", + "end_turn = 2 # play with this value! \n", + "x_diff, y_diff, z_diff = diff_in_pos(start_turn, end_turn, num_dim, lambda_0)\n", + "print('Difference in x described as term list: \\n', x_diff)\n", + "print('\\nDifference in x described as mathematical function:')\n", + "print_function(x_diff)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 3. The distance constraint\n", + "\n", + "Fantastic that you've made it this far! With all the above functions defined we can start solving the problem. \n", + "\n", + "The distance constraint enforces that after each turn, the difference in positions after turns $i$ and $j$ must be larger or equal to 1 (distance between lattice points in the same dimension). \n", + "To visualize the scenario this constraint tries to penalize consider a 2D example with 4 turns, starting in $(0,0)$:\n", + "\n", + "$$ \\text{Turn 1, go right: } \\hspace{0.3cm} (0,0) => (0,1) $$ \n", + "$$ \\text{Turn 2, go up: } \\hspace{0.3cm} (0,1) => (1,1) $$ \n", + "$$ \\text{Turn 3, go left: } \\hspace{0.3cm} (1,1) => (1,0) $$ \n", + "$$ \\text{Turn 4, go down: } \\hspace{0.3cm} (1,0) => (0,0) $$ \n", + "\n", + "As you can see, the last step conflicts with our constraint. It is not permitted to return into a position that we've already been, namely $(0,0)$. Turn 1-3 are all valid, since they remain a distance of 1 away from all other previously held positions.\n", + "\n", + "Let's define what we want mathematically. tThe distance between the position after turn $i$ and $j$ must be larger or equal to 1. For this we'll need some basic geometry, the 3D variant of the Pythagorean theorem. From the theorem, it can be understood that hypotenuse ($c$) must always be larger or equal to one, since that is what defines the distance between two points. Mathematically speaking working this out:\n", + "\n", + "$$ C_{i,j} \\geq 1 $$\n", + "$$ \\sqrt{(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} \\geq 1 $$\n", + "\n", + "The square-root is a bit of a headache when writing out a cost function, it would require an approximation or some sort of factorization, not fun if you're dealing with many terms. To avoid that, we're simply going to square both sides, which in our case if fine (for maths people), since we aren't dealing with negative numbers here:\n", + "\n", + "$$ C_{i,j}^2 \\geq 1 $$\n", + "$$ {(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} \\geq 1 $$\n", + "\n", + "Nice! If you're sharp, you'll start seeing where the previous functions might come in handy now. The function that computes the difference between the respective positions (\"diff_in_pos\") in each dimension was defined above, but also the function that computes the an expansion (\"cross_multiply\") was defined at the beginning of the notebook. Writing those function calls out in order :\n", + "\n", + "1. We call \"diff_in_poss\" to calculate the difference in positions for each dimension (x,y,z).\n", + "2. For each dimension, the square is calculated by calling \"cross_multiply\". \n", + "\n", + "Alright, you might be wondering how to deal with the $>=$, since it is necessary to have an equation that equals zero in order to integrate it into the cost function. \n", + "This is where slack variables come in. The purpose of slack variables is to convert an inequality constraint into an equality constraint. Or in other words, for this equation, we need to compensate some values (explained further below) in order to convert the equation to an equality constraint. Consider the constraint in its simplest form:\n", + "\n", + "$$ C_{i,j}^2 \\geq 1 $$\n", + "\n", + "It is clear that we would need to add some number $V_{i,j}$, on the right hand side of the equation in order to make this an equality constraint. $V_{i,j}$ can be any positive value and is conditioned on $i$ and $j$: \n", + "\n", + "$$ C_{i,j}^2 = 1+V_{i,j}$$\n", + "\n", + "Let's say that instead of representing a single value we want V_{i,j} to represent a range of values $[0-4]$. This is where slack variables can be introduced. By introducing additional optimization variables, which have nothing to do with the path encoding, the range can be described as following:\n", + "\n", + "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+q_{s3}+q_{s4} $$\n", + "\n", + "Or more compactly:\n", + "\n", + "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+2q_{s3} $$\n", + "\n", + "So any value in the range $[0-4]$ is described through these q's. You can derive 1 by assigning a single \"q\", which has weight 1, the value 1. Likewise, you can get the value 4 by assigning all optimization variables the value 1. \n", + "\n", + "Alright, so how do we know which range of values we need to represent? That is revealed by the turn numbers, $i$ and $j$. Over these turns, the maximum squared distance that can be achieved is when moves are only made in a single direction, the \"+x\" direction for example. The maximum distance is then equal to the number of moves squared $(j-i)^2$.\n", + "\n", + "$$ C_{i,j}^2 = (j-i)^2 $$\n", + "\n", + "Then writing out the maths gives us the necessary upper bound for the range that the optimization variables need to represent, where $S$ stands for the number of slack variables necessary:\n", + "\n", + "$$ \\text{Upper bound: } \\hspace{0.5cm} C_{i,j}^2 = (j-i)^2 = 1 + \\sum_{s=0}^{S}q_s$$\n", + "$$ \\text{Upper bound: } \\hspace{0.5cm} \\sum_{s=0}^{S}q_s = (j-i)^2 - 1 $$\n", + "\n", + "For the lower bound of the range, the value is 0. The reason for that is we want to be able to represent any number equal to or larger than 1 for the inequality constraint through the addition of the slack variables. Concluding, the range the q's must represent is $[0,((j-i)^2-1)]$. More on how to calculate the number of slack variables necessary to define this range later, as you don't need ((j-i)^2-1) optimization variables!\n", + "\n", + "\n", + "Piecing all the parts together we find the following equation for a $i$-$j$ combination:\n", + "\n", + "$$ {(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} = 1 + \\sum_{s=0}^{S}q_s $$ \n", + "\n", + "Because constants are irrelevant for the optimization landscape the value 1 can be neglected. The reason being that constants only introduce linear offsets, thus impacting the entire optimization equally. The distance constraint which needs to account for all $i$-$j$ combinations, where $j$>$i$ and $N-1$ the number of turns, is summarized as follows:\n", + "\n", + "$$ \\sum_{i=1}^{N-1} \\sum_{j>i}^{N-1} \\lambda_0 ( {(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} - \\sum_{s=0}^{S}q_s ) $$ \n", + "\n", + "The function that builds this constraint is presented below. Read the docstring for how it works.\n", + "`Note, to run this function you'll need to run the next function cell to define 'generate_slack_coefficients'.` \n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def distance_constraint(num_turns: int, num_dim: int, lambda_0: int) -> list:\n", + "\n", + " '''\n", + " Purpose:\n", + " Build the distance contraint based on previosly defined functions.\n", + " Constraint: Distance squared between i and j must be larger or equal to 1.\n", + " Constraint: L_{i,j}^2 >= 1 => L_{i,j}^2 = 1+q_{slacker} (converting the inequality constraint to an equality constraint.)\n", + " Example/Explanation:\n", + " L{1,2}^2 = (x1-x2)^2 + (y1-y2)^2 + (z1-z2)^2\n", + " x1 = [move(+x1)-move(-x1)]\n", + " x2 = [move(+x1)-move(-x1)] + [move(+x2)-move(-x2)]\n", + " \n", + " \n", + " L{1,2}^2 = [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2\n", + " [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2 - q_{slacker} = 0 ---> expressed in q's == cost function\n", + " Inputs:\n", + " 1. num_turns: the number of turns.\n", + " 2. num_dum: the number of dimensions.\n", + " 3. lambda_0: the constraint weight for the distance constraint.\n", + " Output:\n", + " 1. List of term objects describing the distance constraint.\n", + " '''\n", + "\n", + " terms = []\n", + " slack_indexer = 0\n", + " for start_turn in range(1,num_turns+1):\n", + " for end_turn in range(start_turn+1,num_turns+2):\n", + " # Calculate the differences in positions for each dimension. \n", + " x_diff_i_j, y_diff_i_j, z_diff_i_j = diff_in_pos(start_turn, end_turn, num_dim, lambda_0)\n", + " # Compute the squared distance (Pythagorean theorem) by calculating the squared expansion.\n", + " x_diff_i_j_2, y_diff_i_j_2, z_diff_i_j_2 = cross_multiply(x_diff_i_j,x_diff_i_j), cross_multiply(y_diff_i_j,y_diff_i_j), cross_multiply(z_diff_i_j,z_diff_i_j) \n", + " # Add slack variables due to inequality constraint. \n", + " slack_var_terms = []\n", + " slack_coefficients = generate_slack_coefficients(end_turn-start_turn)\n", + " for s in range(0,len(slack_coefficients)):\n", + " slack_var_terms += [Term(c=-slack_coefficients[s], indices=[num_turns*num_dim+slack_indexer+s])]\n", + " terms += x_diff_i_j_2 + y_diff_i_j_2 + z_diff_i_j_2 + slack_var_terms\n", + " slack_indexer+=len(slack_coefficients)\n", + " return terms\n", + "\n", + "##### ----- Test the function and print output: \n", + "# The output is too large to understand, nevertheless you can run the below statements to view how visualize the term-scaling of the problem.\n", + "number_turns = 2 #play with this value!\n", + "dist_terms = distance_constraint(number_turns, num_dim, lambda_0)\n", + "\n", + "# Only print below statements if you want to get an impression of the number of terms.\n", + "#print('Distance constraint term dictionaries: ', dist_terms) # not readable!\n", + "#print('\\nDistance constraint: ') \n", + "#print_function(dist_terms) # not readable!" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 4. Intermezzo: Slack Variables Weights\n", + "\n", + "To remove any human calculations to construct the distance constraint(s), we'll automate the computation of the number of slack variables and their weights. \n", + "\n", + "As you saw in the previous part, certain slack variables can be assigned weights to reduce the number of slack variables necessary. Recall that the range $[0,4]$ can be defined by the following two equations with slack variables (s):\n", + "\n", + "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+q_{s3}+q_{s4} $$\n", + "\n", + "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+2q_{s3} $$\n", + "\n", + "The bottom equation is more compact because the last variables carries a weight-2. In Lucas' paper (see 2.4 of arxiv:1302.5843) the algorithm to find such weights is presented, which is based on calculating all $2^{x}$, where $x$ iterates from zero to the log_2 of maximum value in the range (4 in this example). \n", + "\n", + "Below are two examples that may help visualize why and how the slack variables represent the ranges of values. \n", + "\\\n", + " \n", + "\n", + "\n", + "
\n", + "\n", + "Example for range $[0,4]$:\n", + "| $q_{s1}$ | $2q_{s2}$ | $q_{s3}$ | Value |\n", + "| ------ | -------- | -------- | ---------------- |\n", + "| 0 | 0 | 0 | 0 + 2(0) + 0 = 0 |\n", + "| 1 | 0 | 0 | 1 + 2(0) + 0 = 1 |\n", + "| 0 | 1 | 0 | 0 + 2(1) + 0 = 2 |\n", + "| 1 | 1 | 0 | 1 + 2(1) + 0 = 3 |\n", + "| 1 | 1 | 1 | 1 + 2(1) + 1 = 4 | \n", + "\n", + "
\n", + "\n", + "\\\n", + " \n", + "\n", + "
\n", + "\n", + "Example for range $[0,20]$:\n", + "Rather than using twenty optimization variables, five with weights can achieve the same!\n", + "| $q_{s1}$ | $2q_{s2}$ | $4q_{s3}$ | $8q_{s4}$ | $5q_{s5}$ | Value |\n", + "| ------ | ------- | --------- | ----------- | --------- | ------------------- |\n", + "| 0 | 0 | 0 | 0 | 0 | 0 + 2(0) + 4(0) + 8(0) + 5(0) = 0 |\n", + "| 1 | 0 | 0 | 0 | 0 | 1 + 2(0) + 4(0) + 8(0) + 5(0) = 1 |\n", + "| 0 | 1 | 0 | 0 | 0 | 0 + 2(1) + 4(0) + 8(0) + 5(0) = 2 |\n", + "| 1 | 1 | 0 | 0 | 0 | 1 + 2(1) + 4(0) + 8(0) + 5(0) = 3 |\n", + "| 0 | 0 | 1 | 0 | 0 | 0 + 2(0) + 4(1) + 8(0) + 5(0) = 4 |\n", + "| ... | ... | ... | ... | ... | ... |\n", + "| 0 | 1 | 0 | 1 | 1 |0 + 2(1) + 4(0) + 8(1) + 5(1)= 15 |\n", + "| 1 | 1 | 0 | 1 | 1 |1 + 2(1) + 4(0) + 8(1) + 5(1)= 16 |\n", + "| 0 | 0 | 1 | 1 | 1 |0 + 2(0) + 4(1) + 8(1) + 5(1)= 17 |\n", + "| 1 | 0 | 1 | 1 | 1 |1 + 2(0) + 4(1) + 8(1) + 5(1)= 18 |\n", + "| 0 | 1 | 1 | 1 | 1 |0 + 2(1) + 4(1) + 8(1) + 5(1)= 19 |\n", + "| 1 | 1 | 1 | 1 | 1 |1 + 2(1) + 4(1) + 8(1) + 5(1)= 20 |\n", + "\n", + "
\n", + "\n", + "\\\n", + " \n", + "\n", + "The function is given below. In context of the distance constraint, we're still faced with a minor problem. If $(j-i)^2-1$ equals 0, then we don't need any slack variables. The reason for this is that the range becomes $[0,0]$, which can also be represented by no variables at all. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def generate_slack_coefficients(turn_diff: int):\n", + "\n", + " ''' \n", + " Purpose: \n", + " Calculates the number of slack variables and their weights.\n", + " Example:\n", + " For the constraint: x1 + x2 + x3 + x4 <= 4 which is converted to x1 + x2 + x3 + x4 + s1 + s2 +2*s3 = 4, \n", + " with 's' being slack variables. This function computes the weights of these slack variables ([1,1,2] for the example).\n", + " Reference:\n", + " Lucas' paper (see 2.4 of arxiv:1302.5843)\n", + " Input:\n", + " 1. turn_diff: the differences in turns (end_turn - start_turn).\n", + " Output:\n", + " 1. y: the weights of the slack variables.\n", + " '''\n", + " \n", + " dist_diff = (turn_diff**2)-1\n", + " if dist_diff == 0:\n", + " y = [] # no slack variables needed\n", + " elif dist_diff > 0:\n", + " M = floor(log2(dist_diff))\n", + " y = [-2**n for n in range(M)]\n", + " y.append(-(dist_diff + 1 - 2**M))\n", + " return y\n", + "\n", + "##### ----- Test the function and print output: \n", + "turn_difference = 3 # play with this value!\n", + "slack_weights = generate_slack_coefficients(turn_difference)\n", + "print('Slack weights: ', slack_weights) \n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 5. No Return Constraint\n", + "\n", + "The distance constraint enforces a minimum distance of 1 between the different taken positions. However, for two consecutive turns, it does not completely prevent (to a high enough degree) going to a previous position. A simplified explanation for this is that the distance constraint is described through the positional differences in $x$, $y$, and $z$. Additionally, for consecutive turns, the number of slack variables is zero ($(i-j)^2-1 = 0$ for consecutive turns} - thus there is no auxiliary benefit introduced by slack variables to compensate for being in a different position after the turn. Therefore, the solver will try to keep the positions as close to each other as possible, which leads to overlapping positions, especially in consecutive turns. To overcome this, a penalization needs to be introduced that stops returning to the previous position held in the turn before. For example, what we want to stop is the following:\n", + "\n", + "$$ \\text{Turn 1: A to B.} $$\n", + "$$ \\text{Turn 2: B to A.} $$\n", + "\n", + "This can be equivalenty described as moving in opposite directions over the consecutive turns. For example, first going in the \"+y\" direction, and following that moving in the \"-y\" direction. \n", + "\n", + "Designing such a constraint is straightforward, the opposite direction variables need to be multiplied. \n", + "Preventing a revisit of a position for the \"x\" direction over the first and second turn can be described by the following constraint:\n", + "\n", + "$$ {\\lambda}_2(d^{1}_{+x} d^{2}_{-x} + d^{1}_{-x}d^{2}_{+x}) $$ \n", + "\n", + "If a move is made in the \"+x\" direction first, $d^{1}_{+x}$ takes value 1. If afterwards a move is made in the \"-x\" direction, $d^{2}_{-x}$ also takes value 1, meaning that the combined term\n", + "$d^{1}_{+x} d^{2}_{-x}$ also becomes 1, enforcing the constraint with penalty value ${\\lambda}_2$. \n", + "\n", + "Generalizing the idea to any direction and for all turns, we find the \"no return constraint\":\n", + "\n", + "$$ {\\lambda}_1 \\left( \\sum_{m}^{\\in \\{x,y,z\\} }\\sum_{t=1}^{N-1} d^{t}_{+m} d^{t+1}_{-m} + d^{t}_{-m}d^{t+1}_{+m} \\right) $$ \n", + "\n", + "In this constraint, iterations are performed over the different dimensions ($m$), and the turn ($t$). The function defintion for the no return constraint is given below. Make sure to read the docstring. In the function the 'cross_multiply' method is used to expand and calculate all the necessary terms of the constraint. The direction variables are dictionaries of polynomials, and therefore have to be expanded before submitting to the Azure QIO solvers.\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def no_return_constraint(num_turns: int, num_dim: int, lamda_4: int)-> list:\n", + " \n", + " '''\n", + " Purpose:\n", + " Build the constraint that penalizes going back to the same position/node two turns later.\n", + " Example:\n", + " Node A ---> ---> Node B ---> ---> Node A => erroneous as we've been there already.\n", + " Two sequential moves may not be in the same dimension and in opposite directions: (+x then -x), (-x then +x), (+y then -y) etc.\n", + " Inputs:\n", + " 1. num_turns: the number of turns.\n", + " 2. num_dim : the number of dimensions, which is 3 for this sample.\n", + " 3. lambda_4 : the penalty weight for this constraint.\n", + " Outputs:\n", + " 1. List of term objects.\n", + " '''\n", + "\n", + " terms = []\n", + " for i in range(0,num_turns):\n", + " x_out_in = cross_multiply(direction_variables(\"+x\",i*num_dim,1,1,lamda_4), direction_variables(\"-x\",(i+1)*num_dim,1,1,lamda_4))\n", + " x_in_out = cross_multiply(direction_variables(\"-x\",i*num_dim,1,1,lamda_4), direction_variables(\"+x\",(i+1)*num_dim,1,1,lamda_4))\n", + " y_right_left = cross_multiply(direction_variables(\"+y\",i*num_dim,1,1,lamda_4), direction_variables(\"-y\",(i+1)*num_dim,1,1,lamda_4))\n", + " y_left_right = cross_multiply(direction_variables(\"-y\",i*num_dim,1,1,lamda_4), direction_variables(\"+y\",(i+1)*num_dim,1,1,lamda_4))\n", + " z_up_down = cross_multiply(direction_variables(\"+z\",i*num_dim,1,1,lamda_4), direction_variables(\"-z\",(i+1)*num_dim,1,1,lamda_4))\n", + " z_down_up = cross_multiply(direction_variables(\"-z\",i*num_dim,1,1,lamda_4), direction_variables(\"+z\",(i+1)*num_dim,1,1,lamda_4))\n", + " terms += x_out_in + x_in_out + y_right_left + y_left_right + z_up_down + z_down_up\n", + " return terms\n", + "\n", + "\n", + "##### ----- Test the function and print output: \n", + "number_turns = 1 # play with this value!\n", + "nrc_terms = no_return_constraint(number_turns, num_dim, lambda_1)\n", + "print('No return constraint term dictionaries: ', nrc_terms)\n", + "print('\\n No return constraint function:')\n", + "print_function(nrc_terms)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 6. Penalize Invalid Moves\n", + "\n", + "Recall that there are two invalid optimization variable substrings that are not associated with any move, $000$ and $111$. A path that includes these substrings is invalid. To prevent the solver from generating these invalid directions we'll need to add two constraints. Each constraint is specific to an invalid direction, and because we're working directly with the substring we don't need the abstraction layers used in previous constraints, like directional and positional variables. \n", + "\n", + "Let's first work out the constraint for preventing substring $000$. $ q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma} $ may not equal $000$, where $\\gamma = 3(k-1)$ and $k$ the turn number. If we were to design the constraints as $ q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma} $ there won't be any penalty, because all $q$'s will equal and multiply to zero. Therefore, if all these $q$'s equal zero, we need the substring to multiply to 1. This is achieved by the following, which multiplies to zero if all optimization variables take the value zero:\n", + "\n", + "$$ {\\lambda}_2(1-q_{0+\\gamma}) (1-q_{1+\\gamma}) (1-q_{2+\\gamma}) $$\n", + "$$ \\text{If } \\hspace{0.1cm} q_{0+\\gamma} = q_{1+\\gamma} = q_{2+\\gamma} = 0, \\hspace{0.1cm} \\text{then: } $$ \n", + "$$ {\\lambda}_2(1-q_{0+\\gamma}) (1-q_{1+\\gamma}) (1-q_{2+\\gamma}) = {\\lambda}_2 \\cdot 1 $$\n", + "\n", + "\n", + "Nice! By expanding the equation and neglecting constant terms a constraint is found that can be implemented:\n", + "\n", + "$$\\text{Constraint for 000: }-q_{0+\\gamma}−q_{1+\\gamma}−q_{2+\\gamma}+q_{0+\\gamma}q_{1+\\gamma}+q_{0+\\gamma}q_{2+\\gamma}+q_{1+\\gamma}q_{2+\\gamma}−q_{0+\\gamma}q_{1+\\gamma}q_{2+\\gamma}$$\n", + "\n", + "Before going to the function definition, let's first look at penalizing the substring $111$. Luckily this is much easier as the substring multiplies to 1 if all the $q$'s have the value zero. The constraint is therefore simple to derive:\n", + "\n", + "$$ {\\lambda}_3 (q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma}) $$\n", + "$$ \\text{If } \\hspace{0.1cm} q_{0+\\gamma} = q_{1+\\gamma} = q_{2+\\gamma} = 1, \\hspace{0.1cm} \\text{then: } $$ \n", + "$$ {\\lambda}_3 (q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma}) = {\\lambda}_3 \\cdot 1$$\n", + "\n", + "The constraint for the substring $111$ is:\n", + "\n", + "$$ \\text{Constraint for $111$: }\\hspace{0.1cm} {\\lambda}_3 (q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma}) $$\n", + "\n", + "The function definitions for these two constraints are given below. \n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def penalize_000(len_seq: int, num_dim: int, lambda_2: int) -> list:\n", + "\n", + " '''\n", + " Purpose:\n", + " Build the constraint that penalizes the invalid moves associated with the 3 q's string: '000'.\n", + " The constraint needs to be defined over the set of all turns, as defined by the 'for' loop.\n", + " Example:\n", + " If turn 2 (q_3q_4q_5) equals '000', assign a large penalty.\n", + " Inputs:\n", + " 1. len_seq: the number nodes to consider.\n", + " 2. num_dim: the number of dimensions (which is 3).\n", + " 3. lambda_2: the penalty weight for this constraint.\n", + " Outputs:\n", + " 1. List of term objects.\n", + " '''\n", + " \n", + " terms = []\n", + " for k in range(0,len_seq):\n", + " offset = k*num_dim\n", + " term_0 = Term(c=-1*lambda_2,indices=[0+offset])\n", + " term_1 = Term(c=-1*lambda_2,indices=[1+offset])\n", + " term_2 = Term(c=-1*lambda_2,indices=[2+offset])\n", + " term_3 = Term(c= 1*lambda_2,indices=[0+offset,1+offset])\n", + " term_4 = Term(c= 1*lambda_2,indices=[0+offset,2+offset])\n", + " term_5 = Term(c= 1*lambda_2,indices=[1+offset,2+offset])\n", + " term_6 = Term(c=-1*lambda_2,indices=[0+offset,1+offset,2+offset])\n", + " terms += [term_0, term_1, term_2, term_3, term_4, term_5, term_6]\n", + " return terms\n", + "\n", + "def penalize_111(len_seq: int, num_dim: int, lambda_3: int) -> list:\n", + "\n", + " '''\n", + " Purpose:\n", + " Build the constraint that penalizes the invalid moves associated with the 3 q's string: '111'.\n", + " The constraint needs to be defined over the set of all turns, as defined by the 'for' loop.\n", + " Example:\n", + " If turn 2 (q_3q_4q_5) equals '111', assign a large penalty.\n", + " Inputs:\n", + " 1. len_seq: the number nodes to consider.\n", + " 2. num_dim: the number of dimensions (which is 3 in this sample).\n", + " 3. lambda_3: the penalty weight for this constraint.\n", + " Outputs:\n", + " 1. List of term objects.\n", + " '''\n", + "\n", + " terms = []\n", + " for k in range(0,len_seq):\n", + " offset = k*num_dim \n", + " terms += [Term(c=1*lambda_3,indices=[0+offset,1+offset,2+offset])]\n", + " return terms\n", + "\n", + "\n", + "##### ----- Test the function and print output: \n", + "term_000 = penalize_000(len_seq, num_dim, lambda_2) \n", + "term_111 = penalize_111(len_seq, num_dim, lambda_3) \n", + "print('Term dictionary penalty constraint for 000:', term_000, '\\n')\n", + "print('Term dictionary penalty constraint for 111:', term_111, '\\n')\n", + "print('Function for penality 000: ')\n", + "print_function(term_000)\n", + "print('Function for penality 111: ')\n", + "print_function(term_111)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 7. Parsing and validating the solution\n", + "\n", + "We've finished defining the optimization function. The next step is to start looking at how we're going to submit it to the solvers and analyze the returned results. \n", + "First let's look at how to parse, validate, and visualize the results, since that will make tuning the solvers easier!\n", + "\n", + "Below you can find the function definition that reads the solution and validates it. The solution dictionary is first read out to the optimiation variable string that describes the path. Afterward, the substrings that represent the directions are translated to linguistic terms, such that the solution can be printed in a human-readable format. Based on these two steps, the validation process checks if any constraints are violated. If constraints are violated warnings will be shown in the output with some tuning suggestions.\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def read_validate_solution(solution: dict, num_turns: int, num_dim: int):\n", + " \n", + " '''\n", + " Purpose:\n", + " To validate the solution returned by the solver. Make it readable, and analyze if it makes sense.\n", + " Inputs:\n", + " 1. solution: The solution results dictionary which is returned by the solver (results[\"configuration\"]).\n", + " 2. num_turns: The number of turns for the simulation.\n", + " 3. num_dim: The number of dimensions, which is 3 for this sample (3D).\n", + " Outputs:\n", + " 1. valid: A boolean variable that specifies the validity of the solution.\n", + " 2. pos_dit: Layered position dictionary that contains all of the nodes' locations per turn {turn: {x: x_pos, y:y_pos, z:z_pos}}.\n", + " 3. dir_dict: Dictionary containing the linguistic interpretation of the 6 directions.\n", + " 4. var_dict: Dictionary containing the spin per optimization variable.\n", + " 5. x_arr: Array of x positions.\n", + " 6. y_arr: Array of y positions.\n", + " 7. z_arr: Array of z positions. \n", + " '''\n", + "\n", + " print('\\n')\n", + " valid = True\n", + " move = ''\n", + " sol_str = ''\n", + " x_arr = [0]\n", + " y_arr = [0]\n", + " z_arr = [0]\n", + " dir_dict = {'100':'out','010':'in','001':'right','110':'left','101':'up','011':'down'}\n", + " pos_dict = {0:{\"x\":0, \"y\":0, \"z\":0}}\n", + " var_dict = {}\n", + " for key,val in solution:\n", + " if key<(num_turns*num_dim):\n", + " turn = floor(key/num_dim)+1\n", + " print(\"Turn: \"+str(turn),\"var: \"+str(key),\"spin: \"+str(val))\n", + " var_dict |= {str(key): val}\n", + " if key%3 list: + + ''' + Purpose: + Translates the direction (+x,-x,+y,-y,+z,-z) of turn 'i' as a function of three q's. (Three optimization variables because of the defined coordinate system). + Example: + Direction "+z" in the first turn (turn = 1) is translated to: q_{0+offset}q_{2+offset}-q_{0+offset}q_{1+offset}q_{2+offset}. + Inputs: + 1. direction: A direction from an x-y-z coordinate system, one of the following: ('+x','-x','+y','-y','+z','-z'). + 2. offset: Offset gives the turn number expressed in the first q of that turn. + Example: Turn 1 starts with q_0, offset=0. Turn 2 starts with q_3, offset = 3. + 3. sign_dir: Changes the sign of the weights corresponding to negative directions "-x", "-y", "-z" -> necessary for finding the positions, for exmaple (+x) "-" (-x). + 4. sign_pos: Changes the sign of the weights corresponding to negative positions "-(x,y,z)" -> necessary for finding the distances between node "i" and node "j". + 5. lambda_: The weight term associated with a constraint. + Output: + 1. A list of term objects. + ''' + + terms = [] + if direction == "+x": + term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset]) + term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset]) + term_2 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset]) + term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1, term_2, term_3] + elif direction == "-x": + term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset]) + term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset]) + term_2 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset]) + term_3 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1, term_2, term_3] + elif direction == "+y": + term_0 = Term(c= 1*sign_pos*lambda_, indices=[2+offset]) + term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset]) + term_2 = Term(c=-1*sign_pos*lambda_, indices=[1+offset, 2+offset]) + term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1, term_2, term_3] + elif direction == "-y": + term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset]) + term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1] + elif direction == "+z": + term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 2+offset]) + term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1] + elif direction == "-z": + term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset]) + term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1] + return terms + +def print_cost_function(terms: list): + + ''' + Purpose: + Takes a list of terms and prints it out as a (mathematical) cost function. + Example: + {'c': 1, 'ids': [0, 10, 11, 12]} ---> 1q_0q_10q_11q_12 + Inputs: + 1. terms: the list of terms. + ''' + + final_string = '' + final_string = '' + for term in terms: + term = term.to_dict() + weight = term['c'] + ids = term['ids'] + string = '(' + if weight >= 0: + string = '+' + '('+str(weight) + if weight < 0: + string = '-' + '(' + str(abs(weight)) + for id_ in ids: + string = string + f'q_{id_}' + string = string + ')' + final_string = final_string + string + print('[' + final_string + ']') + + +def generate_slack_coefficients(turn_diff: int): + + ''' + Purpose: + Calculates the number of slack variables and their weights. + Example: + For the constraint: x1 + x2 + x3 + x4 <= 4 which is converted to x1 + x2 + x3 + x4 + s1 + s2 +2*s3 = 4, + with 's' being slack variables. This function computes the weights of these slack variables ([1,1,2] for the example). + Input: + 1. turn_diff: the differences in turns (end_turn - start_turn). + Output: + 1. y: the weights of the slack variables. + ''' + + dist_diff = (turn_diff**2)-1 + if dist_diff == 0: + y = [] + elif dist_diff > 0: + M = floor(log2(dist_diff)) + y = [2**n for n in range(M)] + y.append(dist_diff + 1 - 2**M) + return y + + +def simplify_every_iter_function(term_list: list[Term], ref_term:Term) -> list[Term]: + terms = [] + same_ids_list = [] + diff_ids_list = [] + if term_list: + for term_in_list in term_list: + if sorted(ref_term.ids) == sorted(term_in_list.ids): + same_ids_list += [term_in_list] + else: + diff_ids_list += [term_in_list] + if same_ids_list: + new_weight = ref_term.c + ids = sorted(ref_term.ids) + for same_ids_term in same_ids_list: + new_weight += same_ids_term.c + terms += [Term(c=new_weight, indices=ids)] + else: + terms += [ref_term] + if diff_ids_list: + terms += diff_ids_list + return terms + + +def diff_in_pos(start_turn: int, end_turn: int, num_dim: int, lamda_: int): + + ''' + Purpose: + Expresses the difference in position (x,y,z) between two turns as a function of the encoding of the directions. + In other words, expresses the difference in the position after the start_turn and position after the end_turn. + Example: + Difference between turn 0 (no turns yet, initial position = (0,0,0)) and turn 2: + x(2) = [ move(+x, turn 1) - move(-x, turn 1) ] + [ move(+x, turn 2) - move(-x, turn 2) ] + Note: only one 'move' per turn gets activated as they are represented by the same q's (ex. turn 1 is represented by q_0, q_1, and q_2). + Inputs: + 1. start_turn: the initial (reference) turn. + 2. end_turn: the final (target) turn. + 3. num_dim: the number of dimensions (3, x-y-z coordinate system). + Outputs: + 1. The difference in the x direction. + 2. The difference in the y direction. + 3. The difference in the z direction. + ''' + + x_diff = y_diff = z_diff = [] + if start_turn < end_turn and start_turn >= 0 and end_turn >= 1: + for turn in range(start_turn,end_turn+1): + x_diff += direction_variables("+x",(turn-1)*num_dim,1,1,lamda_)+direction_variables("-x",(turn-1)*num_dim,-1,1,lamda_) + y_diff += direction_variables("+y",(turn-1)*num_dim,1,1,lamda_)+direction_variables("-y",(turn-1)*num_dim,-1,1,lamda_) + z_diff += direction_variables("+z",(turn-1)*num_dim,1,1,lamda_)+direction_variables("-z",(turn-1)*num_dim,-1,1,lamda_) + return x_diff, y_diff, z_diff + +def cross_multiply(list_a: list[Term], list_b: list[Term]) -> list: + + ''' + Purpose: Cross multiplies two lists of terms (linear ex. [q_0 + q_1] or non-linear ex. [q_0q_1]) to return the expansion. + Can compute powers of groups this way (^2, ^3,...), like squaring a list of terms. + Calculates the expansion locally, unlike the SlcTerm class. + Example: (2q_0q_1+3q_2q_3)^2 => (2q_0q_1)^2 + 12q_0q_1q_2q_3 + (3q_2q_3)^2 + Input: + 1. list_a: list which serves as the reference list (first 'for' loop). + 2. list_b: list which serves as the target list (second 'for' loop). + Output: + 1. list of term objects. + ''' + + terms = [] + for one in list_a: + for uno in list_b: + weight = one.c * uno.c + ids = one.ids + uno.ids + new_term = Term(c = weight, indices = ids) + terms += [new_term] + #terms = simplify_function(terms, new_term) + return terms + +def distance_constraint(num_turns: int, num_dim: int, lambda_0: int) -> list: + + ''' + Purpose: + Build the distance contraint based on previosly defined functions. + Constraint: Distance squared between i and j must be larger or equal to 1. + Constraint: L_{i,j}^2 >= 1 => L_{i,j}^2 = 1+q_{slacker} (converting the inequality constraint to an equality constraint.) + Example/Explanation: + L{1,2}^2 = (x1-x2)^2 + (y1-y2)^2 + (z1-z2)^2 + x1 = [move(+x1)-move(-x1)] + x2 = [move(+x1)-move(-x1)] + [move(+x2)-move(-x2)] + < same for other dimensions > + < fill into first line > + L{1,2}^2 = [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2 + [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2 - q_{slacker} = 0 ---> expressed in q's == cost function + Inputs: + 1. num_turns: the number of turns. + 2. num_dum: the number of dimensions. + 3. lambda_0: the constraint weight for the distance constraint. + Output: + 1. List of term objects describing the distance constraint. + ''' + + terms = [] + slack_indexer = 0 + for start_turn in range(1,num_turns+1): + for end_turn in range(start_turn+1,num_turns+2): + # Calculate the differences in positions for each dimension. + x_diff_i_j, y_diff_i_j, z_diff_i_j = diff_in_pos(start_turn, end_turn, num_dim, lambda_0) + # Compute the squared distance (Pythagorean theorem) by calculating the squared expansion. + x_diff_i_j_2, y_diff_i_j_2, z_diff_i_j_2 = cross_multiply(x_diff_i_j,x_diff_i_j), cross_multiply(y_diff_i_j,y_diff_i_j), cross_multiply(z_diff_i_j,z_diff_i_j) + # Add slack variables due to inequality constraint. + slack_var_terms = [] + slack_coefficients = generate_slack_coefficients(end_turn-start_turn) + for s in range(0,len(slack_coefficients)): + slack_var_terms += [Term(c=-slack_coefficients[s], indices=[num_turns*num_dim+slack_indexer+s])] + + terms += x_diff_i_j_2 + y_diff_i_j_2 + z_diff_i_j_2 + slack_var_terms + slack_indexer+=len(slack_coefficients) + return terms + +def penalize_000(len_seq: int, num_dim: int, lambda_2: int) -> list: + + ''' + Purpose: + Build the constraint that penalizes the invalid moves associated with the substring: '000'. + The constraint needs to be defined over the set of all turns, as defined by the 'for' loop. + Example: + If turn 2 (q_3q_4q_5) equals '000', assign a large penalty. + Inputs: + 1. len_seq: the number nodes to consider. + 2. num_dim: the number of dimensions (which is 3). + 3. lambda_2: the penalty weight for this constraint. + Outputs: + 1. List of term objects. + ''' + + terms = [] + for k in range(0,len_seq): + offset = k*num_dim + term_0 = Term(c=-1*lambda_2,indices=[0+offset]) + term_1 = Term(c=-1*lambda_2,indices=[1+offset]) + term_2 = Term(c=-1*lambda_2,indices=[2+offset]) + term_3 = Term(c= 1*lambda_2,indices=[0+offset,1+offset]) + term_4 = Term(c= 1*lambda_2,indices=[0+offset,2+offset]) + term_5 = Term(c= 1*lambda_2,indices=[1+offset,2+offset]) + term_6 = Term(c=-1*lambda_2,indices=[0+offset,1+offset,2+offset]) + terms += [term_0, term_1, term_2, term_3, term_4, term_5, term_6] + return terms + +def penalize_111(len_seq: int, num_dim: int, lambda_3: int) -> list: + + ''' + Purpose: + Build the constraint that penalizes the invalid moves associated with the substring: '111'. + The constraint needs to be defined over the set of all turns, as defined by the 'for' loop. + Example: + If turn 2 (q_3q_4q_5) equals '111', assign a large penalty. + Inputs: + 1. len_seq: the number nodes to consider. + 2. num_dim: the number of dimensions (which is 3 in this sample). + 3. lambda_3: the penalty weight for this constraint. + Outputs: + 1. List of term objects. + ''' + + terms = [] + for k in range(0,len_seq): + offset = k*num_dim + terms += [Term(c=1*lambda_3,indices=[0+offset,1+offset,2+offset])] + return terms + +def no_return_constraint(num_turns: int, num_dim: int, lamda_4: int)-> list: + + ''' + Purpose: + Build the constraint that penalizes going back to the same position/node two turns later. + Example: + Node A ---> ---> Node B ---> ---> Node A => erroneous as we've been there already. + Two sequential moves may not be in the same dimension and in opposite directions: (+x then -x), (-x then +x), (+y then -y) etc. + Inputs: + 1. num_turns: the number of turns. + 2. num_dim : the number of dimensions, which is 3 for this sample. + 3. lambda_4 : the penalty weight for this constraint. + Outputs: + 1. List of term objects. + ''' + + terms = [] + for i in range(0,num_turns): + x_out_in = cross_multiply(direction_variables("+x",i*num_dim,1,1,lamda_4), direction_variables("-x",(i+1)*num_dim,1,1,lamda_4)) + x_in_out = cross_multiply(direction_variables("-x",i*num_dim,1,1,lamda_4), direction_variables("+x",(i+1)*num_dim,1,1,lamda_4)) + y_right_left = cross_multiply(direction_variables("+y",i*num_dim,1,1,lamda_4), direction_variables("-y",(i+1)*num_dim,1,1,lamda_4)) + y_left_right = cross_multiply(direction_variables("-y",i*num_dim,1,1,lamda_4), direction_variables("+y",(i+1)*num_dim,1,1,lamda_4)) + z_up_down = cross_multiply(direction_variables("+z",i*num_dim,1,1,lamda_4), direction_variables("-z",(i+1)*num_dim,1,1,lamda_4)) + z_down_up = cross_multiply(direction_variables("-z",i*num_dim,1,1,lamda_4), direction_variables("+z",(i+1)*num_dim,1,1,lamda_4)) + terms += x_out_in + x_in_out + y_right_left + y_left_right + z_up_down + z_down_up + return terms + + + +def read_validate_solution(solution: dict, num_turns: int, num_dim: int): + + ''' + Purpose: + To validate the solution returned by the solver. Make it readable, and analyze if it makes sense. + Inputs: + 1. solution: The solution results dictionary which is returned by the solver (results["configuration"]). + 2. num_turns: The number of turns for the simulation. + 3. num_dim: The number of dimensions, which is 3 for this sample (3D). + Outputs: + 1. valid: A boolean variable that specifies the validity of the solution. + 2. pos_dit: Layered position dictionary that contains all of the nodes' locations per turn {turn: {x: x_pos, y:y_pos, z:z_pos}}. + 3. dir_dict: Dictionary containing the linguistic interpretation of the 3-substring directions. + 4. var_dict: Dictionary containing the spin per optimized variable + 5. x_arr: Array of x positions. + 6. y_arr: Array of y positions. + 7. z_arr: Array of z positions. + ''' + + print('\n') + valid = True + move = '' + sol_str = '' + x_arr = [0] + y_arr = [0] + z_arr = [0] + dir_dict = {'100':'out','010':'in','001':'right','110':'left','101':'up','011':'down'} + pos_dict = {0:{"x":0, "y":0, "z":0}} + var_dict = {} + for key,val in solution: + if key<(num_turns*num_dim): + turn = floor(key/num_dim)+1 + print("Turn: "+str(turn),"var: "+str(key),"spin: "+str(val)) + var_dict |= {str(key): val} + if key%3 Date: Tue, 19 Jul 2022 13:45:00 +0200 Subject: [PATCH 07/10] Delete self-avoiding-walk.html --- .../self-avoiding-walk.html | 15645 ---------------- 1 file changed, 15645 deletions(-) delete mode 100644 samples/self-avoiding-path/self-avoiding-walk.html diff --git a/samples/self-avoiding-path/self-avoiding-walk.html b/samples/self-avoiding-path/self-avoiding-walk.html deleted file mode 100644 index 5b3d7e4..0000000 --- a/samples/self-avoiding-path/self-avoiding-walk.html +++ /dev/null @@ -1,15645 +0,0 @@ - - - - - -self-avoiding-walk - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - From 26fe2bc4eb22a3afe5d49305b381e338c52b3e49 Mon Sep 17 00:00:00 2001 From: Max Lucassen <74817215+maximilianluc@users.noreply.github.com> Date: Tue, 19 Jul 2022 13:45:08 +0200 Subject: [PATCH 08/10] Delete self-avoiding-walk.ipynb --- .../self-avoiding-walk.ipynb | 1086 ----------------- 1 file changed, 1086 deletions(-) delete mode 100644 samples/self-avoiding-path/self-avoiding-walk.ipynb diff --git a/samples/self-avoiding-path/self-avoiding-walk.ipynb b/samples/self-avoiding-path/self-avoiding-walk.ipynb deleted file mode 100644 index be93700..0000000 --- a/samples/self-avoiding-path/self-avoiding-walk.ipynb +++ /dev/null @@ -1,1086 +0,0 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Self Avoiding Walk with Azure Quantum Inspired Optimization\n", - "\n", - "In this notebook we'll cover how to formulate an optimization problem to find a path through a 3D lattice that does not cross itself (self-avoiding). The optimization problem is solved with the Azure Quantum service which contains numerous heuristic (non-linear) optimization solvers. Finding a self-avoiding path in a 3D lattice can be considered a difficult problem, in the sense that it has suffers from exponential scaling conditioned on the number of turns and the number of dimensions (2D vs 3D, etc.). \n", - "\n", - "In this notebook, a step by step approach is taken to explain the function definitions to are necessary to create the optimization problem.\n", - "\n", - "Goal: To find a path in a 3D lattice that does not cross itself.\n", - "\n", - "To clarify some vocab and assumptions used in the notebook:\n", - "1. The number of dimensions is 3 (3D), meaning the path can be represented in a $x$-$y$-$z$ plane.\n", - "2. The position represents the location in the x-y-z plane, thus given by ($x$,$y$,$z$).\n", - "3. A direction describes the orientation of within in the x-y-z plane, thus in {$+x$,$-x$,$+y$,$-y$,$+z$,$-z$}.\n", - "4. \"Turns\" are equivalent to \"steps\". After each turn a new position is acquired that must be unique (not visited before). \n", - "5. The total number of turns is equivalent to the number of positions that needs to be visited minus one ($N-1$). \n", - "6. The decision variables for the optimization function are denoted by \"q\" because \"x\" is already associated with a direction, and are referred to as \"optimization variables\".\n", - "\n", - "Note: Because the number of terms to for this optimization problem grows explosively with the number of turns, you might want to try running this in the Azure Quantum notebooks. The more technical reason for this is that expansions of nonlinear terms have to be computed locally resulting in massive number of terms needing to be uploaded. Unless you are very patient, a recommendation would be to either check out the online notebook experience or rewrite this notebook's problem class to its streaming counterpart (https://docs.microsoft.com/en-us/azure/quantum/optimization-streaming-problem). \n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Import the necessary dependencies for the notebook" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "import time\n", - "from math import floor, log2\n", - "from azure.quantum import Workspace\n", - "from azure.quantum.optimization import Problem, ProblemType, Term, ParallelTempering, Tabu, SimulatedAnnealing\n", - "from azure.identity import ClientSecretCredential\n", - "from mpl_toolkits import mplot3d\n", - "import numpy as np\n", - "import matplotlib.pyplot as plt" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "## Connect to your Azure Quantum workspace\n", - "\n", - "To run the sample, you'll need to have a quantum workspace. Check out this module if you don't have one yet: https://docs.microsoft.com/en-us/learn/modules/get-started-azure-quantum/.\n", - "Fill in the variables below." - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "workspace = Workspace(\n", - " subscription_id = \"\",\n", - " resource_group = \"\",\n", - " name = \"\",\n", - " location = \"\",\n", - " credential = ClientSecretCredential(tenant_id=\"\",\n", - " client_id=\"\",\n", - " client_secret=\"\")\n", - ")\n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Print readable cost functions\n", - "\n", - "Throughout the notebook you'll probably realize that printing the \"terms\" isn't going to provide much help, mainly because there will be too many of them and their dictionary format. A term is the way a mathematical term is expressed in terms of a dictionary for the SDK (see examples). Below a function is defined that prints the term(s) dictionaries that describe the constraint/cost function in terms of \"q\" optimization variables. You can call the function to check if the working is correct, or if you're unsure of what a constraint looks like. Note that for a large problem it nevertheless becomes difficult to understand the entire function output because of the number of terms.\n", - "\n", - "An example:\n", - "{'c': 1, 'ids': [0, 10, 11, 12]} ---> $1q_0q_{10}q_{11}q_{12}$\n" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "def print_function(terms: list):\n", - "\n", - " '''\n", - " Purpose:\n", - " Takes a list of terms and prints it out as a mathematical (cost/constraint) function.\n", - " Example:\n", - " {'c': 1, 'ids': [0, 10, 11, 12]} ---> 1q_0q_10q_11q_12\n", - " Inputs:\n", - " 1. terms: the list of terms.\n", - " '''\n", - " \n", - " k = 0\n", - " final_string = ''\n", - " final_string = ''\n", - " for term in terms:\n", - " term = term.to_dict()\n", - " weight = term['c']\n", - " ids = term['ids']\n", - " string = '('\n", - " if weight >= 0:\n", - " if k == 0: \n", - " string = '('+str(weight)\n", - " else:\n", - " string = '+' + '('+str(weight)\n", - " if weight < 0:\n", - " if k == 0:\n", - " string = '(' + str(abs(weight))\n", - " else: \n", - " string = '-' + '(' + str(abs(weight))\n", - " for id_ in ids:\n", - " string = string + f'q_{id_}'\n", - " string = string + ')'\n", - " final_string = final_string + string\n", - " k += 1\n", - "\n", - " print('[ ' + final_string + ' ]')" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Expansion of two term lists\n", - "\n", - "Throughout the notebook we will need to cross-multiply nonlinear terms, for computing squares for example. The function below performs the expansion. An important note to keep in mind here, especially if you're looking to optimize the code, is that the function does not assemble identical terms. Since the cost functions dealt with in this notebook are still rather small, reducing the number of terms was left out of the scope. \n", - "\n", - "More clearly stated in terms of equations:\n", - "\n", - "$$ \\text{Current function (see below): } \\hspace{0.2cm} (a+b)^2 = a^2 + ab + ab + b^2 $$\n", - "$$ \\text{Optimal function: } \\hspace{0.2cm} (a+b)^2 = a^2 + 2ab + b^2 $$\n", - "\n", - "Should be a fun programming exercise to reduce the number of terms significantly!" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "def cross_multiply(list_a: list, list_b: list) -> list:\n", - "\n", - " '''\n", - " Purpose: Cross multiplies two lists of terms (linear ex. [q_0 + q_1] or non-linear ex. [q_0q_1]) to return the expansion.\n", - " Can compute powers of groups this way (^2, ^3,...), like squaring a list of terms.\n", - " Calculates the expansion locally, unlike the SlcTerm class.\n", - " Example: (2q_0q_1+3q_2q_3)^2 => (2q_0q_1)^2 + 6q_0q_1q_2q_3 + 6q_0q_1q_2q_3 + (3q_2q_3)^2\n", - " Input:\n", - " 1. list_a: list which serves as the reference list (first 'for' loop).\n", - " 2. list_b: list which serves as the target list (second 'for' loop).\n", - " Output:\n", - " 1. list of term objects.\n", - " '''\n", - "\n", - " terms = []\n", - " for one in list_a:\n", - " for uno in list_b:\n", - " alpha = one.to_dict()\n", - " beta = uno.to_dict()\n", - " weight = int(alpha['c'])*int(beta['c'])\n", - " ids = list(alpha['ids'])+list(beta['ids'])\n", - " terms += [Term(c = weight, indices = ids)] \n", - " return terms\n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Parameters for running through the notebook\n", - "\n", - "While running through the notebook you might want to execute and print some of the constraint functions. To do that, you'll need some variables to be defined. Only 3 turns are considered with the defined parameters below, as that will keep the function outputs small and understandable!" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "nodes = \"ABCD\" # The four position/node names.\n", - "len_seq = len(nodes) # The length of the node \n", - "num_turns = len(nodes)-1 # The number of turns, which is one less than the number of therefore -1 turns.\n", - "num_dim = 3 # Number of optimization variables required to describe a turn\n", - "lambda_0 = 1 # Penalty weight for the 'distance constraint'\n", - "lambda_1 = 40 # Penalty weight for the 'no return constraint'\n", - "lambda_2 = 25 # Penalty weight for the invalid direction '000' constraint\n", - "lambda_3 = 25 # Penalty weight for the invalid direction '111' constraint" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Part 1. Encoding the directions \n", - "\n", - "Prior to starting to define our cost function, we have to construct some basic functions and agree on some definitions. In this part, we'll define the 6 directions of the x-y-z plane in terms of the optimization variables (\"q\"). \n", - "\n", - "A common way to encode a turn based optimization problem is through a direction-based string, in which each optimization variable substring (ex. $q_0q_1q_2$) denotes some kind of decision of which direction was takn. For example, take a car take can only move backward or forward. The decision of the driver at some time $t$ can be described as $q_t \\in \\{0, 1\\}$, where 0 represents going backward and 1 forward, respectively. Over a multiple time steps, say 3, one can then describe the movement of the car by:\n", - "\n", - "$$ \\text{Movements:} \\hspace{0.25cm} q_0q_1q_2 $$\n", - "\n", - "The sequence of movements, \"forward, backward, backward\", can then be represented as:\n", - "\n", - "$$ \\text{Sequence of movements:} \\hspace{0.25cm} q_0q_1q_2 = 100$$\n", - "\n", - "Alright, if that is clear to you, then the next step is to represent the 6 directions of the x-y-z plane in such a fashion. Regrettably, a \"q\" can only be either 0 or 1, not 2, 3, 4, 5 to represent the six directions. But what can be done is to use multiple optimization variables to describe a direction! For example:\n", - "\n", - "$$ \\text{Sequence of movements:} \\hspace{0.25cm} q_0q_1q_2q_3q_4q_5q_6q_7q_8 $$\n", - "$$ \\text{First move:} \\hspace{0.25cm} q_0q_1q_2 $$\n", - "$$ \\text{Second move:} \\hspace{0.25cm} q_3q_4q_5 $$\n", - "$$ \\text{Third move:} \\hspace{0.25cm} q_6q_7q_8 $$\n", - "\n", - "Because we need to encode 6 directions, we need at least 3 optimization variables to form unique substrings. The table explains this, we to have enough possible combinations to encode the 6 directions:\n", - "\n", - "
\n", - "\n", - "| Opt. var. substring | Combinations | \n", - "| ----------------------------- | -------------------------- |\n", - "| $q_0 \\cdot q_1$ | $2\\cdot 2 = 4 < 6$ |\n", - "| $q_0 \\cdot q_1 \\cdot q_2$ | $2\\cdot 2\\cdot 2 = 8 > 6$ |\n", - "\n", - "
\n", - "\n", - "Note, for later, you should keep in mind that 2 of the 8 combinations become irrelevant. It is important that the solver does not return those strings!\n", - "\n", - "Perfect! Now we just need to assign each direction a unique substring. Below you can find my choices, feel free to change these if you're starting from scratch.\n", - "\n", - "
\n", - "\n", - "| Direction | Opt. var. substring | \n", - "| --------- | ----------------- |\n", - "| +x | 100 |\n", - "| -x | 010 |\n", - "| +y | 001 |\n", - "| -y | 110 |\n", - "| +z | 101 |\n", - "| -z | 011 |\n", - "| N/A | 000 |\n", - "| N/A | 111 |\n", - "\n", - "
\n", - "\n", - "Now we just need to define direction variables. These are as defined in the above table. These variables should take a value 1 if a movement is made in that direction, while the other directions must all be zero. This can be achieved by the following scheme, where $k$ denotes the turn, and $\\gamma = 3(k-1)$ (3 because 3 dimensions):\n", - "\n", - "
\n", - "\n", - "| Direction | Opt. var. substring | Formula | \n", - "| ------------- | ---------------- | -------------------------------------------------- |\n", - "| $d_{+x}^{k}$ | 100 | $ q_{0+\\gamma} (1-q_{1+\\gamma}) (1-q_{2+\\gamma})$ |\n", - "| $d_{-x}^{k}$ | 010 | $ (1-q_{0+\\gamma}) q_{1+\\gamma} (1-q_{2+\\gamma})$ |\n", - "| $d_{+y}^{k}$ | 001 | $ (1-q_{0+\\gamma}) (1-q_{1+\\gamma}) q_{2+\\gamma}$ | \n", - "| $d_{-y}^{k}$ | 110 | $ q_{0+\\gamma} q_{1+\\gamma} (1-q_{2+\\gamma}) $ |\n", - "| $d_{+z}^{k}$ | 101 | $ q_{0+\\gamma} (1-q_{1+\\gamma}) q_{2+\\gamma} $ |\n", - "| $d_{-z}^{k}$ | 011 | $ (1-q_{0+\\gamma}) q_{1+\\gamma} q_{2+\\gamma} $ |\n", - "\n", - "
\n", - "\n", - "To clarify a bit further through an example:\n", - "If in the first turn (k=0) the solver returns $q_0=1$, $q_1=0$, $q_2=0$, and in the second turn (k=1) returns $q_3=0$, $q_4=0$, $q_5=1$, then a \"+x and +y\" were taken, respecively.\n", - "\n", - "These direction variables will help understand some difficult constraints later on. Defining these direction variables additionally makes the code much more readable, since we can define everything in terms of the direction variables instead of the individual optimization variables.\n", - "\n", - "Below you can find the function for the direction variables. The formulas have been expanded (mathematically) to easily declare them in a number of terms, however it is hard-coded this way. Some inputs to the function (\"sign_dir\", \"sign_pos\", \"lambda_\") are relevant for building constraints later in the notebook, but have to defined in this function. Further information can be found in the function docstring. \n", - " " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "def direction_variables(direction: str, offset: int, sign_dir: int, sign_pos: int, lambda_: int) -> list:\n", - "\n", - " '''\n", - " Purpose:\n", - " Translates the direction (+x,-x,+y,-y,+z,-z) of turn 'i' as a function of three optimization variables. (Three q's because of the defined coordinate system).\n", - " Example:\n", - " Direction \"+z\" in the first turn (turn = 1) is translated to: q_{0+offset}q_{2+offset}-q_{0+offset}q_{1+offset}q_{2+offset}.\n", - " Inputs:\n", - " 1. direction: A direction from an x-y-z coordinate system, one of the following: ('+x','-x','+y','-y','+z','-z').\n", - " 2. offset: Offset gives the turn number expressed in the first \"q\" of that turn. Equal to gamma in the explanation.\n", - " Example: Turn 1 starts with \"q\" q_0, offset=0. Turn 2 starts with q_3, offset = 3.\n", - " 3. sign_dir: Changes the sign of the weights corresponding to negative directions \"-x\", \"-y\", \"-z\" -> necessary for finding the positions, for exmaple (+x) \"-\" (-x).\n", - " 4. sign_pos: Changes the sign of the weights corresponding to negative positions \"-(x,y,z)\" -> necessary for finding the distances between node \"i\" and node \"j\".\n", - " 5. lambda_: The weight term associated with a constraint.\n", - " Output:\n", - " 1. A list of term objects.\n", - " '''\n", - "\n", - " terms = []\n", - " if direction == \"+x\":\n", - " term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset])\n", - " term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset])\n", - " term_2 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset])\n", - " term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", - " terms = [term_0, term_1, term_2, term_3]\n", - " elif direction == \"-x\":\n", - " term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset])\n", - " term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset])\n", - " term_2 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset])\n", - " term_3 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", - " terms = [term_0, term_1, term_2, term_3]\n", - " elif direction == \"+y\":\n", - " term_0 = Term(c= 1*sign_pos*lambda_, indices=[2+offset])\n", - " term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset])\n", - " term_2 = Term(c=-1*sign_pos*lambda_, indices=[1+offset, 2+offset])\n", - " term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", - " terms = [term_0, term_1, term_2, term_3]\n", - " elif direction == \"-y\":\n", - " term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset])\n", - " term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", - " terms = [term_0, term_1]\n", - " elif direction == \"+z\":\n", - " term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 2+offset])\n", - " term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", - " terms = [term_0, term_1]\n", - " elif direction == \"-z\":\n", - " term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset])\n", - " term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", - " terms = [term_0, term_1]\n", - " return terms\n", - "\n", - "\n", - "##### ----- Test the function and print output:\n", - "turn = 1 # play with this value! \n", - "dir_var = direction_variables(\"+x\",(turn-1)*num_dim,1,1,lambda_0) \n", - "print('dir_var term dictionary \"+x\": ', dir_var)\n", - "print_function(dir_var)\n", - "\n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Part 2. Finding the difference in positions\n", - "\n", - "Great that we have the directions defined! Now let's use them and define a function that calculates the difference in positions, which we will need later. After each turn, a direction that appends to the path. A valid path is defined as a one that does not cross itself, meaning that we need to compare the positions over the turns. In other words, every new position appended to the path needs to be checked with all previously held positions, to verify that a position hasn't been visited twice. \n", - "\n", - "So how do we go about this?\n", - "\n", - "First we need a way to know the positions after choosing to go in a certain direction, so let's tackle that first. Consider the fact that the directions are recorded for each turn, which already gives some sort of log of the positions in the path. By summing the direction variables respective to their dimension (x/y/z) acoomplishes this, but only if a negative move can compensate a positive one. For example, after two turns the $x$-location can be expressed as:\n", - "\n", - "$$ x_2 = ( d^{1}_{+x} - d^{1}_{-x} ) + ( d^{2}_{+x} - d^{2}_{-x} )$$\n", - "\n", - "**_NOTE:_** In the above function (\"direction_variables\"), the negative sign for the negative direction variables is controlled through \"sign_dir\". \"sign_dir\" must be set to -1 to assign a negative sign to it as required in these position formulas!\n", - "\n", - "\n", - "Remember that for a turn only one direction variable can be set to 1! Thus if two moves in the $-x$ direction are taken, then:\n", - "\n", - "$$ x_2 = ( d^{1}_{+x} - d^{1}_{-x} ) + ( d^{2}_{+x} - d^{2}_{-x} ) = ( 0 - 1 ) + ( 0 - 1 ) = -2 $$\n", - "\n", - "As with the simple example for the x-dimension, the same can be applied to the $x$ and $y$ directions. The formulas below descrive the position after some number of turns through a summation (for the maths/physics enthousiasts, these are integrals of the velocities to derive the positions :) ).\n", - "\n", - "$$ x^k = \\sum_{k=1}^{k} ( d^{k}_{+x} - d^{k}_{-x} ) $$\n", - "$$ y^k = \\sum_{k=1}^{k} ( d^{k}_{+y} - d^{k}_{-y} ) $$\n", - "$$ z^k = \\sum_{k=1}^{k} ( d^{k}_{+z} - d^{k}_{-z} ) $$\n", - "\n", - "Great stuff! Now we have a method to find the positions along the path. To find the differences in position, for example between turn 2 and turn 1, it is only necessary to apply a subtraction: \n", - "\n", - "$$ x_2 - x_1 = \\sum_{k=1}^{2} ( d^{k}_{+x} - d^{k}_{-x} ) - \\sum_{k=1}^{1} ( d^{k}_{+x} - d^{k}_{-x}) = ( d^{2}_{+x} - d^{2}_{-x} ) $$\n", - "$$ y_2 - y_1 = \\sum_{k=1}^{2} ( d^{k}_{+y} - d^{k}_{-y} ) - \\sum_{k=1}^{1} ( d^{k}_{+y} - d^{k}_{-y}) = ( d^{2}_{+y} - d^{2}_{-y} ) $$\n", - "$$ z_2 - z_1 = \\sum_{k=1}^{2} ( d^{k}_{+z} - d^{k}_{-z} ) - \\sum_{k=1}^{1} ( d^{k}_{+z} - d^{k}_{-z}) = ( d^{2}_{+z} - d^{2}_{-z} ) $$\n", - "\n", - "Generalizing this to any difference between two positions:\n", - "\n", - "$$ x_j - x_i = \\sum_{k=i}^{j} ( d^{k}_{+x} - d^{k}_{-x} ) $$\n", - "$$ y_j - y_i = \\sum_{k=i}^{j} ( d^{k}_{+y} - d^{k}_{-y} ) $$\n", - "$$ z_j - z_i = \\sum_{k=i}^{j} ( d^{k}_{+z} - d^{k}_{-z} ) $$\n", - "\n", - "Fantastic! Now on to the function code for the difference in positions. Do read the function and its docstring to understand the implementation, because it reference the previously defined function to make use of direction variables. \n" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "def diff_in_pos(start_turn: int, end_turn: int, num_dim: int, lamda_: int):\n", - "\n", - " '''\n", - " Purpose:\n", - " Expresses the difference in position (x,y,z) between two turns as a function of the q's encoding of the directions.\n", - " In other words, expresses the difference in the position after the start_turn and position after the end_turn.\n", - " Example:\n", - " Difference between turn 0 (no turns yet, initial position = (0,0,0)) and turn 2:\n", - " x(2) = [ move(+x, turn 1) - move(-x, turn 1) ] + [ move(+x, turn 2) - move(-x, turn 2) ]\n", - " Note: only one 'move' per turn gets activated as they are represented by the same q's (ex. turn 1 is represented by q_0, q_1, and q_2).\n", - " Inputs:\n", - " 1. start_turn: the initial (reference) turn.\n", - " 2. end_turn: the final (target) turn.\n", - " 3. num_dim: the number of dimensions (3, x-y-z coordinate system).\n", - " Outputs:\n", - " 1. The difference in the x direction.\n", - " 2. The difference in the y direction.\n", - " 3. The difference in the z direction. \n", - " '''\n", - "\n", - " x_diff = y_diff = z_diff = []\n", - " if start_turn < end_turn and start_turn >= 0 and end_turn >= 1:\n", - " for turn in range(start_turn,end_turn+1):\n", - " x_diff += direction_variables(\"+x\",(turn-1)*num_dim,1,1,lamda_)+direction_variables(\"-x\",(turn-1)*num_dim,-1,1,lamda_)\n", - " y_diff += direction_variables(\"+y\",(turn-1)*num_dim,1,1,lamda_)+direction_variables(\"-y\",(turn-1)*num_dim,-1,1,lamda_)\n", - " z_diff += direction_variables(\"+z\",(turn-1)*num_dim,1,1,lamda_)+direction_variables(\"-z\",(turn-1)*num_dim,-1,1,lamda_)\n", - " return x_diff, y_diff, z_diff\n", - "\n", - "\n", - "##### ----- Test the function and print output: \n", - "start_turn = 1 # play with this value! \n", - "end_turn = 2 # play with this value! \n", - "x_diff, y_diff, z_diff = diff_in_pos(start_turn, end_turn, num_dim, lambda_0)\n", - "print('Difference in x described as term list: \\n', x_diff)\n", - "print('\\nDifference in x described as mathematical function:')\n", - "print_function(x_diff)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Part 3. The distance constraint\n", - "\n", - "Fantastic that you've made it this far! With all the above functions defined we can start solving the problem. \n", - "\n", - "The distance constraint enforces that after each turn, the difference in positions after turns $i$ and $j$ must be larger or equal to 1 (distance between lattice points in the same dimension). \n", - "To visualize the scenario this constraint tries to penalize consider a 2D example with 4 turns, starting in $(0,0)$:\n", - "\n", - "$$ \\text{Turn 1, go right: } \\hspace{0.3cm} (0,0) => (0,1) $$ \n", - "$$ \\text{Turn 2, go up: } \\hspace{0.3cm} (0,1) => (1,1) $$ \n", - "$$ \\text{Turn 3, go left: } \\hspace{0.3cm} (1,1) => (1,0) $$ \n", - "$$ \\text{Turn 4, go down: } \\hspace{0.3cm} (1,0) => (0,0) $$ \n", - "\n", - "As you can see, the last step conflicts with our constraint. It is not permitted to return into a position that we've already been, namely $(0,0)$. Turn 1-3 are all valid, since they remain a distance of 1 away from all other previously held positions.\n", - "\n", - "Let's define what we want mathematically. tThe distance between the position after turn $i$ and $j$ must be larger or equal to 1. For this we'll need some basic geometry, the 3D variant of the Pythagorean theorem. From the theorem, it can be understood that hypotenuse ($c$) must always be larger or equal to one, since that is what defines the distance between two points. Mathematically speaking working this out:\n", - "\n", - "$$ C_{i,j} \\geq 1 $$\n", - "$$ \\sqrt{(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} \\geq 1 $$\n", - "\n", - "The square-root is a bit of a headache when writing out a cost function, it would require an approximation or some sort of factorization, not fun if you're dealing with many terms. To avoid that, we're simply going to square both sides, which in our case if fine (for maths people), since we aren't dealing with negative numbers here:\n", - "\n", - "$$ C_{i,j}^2 \\geq 1 $$\n", - "$$ {(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} \\geq 1 $$\n", - "\n", - "Nice! If you're sharp, you'll start seeing where the previous functions might come in handy now. The function that computes the difference between the respective positions (\"diff_in_pos\") in each dimension was defined above, but also the function that computes the an expansion (\"cross_multiply\") was defined at the beginning of the notebook. Writing those function calls out in order :\n", - "\n", - "1. We call \"diff_in_poss\" to calculate the difference in positions for each dimension (x,y,z).\n", - "2. For each dimension, the square is calculated by calling \"cross_multiply\". \n", - "\n", - "Alright, you might be wondering how to deal with the $>=$, since it is necessary to have an equation that equals zero in order to integrate it into the cost function. \n", - "This is where slack variables come in. The purpose of slack variables is to convert an inequality constraint into an equality constraint. Or in other words, for this equation, we need to compensate some values (explained further below) in order to convert the equation to an equality constraint. Consider the constraint in its simplest form:\n", - "\n", - "$$ C_{i,j}^2 \\geq 1 $$\n", - "\n", - "It is clear that we would need to add some number $V_{i,j}$, on the right hand side of the equation in order to make this an equality constraint. $V_{i,j}$ can be any positive value and is conditioned on $i$ and $j$: \n", - "\n", - "$$ C_{i,j}^2 = 1+V_{i,j}$$\n", - "\n", - "Let's say that instead of representing a single value we want V_{i,j} to represent a range of values $[0-4]$. This is where slack variables can be introduced. By introducing additional optimization variables, which have nothing to do with the path encoding, the range can be described as following:\n", - "\n", - "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+q_{s3}+q_{s4} $$\n", - "\n", - "Or more compactly:\n", - "\n", - "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+2q_{s3} $$\n", - "\n", - "So any value in the range $[0-4]$ is described through these q's. You can derive 1 by assigning a single \"q\", which has weight 1, the value 1. Likewise, you can get the value 4 by assigning all optimization variables the value 1. \n", - "\n", - "Alright, so how do we know which range of values we need to represent? That is revealed by the turn numbers, $i$ and $j$. Over these turns, the maximum squared distance that can be achieved is when moves are only made in a single direction, the \"+x\" direction for example. The maximum distance is then equal to the number of moves squared $(j-i)^2$.\n", - "\n", - "$$ C_{i,j}^2 = (j-i)^2 $$\n", - "\n", - "Then writing out the maths gives us the necessary upper bound for the range that the optimization variables need to represent, where $S$ stands for the number of slack variables necessary:\n", - "\n", - "$$ \\text{Upper bound: } \\hspace{0.5cm} C_{i,j}^2 = (j-i)^2 = 1 + \\sum_{s=0}^{S}q_s$$\n", - "$$ \\text{Upper bound: } \\hspace{0.5cm} \\sum_{s=0}^{S}q_s = (j-i)^2 - 1 $$\n", - "\n", - "For the lower bound of the range, the value is 0. The reason for that is we want to be able to represent any number equal to or larger than 1 for the inequality constraint through the addition of the slack variables. Concluding, the range the q's must represent is $[0,((j-i)^2-1)]$. More on how to calculate the number of slack variables necessary to define this range later, as you don't need ((j-i)^2-1) optimization variables!\n", - "\n", - "\n", - "Piecing all the parts together we find the following equation for a $i$-$j$ combination:\n", - "\n", - "$$ {(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} = 1 + \\sum_{s=0}^{S}q_s $$ \n", - "\n", - "Because constants are irrelevant for the optimization landscape the value 1 can be neglected. The reason being that constants only introduce linear offsets, thus impacting the entire optimization equally. The distance constraint which needs to account for all $i$-$j$ combinations, where $j$>$i$ and $N-1$ the number of turns, is summarized as follows:\n", - "\n", - "$$ \\sum_{i=1}^{N-1} \\sum_{j>i}^{N-1} \\lambda_0 ( {(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} - \\sum_{s=0}^{S}q_s ) $$ \n", - "\n", - "The function that builds this constraint is presented below. Read the docstring for how it works.\n", - "`Note, to run this function you'll need to run the next function cell to define 'generate_slack_coefficients'.` \n" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "def distance_constraint(num_turns: int, num_dim: int, lambda_0: int) -> list:\n", - "\n", - " '''\n", - " Purpose:\n", - " Build the distance contraint based on previosly defined functions.\n", - " Constraint: Distance squared between i and j must be larger or equal to 1.\n", - " Constraint: L_{i,j}^2 >= 1 => L_{i,j}^2 = 1+q_{slacker} (converting the inequality constraint to an equality constraint.)\n", - " Example/Explanation:\n", - " L{1,2}^2 = (x1-x2)^2 + (y1-y2)^2 + (z1-z2)^2\n", - " x1 = [move(+x1)-move(-x1)]\n", - " x2 = [move(+x1)-move(-x1)] + [move(+x2)-move(-x2)]\n", - " \n", - " \n", - " L{1,2}^2 = [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2\n", - " [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2 - q_{slacker} = 0 ---> expressed in q's == cost function\n", - " Inputs:\n", - " 1. num_turns: the number of turns.\n", - " 2. num_dum: the number of dimensions.\n", - " 3. lambda_0: the constraint weight for the distance constraint.\n", - " Output:\n", - " 1. List of term objects describing the distance constraint.\n", - " '''\n", - "\n", - " terms = []\n", - " slack_indexer = 0\n", - " for start_turn in range(1,num_turns+1):\n", - " for end_turn in range(start_turn+1,num_turns+2):\n", - " # Calculate the differences in positions for each dimension. \n", - " x_diff_i_j, y_diff_i_j, z_diff_i_j = diff_in_pos(start_turn, end_turn, num_dim, lambda_0)\n", - " # Compute the squared distance (Pythagorean theorem) by calculating the squared expansion.\n", - " x_diff_i_j_2, y_diff_i_j_2, z_diff_i_j_2 = cross_multiply(x_diff_i_j,x_diff_i_j), cross_multiply(y_diff_i_j,y_diff_i_j), cross_multiply(z_diff_i_j,z_diff_i_j) \n", - " # Add slack variables due to inequality constraint. \n", - " slack_var_terms = []\n", - " slack_coefficients = generate_slack_coefficients(end_turn-start_turn)\n", - " for s in range(0,len(slack_coefficients)):\n", - " slack_var_terms += [Term(c=-slack_coefficients[s], indices=[num_turns*num_dim+slack_indexer+s])]\n", - " terms += x_diff_i_j_2 + y_diff_i_j_2 + z_diff_i_j_2 + slack_var_terms\n", - " slack_indexer+=len(slack_coefficients)\n", - " return terms\n", - "\n", - "##### ----- Test the function and print output: \n", - "# The output is too large to understand, nevertheless you can run the below statements to view how visualize the term-scaling of the problem.\n", - "number_turns = 2 #play with this value!\n", - "dist_terms = distance_constraint(number_turns, num_dim, lambda_0)\n", - "\n", - "# Only print below statements if you want to get an impression of the number of terms.\n", - "#print('Distance constraint term dictionaries: ', dist_terms) # not readable!\n", - "#print('\\nDistance constraint: ') \n", - "#print_function(dist_terms) # not readable!" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Part 4. Intermezzo: Slack Variables Weights\n", - "\n", - "To remove any human calculations to construct the distance constraint(s), we'll automate the computation of the number of slack variables and their weights. \n", - "\n", - "As you saw in the previous part, certain slack variables can be assigned weights to reduce the number of slack variables necessary. Recall that the range $[0,4]$ can be defined by the following two equations with slack variables (s):\n", - "\n", - "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+q_{s3}+q_{s4} $$\n", - "\n", - "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+2q_{s3} $$\n", - "\n", - "The bottom equation is more compact because the last variables carries a weight-2. In Lucas' paper (see 2.4 of arxiv:1302.5843) the algorithm to find such weights is presented, which is based on calculating all $2^{x}$, where $x$ iterates from zero to the log_2 of maximum value in the range (4 in this example). \n", - "\n", - "Below are two examples that may help visualize why and how the slack variables represent the ranges of values. \n", - "\\\n", - " \n", - "\n", - "\n", - "
\n", - "\n", - "Example for range $[0,4]$:\n", - "| $q_{s1}$ | $2q_{s2}$ | $q_{s3}$ | Value |\n", - "| ------ | -------- | -------- | ---------------- |\n", - "| 0 | 0 | 0 | 0 + 2(0) + 0 = 0 |\n", - "| 1 | 0 | 0 | 1 + 2(0) + 0 = 1 |\n", - "| 0 | 1 | 0 | 0 + 2(1) + 0 = 2 |\n", - "| 1 | 1 | 0 | 1 + 2(1) + 0 = 3 |\n", - "| 1 | 1 | 1 | 1 + 2(1) + 1 = 4 | \n", - "\n", - "
\n", - "\n", - "\\\n", - " \n", - "\n", - "
\n", - "\n", - "Example for range $[0,20]$:\n", - "Rather than using twenty optimization variables, five with weights can achieve the same!\n", - "| $q_{s1}$ | $2q_{s2}$ | $4q_{s3}$ | $8q_{s4}$ | $5q_{s5}$ | Value |\n", - "| ------ | ------- | --------- | ----------- | --------- | ------------------- |\n", - "| 0 | 0 | 0 | 0 | 0 | 0 + 2(0) + 4(0) + 8(0) + 5(0) = 0 |\n", - "| 1 | 0 | 0 | 0 | 0 | 1 + 2(0) + 4(0) + 8(0) + 5(0) = 1 |\n", - "| 0 | 1 | 0 | 0 | 0 | 0 + 2(1) + 4(0) + 8(0) + 5(0) = 2 |\n", - "| 1 | 1 | 0 | 0 | 0 | 1 + 2(1) + 4(0) + 8(0) + 5(0) = 3 |\n", - "| 0 | 0 | 1 | 0 | 0 | 0 + 2(0) + 4(1) + 8(0) + 5(0) = 4 |\n", - "| ... | ... | ... | ... | ... | ... |\n", - "| 0 | 1 | 0 | 1 | 1 |0 + 2(1) + 4(0) + 8(1) + 5(1)= 15 |\n", - "| 1 | 1 | 0 | 1 | 1 |1 + 2(1) + 4(0) + 8(1) + 5(1)= 16 |\n", - "| 0 | 0 | 1 | 1 | 1 |0 + 2(0) + 4(1) + 8(1) + 5(1)= 17 |\n", - "| 1 | 0 | 1 | 1 | 1 |1 + 2(0) + 4(1) + 8(1) + 5(1)= 18 |\n", - "| 0 | 1 | 1 | 1 | 1 |0 + 2(1) + 4(1) + 8(1) + 5(1)= 19 |\n", - "| 1 | 1 | 1 | 1 | 1 |1 + 2(1) + 4(1) + 8(1) + 5(1)= 20 |\n", - "\n", - "
\n", - "\n", - "\\\n", - " \n", - "\n", - "The function is given below. In context of the distance constraint, we're still faced with a minor problem. If $(j-i)^2-1$ equals 0, then we don't need any slack variables. The reason for this is that the range becomes $[0,0]$, which can also be represented by no variables at all. " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "def generate_slack_coefficients(turn_diff: int):\n", - "\n", - " ''' \n", - " Purpose: \n", - " Calculates the number of slack variables and their weights.\n", - " Example:\n", - " For the constraint: x1 + x2 + x3 + x4 <= 4 which is converted to x1 + x2 + x3 + x4 + s1 + s2 +2*s3 = 4, \n", - " with 's' being slack variables. This function computes the weights of these slack variables ([1,1,2] for the example).\n", - " Reference:\n", - " Lucas' paper (see 2.4 of arxiv:1302.5843)\n", - " Input:\n", - " 1. turn_diff: the differences in turns (end_turn - start_turn).\n", - " Output:\n", - " 1. y: the weights of the slack variables.\n", - " '''\n", - " \n", - " dist_diff = (turn_diff**2)-1\n", - " if dist_diff == 0:\n", - " y = [] # no slack variables needed\n", - " elif dist_diff > 0:\n", - " M = floor(log2(dist_diff))\n", - " y = [-2**n for n in range(M)]\n", - " y.append(-(dist_diff + 1 - 2**M))\n", - " return y\n", - "\n", - "##### ----- Test the function and print output: \n", - "turn_difference = 3 # play with this value!\n", - "slack_weights = generate_slack_coefficients(turn_difference)\n", - "print('Slack weights: ', slack_weights) \n" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Part 5. No Return Constraint\n", - "\n", - "The distance constraint enforces a minimum distance of 1 between the different taken positions. However, for two consecutive turns, it does not completely prevent (to a high enough degree) going to a previous position. A simplified explanation for this is that the distance constraint is described through the positional differences in $x$, $y$, and $z$. Additionally, for consecutive turns, the number of slack variables is zero ($(i-j)^2-1 = 0$ for consecutive turns} - thus there is no auxiliary benefit introduced by slack variables to compensate for being in a different position after the turn. Therefore, the solver will try to keep the positions as close to each other as possible, which leads to overlapping positions, especially in consecutive turns. To overcome this, a penalization needs to be introduced that stops returning to the previous position held in the turn before. For example, what we want to stop is the following:\n", - "\n", - "$$ \\text{Turn 1: A to B.} $$\n", - "$$ \\text{Turn 2: B to A.} $$\n", - "\n", - "This can be equivalenty described as moving in opposite directions over the consecutive turns. For example, first going in the \"+y\" direction, and following that moving in the \"-y\" direction. \n", - "\n", - "Designing such a constraint is straightforward, the opposite direction variables need to be multiplied. \n", - "Preventing a revisit of a position for the \"x\" direction over the first and second turn can be described by the following constraint:\n", - "\n", - "$$ {\\lambda}_2(d^{1}_{+x} d^{2}_{-x} + d^{1}_{-x}d^{2}_{+x}) $$ \n", - "\n", - "If a move is made in the \"+x\" direction first, $d^{1}_{+x}$ takes value 1. If afterwards a move is made in the \"-x\" direction, $d^{2}_{-x}$ also takes value 1, meaning that the combined term\n", - "$d^{1}_{+x} d^{2}_{-x}$ also becomes 1, enforcing the constraint with penalty value ${\\lambda}_2$. \n", - "\n", - "Generalizing the idea to any direction and for all turns, we find the \"no return constraint\":\n", - "\n", - "$$ {\\lambda}_1 \\left( \\sum_{m}^{\\in \\{x,y,z\\} }\\sum_{t=1}^{N-1} d^{t}_{+m} d^{t+1}_{-m} + d^{t}_{-m}d^{t+1}_{+m} \\right) $$ \n", - "\n", - "In this constraint, iterations are performed over the different dimensions ($m$), and the turn ($t$). The function defintion for the no return constraint is given below. Make sure to read the docstring. In the function the 'cross_multiply' method is used to expand and calculate all the necessary terms of the constraint. The direction variables are dictionaries of polynomials, and therefore have to be expanded before submitting to the Azure QIO solvers.\n", - "\n" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "def no_return_constraint(num_turns: int, num_dim: int, lamda_4: int)-> list:\n", - " \n", - " '''\n", - " Purpose:\n", - " Build the constraint that penalizes going back to the same position/node two turns later.\n", - " Example:\n", - " Node A ---> ---> Node B ---> ---> Node A => erroneous as we've been there already.\n", - " Two sequential moves may not be in the same dimension and in opposite directions: (+x then -x), (-x then +x), (+y then -y) etc.\n", - " Inputs:\n", - " 1. num_turns: the number of turns.\n", - " 2. num_dim : the number of dimensions, which is 3 for this sample.\n", - " 3. lambda_4 : the penalty weight for this constraint.\n", - " Outputs:\n", - " 1. List of term objects.\n", - " '''\n", - "\n", - " terms = []\n", - " for i in range(0,num_turns):\n", - " x_out_in = cross_multiply(direction_variables(\"+x\",i*num_dim,1,1,lamda_4), direction_variables(\"-x\",(i+1)*num_dim,1,1,lamda_4))\n", - " x_in_out = cross_multiply(direction_variables(\"-x\",i*num_dim,1,1,lamda_4), direction_variables(\"+x\",(i+1)*num_dim,1,1,lamda_4))\n", - " y_right_left = cross_multiply(direction_variables(\"+y\",i*num_dim,1,1,lamda_4), direction_variables(\"-y\",(i+1)*num_dim,1,1,lamda_4))\n", - " y_left_right = cross_multiply(direction_variables(\"-y\",i*num_dim,1,1,lamda_4), direction_variables(\"+y\",(i+1)*num_dim,1,1,lamda_4))\n", - " z_up_down = cross_multiply(direction_variables(\"+z\",i*num_dim,1,1,lamda_4), direction_variables(\"-z\",(i+1)*num_dim,1,1,lamda_4))\n", - " z_down_up = cross_multiply(direction_variables(\"-z\",i*num_dim,1,1,lamda_4), direction_variables(\"+z\",(i+1)*num_dim,1,1,lamda_4))\n", - " terms += x_out_in + x_in_out + y_right_left + y_left_right + z_up_down + z_down_up\n", - " return terms\n", - "\n", - "\n", - "##### ----- Test the function and print output: \n", - "number_turns = 1 # play with this value!\n", - "nrc_terms = no_return_constraint(number_turns, num_dim, lambda_1)\n", - "print('No return constraint term dictionaries: ', nrc_terms)\n", - "print('\\n No return constraint function:')\n", - "print_function(nrc_terms)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Part 6. Penalize Invalid Moves\n", - "\n", - "Recall that there are two invalid optimization variable substrings that are not associated with any move, $000$ and $111$. A path that includes these substrings is invalid. To prevent the solver from generating these invalid directions we'll need to add two constraints. Each constraint is specific to an invalid direction, and because we're working directly with the substring we don't need the abstraction layers used in previous constraints, like directional and positional variables. \n", - "\n", - "Let's first work out the constraint for preventing substring $000$. $ q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma} $ may not equal $000$, where $\\gamma = 3(k-1)$ and $k$ the turn number. If we were to design the constraints as $ q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma} $ there won't be any penalty, because all $q$'s will equal and multiply to zero. Therefore, if all these $q$'s equal zero, we need the substring to multiply to 1. This is achieved by the following, which multiplies to zero if all optimization variables take the value zero:\n", - "\n", - "$$ {\\lambda}_2(1-q_{0+\\gamma}) (1-q_{1+\\gamma}) (1-q_{2+\\gamma}) $$\n", - "$$ \\text{If } \\hspace{0.1cm} q_{0+\\gamma} = q_{1+\\gamma} = q_{2+\\gamma} = 0, \\hspace{0.1cm} \\text{then: } $$ \n", - "$$ {\\lambda}_2(1-q_{0+\\gamma}) (1-q_{1+\\gamma}) (1-q_{2+\\gamma}) = {\\lambda}_2 \\cdot 1 $$\n", - "\n", - "\n", - "Nice! By expanding the equation and neglecting constant terms a constraint is found that can be implemented:\n", - "\n", - "$$\\text{Constraint for 000: }-q_{0+\\gamma}−q_{1+\\gamma}−q_{2+\\gamma}+q_{0+\\gamma}q_{1+\\gamma}+q_{0+\\gamma}q_{2+\\gamma}+q_{1+\\gamma}q_{2+\\gamma}−q_{0+\\gamma}q_{1+\\gamma}q_{2+\\gamma}$$\n", - "\n", - "Before going to the function definition, let's first look at penalizing the substring $111$. Luckily this is much easier as the substring multiplies to 1 if all the $q$'s have the value zero. The constraint is therefore simple to derive:\n", - "\n", - "$$ {\\lambda}_3 (q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma}) $$\n", - "$$ \\text{If } \\hspace{0.1cm} q_{0+\\gamma} = q_{1+\\gamma} = q_{2+\\gamma} = 1, \\hspace{0.1cm} \\text{then: } $$ \n", - "$$ {\\lambda}_3 (q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma}) = {\\lambda}_3 \\cdot 1$$\n", - "\n", - "The constraint for the substring $111$ is:\n", - "\n", - "$$ \\text{Constraint for $111$: }\\hspace{0.1cm} {\\lambda}_3 (q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma}) $$\n", - "\n", - "The function definitions for these two constraints are given below. \n" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "def penalize_000(len_seq: int, num_dim: int, lambda_2: int) -> list:\n", - "\n", - " '''\n", - " Purpose:\n", - " Build the constraint that penalizes the invalid moves associated with the 3 q's string: '000'.\n", - " The constraint needs to be defined over the set of all turns, as defined by the 'for' loop.\n", - " Example:\n", - " If turn 2 (q_3q_4q_5) equals '000', assign a large penalty.\n", - " Inputs:\n", - " 1. len_seq: the number nodes to consider.\n", - " 2. num_dim: the number of dimensions (which is 3).\n", - " 3. lambda_2: the penalty weight for this constraint.\n", - " Outputs:\n", - " 1. List of term objects.\n", - " '''\n", - " \n", - " terms = []\n", - " for k in range(0,len_seq):\n", - " offset = k*num_dim\n", - " term_0 = Term(c=-1*lambda_2,indices=[0+offset])\n", - " term_1 = Term(c=-1*lambda_2,indices=[1+offset])\n", - " term_2 = Term(c=-1*lambda_2,indices=[2+offset])\n", - " term_3 = Term(c= 1*lambda_2,indices=[0+offset,1+offset])\n", - " term_4 = Term(c= 1*lambda_2,indices=[0+offset,2+offset])\n", - " term_5 = Term(c= 1*lambda_2,indices=[1+offset,2+offset])\n", - " term_6 = Term(c=-1*lambda_2,indices=[0+offset,1+offset,2+offset])\n", - " terms += [term_0, term_1, term_2, term_3, term_4, term_5, term_6]\n", - " return terms\n", - "\n", - "def penalize_111(len_seq: int, num_dim: int, lambda_3: int) -> list:\n", - "\n", - " '''\n", - " Purpose:\n", - " Build the constraint that penalizes the invalid moves associated with the 3 q's string: '111'.\n", - " The constraint needs to be defined over the set of all turns, as defined by the 'for' loop.\n", - " Example:\n", - " If turn 2 (q_3q_4q_5) equals '111', assign a large penalty.\n", - " Inputs:\n", - " 1. len_seq: the number nodes to consider.\n", - " 2. num_dim: the number of dimensions (which is 3 in this sample).\n", - " 3. lambda_3: the penalty weight for this constraint.\n", - " Outputs:\n", - " 1. List of term objects.\n", - " '''\n", - "\n", - " terms = []\n", - " for k in range(0,len_seq):\n", - " offset = k*num_dim \n", - " terms += [Term(c=1*lambda_3,indices=[0+offset,1+offset,2+offset])]\n", - " return terms\n", - "\n", - "\n", - "##### ----- Test the function and print output: \n", - "term_000 = penalize_000(len_seq, num_dim, lambda_2) \n", - "term_111 = penalize_111(len_seq, num_dim, lambda_3) \n", - "print('Term dictionary penalty constraint for 000:', term_000, '\\n')\n", - "print('Term dictionary penalty constraint for 111:', term_111, '\\n')\n", - "print('Function for penality 000: ')\n", - "print_function(term_000)\n", - "print('Function for penality 111: ')\n", - "print_function(term_111)" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# Part 7. Parsing and validating the solution\n", - "\n", - "We've finished defining the optimization function. The next step is to start looking at how we're going to submit it to the solvers and analyze the returned results. \n", - "First let's look at how to parse, validate, and visualize the results, since that will make tuning the solvers easier!\n", - "\n", - "Below you can find the function definition that reads the solution and validates it. The solution dictionary is first read out to the optimiation variable string that describes the path. Afterward, the substrings that represent the directions are translated to linguistic terms, such that the solution can be printed in a human-readable format. Based on these two steps, the validation process checks if any constraints are violated. If constraints are violated warnings will be shown in the output with some tuning suggestions.\n" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [ - "def read_validate_solution(solution: dict, num_turns: int, num_dim: int):\n", - " \n", - " '''\n", - " Purpose:\n", - " To validate the solution returned by the solver. Make it readable, and analyze if it makes sense.\n", - " Inputs:\n", - " 1. solution: The solution results dictionary which is returned by the solver (results[\"configuration\"]).\n", - " 2. num_turns: The number of turns for the simulation.\n", - " 3. num_dim: The number of dimensions, which is 3 for this sample (3D).\n", - " Outputs:\n", - " 1. valid: A boolean variable that specifies the validity of the solution.\n", - " 2. pos_dit: Layered position dictionary that contains all of the nodes' locations per turn {turn: {x: x_pos, y:y_pos, z:z_pos}}.\n", - " 3. dir_dict: Dictionary containing the linguistic interpretation of the 6 directions.\n", - " 4. var_dict: Dictionary containing the spin per optimization variable.\n", - " 5. x_arr: Array of x positions.\n", - " 6. y_arr: Array of y positions.\n", - " 7. z_arr: Array of z positions. \n", - " '''\n", - "\n", - " print('\\n')\n", - " valid = True\n", - " move = ''\n", - " sol_str = ''\n", - " x_arr = [0]\n", - " y_arr = [0]\n", - " z_arr = [0]\n", - " dir_dict = {'100':'out','010':'in','001':'right','110':'left','101':'up','011':'down'}\n", - " pos_dict = {0:{\"x\":0, \"y\":0, \"z\":0}}\n", - " var_dict = {}\n", - " for key,val in solution:\n", - " if key<(num_turns*num_dim):\n", - " turn = floor(key/num_dim)+1\n", - " print(\"Turn: \"+str(turn),\"var: \"+str(key),\"spin: \"+str(val))\n", - " var_dict |= {str(key): val}\n", - " if key%3 Date: Tue, 19 Jul 2022 13:45:20 +0200 Subject: [PATCH 09/10] Delete self-avoiding-walk.py --- .../self-avoiding-path/self-avoiding-walk.py | 485 ------------------ 1 file changed, 485 deletions(-) delete mode 100644 samples/self-avoiding-path/self-avoiding-walk.py diff --git a/samples/self-avoiding-path/self-avoiding-walk.py b/samples/self-avoiding-path/self-avoiding-walk.py deleted file mode 100644 index 142e259..0000000 --- a/samples/self-avoiding-path/self-avoiding-walk.py +++ /dev/null @@ -1,485 +0,0 @@ -import time -from math import log2, floor -from azure.quantum import Workspace -from azure.quantum.optimization import Problem, ProblemType, Term, ParallelTempering, Tabu, SimulatedAnnealing -from azure.identity import ClientSecretCredential -from mpl_toolkits import mplot3d -import numpy as np -import matplotlib.pyplot as plt - - -workspace = Workspace( - subscription_id = , - resource_group = , - name = , - location = , - credential = ClientSecretCredential(tenant_id=, - client_id=, - client_secret=) -) - -def direction_variables(direction: str, offset: int, sign_dir: int, sign_pos: int, lambda_: int) -> list: - - ''' - Purpose: - Translates the direction (+x,-x,+y,-y,+z,-z) of turn 'i' as a function of three q's. (Three optimization variables because of the defined coordinate system). - Example: - Direction "+z" in the first turn (turn = 1) is translated to: q_{0+offset}q_{2+offset}-q_{0+offset}q_{1+offset}q_{2+offset}. - Inputs: - 1. direction: A direction from an x-y-z coordinate system, one of the following: ('+x','-x','+y','-y','+z','-z'). - 2. offset: Offset gives the turn number expressed in the first q of that turn. - Example: Turn 1 starts with q_0, offset=0. Turn 2 starts with q_3, offset = 3. - 3. sign_dir: Changes the sign of the weights corresponding to negative directions "-x", "-y", "-z" -> necessary for finding the positions, for exmaple (+x) "-" (-x). - 4. sign_pos: Changes the sign of the weights corresponding to negative positions "-(x,y,z)" -> necessary for finding the distances between node "i" and node "j". - 5. lambda_: The weight term associated with a constraint. - Output: - 1. A list of term objects. - ''' - - terms = [] - if direction == "+x": - term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset]) - term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset]) - term_2 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset]) - term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) - terms = [term_0, term_1, term_2, term_3] - elif direction == "-x": - term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset]) - term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset]) - term_2 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset]) - term_3 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) - terms = [term_0, term_1, term_2, term_3] - elif direction == "+y": - term_0 = Term(c= 1*sign_pos*lambda_, indices=[2+offset]) - term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset]) - term_2 = Term(c=-1*sign_pos*lambda_, indices=[1+offset, 2+offset]) - term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) - terms = [term_0, term_1, term_2, term_3] - elif direction == "-y": - term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset]) - term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) - terms = [term_0, term_1] - elif direction == "+z": - term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 2+offset]) - term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) - terms = [term_0, term_1] - elif direction == "-z": - term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset]) - term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) - terms = [term_0, term_1] - return terms - -def print_cost_function(terms: list): - - ''' - Purpose: - Takes a list of terms and prints it out as a (mathematical) cost function. - Example: - {'c': 1, 'ids': [0, 10, 11, 12]} ---> 1q_0q_10q_11q_12 - Inputs: - 1. terms: the list of terms. - ''' - - final_string = '' - final_string = '' - for term in terms: - term = term.to_dict() - weight = term['c'] - ids = term['ids'] - string = '(' - if weight >= 0: - string = '+' + '('+str(weight) - if weight < 0: - string = '-' + '(' + str(abs(weight)) - for id_ in ids: - string = string + f'q_{id_}' - string = string + ')' - final_string = final_string + string - print('[' + final_string + ']') - - -def generate_slack_coefficients(turn_diff: int): - - ''' - Purpose: - Calculates the number of slack variables and their weights. - Example: - For the constraint: x1 + x2 + x3 + x4 <= 4 which is converted to x1 + x2 + x3 + x4 + s1 + s2 +2*s3 = 4, - with 's' being slack variables. This function computes the weights of these slack variables ([1,1,2] for the example). - Input: - 1. turn_diff: the differences in turns (end_turn - start_turn). - Output: - 1. y: the weights of the slack variables. - ''' - - dist_diff = (turn_diff**2)-1 - if dist_diff == 0: - y = [] - elif dist_diff > 0: - M = floor(log2(dist_diff)) - y = [2**n for n in range(M)] - y.append(dist_diff + 1 - 2**M) - return y - - -def simplify_every_iter_function(term_list: list[Term], ref_term:Term) -> list[Term]: - terms = [] - same_ids_list = [] - diff_ids_list = [] - if term_list: - for term_in_list in term_list: - if sorted(ref_term.ids) == sorted(term_in_list.ids): - same_ids_list += [term_in_list] - else: - diff_ids_list += [term_in_list] - if same_ids_list: - new_weight = ref_term.c - ids = sorted(ref_term.ids) - for same_ids_term in same_ids_list: - new_weight += same_ids_term.c - terms += [Term(c=new_weight, indices=ids)] - else: - terms += [ref_term] - if diff_ids_list: - terms += diff_ids_list - return terms - - -def diff_in_pos(start_turn: int, end_turn: int, num_dim: int, lamda_: int): - - ''' - Purpose: - Expresses the difference in position (x,y,z) between two turns as a function of the encoding of the directions. - In other words, expresses the difference in the position after the start_turn and position after the end_turn. - Example: - Difference between turn 0 (no turns yet, initial position = (0,0,0)) and turn 2: - x(2) = [ move(+x, turn 1) - move(-x, turn 1) ] + [ move(+x, turn 2) - move(-x, turn 2) ] - Note: only one 'move' per turn gets activated as they are represented by the same q's (ex. turn 1 is represented by q_0, q_1, and q_2). - Inputs: - 1. start_turn: the initial (reference) turn. - 2. end_turn: the final (target) turn. - 3. num_dim: the number of dimensions (3, x-y-z coordinate system). - Outputs: - 1. The difference in the x direction. - 2. The difference in the y direction. - 3. The difference in the z direction. - ''' - - x_diff = y_diff = z_diff = [] - if start_turn < end_turn and start_turn >= 0 and end_turn >= 1: - for turn in range(start_turn,end_turn+1): - x_diff += direction_variables("+x",(turn-1)*num_dim,1,1,lamda_)+direction_variables("-x",(turn-1)*num_dim,-1,1,lamda_) - y_diff += direction_variables("+y",(turn-1)*num_dim,1,1,lamda_)+direction_variables("-y",(turn-1)*num_dim,-1,1,lamda_) - z_diff += direction_variables("+z",(turn-1)*num_dim,1,1,lamda_)+direction_variables("-z",(turn-1)*num_dim,-1,1,lamda_) - return x_diff, y_diff, z_diff - -def cross_multiply(list_a: list[Term], list_b: list[Term]) -> list: - - ''' - Purpose: Cross multiplies two lists of terms (linear ex. [q_0 + q_1] or non-linear ex. [q_0q_1]) to return the expansion. - Can compute powers of groups this way (^2, ^3,...), like squaring a list of terms. - Calculates the expansion locally, unlike the SlcTerm class. - Example: (2q_0q_1+3q_2q_3)^2 => (2q_0q_1)^2 + 12q_0q_1q_2q_3 + (3q_2q_3)^2 - Input: - 1. list_a: list which serves as the reference list (first 'for' loop). - 2. list_b: list which serves as the target list (second 'for' loop). - Output: - 1. list of term objects. - ''' - - terms = [] - for one in list_a: - for uno in list_b: - weight = one.c * uno.c - ids = one.ids + uno.ids - new_term = Term(c = weight, indices = ids) - terms += [new_term] - #terms = simplify_function(terms, new_term) - return terms - -def distance_constraint(num_turns: int, num_dim: int, lambda_0: int) -> list: - - ''' - Purpose: - Build the distance contraint based on previosly defined functions. - Constraint: Distance squared between i and j must be larger or equal to 1. - Constraint: L_{i,j}^2 >= 1 => L_{i,j}^2 = 1+q_{slacker} (converting the inequality constraint to an equality constraint.) - Example/Explanation: - L{1,2}^2 = (x1-x2)^2 + (y1-y2)^2 + (z1-z2)^2 - x1 = [move(+x1)-move(-x1)] - x2 = [move(+x1)-move(-x1)] + [move(+x2)-move(-x2)] - < same for other dimensions > - < fill into first line > - L{1,2}^2 = [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2 - [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2 - q_{slacker} = 0 ---> expressed in q's == cost function - Inputs: - 1. num_turns: the number of turns. - 2. num_dum: the number of dimensions. - 3. lambda_0: the constraint weight for the distance constraint. - Output: - 1. List of term objects describing the distance constraint. - ''' - - terms = [] - slack_indexer = 0 - for start_turn in range(1,num_turns+1): - for end_turn in range(start_turn+1,num_turns+2): - # Calculate the differences in positions for each dimension. - x_diff_i_j, y_diff_i_j, z_diff_i_j = diff_in_pos(start_turn, end_turn, num_dim, lambda_0) - # Compute the squared distance (Pythagorean theorem) by calculating the squared expansion. - x_diff_i_j_2, y_diff_i_j_2, z_diff_i_j_2 = cross_multiply(x_diff_i_j,x_diff_i_j), cross_multiply(y_diff_i_j,y_diff_i_j), cross_multiply(z_diff_i_j,z_diff_i_j) - # Add slack variables due to inequality constraint. - slack_var_terms = [] - slack_coefficients = generate_slack_coefficients(end_turn-start_turn) - for s in range(0,len(slack_coefficients)): - slack_var_terms += [Term(c=-slack_coefficients[s], indices=[num_turns*num_dim+slack_indexer+s])] - - terms += x_diff_i_j_2 + y_diff_i_j_2 + z_diff_i_j_2 + slack_var_terms - slack_indexer+=len(slack_coefficients) - return terms - -def penalize_000(len_seq: int, num_dim: int, lambda_2: int) -> list: - - ''' - Purpose: - Build the constraint that penalizes the invalid moves associated with the substring: '000'. - The constraint needs to be defined over the set of all turns, as defined by the 'for' loop. - Example: - If turn 2 (q_3q_4q_5) equals '000', assign a large penalty. - Inputs: - 1. len_seq: the number nodes to consider. - 2. num_dim: the number of dimensions (which is 3). - 3. lambda_2: the penalty weight for this constraint. - Outputs: - 1. List of term objects. - ''' - - terms = [] - for k in range(0,len_seq): - offset = k*num_dim - term_0 = Term(c=-1*lambda_2,indices=[0+offset]) - term_1 = Term(c=-1*lambda_2,indices=[1+offset]) - term_2 = Term(c=-1*lambda_2,indices=[2+offset]) - term_3 = Term(c= 1*lambda_2,indices=[0+offset,1+offset]) - term_4 = Term(c= 1*lambda_2,indices=[0+offset,2+offset]) - term_5 = Term(c= 1*lambda_2,indices=[1+offset,2+offset]) - term_6 = Term(c=-1*lambda_2,indices=[0+offset,1+offset,2+offset]) - terms += [term_0, term_1, term_2, term_3, term_4, term_5, term_6] - return terms - -def penalize_111(len_seq: int, num_dim: int, lambda_3: int) -> list: - - ''' - Purpose: - Build the constraint that penalizes the invalid moves associated with the substring: '111'. - The constraint needs to be defined over the set of all turns, as defined by the 'for' loop. - Example: - If turn 2 (q_3q_4q_5) equals '111', assign a large penalty. - Inputs: - 1. len_seq: the number nodes to consider. - 2. num_dim: the number of dimensions (which is 3 in this sample). - 3. lambda_3: the penalty weight for this constraint. - Outputs: - 1. List of term objects. - ''' - - terms = [] - for k in range(0,len_seq): - offset = k*num_dim - terms += [Term(c=1*lambda_3,indices=[0+offset,1+offset,2+offset])] - return terms - -def no_return_constraint(num_turns: int, num_dim: int, lamda_4: int)-> list: - - ''' - Purpose: - Build the constraint that penalizes going back to the same position/node two turns later. - Example: - Node A ---> ---> Node B ---> ---> Node A => erroneous as we've been there already. - Two sequential moves may not be in the same dimension and in opposite directions: (+x then -x), (-x then +x), (+y then -y) etc. - Inputs: - 1. num_turns: the number of turns. - 2. num_dim : the number of dimensions, which is 3 for this sample. - 3. lambda_4 : the penalty weight for this constraint. - Outputs: - 1. List of term objects. - ''' - - terms = [] - for i in range(0,num_turns): - x_out_in = cross_multiply(direction_variables("+x",i*num_dim,1,1,lamda_4), direction_variables("-x",(i+1)*num_dim,1,1,lamda_4)) - x_in_out = cross_multiply(direction_variables("-x",i*num_dim,1,1,lamda_4), direction_variables("+x",(i+1)*num_dim,1,1,lamda_4)) - y_right_left = cross_multiply(direction_variables("+y",i*num_dim,1,1,lamda_4), direction_variables("-y",(i+1)*num_dim,1,1,lamda_4)) - y_left_right = cross_multiply(direction_variables("-y",i*num_dim,1,1,lamda_4), direction_variables("+y",(i+1)*num_dim,1,1,lamda_4)) - z_up_down = cross_multiply(direction_variables("+z",i*num_dim,1,1,lamda_4), direction_variables("-z",(i+1)*num_dim,1,1,lamda_4)) - z_down_up = cross_multiply(direction_variables("-z",i*num_dim,1,1,lamda_4), direction_variables("+z",(i+1)*num_dim,1,1,lamda_4)) - terms += x_out_in + x_in_out + y_right_left + y_left_right + z_up_down + z_down_up - return terms - - - -def read_validate_solution(solution: dict, num_turns: int, num_dim: int): - - ''' - Purpose: - To validate the solution returned by the solver. Make it readable, and analyze if it makes sense. - Inputs: - 1. solution: The solution results dictionary which is returned by the solver (results["configuration"]). - 2. num_turns: The number of turns for the simulation. - 3. num_dim: The number of dimensions, which is 3 for this sample (3D). - Outputs: - 1. valid: A boolean variable that specifies the validity of the solution. - 2. pos_dit: Layered position dictionary that contains all of the nodes' locations per turn {turn: {x: x_pos, y:y_pos, z:z_pos}}. - 3. dir_dict: Dictionary containing the linguistic interpretation of the 3-substring directions. - 4. var_dict: Dictionary containing the spin per optimized variable - 5. x_arr: Array of x positions. - 6. y_arr: Array of y positions. - 7. z_arr: Array of z positions. - ''' - - print('\n') - valid = True - move = '' - sol_str = '' - x_arr = [0] - y_arr = [0] - z_arr = [0] - dir_dict = {'100':'out','010':'in','001':'right','110':'left','101':'up','011':'down'} - pos_dict = {0:{"x":0, "y":0, "z":0}} - var_dict = {} - for key,val in solution: - if key<(num_turns*num_dim): - turn = floor(key/num_dim)+1 - print("Turn: "+str(turn),"var: "+str(key),"spin: "+str(val)) - var_dict |= {str(key): val} - if key%3 Date: Tue, 19 Jul 2022 13:46:24 +0200 Subject: [PATCH 10/10] Add files via upload --- .../self-avoiding-path.html | 15645 ++++++++++++++++ .../self-avoiding-path.ipynb | 1086 ++ .../self-avoiding-path/self-avoiding-path.py | 485 + 3 files changed, 17216 insertions(+) create mode 100644 samples/self-avoiding-path/self-avoiding-path.html create mode 100644 samples/self-avoiding-path/self-avoiding-path.ipynb create mode 100644 samples/self-avoiding-path/self-avoiding-path.py diff --git a/samples/self-avoiding-path/self-avoiding-path.html b/samples/self-avoiding-path/self-avoiding-path.html new file mode 100644 index 0000000..5b3d7e4 --- /dev/null +++ b/samples/self-avoiding-path/self-avoiding-path.html @@ -0,0 +1,15645 @@ + + + + + +self-avoiding-walk + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/samples/self-avoiding-path/self-avoiding-path.ipynb b/samples/self-avoiding-path/self-avoiding-path.ipynb new file mode 100644 index 0000000..16d9bac --- /dev/null +++ b/samples/self-avoiding-path/self-avoiding-path.ipynb @@ -0,0 +1,1086 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Self Avoiding Path with Azure Quantum Inspired Optimization\n", + "\n", + "In this notebook we'll cover how to formulate an optimization problem to find a path through a 3D lattice that does not cross itself (self-avoiding walk/path). The optimization problem is solved with the Azure Quantum service which contains numerous heuristic (non-linear) optimization solvers. Finding a self-avoiding path in a 3D lattice can be considered a difficult problem, in the sense that it has suffers from exponential scaling conditioned on the number of turns and the number of dimensions (2D vs 3D, etc.). \n", + "\n", + "In this notebook, a step by step approach is taken to explain the function definitions to are necessary to create the optimization problem.\n", + "\n", + "Goal: To find a path in a 3D lattice that does not cross itself.\n", + "\n", + "To clarify some vocab and assumptions used in the notebook:\n", + "1. The number of dimensions is 3 (3D), meaning the path can be represented in a $x$-$y$-$z$ plane.\n", + "2. The position represents the location in the x-y-z plane, thus given by ($x$,$y$,$z$).\n", + "3. A direction describes the orientation of within in the x-y-z plane, thus in {$+x$,$-x$,$+y$,$-y$,$+z$,$-z$}.\n", + "4. \"Turns\" are equivalent to \"steps\". After each turn a new position is acquired that must be unique (not visited before). \n", + "5. The total number of turns is equivalent to the number of positions that needs to be visited minus one ($N-1$). \n", + "6. The decision variables for the optimization function are denoted by \"q\" because \"x\" is already associated with a direction, and are referred to as \"optimization variables\".\n", + "\n", + "Note: Because the number of terms to for this optimization problem grows explosively with the number of turns, you might want to try running this in the Azure Quantum notebooks. The more technical reason for this is that expansions of nonlinear terms have to be computed locally resulting in massive number of terms needing to be uploaded. Unless you are very patient, a recommendation would be to either check out the online notebook experience or rewrite this notebook's problem class to its streaming counterpart (https://docs.microsoft.com/en-us/azure/quantum/optimization-streaming-problem). \n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Import the necessary dependencies for the notebook" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import time\n", + "from math import floor, log2\n", + "from azure.quantum import Workspace\n", + "from azure.quantum.optimization import Problem, ProblemType, Term, ParallelTempering, Tabu, SimulatedAnnealing\n", + "from azure.identity import ClientSecretCredential\n", + "from mpl_toolkits import mplot3d\n", + "import numpy as np\n", + "import matplotlib.pyplot as plt" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Connect to your Azure Quantum workspace\n", + "\n", + "To run the sample, you'll need to have a quantum workspace. Check out this module if you don't have one yet: https://docs.microsoft.com/en-us/learn/modules/get-started-azure-quantum/.\n", + "Fill in the variables below." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "workspace = Workspace(\n", + " subscription_id = \"\",\n", + " resource_group = \"\",\n", + " name = \"\",\n", + " location = \"\",\n", + " credential = ClientSecretCredential(tenant_id=\"\",\n", + " client_id=\"\",\n", + " client_secret=\"\")\n", + ")\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Print readable cost functions\n", + "\n", + "Throughout the notebook you'll probably realize that printing the \"terms\" isn't going to provide much help, mainly because there will be too many of them and their dictionary format. A term is the way a mathematical term is expressed in terms of a dictionary for the SDK (see examples). Below a function is defined that prints the term(s) dictionaries that describe the constraint/cost function in terms of \"q\" optimization variables. You can call the function to check if the working is correct, or if you're unsure of what a constraint looks like. Note that for a large problem it nevertheless becomes difficult to understand the entire function output because of the number of terms.\n", + "\n", + "An example:\n", + "{'c': 1, 'ids': [0, 10, 11, 12]} ---> $1q_0q_{10}q_{11}q_{12}$\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def print_function(terms: list):\n", + "\n", + " '''\n", + " Purpose:\n", + " Takes a list of terms and prints it out as a mathematical (cost/constraint) function.\n", + " Example:\n", + " {'c': 1, 'ids': [0, 10, 11, 12]} ---> 1q_0q_10q_11q_12\n", + " Inputs:\n", + " 1. terms: the list of terms.\n", + " '''\n", + " \n", + " k = 0\n", + " final_string = ''\n", + " final_string = ''\n", + " for term in terms:\n", + " term = term.to_dict()\n", + " weight = term['c']\n", + " ids = term['ids']\n", + " string = '('\n", + " if weight >= 0:\n", + " if k == 0: \n", + " string = '('+str(weight)\n", + " else:\n", + " string = '+' + '('+str(weight)\n", + " if weight < 0:\n", + " if k == 0:\n", + " string = '(' + str(abs(weight))\n", + " else: \n", + " string = '-' + '(' + str(abs(weight))\n", + " for id_ in ids:\n", + " string = string + f'q_{id_}'\n", + " string = string + ')'\n", + " final_string = final_string + string\n", + " k += 1\n", + "\n", + " print('[ ' + final_string + ' ]')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Expansion of two term lists\n", + "\n", + "Throughout the notebook we will need to cross-multiply nonlinear terms, for computing squares for example. The function below performs the expansion. An important note to keep in mind here, especially if you're looking to optimize the code, is that the function does not assemble identical terms. Since the cost functions dealt with in this notebook are still rather small, reducing the number of terms was left out of the scope. \n", + "\n", + "More clearly stated in terms of equations:\n", + "\n", + "$$ \\text{Current function (see below): } \\hspace{0.2cm} (a+b)^2 = a^2 + ab + ab + b^2 $$\n", + "$$ \\text{Optimal function: } \\hspace{0.2cm} (a+b)^2 = a^2 + 2ab + b^2 $$\n", + "\n", + "Should be a fun programming exercise to reduce the number of terms significantly!" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def cross_multiply(list_a: list, list_b: list) -> list:\n", + "\n", + " '''\n", + " Purpose: Cross multiplies two lists of terms (linear ex. [q_0 + q_1] or non-linear ex. [q_0q_1]) to return the expansion.\n", + " Can compute powers of groups this way (^2, ^3,...), like squaring a list of terms.\n", + " Calculates the expansion locally, unlike the SlcTerm class.\n", + " Example: (2q_0q_1+3q_2q_3)^2 => (2q_0q_1)^2 + 6q_0q_1q_2q_3 + 6q_0q_1q_2q_3 + (3q_2q_3)^2\n", + " Input:\n", + " 1. list_a: list which serves as the reference list (first 'for' loop).\n", + " 2. list_b: list which serves as the target list (second 'for' loop).\n", + " Output:\n", + " 1. list of term objects.\n", + " '''\n", + "\n", + " terms = []\n", + " for one in list_a:\n", + " for uno in list_b:\n", + " alpha = one.to_dict()\n", + " beta = uno.to_dict()\n", + " weight = int(alpha['c'])*int(beta['c'])\n", + " ids = list(alpha['ids'])+list(beta['ids'])\n", + " terms += [Term(c = weight, indices = ids)] \n", + " return terms\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Parameters for running through the notebook\n", + "\n", + "While running through the notebook you might want to execute and print some of the constraint functions. To do that, you'll need some variables to be defined. Only 3 turns are considered with the defined parameters below, as that will keep the function outputs small and understandable!" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "nodes = \"ABCD\" # The four position/node names.\n", + "len_seq = len(nodes) # The length of the node \n", + "num_turns = len(nodes)-1 # The number of turns, which is one less than the number of therefore -1 turns.\n", + "num_dim = 3 # Number of optimization variables required to describe a turn\n", + "lambda_0 = 1 # Penalty weight for the 'distance constraint'\n", + "lambda_1 = 40 # Penalty weight for the 'no return constraint'\n", + "lambda_2 = 25 # Penalty weight for the invalid direction '000' constraint\n", + "lambda_3 = 25 # Penalty weight for the invalid direction '111' constraint" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 1. Encoding the directions \n", + "\n", + "Prior to starting to define our cost function, we have to construct some basic functions and agree on some definitions. In this part, we'll define the 6 directions of the x-y-z plane in terms of the optimization variables (\"q\"). \n", + "\n", + "A common way to encode a turn based optimization problem is through a direction-based string, in which each optimization variable substring (ex. $q_0q_1q_2$) denotes some kind of decision of which direction was takn. For example, take a car take can only move backward or forward. The decision of the driver at some time $t$ can be described as $q_t \\in \\{0, 1\\}$, where 0 represents going backward and 1 forward, respectively. Over a multiple time steps, say 3, one can then describe the movement of the car by:\n", + "\n", + "$$ \\text{Movements:} \\hspace{0.25cm} q_0q_1q_2 $$\n", + "\n", + "The sequence of movements, \"forward, backward, backward\", can then be represented as:\n", + "\n", + "$$ \\text{Sequence of movements:} \\hspace{0.25cm} q_0q_1q_2 = 100$$\n", + "\n", + "Alright, if that is clear to you, then the next step is to represent the 6 directions of the x-y-z plane in such a fashion. Regrettably, a \"q\" can only be either 0 or 1, not 2, 3, 4, 5 to represent the six directions. But what can be done is to use multiple optimization variables to describe a direction! For example:\n", + "\n", + "$$ \\text{Sequence of movements:} \\hspace{0.25cm} q_0q_1q_2q_3q_4q_5q_6q_7q_8 $$\n", + "$$ \\text{First move:} \\hspace{0.25cm} q_0q_1q_2 $$\n", + "$$ \\text{Second move:} \\hspace{0.25cm} q_3q_4q_5 $$\n", + "$$ \\text{Third move:} \\hspace{0.25cm} q_6q_7q_8 $$\n", + "\n", + "Because we need to encode 6 directions, we need at least 3 optimization variables to form unique substrings. The table explains this, we to have enough possible combinations to encode the 6 directions:\n", + "\n", + "
\n", + "\n", + "| Opt. var. substring | Combinations | \n", + "| ----------------------------- | -------------------------- |\n", + "| $q_0 \\cdot q_1$ | $2\\cdot 2 = 4 < 6$ |\n", + "| $q_0 \\cdot q_1 \\cdot q_2$ | $2\\cdot 2\\cdot 2 = 8 > 6$ |\n", + "\n", + "
\n", + "\n", + "Note, for later, you should keep in mind that 2 of the 8 combinations become irrelevant. It is important that the solver does not return those strings!\n", + "\n", + "Perfect! Now we just need to assign each direction a unique substring. Below you can find my choices, feel free to change these if you're starting from scratch.\n", + "\n", + "
\n", + "\n", + "| Direction | Opt. var. substring | \n", + "| --------- | ----------------- |\n", + "| +x | 100 |\n", + "| -x | 010 |\n", + "| +y | 001 |\n", + "| -y | 110 |\n", + "| +z | 101 |\n", + "| -z | 011 |\n", + "| N/A | 000 |\n", + "| N/A | 111 |\n", + "\n", + "
\n", + "\n", + "Now we just need to define direction variables. These are as defined in the above table. These variables should take a value 1 if a movement is made in that direction, while the other directions must all be zero. This can be achieved by the following scheme, where $k$ denotes the turn, and $\\gamma = 3(k-1)$ (3 because 3 dimensions):\n", + "\n", + "
\n", + "\n", + "| Direction | Opt. var. substring | Formula | \n", + "| ------------- | ---------------- | -------------------------------------------------- |\n", + "| $d_{+x}^{k}$ | 100 | $ q_{0+\\gamma} (1-q_{1+\\gamma}) (1-q_{2+\\gamma})$ |\n", + "| $d_{-x}^{k}$ | 010 | $ (1-q_{0+\\gamma}) q_{1+\\gamma} (1-q_{2+\\gamma})$ |\n", + "| $d_{+y}^{k}$ | 001 | $ (1-q_{0+\\gamma}) (1-q_{1+\\gamma}) q_{2+\\gamma}$ | \n", + "| $d_{-y}^{k}$ | 110 | $ q_{0+\\gamma} q_{1+\\gamma} (1-q_{2+\\gamma}) $ |\n", + "| $d_{+z}^{k}$ | 101 | $ q_{0+\\gamma} (1-q_{1+\\gamma}) q_{2+\\gamma} $ |\n", + "| $d_{-z}^{k}$ | 011 | $ (1-q_{0+\\gamma}) q_{1+\\gamma} q_{2+\\gamma} $ |\n", + "\n", + "
\n", + "\n", + "To clarify a bit further through an example:\n", + "If in the first turn (k=0) the solver returns $q_0=1$, $q_1=0$, $q_2=0$, and in the second turn (k=1) returns $q_3=0$, $q_4=0$, $q_5=1$, then a \"+x and +y\" were taken, respecively.\n", + "\n", + "These direction variables will help understand some difficult constraints later on. Defining these direction variables additionally makes the code much more readable, since we can define everything in terms of the direction variables instead of the individual optimization variables.\n", + "\n", + "Below you can find the function for the direction variables. The formulas have been expanded (mathematically) to easily declare them in a number of terms, however it is hard-coded this way. Some inputs to the function (\"sign_dir\", \"sign_pos\", \"lambda_\") are relevant for building constraints later in the notebook, but have to defined in this function. Further information can be found in the function docstring. \n", + " " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def direction_variables(direction: str, offset: int, sign_dir: int, sign_pos: int, lambda_: int) -> list:\n", + "\n", + " '''\n", + " Purpose:\n", + " Translates the direction (+x,-x,+y,-y,+z,-z) of turn 'i' as a function of three optimization variables. (Three q's because of the defined coordinate system).\n", + " Example:\n", + " Direction \"+z\" in the first turn (turn = 1) is translated to: q_{0+offset}q_{2+offset}-q_{0+offset}q_{1+offset}q_{2+offset}.\n", + " Inputs:\n", + " 1. direction: A direction from an x-y-z coordinate system, one of the following: ('+x','-x','+y','-y','+z','-z').\n", + " 2. offset: Offset gives the turn number expressed in the first \"q\" of that turn. Equal to gamma in the explanation.\n", + " Example: Turn 1 starts with \"q\" q_0, offset=0. Turn 2 starts with q_3, offset = 3.\n", + " 3. sign_dir: Changes the sign of the weights corresponding to negative directions \"-x\", \"-y\", \"-z\" -> necessary for finding the positions, for exmaple (+x) \"-\" (-x).\n", + " 4. sign_pos: Changes the sign of the weights corresponding to negative positions \"-(x,y,z)\" -> necessary for finding the distances between node \"i\" and node \"j\".\n", + " 5. lambda_: The weight term associated with a constraint.\n", + " Output:\n", + " 1. A list of term objects.\n", + " '''\n", + "\n", + " terms = []\n", + " if direction == \"+x\":\n", + " term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset])\n", + " term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset])\n", + " term_2 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset])\n", + " term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1, term_2, term_3]\n", + " elif direction == \"-x\":\n", + " term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset])\n", + " term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset])\n", + " term_2 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset])\n", + " term_3 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1, term_2, term_3]\n", + " elif direction == \"+y\":\n", + " term_0 = Term(c= 1*sign_pos*lambda_, indices=[2+offset])\n", + " term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset])\n", + " term_2 = Term(c=-1*sign_pos*lambda_, indices=[1+offset, 2+offset])\n", + " term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1, term_2, term_3]\n", + " elif direction == \"-y\":\n", + " term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset])\n", + " term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1]\n", + " elif direction == \"+z\":\n", + " term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 2+offset])\n", + " term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1]\n", + " elif direction == \"-z\":\n", + " term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset])\n", + " term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset])\n", + " terms = [term_0, term_1]\n", + " return terms\n", + "\n", + "\n", + "##### ----- Test the function and print output:\n", + "turn = 1 # play with this value! \n", + "dir_var = direction_variables(\"+x\",(turn-1)*num_dim,1,1,lambda_0) \n", + "print('dir_var term dictionary \"+x\": ', dir_var)\n", + "print_function(dir_var)\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 2. Finding the difference in positions\n", + "\n", + "Great that we have the directions defined! Now let's use them and define a function that calculates the difference in positions, which we will need later. After each turn, a direction that appends to the path. A valid path is defined as a one that does not cross itself, meaning that we need to compare the positions over the turns. In other words, every new position appended to the path needs to be checked with all previously held positions, to verify that a position hasn't been visited twice. \n", + "\n", + "So how do we go about this?\n", + "\n", + "First we need a way to know the positions after choosing to go in a certain direction, so let's tackle that first. Consider the fact that the directions are recorded for each turn, which already gives some sort of log of the positions in the path. By summing the direction variables respective to their dimension (x/y/z) acoomplishes this, but only if a negative move can compensate a positive one. For example, after two turns the $x$-location can be expressed as:\n", + "\n", + "$$ x_2 = ( d^{1}_{+x} - d^{1}_{-x} ) + ( d^{2}_{+x} - d^{2}_{-x} )$$\n", + "\n", + "**_NOTE:_** In the above function (\"direction_variables\"), the negative sign for the negative direction variables is controlled through \"sign_dir\". \"sign_dir\" must be set to -1 to assign a negative sign to it as required in these position formulas!\n", + "\n", + "\n", + "Remember that for a turn only one direction variable can be set to 1! Thus if two moves in the $-x$ direction are taken, then:\n", + "\n", + "$$ x_2 = ( d^{1}_{+x} - d^{1}_{-x} ) + ( d^{2}_{+x} - d^{2}_{-x} ) = ( 0 - 1 ) + ( 0 - 1 ) = -2 $$\n", + "\n", + "As with the simple example for the x-dimension, the same can be applied to the $x$ and $y$ directions. The formulas below descrive the position after some number of turns through a summation (for the maths/physics enthousiasts, these are integrals of the velocities to derive the positions :) ).\n", + "\n", + "$$ x^k = \\sum_{k=1}^{k} ( d^{k}_{+x} - d^{k}_{-x} ) $$\n", + "$$ y^k = \\sum_{k=1}^{k} ( d^{k}_{+y} - d^{k}_{-y} ) $$\n", + "$$ z^k = \\sum_{k=1}^{k} ( d^{k}_{+z} - d^{k}_{-z} ) $$\n", + "\n", + "Great stuff! Now we have a method to find the positions along the path. To find the differences in position, for example between turn 2 and turn 1, it is only necessary to apply a subtraction: \n", + "\n", + "$$ x_2 - x_1 = \\sum_{k=1}^{2} ( d^{k}_{+x} - d^{k}_{-x} ) - \\sum_{k=1}^{1} ( d^{k}_{+x} - d^{k}_{-x}) = ( d^{2}_{+x} - d^{2}_{-x} ) $$\n", + "$$ y_2 - y_1 = \\sum_{k=1}^{2} ( d^{k}_{+y} - d^{k}_{-y} ) - \\sum_{k=1}^{1} ( d^{k}_{+y} - d^{k}_{-y}) = ( d^{2}_{+y} - d^{2}_{-y} ) $$\n", + "$$ z_2 - z_1 = \\sum_{k=1}^{2} ( d^{k}_{+z} - d^{k}_{-z} ) - \\sum_{k=1}^{1} ( d^{k}_{+z} - d^{k}_{-z}) = ( d^{2}_{+z} - d^{2}_{-z} ) $$\n", + "\n", + "Generalizing this to any difference between two positions:\n", + "\n", + "$$ x_j - x_i = \\sum_{k=i}^{j} ( d^{k}_{+x} - d^{k}_{-x} ) $$\n", + "$$ y_j - y_i = \\sum_{k=i}^{j} ( d^{k}_{+y} - d^{k}_{-y} ) $$\n", + "$$ z_j - z_i = \\sum_{k=i}^{j} ( d^{k}_{+z} - d^{k}_{-z} ) $$\n", + "\n", + "Fantastic! Now on to the function code for the difference in positions. Do read the function and its docstring to understand the implementation, because it reference the previously defined function to make use of direction variables. \n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def diff_in_pos(start_turn: int, end_turn: int, num_dim: int, lamda_: int):\n", + "\n", + " '''\n", + " Purpose:\n", + " Expresses the difference in position (x,y,z) between two turns as a function of the q's encoding of the directions.\n", + " In other words, expresses the difference in the position after the start_turn and position after the end_turn.\n", + " Example:\n", + " Difference between turn 0 (no turns yet, initial position = (0,0,0)) and turn 2:\n", + " x(2) = [ move(+x, turn 1) - move(-x, turn 1) ] + [ move(+x, turn 2) - move(-x, turn 2) ]\n", + " Note: only one 'move' per turn gets activated as they are represented by the same q's (ex. turn 1 is represented by q_0, q_1, and q_2).\n", + " Inputs:\n", + " 1. start_turn: the initial (reference) turn.\n", + " 2. end_turn: the final (target) turn.\n", + " 3. num_dim: the number of dimensions (3, x-y-z coordinate system).\n", + " Outputs:\n", + " 1. The difference in the x direction.\n", + " 2. The difference in the y direction.\n", + " 3. The difference in the z direction. \n", + " '''\n", + "\n", + " x_diff = y_diff = z_diff = []\n", + " if start_turn < end_turn and start_turn >= 0 and end_turn >= 1:\n", + " for turn in range(start_turn,end_turn+1):\n", + " x_diff += direction_variables(\"+x\",(turn-1)*num_dim,1,1,lamda_)+direction_variables(\"-x\",(turn-1)*num_dim,-1,1,lamda_)\n", + " y_diff += direction_variables(\"+y\",(turn-1)*num_dim,1,1,lamda_)+direction_variables(\"-y\",(turn-1)*num_dim,-1,1,lamda_)\n", + " z_diff += direction_variables(\"+z\",(turn-1)*num_dim,1,1,lamda_)+direction_variables(\"-z\",(turn-1)*num_dim,-1,1,lamda_)\n", + " return x_diff, y_diff, z_diff\n", + "\n", + "\n", + "##### ----- Test the function and print output: \n", + "start_turn = 1 # play with this value! \n", + "end_turn = 2 # play with this value! \n", + "x_diff, y_diff, z_diff = diff_in_pos(start_turn, end_turn, num_dim, lambda_0)\n", + "print('Difference in x described as term list: \\n', x_diff)\n", + "print('\\nDifference in x described as mathematical function:')\n", + "print_function(x_diff)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 3. The distance constraint\n", + "\n", + "Fantastic that you've made it this far! With all the above functions defined we can start solving the problem. \n", + "\n", + "The distance constraint enforces that after each turn, the difference in positions after turns $i$ and $j$ must be larger or equal to 1 (distance between lattice points in the same dimension). \n", + "To visualize the scenario this constraint tries to penalize consider a 2D example with 4 turns, starting in $(0,0)$:\n", + "\n", + "$$ \\text{Turn 1, go right: } \\hspace{0.3cm} (0,0) => (0,1) $$ \n", + "$$ \\text{Turn 2, go up: } \\hspace{0.3cm} (0,1) => (1,1) $$ \n", + "$$ \\text{Turn 3, go left: } \\hspace{0.3cm} (1,1) => (1,0) $$ \n", + "$$ \\text{Turn 4, go down: } \\hspace{0.3cm} (1,0) => (0,0) $$ \n", + "\n", + "As you can see, the last step conflicts with our constraint. It is not permitted to return into a position that we've already been, namely $(0,0)$. Turn 1-3 are all valid, since they remain a distance of 1 away from all other previously held positions.\n", + "\n", + "Let's define what we want mathematically. tThe distance between the position after turn $i$ and $j$ must be larger or equal to 1. For this we'll need some basic geometry, the 3D variant of the Pythagorean theorem. From the theorem, it can be understood that hypotenuse ($c$) must always be larger or equal to one, since that is what defines the distance between two points. Mathematically speaking working this out:\n", + "\n", + "$$ C_{i,j} \\geq 1 $$\n", + "$$ \\sqrt{(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} \\geq 1 $$\n", + "\n", + "The square-root is a bit of a headache when writing out a cost function, it would require an approximation or some sort of factorization, not fun if you're dealing with many terms. To avoid that, we're simply going to square both sides, which in our case if fine (for maths people), since we aren't dealing with negative numbers here:\n", + "\n", + "$$ C_{i,j}^2 \\geq 1 $$\n", + "$$ {(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} \\geq 1 $$\n", + "\n", + "Nice! If you're sharp, you'll start seeing where the previous functions might come in handy now. The function that computes the difference between the respective positions (\"diff_in_pos\") in each dimension was defined above, but also the function that computes the an expansion (\"cross_multiply\") was defined at the beginning of the notebook. Writing those function calls out in order :\n", + "\n", + "1. We call \"diff_in_poss\" to calculate the difference in positions for each dimension (x,y,z).\n", + "2. For each dimension, the square is calculated by calling \"cross_multiply\". \n", + "\n", + "Alright, you might be wondering how to deal with the $>=$, since it is necessary to have an equation that equals zero in order to integrate it into the cost function. \n", + "This is where slack variables come in. The purpose of slack variables is to convert an inequality constraint into an equality constraint. Or in other words, for this equation, we need to compensate some values (explained further below) in order to convert the equation to an equality constraint. Consider the constraint in its simplest form:\n", + "\n", + "$$ C_{i,j}^2 \\geq 1 $$\n", + "\n", + "It is clear that we would need to add some number $V_{i,j}$, on the right hand side of the equation in order to make this an equality constraint. $V_{i,j}$ can be any positive value and is conditioned on $i$ and $j$: \n", + "\n", + "$$ C_{i,j}^2 = 1+V_{i,j}$$\n", + "\n", + "Let's say that instead of representing a single value we want V_{i,j} to represent a range of values $[0-4]$. This is where slack variables can be introduced. By introducing additional optimization variables, which have nothing to do with the path encoding, the range can be described as following:\n", + "\n", + "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+q_{s3}+q_{s4} $$\n", + "\n", + "Or more compactly:\n", + "\n", + "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+2q_{s3} $$\n", + "\n", + "So any value in the range $[0-4]$ is described through these q's. You can derive 1 by assigning a single \"q\", which has weight 1, the value 1. Likewise, you can get the value 4 by assigning all optimization variables the value 1. \n", + "\n", + "Alright, so how do we know which range of values we need to represent? That is revealed by the turn numbers, $i$ and $j$. Over these turns, the maximum squared distance that can be achieved is when moves are only made in a single direction, the \"+x\" direction for example. The maximum distance is then equal to the number of moves squared $(j-i)^2$.\n", + "\n", + "$$ C_{i,j}^2 = (j-i)^2 $$\n", + "\n", + "Then writing out the maths gives us the necessary upper bound for the range that the optimization variables need to represent, where $S$ stands for the number of slack variables necessary:\n", + "\n", + "$$ \\text{Upper bound: } \\hspace{0.5cm} C_{i,j}^2 = (j-i)^2 = 1 + \\sum_{s=0}^{S}q_s$$\n", + "$$ \\text{Upper bound: } \\hspace{0.5cm} \\sum_{s=0}^{S}q_s = (j-i)^2 - 1 $$\n", + "\n", + "For the lower bound of the range, the value is 0. The reason for that is we want to be able to represent any number equal to or larger than 1 for the inequality constraint through the addition of the slack variables. Concluding, the range the q's must represent is $[0,((j-i)^2-1)]$. More on how to calculate the number of slack variables necessary to define this range later, as you don't need ((j-i)^2-1) optimization variables!\n", + "\n", + "\n", + "Piecing all the parts together we find the following equation for a $i$-$j$ combination:\n", + "\n", + "$$ {(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} = 1 + \\sum_{s=0}^{S}q_s $$ \n", + "\n", + "Because constants are irrelevant for the optimization landscape the value 1 can be neglected. The reason being that constants only introduce linear offsets, thus impacting the entire optimization equally. The distance constraint which needs to account for all $i$-$j$ combinations, where $j$>$i$ and $N-1$ the number of turns, is summarized as follows:\n", + "\n", + "$$ \\sum_{i=1}^{N-1} \\sum_{j>i}^{N-1} \\lambda_0 ( {(x_{j} - x_{i})^2 + (y_{j} - y_{i})^2 + (z_{j} - z_{i})^2} - \\sum_{s=0}^{S}q_s ) $$ \n", + "\n", + "The function that builds this constraint is presented below. Read the docstring for how it works.\n", + "`Note, to run this function you'll need to run the next function cell to define 'generate_slack_coefficients'.` \n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def distance_constraint(num_turns: int, num_dim: int, lambda_0: int) -> list:\n", + "\n", + " '''\n", + " Purpose:\n", + " Build the distance contraint based on previosly defined functions.\n", + " Constraint: Distance squared between i and j must be larger or equal to 1.\n", + " Constraint: L_{i,j}^2 >= 1 => L_{i,j}^2 = 1+q_{slacker} (converting the inequality constraint to an equality constraint.)\n", + " Example/Explanation:\n", + " L{1,2}^2 = (x1-x2)^2 + (y1-y2)^2 + (z1-z2)^2\n", + " x1 = [move(+x1)-move(-x1)]\n", + " x2 = [move(+x1)-move(-x1)] + [move(+x2)-move(-x2)]\n", + " \n", + " \n", + " L{1,2}^2 = [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2\n", + " [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2 - q_{slacker} = 0 ---> expressed in q's == cost function\n", + " Inputs:\n", + " 1. num_turns: the number of turns.\n", + " 2. num_dum: the number of dimensions.\n", + " 3. lambda_0: the constraint weight for the distance constraint.\n", + " Output:\n", + " 1. List of term objects describing the distance constraint.\n", + " '''\n", + "\n", + " terms = []\n", + " slack_indexer = 0\n", + " for start_turn in range(1,num_turns+1):\n", + " for end_turn in range(start_turn+1,num_turns+2):\n", + " # Calculate the differences in positions for each dimension. \n", + " x_diff_i_j, y_diff_i_j, z_diff_i_j = diff_in_pos(start_turn, end_turn, num_dim, lambda_0)\n", + " # Compute the squared distance (Pythagorean theorem) by calculating the squared expansion.\n", + " x_diff_i_j_2, y_diff_i_j_2, z_diff_i_j_2 = cross_multiply(x_diff_i_j,x_diff_i_j), cross_multiply(y_diff_i_j,y_diff_i_j), cross_multiply(z_diff_i_j,z_diff_i_j) \n", + " # Add slack variables due to inequality constraint. \n", + " slack_var_terms = []\n", + " slack_coefficients = generate_slack_coefficients(end_turn-start_turn)\n", + " for s in range(0,len(slack_coefficients)):\n", + " slack_var_terms += [Term(c=-slack_coefficients[s], indices=[num_turns*num_dim+slack_indexer+s])]\n", + " terms += x_diff_i_j_2 + y_diff_i_j_2 + z_diff_i_j_2 + slack_var_terms\n", + " slack_indexer+=len(slack_coefficients)\n", + " return terms\n", + "\n", + "##### ----- Test the function and print output: \n", + "# The output is too large to understand, nevertheless you can run the below statements to view how visualize the term-scaling of the problem.\n", + "number_turns = 2 #play with this value!\n", + "dist_terms = distance_constraint(number_turns, num_dim, lambda_0)\n", + "\n", + "# Only print below statements if you want to get an impression of the number of terms.\n", + "#print('Distance constraint term dictionaries: ', dist_terms) # not readable!\n", + "#print('\\nDistance constraint: ') \n", + "#print_function(dist_terms) # not readable!" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 4. Intermezzo: Slack Variables Weights\n", + "\n", + "To remove any human calculations to construct the distance constraint(s), we'll automate the computation of the number of slack variables and their weights. \n", + "\n", + "As you saw in the previous part, certain slack variables can be assigned weights to reduce the number of slack variables necessary. Recall that the range $[0,4]$ can be defined by the following two equations with slack variables (s):\n", + "\n", + "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+q_{s3}+q_{s4} $$\n", + "\n", + "$$ V_{i,j} = [0-4] = q_{s1}+q_{s2}+2q_{s3} $$\n", + "\n", + "The bottom equation is more compact because the last variables carries a weight-2. In Lucas' paper (see 2.4 of arxiv:1302.5843) the algorithm to find such weights is presented, which is based on calculating all $2^{x}$, where $x$ iterates from zero to the log_2 of maximum value in the range (4 in this example). \n", + "\n", + "Below are two examples that may help visualize why and how the slack variables represent the ranges of values. \n", + "\\\n", + " \n", + "\n", + "\n", + "
\n", + "\n", + "Example for range $[0,4]$:\n", + "| $q_{s1}$ | $2q_{s2}$ | $q_{s3}$ | Value |\n", + "| ------ | -------- | -------- | ---------------- |\n", + "| 0 | 0 | 0 | 0 + 2(0) + 0 = 0 |\n", + "| 1 | 0 | 0 | 1 + 2(0) + 0 = 1 |\n", + "| 0 | 1 | 0 | 0 + 2(1) + 0 = 2 |\n", + "| 1 | 1 | 0 | 1 + 2(1) + 0 = 3 |\n", + "| 1 | 1 | 1 | 1 + 2(1) + 1 = 4 | \n", + "\n", + "
\n", + "\n", + "\\\n", + " \n", + "\n", + "
\n", + "\n", + "Example for range $[0,20]$:\n", + "Rather than using twenty optimization variables, five with weights can achieve the same!\n", + "| $q_{s1}$ | $2q_{s2}$ | $4q_{s3}$ | $8q_{s4}$ | $5q_{s5}$ | Value |\n", + "| ------ | ------- | --------- | ----------- | --------- | ------------------- |\n", + "| 0 | 0 | 0 | 0 | 0 | 0 + 2(0) + 4(0) + 8(0) + 5(0) = 0 |\n", + "| 1 | 0 | 0 | 0 | 0 | 1 + 2(0) + 4(0) + 8(0) + 5(0) = 1 |\n", + "| 0 | 1 | 0 | 0 | 0 | 0 + 2(1) + 4(0) + 8(0) + 5(0) = 2 |\n", + "| 1 | 1 | 0 | 0 | 0 | 1 + 2(1) + 4(0) + 8(0) + 5(0) = 3 |\n", + "| 0 | 0 | 1 | 0 | 0 | 0 + 2(0) + 4(1) + 8(0) + 5(0) = 4 |\n", + "| ... | ... | ... | ... | ... | ... |\n", + "| 0 | 1 | 0 | 1 | 1 |0 + 2(1) + 4(0) + 8(1) + 5(1)= 15 |\n", + "| 1 | 1 | 0 | 1 | 1 |1 + 2(1) + 4(0) + 8(1) + 5(1)= 16 |\n", + "| 0 | 0 | 1 | 1 | 1 |0 + 2(0) + 4(1) + 8(1) + 5(1)= 17 |\n", + "| 1 | 0 | 1 | 1 | 1 |1 + 2(0) + 4(1) + 8(1) + 5(1)= 18 |\n", + "| 0 | 1 | 1 | 1 | 1 |0 + 2(1) + 4(1) + 8(1) + 5(1)= 19 |\n", + "| 1 | 1 | 1 | 1 | 1 |1 + 2(1) + 4(1) + 8(1) + 5(1)= 20 |\n", + "\n", + "
\n", + "\n", + "\\\n", + " \n", + "\n", + "The function is given below. In context of the distance constraint, we're still faced with a minor problem. If $(j-i)^2-1$ equals 0, then we don't need any slack variables. The reason for this is that the range becomes $[0,0]$, which can also be represented by no variables at all. " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def generate_slack_coefficients(turn_diff: int):\n", + "\n", + " ''' \n", + " Purpose: \n", + " Calculates the number of slack variables and their weights.\n", + " Example:\n", + " For the constraint: x1 + x2 + x3 + x4 <= 4 which is converted to x1 + x2 + x3 + x4 + s1 + s2 +2*s3 = 4, \n", + " with 's' being slack variables. This function computes the weights of these slack variables ([1,1,2] for the example).\n", + " Reference:\n", + " Lucas' paper (see 2.4 of arxiv:1302.5843)\n", + " Input:\n", + " 1. turn_diff: the differences in turns (end_turn - start_turn).\n", + " Output:\n", + " 1. y: the weights of the slack variables.\n", + " '''\n", + " \n", + " dist_diff = (turn_diff**2)-1\n", + " if dist_diff == 0:\n", + " y = [] # no slack variables needed\n", + " elif dist_diff > 0:\n", + " M = floor(log2(dist_diff))\n", + " y = [-2**n for n in range(M)]\n", + " y.append(-(dist_diff + 1 - 2**M))\n", + " return y\n", + "\n", + "##### ----- Test the function and print output: \n", + "turn_difference = 3 # play with this value!\n", + "slack_weights = generate_slack_coefficients(turn_difference)\n", + "print('Slack weights: ', slack_weights) \n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 5. No Return Constraint\n", + "\n", + "The distance constraint enforces a minimum distance of 1 between the different taken positions. However, for two consecutive turns, it does not completely prevent (to a high enough degree) going to a previous position. A simplified explanation for this is that the distance constraint is described through the positional differences in $x$, $y$, and $z$. Additionally, for consecutive turns, the number of slack variables is zero ($(i-j)^2-1 = 0$ for consecutive turns} - thus there is no auxiliary benefit introduced by slack variables to compensate for being in a different position after the turn. Therefore, the solver will try to keep the positions as close to each other as possible, which leads to overlapping positions, especially in consecutive turns. To overcome this, a penalization needs to be introduced that stops returning to the previous position held in the turn before. For example, what we want to stop is the following:\n", + "\n", + "$$ \\text{Turn 1: A to B.} $$\n", + "$$ \\text{Turn 2: B to A.} $$\n", + "\n", + "This can be equivalenty described as moving in opposite directions over the consecutive turns. For example, first going in the \"+y\" direction, and following that moving in the \"-y\" direction. \n", + "\n", + "Designing such a constraint is straightforward, the opposite direction variables need to be multiplied. \n", + "Preventing a revisit of a position for the \"x\" direction over the first and second turn can be described by the following constraint:\n", + "\n", + "$$ {\\lambda}_2(d^{1}_{+x} d^{2}_{-x} + d^{1}_{-x}d^{2}_{+x}) $$ \n", + "\n", + "If a move is made in the \"+x\" direction first, $d^{1}_{+x}$ takes value 1. If afterwards a move is made in the \"-x\" direction, $d^{2}_{-x}$ also takes value 1, meaning that the combined term\n", + "$d^{1}_{+x} d^{2}_{-x}$ also becomes 1, enforcing the constraint with penalty value ${\\lambda}_2$. \n", + "\n", + "Generalizing the idea to any direction and for all turns, we find the \"no return constraint\":\n", + "\n", + "$$ {\\lambda}_1 \\left( \\sum_{m}^{\\in \\{x,y,z\\} }\\sum_{t=1}^{N-1} d^{t}_{+m} d^{t+1}_{-m} + d^{t}_{-m}d^{t+1}_{+m} \\right) $$ \n", + "\n", + "In this constraint, iterations are performed over the different dimensions ($m$), and the turn ($t$). The function defintion for the no return constraint is given below. Make sure to read the docstring. In the function the 'cross_multiply' method is used to expand and calculate all the necessary terms of the constraint. The direction variables are dictionaries of polynomials, and therefore have to be expanded before submitting to the Azure QIO solvers.\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def no_return_constraint(num_turns: int, num_dim: int, lamda_4: int)-> list:\n", + " \n", + " '''\n", + " Purpose:\n", + " Build the constraint that penalizes going back to the same position/node two turns later.\n", + " Example:\n", + " Node A ---> ---> Node B ---> ---> Node A => erroneous as we've been there already.\n", + " Two sequential moves may not be in the same dimension and in opposite directions: (+x then -x), (-x then +x), (+y then -y) etc.\n", + " Inputs:\n", + " 1. num_turns: the number of turns.\n", + " 2. num_dim : the number of dimensions, which is 3 for this sample.\n", + " 3. lambda_4 : the penalty weight for this constraint.\n", + " Outputs:\n", + " 1. List of term objects.\n", + " '''\n", + "\n", + " terms = []\n", + " for i in range(0,num_turns):\n", + " x_out_in = cross_multiply(direction_variables(\"+x\",i*num_dim,1,1,lamda_4), direction_variables(\"-x\",(i+1)*num_dim,1,1,lamda_4))\n", + " x_in_out = cross_multiply(direction_variables(\"-x\",i*num_dim,1,1,lamda_4), direction_variables(\"+x\",(i+1)*num_dim,1,1,lamda_4))\n", + " y_right_left = cross_multiply(direction_variables(\"+y\",i*num_dim,1,1,lamda_4), direction_variables(\"-y\",(i+1)*num_dim,1,1,lamda_4))\n", + " y_left_right = cross_multiply(direction_variables(\"-y\",i*num_dim,1,1,lamda_4), direction_variables(\"+y\",(i+1)*num_dim,1,1,lamda_4))\n", + " z_up_down = cross_multiply(direction_variables(\"+z\",i*num_dim,1,1,lamda_4), direction_variables(\"-z\",(i+1)*num_dim,1,1,lamda_4))\n", + " z_down_up = cross_multiply(direction_variables(\"-z\",i*num_dim,1,1,lamda_4), direction_variables(\"+z\",(i+1)*num_dim,1,1,lamda_4))\n", + " terms += x_out_in + x_in_out + y_right_left + y_left_right + z_up_down + z_down_up\n", + " return terms\n", + "\n", + "\n", + "##### ----- Test the function and print output: \n", + "number_turns = 1 # play with this value!\n", + "nrc_terms = no_return_constraint(number_turns, num_dim, lambda_1)\n", + "print('No return constraint term dictionaries: ', nrc_terms)\n", + "print('\\n No return constraint function:')\n", + "print_function(nrc_terms)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 6. Penalize Invalid Moves\n", + "\n", + "Recall that there are two invalid optimization variable substrings that are not associated with any move, $000$ and $111$. A path that includes these substrings is invalid. To prevent the solver from generating these invalid directions we'll need to add two constraints. Each constraint is specific to an invalid direction, and because we're working directly with the substring we don't need the abstraction layers used in previous constraints, like directional and positional variables. \n", + "\n", + "Let's first work out the constraint for preventing substring $000$. $ q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma} $ may not equal $000$, where $\\gamma = 3(k-1)$ and $k$ the turn number. If we were to design the constraints as $ q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma} $ there won't be any penalty, because all $q$'s will equal and multiply to zero. Therefore, if all these $q$'s equal zero, we need the substring to multiply to 1. This is achieved by the following, which multiplies to zero if all optimization variables take the value zero:\n", + "\n", + "$$ {\\lambda}_2(1-q_{0+\\gamma}) (1-q_{1+\\gamma}) (1-q_{2+\\gamma}) $$\n", + "$$ \\text{If } \\hspace{0.1cm} q_{0+\\gamma} = q_{1+\\gamma} = q_{2+\\gamma} = 0, \\hspace{0.1cm} \\text{then: } $$ \n", + "$$ {\\lambda}_2(1-q_{0+\\gamma}) (1-q_{1+\\gamma}) (1-q_{2+\\gamma}) = {\\lambda}_2 \\cdot 1 $$\n", + "\n", + "\n", + "Nice! By expanding the equation and neglecting constant terms a constraint is found that can be implemented:\n", + "\n", + "$$\\text{Constraint for 000: }-q_{0+\\gamma}−q_{1+\\gamma}−q_{2+\\gamma}+q_{0+\\gamma}q_{1+\\gamma}+q_{0+\\gamma}q_{2+\\gamma}+q_{1+\\gamma}q_{2+\\gamma}−q_{0+\\gamma}q_{1+\\gamma}q_{2+\\gamma}$$\n", + "\n", + "Before going to the function definition, let's first look at penalizing the substring $111$. Luckily this is much easier as the substring multiplies to 1 if all the $q$'s have the value zero. The constraint is therefore simple to derive:\n", + "\n", + "$$ {\\lambda}_3 (q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma}) $$\n", + "$$ \\text{If } \\hspace{0.1cm} q_{0+\\gamma} = q_{1+\\gamma} = q_{2+\\gamma} = 1, \\hspace{0.1cm} \\text{then: } $$ \n", + "$$ {\\lambda}_3 (q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma}) = {\\lambda}_3 \\cdot 1$$\n", + "\n", + "The constraint for the substring $111$ is:\n", + "\n", + "$$ \\text{Constraint for $111$: }\\hspace{0.1cm} {\\lambda}_3 (q_{0+\\gamma} q_{1+\\gamma} q_{2+\\gamma}) $$\n", + "\n", + "The function definitions for these two constraints are given below. \n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def penalize_000(len_seq: int, num_dim: int, lambda_2: int) -> list:\n", + "\n", + " '''\n", + " Purpose:\n", + " Build the constraint that penalizes the invalid moves associated with the 3 q's string: '000'.\n", + " The constraint needs to be defined over the set of all turns, as defined by the 'for' loop.\n", + " Example:\n", + " If turn 2 (q_3q_4q_5) equals '000', assign a large penalty.\n", + " Inputs:\n", + " 1. len_seq: the number nodes to consider.\n", + " 2. num_dim: the number of dimensions (which is 3).\n", + " 3. lambda_2: the penalty weight for this constraint.\n", + " Outputs:\n", + " 1. List of term objects.\n", + " '''\n", + " \n", + " terms = []\n", + " for k in range(0,len_seq):\n", + " offset = k*num_dim\n", + " term_0 = Term(c=-1*lambda_2,indices=[0+offset])\n", + " term_1 = Term(c=-1*lambda_2,indices=[1+offset])\n", + " term_2 = Term(c=-1*lambda_2,indices=[2+offset])\n", + " term_3 = Term(c= 1*lambda_2,indices=[0+offset,1+offset])\n", + " term_4 = Term(c= 1*lambda_2,indices=[0+offset,2+offset])\n", + " term_5 = Term(c= 1*lambda_2,indices=[1+offset,2+offset])\n", + " term_6 = Term(c=-1*lambda_2,indices=[0+offset,1+offset,2+offset])\n", + " terms += [term_0, term_1, term_2, term_3, term_4, term_5, term_6]\n", + " return terms\n", + "\n", + "def penalize_111(len_seq: int, num_dim: int, lambda_3: int) -> list:\n", + "\n", + " '''\n", + " Purpose:\n", + " Build the constraint that penalizes the invalid moves associated with the 3 q's string: '111'.\n", + " The constraint needs to be defined over the set of all turns, as defined by the 'for' loop.\n", + " Example:\n", + " If turn 2 (q_3q_4q_5) equals '111', assign a large penalty.\n", + " Inputs:\n", + " 1. len_seq: the number nodes to consider.\n", + " 2. num_dim: the number of dimensions (which is 3 in this sample).\n", + " 3. lambda_3: the penalty weight for this constraint.\n", + " Outputs:\n", + " 1. List of term objects.\n", + " '''\n", + "\n", + " terms = []\n", + " for k in range(0,len_seq):\n", + " offset = k*num_dim \n", + " terms += [Term(c=1*lambda_3,indices=[0+offset,1+offset,2+offset])]\n", + " return terms\n", + "\n", + "\n", + "##### ----- Test the function and print output: \n", + "term_000 = penalize_000(len_seq, num_dim, lambda_2) \n", + "term_111 = penalize_111(len_seq, num_dim, lambda_3) \n", + "print('Term dictionary penalty constraint for 000:', term_000, '\\n')\n", + "print('Term dictionary penalty constraint for 111:', term_111, '\\n')\n", + "print('Function for penality 000: ')\n", + "print_function(term_000)\n", + "print('Function for penality 111: ')\n", + "print_function(term_111)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Part 7. Parsing and validating the solution\n", + "\n", + "We've finished defining the optimization function. The next step is to start looking at how we're going to submit it to the solvers and analyze the returned results. \n", + "First let's look at how to parse, validate, and visualize the results, since that will make tuning the solvers easier!\n", + "\n", + "Below you can find the function definition that reads the solution and validates it. The solution dictionary is first read out to the optimiation variable string that describes the path. Afterward, the substrings that represent the directions are translated to linguistic terms, such that the solution can be printed in a human-readable format. Based on these two steps, the validation process checks if any constraints are violated. If constraints are violated warnings will be shown in the output with some tuning suggestions.\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "def read_validate_solution(solution: dict, num_turns: int, num_dim: int):\n", + " \n", + " '''\n", + " Purpose:\n", + " To validate the solution returned by the solver. Make it readable, and analyze if it makes sense.\n", + " Inputs:\n", + " 1. solution: The solution results dictionary which is returned by the solver (results[\"configuration\"]).\n", + " 2. num_turns: The number of turns for the simulation.\n", + " 3. num_dim: The number of dimensions, which is 3 for this sample (3D).\n", + " Outputs:\n", + " 1. valid: A boolean variable that specifies the validity of the solution.\n", + " 2. pos_dit: Layered position dictionary that contains all of the nodes' locations per turn {turn: {x: x_pos, y:y_pos, z:z_pos}}.\n", + " 3. dir_dict: Dictionary containing the linguistic interpretation of the 6 directions.\n", + " 4. var_dict: Dictionary containing the spin per optimization variable.\n", + " 5. x_arr: Array of x positions.\n", + " 6. y_arr: Array of y positions.\n", + " 7. z_arr: Array of z positions. \n", + " '''\n", + "\n", + " print('\\n')\n", + " valid = True\n", + " move = ''\n", + " sol_str = ''\n", + " x_arr = [0]\n", + " y_arr = [0]\n", + " z_arr = [0]\n", + " dir_dict = {'100':'out','010':'in','001':'right','110':'left','101':'up','011':'down'}\n", + " pos_dict = {0:{\"x\":0, \"y\":0, \"z\":0}}\n", + " var_dict = {}\n", + " for key,val in solution:\n", + " if key<(num_turns*num_dim):\n", + " turn = floor(key/num_dim)+1\n", + " print(\"Turn: \"+str(turn),\"var: \"+str(key),\"spin: \"+str(val))\n", + " var_dict |= {str(key): val}\n", + " if key%3 list: + + ''' + Purpose: + Translates the direction (+x,-x,+y,-y,+z,-z) of turn 'i' as a function of three q's. (Three optimization variables because of the defined coordinate system). + Example: + Direction "+z" in the first turn (turn = 1) is translated to: q_{0+offset}q_{2+offset}-q_{0+offset}q_{1+offset}q_{2+offset}. + Inputs: + 1. direction: A direction from an x-y-z coordinate system, one of the following: ('+x','-x','+y','-y','+z','-z'). + 2. offset: Offset gives the turn number expressed in the first q of that turn. + Example: Turn 1 starts with q_0, offset=0. Turn 2 starts with q_3, offset = 3. + 3. sign_dir: Changes the sign of the weights corresponding to negative directions "-x", "-y", "-z" -> necessary for finding the positions, for exmaple (+x) "-" (-x). + 4. sign_pos: Changes the sign of the weights corresponding to negative positions "-(x,y,z)" -> necessary for finding the distances between node "i" and node "j". + 5. lambda_: The weight term associated with a constraint. + Output: + 1. A list of term objects. + ''' + + terms = [] + if direction == "+x": + term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset]) + term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset]) + term_2 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset]) + term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1, term_2, term_3] + elif direction == "-x": + term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset]) + term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset]) + term_2 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset]) + term_3 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1, term_2, term_3] + elif direction == "+y": + term_0 = Term(c= 1*sign_pos*lambda_, indices=[2+offset]) + term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 2+offset]) + term_2 = Term(c=-1*sign_pos*lambda_, indices=[1+offset, 2+offset]) + term_3 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1, term_2, term_3] + elif direction == "-y": + term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset]) + term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1] + elif direction == "+z": + term_0 = Term(c= 1*sign_pos*lambda_, indices=[0+offset, 2+offset]) + term_1 = Term(c=-1*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1] + elif direction == "-z": + term_0 = Term(c= 1*sign_dir*sign_pos*lambda_, indices=[1+offset, 2+offset]) + term_1 = Term(c=-1*sign_dir*sign_pos*lambda_, indices=[0+offset, 1+offset, 2+offset]) + terms = [term_0, term_1] + return terms + +def print_cost_function(terms: list): + + ''' + Purpose: + Takes a list of terms and prints it out as a (mathematical) cost function. + Example: + {'c': 1, 'ids': [0, 10, 11, 12]} ---> 1q_0q_10q_11q_12 + Inputs: + 1. terms: the list of terms. + ''' + + final_string = '' + final_string = '' + for term in terms: + term = term.to_dict() + weight = term['c'] + ids = term['ids'] + string = '(' + if weight >= 0: + string = '+' + '('+str(weight) + if weight < 0: + string = '-' + '(' + str(abs(weight)) + for id_ in ids: + string = string + f'q_{id_}' + string = string + ')' + final_string = final_string + string + print('[' + final_string + ']') + + +def generate_slack_coefficients(turn_diff: int): + + ''' + Purpose: + Calculates the number of slack variables and their weights. + Example: + For the constraint: x1 + x2 + x3 + x4 <= 4 which is converted to x1 + x2 + x3 + x4 + s1 + s2 +2*s3 = 4, + with 's' being slack variables. This function computes the weights of these slack variables ([1,1,2] for the example). + Input: + 1. turn_diff: the differences in turns (end_turn - start_turn). + Output: + 1. y: the weights of the slack variables. + ''' + + dist_diff = (turn_diff**2)-1 + if dist_diff == 0: + y = [] + elif dist_diff > 0: + M = floor(log2(dist_diff)) + y = [2**n for n in range(M)] + y.append(dist_diff + 1 - 2**M) + return y + + +def simplify_every_iter_function(term_list: list[Term], ref_term:Term) -> list[Term]: + terms = [] + same_ids_list = [] + diff_ids_list = [] + if term_list: + for term_in_list in term_list: + if sorted(ref_term.ids) == sorted(term_in_list.ids): + same_ids_list += [term_in_list] + else: + diff_ids_list += [term_in_list] + if same_ids_list: + new_weight = ref_term.c + ids = sorted(ref_term.ids) + for same_ids_term in same_ids_list: + new_weight += same_ids_term.c + terms += [Term(c=new_weight, indices=ids)] + else: + terms += [ref_term] + if diff_ids_list: + terms += diff_ids_list + return terms + + +def diff_in_pos(start_turn: int, end_turn: int, num_dim: int, lamda_: int): + + ''' + Purpose: + Expresses the difference in position (x,y,z) between two turns as a function of the encoding of the directions. + In other words, expresses the difference in the position after the start_turn and position after the end_turn. + Example: + Difference between turn 0 (no turns yet, initial position = (0,0,0)) and turn 2: + x(2) = [ move(+x, turn 1) - move(-x, turn 1) ] + [ move(+x, turn 2) - move(-x, turn 2) ] + Note: only one 'move' per turn gets activated as they are represented by the same q's (ex. turn 1 is represented by q_0, q_1, and q_2). + Inputs: + 1. start_turn: the initial (reference) turn. + 2. end_turn: the final (target) turn. + 3. num_dim: the number of dimensions (3, x-y-z coordinate system). + Outputs: + 1. The difference in the x direction. + 2. The difference in the y direction. + 3. The difference in the z direction. + ''' + + x_diff = y_diff = z_diff = [] + if start_turn < end_turn and start_turn >= 0 and end_turn >= 1: + for turn in range(start_turn,end_turn+1): + x_diff += direction_variables("+x",(turn-1)*num_dim,1,1,lamda_)+direction_variables("-x",(turn-1)*num_dim,-1,1,lamda_) + y_diff += direction_variables("+y",(turn-1)*num_dim,1,1,lamda_)+direction_variables("-y",(turn-1)*num_dim,-1,1,lamda_) + z_diff += direction_variables("+z",(turn-1)*num_dim,1,1,lamda_)+direction_variables("-z",(turn-1)*num_dim,-1,1,lamda_) + return x_diff, y_diff, z_diff + +def cross_multiply(list_a: list[Term], list_b: list[Term]) -> list: + + ''' + Purpose: Cross multiplies two lists of terms (linear ex. [q_0 + q_1] or non-linear ex. [q_0q_1]) to return the expansion. + Can compute powers of groups this way (^2, ^3,...), like squaring a list of terms. + Calculates the expansion locally, unlike the SlcTerm class. + Example: (2q_0q_1+3q_2q_3)^2 => (2q_0q_1)^2 + 12q_0q_1q_2q_3 + (3q_2q_3)^2 + Input: + 1. list_a: list which serves as the reference list (first 'for' loop). + 2. list_b: list which serves as the target list (second 'for' loop). + Output: + 1. list of term objects. + ''' + + terms = [] + for one in list_a: + for uno in list_b: + weight = one.c * uno.c + ids = one.ids + uno.ids + new_term = Term(c = weight, indices = ids) + terms += [new_term] + #terms = simplify_function(terms, new_term) + return terms + +def distance_constraint(num_turns: int, num_dim: int, lambda_0: int) -> list: + + ''' + Purpose: + Build the distance contraint based on previosly defined functions. + Constraint: Distance squared between i and j must be larger or equal to 1. + Constraint: L_{i,j}^2 >= 1 => L_{i,j}^2 = 1+q_{slacker} (converting the inequality constraint to an equality constraint.) + Example/Explanation: + L{1,2}^2 = (x1-x2)^2 + (y1-y2)^2 + (z1-z2)^2 + x1 = [move(+x1)-move(-x1)] + x2 = [move(+x1)-move(-x1)] + [move(+x2)-move(-x2)] + < same for other dimensions > + < fill into first line > + L{1,2}^2 = [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2 + [move(+x2)-move(-x2)]^2 + [move(+y2)-move(-y2)]^2 + [move(+z2)-move(-z2)]^2 - q_{slacker} = 0 ---> expressed in q's == cost function + Inputs: + 1. num_turns: the number of turns. + 2. num_dum: the number of dimensions. + 3. lambda_0: the constraint weight for the distance constraint. + Output: + 1. List of term objects describing the distance constraint. + ''' + + terms = [] + slack_indexer = 0 + for start_turn in range(1,num_turns+1): + for end_turn in range(start_turn+1,num_turns+2): + # Calculate the differences in positions for each dimension. + x_diff_i_j, y_diff_i_j, z_diff_i_j = diff_in_pos(start_turn, end_turn, num_dim, lambda_0) + # Compute the squared distance (Pythagorean theorem) by calculating the squared expansion. + x_diff_i_j_2, y_diff_i_j_2, z_diff_i_j_2 = cross_multiply(x_diff_i_j,x_diff_i_j), cross_multiply(y_diff_i_j,y_diff_i_j), cross_multiply(z_diff_i_j,z_diff_i_j) + # Add slack variables due to inequality constraint. + slack_var_terms = [] + slack_coefficients = generate_slack_coefficients(end_turn-start_turn) + for s in range(0,len(slack_coefficients)): + slack_var_terms += [Term(c=-slack_coefficients[s], indices=[num_turns*num_dim+slack_indexer+s])] + + terms += x_diff_i_j_2 + y_diff_i_j_2 + z_diff_i_j_2 + slack_var_terms + slack_indexer+=len(slack_coefficients) + return terms + +def penalize_000(len_seq: int, num_dim: int, lambda_2: int) -> list: + + ''' + Purpose: + Build the constraint that penalizes the invalid moves associated with the substring: '000'. + The constraint needs to be defined over the set of all turns, as defined by the 'for' loop. + Example: + If turn 2 (q_3q_4q_5) equals '000', assign a large penalty. + Inputs: + 1. len_seq: the number nodes to consider. + 2. num_dim: the number of dimensions (which is 3). + 3. lambda_2: the penalty weight for this constraint. + Outputs: + 1. List of term objects. + ''' + + terms = [] + for k in range(0,len_seq): + offset = k*num_dim + term_0 = Term(c=-1*lambda_2,indices=[0+offset]) + term_1 = Term(c=-1*lambda_2,indices=[1+offset]) + term_2 = Term(c=-1*lambda_2,indices=[2+offset]) + term_3 = Term(c= 1*lambda_2,indices=[0+offset,1+offset]) + term_4 = Term(c= 1*lambda_2,indices=[0+offset,2+offset]) + term_5 = Term(c= 1*lambda_2,indices=[1+offset,2+offset]) + term_6 = Term(c=-1*lambda_2,indices=[0+offset,1+offset,2+offset]) + terms += [term_0, term_1, term_2, term_3, term_4, term_5, term_6] + return terms + +def penalize_111(len_seq: int, num_dim: int, lambda_3: int) -> list: + + ''' + Purpose: + Build the constraint that penalizes the invalid moves associated with the substring: '111'. + The constraint needs to be defined over the set of all turns, as defined by the 'for' loop. + Example: + If turn 2 (q_3q_4q_5) equals '111', assign a large penalty. + Inputs: + 1. len_seq: the number nodes to consider. + 2. num_dim: the number of dimensions (which is 3 in this sample). + 3. lambda_3: the penalty weight for this constraint. + Outputs: + 1. List of term objects. + ''' + + terms = [] + for k in range(0,len_seq): + offset = k*num_dim + terms += [Term(c=1*lambda_3,indices=[0+offset,1+offset,2+offset])] + return terms + +def no_return_constraint(num_turns: int, num_dim: int, lamda_4: int)-> list: + + ''' + Purpose: + Build the constraint that penalizes going back to the same position/node two turns later. + Example: + Node A ---> ---> Node B ---> ---> Node A => erroneous as we've been there already. + Two sequential moves may not be in the same dimension and in opposite directions: (+x then -x), (-x then +x), (+y then -y) etc. + Inputs: + 1. num_turns: the number of turns. + 2. num_dim : the number of dimensions, which is 3 for this sample. + 3. lambda_4 : the penalty weight for this constraint. + Outputs: + 1. List of term objects. + ''' + + terms = [] + for i in range(0,num_turns): + x_out_in = cross_multiply(direction_variables("+x",i*num_dim,1,1,lamda_4), direction_variables("-x",(i+1)*num_dim,1,1,lamda_4)) + x_in_out = cross_multiply(direction_variables("-x",i*num_dim,1,1,lamda_4), direction_variables("+x",(i+1)*num_dim,1,1,lamda_4)) + y_right_left = cross_multiply(direction_variables("+y",i*num_dim,1,1,lamda_4), direction_variables("-y",(i+1)*num_dim,1,1,lamda_4)) + y_left_right = cross_multiply(direction_variables("-y",i*num_dim,1,1,lamda_4), direction_variables("+y",(i+1)*num_dim,1,1,lamda_4)) + z_up_down = cross_multiply(direction_variables("+z",i*num_dim,1,1,lamda_4), direction_variables("-z",(i+1)*num_dim,1,1,lamda_4)) + z_down_up = cross_multiply(direction_variables("-z",i*num_dim,1,1,lamda_4), direction_variables("+z",(i+1)*num_dim,1,1,lamda_4)) + terms += x_out_in + x_in_out + y_right_left + y_left_right + z_up_down + z_down_up + return terms + + + +def read_validate_solution(solution: dict, num_turns: int, num_dim: int): + + ''' + Purpose: + To validate the solution returned by the solver. Make it readable, and analyze if it makes sense. + Inputs: + 1. solution: The solution results dictionary which is returned by the solver (results["configuration"]). + 2. num_turns: The number of turns for the simulation. + 3. num_dim: The number of dimensions, which is 3 for this sample (3D). + Outputs: + 1. valid: A boolean variable that specifies the validity of the solution. + 2. pos_dit: Layered position dictionary that contains all of the nodes' locations per turn {turn: {x: x_pos, y:y_pos, z:z_pos}}. + 3. dir_dict: Dictionary containing the linguistic interpretation of the 3-substring directions. + 4. var_dict: Dictionary containing the spin per optimized variable + 5. x_arr: Array of x positions. + 6. y_arr: Array of y positions. + 7. z_arr: Array of z positions. + ''' + + print('\n') + valid = True + move = '' + sol_str = '' + x_arr = [0] + y_arr = [0] + z_arr = [0] + dir_dict = {'100':'out','010':'in','001':'right','110':'left','101':'up','011':'down'} + pos_dict = {0:{"x":0, "y":0, "z":0}} + var_dict = {} + for key,val in solution: + if key<(num_turns*num_dim): + turn = floor(key/num_dim)+1 + print("Turn: "+str(turn),"var: "+str(key),"spin: "+str(val)) + var_dict |= {str(key): val} + if key%3