clearlydefined · RomanIakovlev · Oct 4, 2024 · Sep 18, 2024 · Sep 25, 2024 · Sep 26, 2024
diff --git a/.github/workflows/integration-test.yml b/.github/workflows/integration-test.yml
@@ -10,6 +10,10 @@ permissions:
 jobs:
   test:
     runs-on: ubuntu-latest
+    strategy:
+      max-parallel: 1
+      matrix:
+        dynamicCoordinates: [true, false]
     defaults:
       run:
         working-directory: ./tools/integration
@@ -29,7 +33,7 @@ jobs:
         run: npm test
 
       - name: Trigger harvest and verify completion
-        run: npm run e2e-test-harvest
+        run: DYNAMIC_COORDINATES=${{ matrix.dynamicCoordinates }} npm run e2e-test-harvest
 
       - name: Verify service functions
-        run: npm run e2e-test-service
+        run: DYNAMIC_COORDINATES=${{ matrix.dynamicCoordinates }} npm run e2e-test-service
diff --git a/...rding/src/functions/compareDefinitions.js → tools/integration/lib/compareDefinitions.js b/...rding/src/functions/compareDefinitions.js → tools/integration/lib/compareDefinitions.js
@@ -1,37 +1,5 @@
-const { app } = require("@azure/functions");
-
-app.http("compareDefinitions", {
-  methods: ["POST"],
-  authLevel: "anonymous",
-  handler: async (request, context) => {
-    try {
-      const {
-        productionDoc,
-        stagingDoc,
-        ignoredKeys = [],
-      } = await request.json();
-
-      if (!productionDoc || !stagingDoc) {
-        return {
-          status: 400,
-          body: "Please provide both productionDoc and stagingDoc in the request body",
-        };
-      }
-
-      const result = compareDocuments(stagingDoc, productionDoc, ignoredKeys);
-
-      return {
-        status: 200,
-        jsonBody: result,
-      };
-    } catch (error) {
-      return {
-        status: 400,
-        body: "Error processing request: " + error.message,
-      };
-    }
-  }
-});
+// (c) Copyright 2024, GitHub and ClearlyDefined contributors. Licensed under the MIT license.
+// SPDX-License-Identifier: MIT
 
 function compareDocuments(staging, production, ignoredKeys, path = '') {
     let differences = {};
@@ -49,7 +17,7 @@ function compareDocuments(staging, production, ignoredKeys, path = '') {
         const currentPath = path ? `${path}.${key}` : key;
 
         if (shouldIgnore(currentPath, ignoredKeys)) {
-            continue; // Skip comparison for keys that should be ignored
+            continue;
         }
 
         const stagingValue = staging[key];
@@ -247,4 +215,6 @@ function getType(value) {
     if (value === null) return 'null';
     if (Array.isArray(value)) return 'array';
     return typeof value;
-}
+}
+
+module.exports = { compareDocuments }
diff --git a/tools/integration/test/integration/e2e-test-service/attachmentTest.js b/tools/integration/test/integration/e2e-test-service/attachmentTest.js
@@ -2,15 +2,16 @@
 // SPDX-License-Identifier: MIT
 
 const { callFetch } = require('../../../lib/fetch')
-const { devApiBaseUrl, prodApiBaseUrl, components, definition } = require('../testConfig')
+const { devApiBaseUrl, prodApiBaseUrl, getComponents, definition } = require('../testConfig')
 const { strictEqual } = require('assert')
 
-describe('Validation attachments between dev and prod', function () {
+describe('Validation attachments between dev and prod', async function () {
   this.timeout(definition.timeout * 2)
 
   //Rest a bit to avoid overloading the servers
   afterEach(() => new Promise(resolve => setTimeout(resolve, definition.timeout / 2)))
 
+  const components = await getComponents()
   components.forEach(coordinates => {
     it(`should have the same attachement as prod for ${coordinates}`, () => fetchAndCompareAttachments(coordinates))
   })

diff --git a/tools/integration/test/integration/e2e-test-service/definitionTest.js b/tools/integration/test/integration/e2e-test-service/definitionTest.js
@@ -4,7 +4,7 @@
 const { omit, isEqual, pick } = require('lodash')
 const { deepStrictEqual, strictEqual } = require('assert')
 const { callFetch, buildPostOpts } = require('../../../lib/fetch')
-const { devApiBaseUrl, prodApiBaseUrl, components, definition } = require('../testConfig')
+const { devApiBaseUrl, prodApiBaseUrl, getComponents, definition } = require('../testConfig')
 const nock = require('nock')
 const fs = require('fs')
 
@@ -14,19 +14,16 @@ describe('Validation definitions between dev and prod', function () {
   //Rest a bit to avoid overloading the servers
   afterEach(() => new Promise(resolve => setTimeout(resolve, definition.timeout / 2)))
 
-  describe('Validation between dev and prod', function () {
-    before(() => {
-      loadFixtures().forEach(([url, definition]) =>
-        nock(prodApiBaseUrl, { allowUnmocked: true }).get(url).reply(200, definition)
-      )
-    })
-
+  describe('Validation between dev and prod', async function () {
+    const components = await getComponents()
+    console.info(`Testing definitions for ${JSON.stringify(components)}`)
     components.forEach(coordinates => {
       it(`should return the same definition as prod for ${coordinates}`, () => fetchAndCompareDefinition(coordinates))
     })
   })
 
-  describe('Validate on dev', function () {
+  describe('Validate on dev', async function () {
+    const components = await getComponents()
     const coordinates = components[0]
 
     describe('Search definitions', function () {

diff --git a/tools/integration/test/integration/e2e-test-service/noticeTest.js b/tools/integration/test/integration/e2e-test-service/noticeTest.js
@@ -3,11 +3,11 @@
 
 const { deepStrictEqual } = require('assert')
 const { callFetch, buildPostOpts } = require('../../../lib/fetch')
-const { devApiBaseUrl, prodApiBaseUrl, components, definition } = require('../testConfig')
+const { devApiBaseUrl, prodApiBaseUrl, getComponents, definition } = require('../testConfig')
 const nock = require('nock')
 const fs = require('fs')
 
-describe('Validate notice files between dev and prod', function () {
+describe('Validate notice files between dev and prod', async function () {
   this.timeout(definition.timeout)
 
   //Rest a bit to avoid overloading the servers
@@ -20,7 +20,7 @@ describe('Validate notice files between dev and prod', function () {
         .reply(200, notice)
     })
   })
-
+  const components = await getComponents()
   components.forEach(coordinates => {
     it(`should return the same notice as prod for ${coordinates}`, () => fetchAndCompareNotices(coordinates))
   })

diff --git a/tools/integration/test/integration/harvestTest.js b/tools/integration/test/integration/harvestTest.js
@@ -1,7 +1,7 @@
 // (c) Copyright 2024, SAP SE and ClearlyDefined contributors. Licensed under the MIT license.
 // SPDX-License-Identifier: MIT
 
-const { components, devApiBaseUrl, harvest } = require('./testConfig')
+const { getComponents, devApiBaseUrl, harvest } = require('./testConfig')
 const Poller = require('../../lib/poller')
 const Harvester = require('../../lib/harvester')
 const { strictEqual } = require('assert')
@@ -10,7 +10,9 @@ describe('Tests for harvesting different components', function () {
   it('should verify all harvests are complete', async function () {
     this.timeout(harvest.timeout)
     console.time('Harvest Test')
-    const status = await harvestTillCompletion(components)
+    const recentDefinitions = await getComponents()
+    console.info(`Recent definitions: ${recentDefinitions}`)
+    const status = await harvestTillCompletion(recentDefinitions)
-    const recentDefinitions = await getComponents()
-    console.info(`Recent definitions: ${recentDefinitions}`)
-    const status = await harvestTillCompletion(recentDefinitions)
+    const targetDefinitions = await getComponents()
+    console.info(`Recent definitions: ${targetDefinitions}`)
+    const status = await harvestTillCompletion(targetDefinitions)
-    const recentDefinitions = await getComponents()
-    console.info(`Recent definitions: ${recentDefinitions}`)
-    const status = await harvestTillCompletion(recentDefinitions)
+    const targetDefinitions = await getComponents()
+    console.info(`Recent definitions: ${targetDefinitions}`)
+    const status = await harvestTillCompletion(targetDefinitions)
     for (const [coordinates, isHarvested] of status) {
       strictEqual(isHarvested, true, `Harvest for ${coordinates} is not complete`)
     }

diff --git a/tools/integration/test/integration/testConfig.js b/tools/integration/test/integration/testConfig.js
@@ -1,5 +1,7 @@
 // (c) Copyright 2024, SAP SE and ClearlyDefined contributors. Licensed under the MIT license.
 // SPDX-License-Identifier: MIT
+const fs = require('fs').promises;
+const path = require('path');
 
 const devApiBaseUrl = 'https://dev-api.clearlydefined.io'
 const prodApiBaseUrl = 'https://api.clearlydefined.io'
@@ -11,7 +13,7 @@ const pollingMaxTime = 1000 * 60 * 60 // 60 minutes
 const harvestTools = ['licensee', 'reuse', 'scancode']
 
 //Components to test
-const components = [
+const componentsStatic = [
   'pypi/pypi/-/platformdirs/4.2.0', //Keep this as the first element to test, it is relatively small
   'maven/mavencentral/org.apache.httpcomponents/httpcore/4.4.16',
   'maven/mavengoogle/android.arch.lifecycle/common/1.0.1',
@@ -32,10 +34,47 @@ const components = [
   // 'sourcearchive/mavencentral/org.apache.httpcomponents/httpcore/4.1' // Dev and prod have different license and scores. See https://github.com/clearlydefined/crawler/issues/533
 ]
 
+function shouldUseDynamicComponents() {
+  // check for environment variable DYNAMIC_COORDINATES, if it is set to true, use dynamic components
+  return process.env.DYNAMIC_COORDINATES === 'true';
+
+}
+
+async function getComponents() {
+  if (shouldUseDynamicComponents()) {
+    console.info("Using dynamic components");
+    return componentsDynamic();
+  } else {
+    console.info("Using static components");
+    return Promise.resolve(componentsStatic);
+  }
+}
+
+const componentsDynamic = async () => {
+
+  const filePath = path.join(__dirname, 'recentDefinitions.json');
+
+  try {
+    // Check if the file exists
+    await fs.access(filePath);
+    // Read the file contents
+    const data = await fs.readFile(filePath, 'utf8');
+    console.info("Read dynamic components from disk")
+    return JSON.parse(data);
+  } catch (err) {
+    // If the file doesn't exist, fetch the data and save it to disk
+    const response = await fetch('https://cosmos-query-function-app.azurewebsites.net/api/getrecentdefinitions?days=1&limit=1');
+    const data = await response.json();
+    await fs.writeFile(filePath, JSON.stringify(data, null, 2), 'utf8');
+    console.info("Read dynamic components from remote")
+    return data;
+  }
+};
+
 module.exports = {
   devApiBaseUrl,
   prodApiBaseUrl,
-  components,
+  getComponents,
   harvest: {
     poll: { interval: pollingInterval, maxTime: pollingMaxTime }, // for each component
     tools: harvestTools,