actions: More JSON Tests

#19 All JSON files were treated with this Python: import json from collections import OrderedDict files = [ 'schema/network-schema.json', 'examples/json/network-package-additional-checks.json', 'examples/json/network-package.json', 'examples/json/spans-endpoint.json', 'examples/json/nodes-endpoint.json', 'examples/json/network-separate-files.json', 'examples/json/multiple-networks.json', 'examples/json/api-response.json', 'examples/json/network-embedded.json', 'examples/json/network-package-invalid.json', 'examples/json/network-separate-endpoints.json', ] for f in files: print(f) with open(f) as fp: data = json.load(fp, object_pairs_hook=OrderedDict) with open(f, "w") as fp: json.dump(data, fp, ensure_ascii=False, indent=2) fp.write('\n')
Open-Telecoms-Data · Dec 14, 2022 · cc35556 · cc35556
1 parent b74fec7
commit cc35556
Show file tree

Hide file tree

Showing 14 changed files with 181 additions and 19 deletions.
diff --git a/examples/csv/contracts.csv b/examples/csv/contracts.csv
@@ -1,2 +1,2 @@
 id,contracts/0/id,contracts/0/title,contracts/0/description,contracts/0/type,contracts/0/value/amount,contracts/0/value/currency,contracts/0/dateSigned
-a096d627-72e1-4f9b-b129-951b1737bff4,1,NextGen Phase 1 Construction Contract,Contract for the construction of phase 1 of the NextGen network.,private,1537459500.00,GHS,2016-06-30
+a096d627-72e1-4f9b-b129-951b1737bff4,1,NextGen Phase 1 Construction Contract,Contract for the construction of phase 1 of the NextGen network.,private,1537459500.0,GHS,2016-06-30
diff --git a/examples/csv/spans.csv b/examples/csv/spans.csv
@@ -1,2 +1,2 @@
 id,spans/0/id,spans/0/name,spans/0/phase/id,spans/0/phase/name,spans/0/status,spans/0/readyForServiceDate,spans/0/start,spans/0/end,spans/0/directed,spans/0/route/type,spans/0/route/coordinates,spans/0/physicalInfrastructureProvider/id,spans/0/physicalInfrastructureProvider/name,spans/0/networkProvider/id,spans/0/networkProvider/name,spans/0/supplier/id,spans/0/supplier/name,spans/0/transmissionMedium,spans/0/deployment,spans/0/deploymentDetails/description,spans/0/darkFibre,spans/0/fibreType,spans/0/fibreTypeDetails/fibreSubtype,spans/0/fibreTypeDetails/description,spans/0/fibreCount,spans/0/fibreLength,spans/0/technologies,spans/0/capacity,spans/0/capacityDetails/description,spans/0/countries
-a096d627-72e1-4f9b-b129-951b1737bff4,1,Accra to Kumasi,1,NextGen Phase 1,operational,2018-01-01,1,2,False,LineString,"-0.173,5.626;-0.178,5.807;-0.112,5.971;-0.211,5.963;-0.321,6.170;-0.488,6.290;-0.560,6.421;-0.752,6.533;-0.867,6.607;-1.101,6.585;-1.304,6.623;-1.461,6.727;-1.628,6.713",GH-RGD-CS111111111,FibreCo,GH-RGD-CS222222222,FastWeb,GH-RGD-CS333333333,ProjectCo,fibre,belowGround,Buried in ducts,True,G.652,G.652.D,"CABLED STANDARD ENHANCED SINGLEMODE FIBRE ESMF, LOW WATER PEAK SINGLE MODE FIBRE G.652.D, OS2",24,276000,sdh,4.976,2xSTM-16,GH
+a096d627-72e1-4f9b-b129-951b1737bff4,1,Accra to Kumasi,1,NextGen Phase 1,operational,2018-01-01,1,2,False,LineString,"-0.173,5.626;-0.178,5.807;-0.112,5.971;-0.211,5.963;-0.321,6.17;-0.488,6.29;-0.56,6.421;-0.752,6.533;-0.867,6.607;-1.101,6.585;-1.304,6.623;-1.461,6.727;-1.628,6.713",GH-RGD-CS111111111,FibreCo,GH-RGD-CS222222222,FastWeb,GH-RGD-CS333333333,ProjectCo,fibre,belowGround,Buried in ducts,True,G.652,G.652.D,"CABLED STANDARD ENHANCED SINGLEMODE FIBRE ESMF, LOW WATER PEAK SINGLE MODE FIBRE G.652.D, OS2",24,276000,sdh,4.976,2xSTM-16,GH
diff --git a/examples/json/api-response.json b/examples/json/api-response.json
@@ -25,4 +25,4 @@
     "next": "http://example.com/networks?cursor=100",
     "prev": "http://example.com/networks?cursor=96"
   }
-}
+}
diff --git a/examples/json/multiple-networks.json b/examples/json/multiple-networks.json
@@ -21,4 +21,4 @@
       ]
     }
   ]
-}
+}
diff --git a/examples/json/network-embedded.json b/examples/json/network-embedded.json
@@ -14,4 +14,4 @@
       "href": "https://raw.githubusercontent.com/Open-Telecoms-Data/open-fibre-data-standard/0__1__0__beta/schema/network-schema.json"
     }
   ]
-}
+}
diff --git a/examples/json/network-package-additional-checks.json b/examples/json/network-package-additional-checks.json
@@ -44,7 +44,7 @@
               [
                 0,
                 0
-              ]              
+              ]
             ]
           },
           "phase": {
@@ -126,4 +126,4 @@
       ]
     }
   ]
-}
+}
diff --git a/examples/json/network-package-invalid.json b/examples/json/network-package-invalid.json
@@ -11,7 +11,9 @@
             "type": "LineString",
             "properties": ""
           },
-          "transmissionMedium": ["cable"],
+          "transmissionMedium": [
+            "cable"
+          ],
           "directed": "yes",
           "fibreCount": "52"
         }
@@ -49,4 +51,4 @@
       ]
     }
   ]
-}
+}
diff --git a/examples/json/network-package.json b/examples/json/network-package.json
@@ -123,14 +123,14 @@
               ],
               [
                 -0.321,
-                6.170
+                6.17
               ],
               [
                 -0.488,
-                6.290
+                6.29
               ],
               [
-                -0.560,
+                -0.56,
                 6.421
               ],
               [
@@ -284,7 +284,7 @@
           "description": "Contract for the construction of phase 1 of the NextGen network.",
           "type": "private",
           "value": {
-            "amount": 1537459500.00,
+            "amount": 1537459500.0,
             "currency": "GHS"
           },
           "dateSigned": "2016-06-30",
@@ -335,4 +335,4 @@
       ]
     }
   ]
-}
+}
diff --git a/examples/json/network-separate-endpoints.json b/examples/json/network-separate-endpoints.json
@@ -19,4 +19,4 @@
       ]
     }
   ]
-}
+}
diff --git a/examples/json/network-separate-files.json b/examples/json/network-separate-files.json
@@ -19,4 +19,4 @@
       ]
     }
   ]
-}
+}
diff --git a/examples/json/nodes-endpoint.json b/examples/json/nodes-endpoint.json
@@ -7,4 +7,4 @@
     "next": "http://example.com/network/1/nodes?cursor=100",
     "prev": "http://example.com/network/1/nodes?cursor=96"
   }
-}
+}
diff --git a/examples/json/spans-endpoint.json b/examples/json/spans-endpoint.json
@@ -7,4 +7,4 @@
     "next": "http://example.com/network/1/spans?cursor=100",
     "prev": "http://example.com/network/1/spans?cursor=96"
   }
-}
+}
diff --git a/schema/network-schema.json b/schema/network-schema.json
@@ -2062,7 +2062,7 @@
         },
         "rel": {
           "title": "Link relation type",
-          "description": "The relationship with this related resource, from the open [linkRelationType codelist](https://open-fibre-data-standard.readthedocs.io/en/latest/reference/codelists.html#linkrelationtype). The 'describedby' code must only be used in the first item in the `links` array to link to the schema that describes the structure of the data." ,
+          "description": "The relationship with this related resource, from the open [linkRelationType codelist](https://open-fibre-data-standard.readthedocs.io/en/latest/reference/codelists.html#linkrelationtype). The 'describedby' code must only be used in the first item in the `links` array to link to the schema that describes the structure of the data.",
           "type": "string",
           "$comment": "",
           "codelist": "linkRelationType.csv",

diff --git a/tests/test_json.py b/tests/test_json.py
@@ -1,14 +1,174 @@
+from warnings import warn
+from collections import Counter
 from jscc.testing.checks import get_empty_files, get_misindented_files, get_invalid_json_files
 from jscc.testing.util import warn_and_assert
+from jscc.testing.filesystem import walk_json_data, walk_csv_data
+from jscc.schema import is_json_schema
+from jscc.testing.checks import validate_items_type, validate_letter_case, validate_schema
+
+import pytest
+import os
+import json
+
+
+this_dir = os.path.dirname(os.path.realpath(__file__))
+absolute_source_schema_dir = this_dir + '/../schema/'
+absolute_source_codelist_dir = this_dir + '/../codelists/'
 
 
 def test_empty():
     empty_files_paths = [path for path in get_empty_files() if "src/" not in path[0]]
     warn_and_assert(empty_files_paths, "{0} is empty, run: rm {0}", "Files are empty. See warnings below.")
 
 
+def test_indent():
+    """Note this test can often fail on problems that are not to do with indents."""
+    misindented_files_paths = [path for path in get_misindented_files() if "src/" not in path[0]]
+    warn_and_assert(
+        misindented_files_paths,
+        "{0} is not indented as expected",
+        "Files are not indented as expected. See warnings below",
+    )
+
+
 def test_invalid_json():
     warn_and_assert(
         get_invalid_json_files(excluded=('.git', '.ve', '_static', 'build', 'fixtures', "_build")), "{0} is not valid JSON: {1}", "JSON files are invalid. See warnings below."
     )
 
+
+schemas = [(path, name, data) for path, name, _, data in walk_json_data(top=absolute_source_schema_dir) if is_json_schema(data) and not path.endswith('tests/schema/meta-schema.json')]
+# with open(os.path.join(this_dir, 'schema', 'meta-schema.json')) as fp:
+#     metaschema = json.load(fp)
+
+
+# @pytest.mark.parametrize("path,name,data", schemas)
+# def test_schema_valid(path, name, data):
+
+#     # skip schemas generated by tests for now
+#     if "schema/testing" in path or "src/" in path:
+#         return
+#     validate_json_schema(path, name, data, metaschema)
+
+
+@pytest.mark.parametrize("path,name,data", schemas)
+def test_codelist_enums(path, name, data):
+    """
+    Make sure the codes in the codelist CSVs match the equivalent enums in the schema.
+    """
+    if "src/" in path:
+        return
+
+    errors = 0
+
+    codelist_codes = collect_codelist_codes()
+    codelist_info = collect_codelist_enums(path, data)
+
+    for codelist_file, codes in codelist_codes.items():
+        if codelist_file in codelist_info:
+            codelist_enum = codelist_info[codelist_file][0]
+            open_codelist = codelist_info[codelist_file][1]
+            if not open_codelist and Counter(codelist_enum) != Counter(codes):
+                errors += 1
+                warn("""Codelist mismatch:\n
+                    {}: \n
+                    {}\n
+                    {} enum:\n
+                    {}\n
+                    """.format(codelist_file, codes, name, codelist_enum))
+
+    assert not errors, "Codelist files and schema enums out of sync, see warnings below."
+
+
+def test_codelists_used():
+    codelist_files = collect_codelist_files(absolute_source_codelist_dir)
+
+    print('potato', codelist_files)
+
+    codelists = set()
+    for path, name, data in schemas:
+        codelists.update(collect_codelist_values(path, data))
+
+    unused_codelists = [codelist for codelist in codelist_files if codelist not in codelists]
+    missing_codelists = [codelist for codelist in codelists if codelist not in codelist_files]
+
+    assert len(unused_codelists) == 0, "Codelist files found not in schema: {}".format(unused_codelists)
+    assert len(missing_codelists) == 0, "Codelists in schema missing CSVs: {}".format(missing_codelists)
+
+
+def validate_json_schema(path, name, data, schema):
+    if name == "codelist-schema.json":
+        return
+    errors = 0
+    errors += validate_schema(path, data, schema)
+    errors += validate_items_type(path, data)
+    errors += validate_letter_case(path, data)
+    assert not errors, "One or more JSON Schema files are invalid. See warnings below."
+
+
+def collect_codelist_values(path, data, pointer=''):
+    """
+    Collects ``codelist`` values from JSON Schema.
+    From https://github.com/open-contracting/jscc/blob/main/jscc/testing/checks.py#L674
+    """
+    codelists = set()
+
+    if isinstance(data, list):
+        for index, item in enumerate(data):
+            codelists.update(collect_codelist_values(path, item, pointer='{}/{}'.format(pointer, index)))
+    elif isinstance(data, dict):
+        if 'codelist' in data:
+            codelists.add(data['codelist'])
+
+        for key, value in data.items():
+            codelists.update(collect_codelist_values(path, value, pointer='{}/{}'.format(pointer, key)))
+
+    return codelists
+
+
+def collect_codelist_enums(path, data, pointer=''):
+    """
+    Collects values of ``codelist``, ``enum`` and ``openCodelist`` from JSON Schema.
+    Adapted from collect_codelist_values
+    """
+    codelists = {}
+
+    if isinstance(data, list):
+        for index, item in enumerate(data):
+            codelists.update(collect_codelist_enums(path, item, pointer='{}/{}'.format(pointer, index)))
+    elif isinstance(data, dict):
+        if 'codelist' in data:
+          if data.get('type') == 'array' and 'items' in data:
+            codelists[data.get('codelist')] = ((data['items'].get('enum'), data.get('openCodelist')))
+          else:
+            codelists[data.get('codelist')] = ((data.get('enum'), data.get('openCodelist')))
+
+        for key, value in data.items():
+            codelists.update(collect_codelist_enums(path, value, pointer='{}/{}'.format(pointer, key)))
+
+    return codelists
+
+
+def collect_codelist_files(schema_dir):
+    codelist_files = set()
+    for csvpath, csvname, _, fieldnames, _ in walk_csv_data(top=schema_dir):
+        if 'Code' in fieldnames:
+            codelist_files.add(csvname)
+
+    return codelist_files
+
+
+def collect_codelist_codes():
+    """
+    Walk through all the codelist CSV files and get just the codes
+    """
+    codelist_codes = {}
+    codelist_csvs = walk_csv_data(top=absolute_source_codelist_dir)
+    # (file path, file name, text content, fieldnames, rows)
+    for _, codelist_file, _, _, rows in codelist_csvs:
+        codes = []
+        for row in rows:
+            codes.append(row.get('Code'))
+        codelist_codes[codelist_file] = codes
+
+    return codelist_codes
-Original file line number
+Diff line change
@@ Expand Up / @@ -25,4 +25,4 @@ @@
         "next": "http://example.com/networks?cursor=100",
         "prev": "http://example.com/networks?cursor=96"
       }
-    }
+    }