etsap-TIMES · olejandro · Dec 1, 2023 · Nov 24, 2023 · Nov 24, 2023 · Dec 1, 2023
diff --git a/times_reader/datatypes.py b/times_reader/datatypes.py
@@ -61,7 +61,7 @@ class Tag(str, Enum):
     uc_sets = "~UC_SETS"
     uc_t = "~UC_T"
     # This is used by Veda for unit conversion when displaying results
-    # unitconversion = "~UNITCONVERSION"
+    unitconversion = "~UNITCONVERSION"
 
     @classmethod
     def has_tag(cls, tag):
@@ -270,15 +270,28 @@ def _read_mappings(filename: str) -> List[TimesXlMap]:
     def _read_veda_tags_info(
         veda_tags_file: str,
     ) -> Tuple[Dict[Tag, Dict[str, str]], Dict[Tag, Dict[str, list]]]:
+        def to_tag(s: str) -> Tag:
+            # The file stores the tag name in lowercase, and without the ~
+            return Tag("~" + s.upper())
+
+        # Read veda_tags_file
         with resources.open_text("times_reader.config", veda_tags_file) as f:
             veda_tags_info = json.load(f)
+
+        # Check that all the tags we use are present in veda_tags_file
+        tags = {to_tag(tag_info["tag_name"]) for tag_info in veda_tags_info}
+        for tag in Tag:
+            if tag not in tags:
+                print(
+                    f"WARNING: datatypes.Tag has an unknown Tag {tag} not in {veda_tags_file}"
+                )
+
         column_aliases = {}
         row_comment_chars = {}
 
         for tag_info in veda_tags_info:
             if "tag_fields" in tag_info:
-                # The file stores the tag name in lowercase, and without the ~
-                tag_name = "~" + tag_info["tag_name"].upper()
+                tag_name = to_tag(tag_info["tag_name"])
                 # Process column aliases:
                 column_aliases[tag_name] = {}
                 names = tag_info["tag_fields"]["fields_names"]

diff --git a/times_reader/transforms.py b/times_reader/transforms.py
@@ -229,6 +229,10 @@ def normalize_column_aliases(
             )
         else:
             print(f"WARNING: could not find {table.tag} in config.column_aliases")
+        if len(set(table.dataframe.columns)) > len(table.dataframe.columns):
+            raise ValueError(
+                f"Table has duplicate column names (after normalization): {table}"
+            )
     return tables