elixir-cloud-aai · Karanjot786 · Aug 16, 2024 · Aug 19, 2024 · Aug 22, 2024 · Aug 24, 2024
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
@@ -2,43 +2,44 @@ name: CI
 
 on:
   push:
-    branches: [ main ]
+    branches: '*'
   pull_request:
-    branches: [ main ]
+    branches: '*'
 
 jobs:
   build:
     runs-on: ubuntu-latest
 
     steps:
-    - uses: actions/checkout@v2
-
-    - name: Set up Python
-      uses: actions/setup-python@v2
-      with:
-        python-version: '3.11'
-
-    - name: Install Poetry
-      run: |
-        curl -sSL https://install.python-poetry.org | python3 -
-        poetry install
-
-    - name: Lint with Ruff
-      run: |
-        poetry run ruff check crategen/
-
-    - name: Type check with Mypy
-      run: |
-        poetry run mypy crategen/
-
-    - name: Run security checks with Bandit
-      run: |
-        poetry run bandit -r crategen/
-
-    - name: Install test dependencies
-      run: |
-        poetry add pytest pytest-cov pytest-mock
-
-    # - name: Run tests
-    #   run: |
-    #     poetry run pytest --cov=crategen
+      - uses: actions/checkout@v4
+
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: '3.11'
+
+      - name: Install Poetry
+        run: |
+          curl -sSL https://install.python-poetry.org | python3 -
+          poetry install
+
+      - name: Lint with Ruff
+        run: |
+          poetry run ruff check crategen/
+        if: ${{ success() }}
+
+      - name: Type check with Mypy
+        run: |
+          poetry run mypy crategen/
+
+      - name: Run security checks with Bandit
+        run: |
+          poetry run bandit -r crategen/
+
+      - name: Install test dependencies
+        run: |
+          poetry add pytest pytest-cov pytest-mock
+
+      - name: Run tests
+        run: |
+          poetry run pytest --cov=crategen
diff --git a/crategen/cli.py b/crategen/cli.py
@@ -1,30 +1,37 @@
-import click
 import json
+
+import click
+
 from crategen.converter_manager import ConverterManager
 
+
 @click.command()
-@click.option('--input', prompt='Input file', help='Path to the input JSON file.')
-@click.option('--output', prompt='Output file', help='Path to the output JSON file.')
-@click.option('--conversion-type', prompt='Conversion type', type=click.Choice(['tes-to-wrroc', 'wes-to-wrroc']), help='Type of conversion to perform.')
+@click.option("--input", prompt="Input file", help="Path to the input JSON file.")
+@click.option("--output", prompt="Output file", help="Path to the output JSON file.")
+@click.option(
+    "--conversion-type",
+    prompt="Conversion type",
+    type=click.Choice(["tes-to-wrroc", "wes-to-wrroc"]),
+    help="Type of conversion to perform.",
+)
 def cli(input, output, conversion_type):
-    """
-    Command Line Interface for converting TES/WES to WRROC.
-    """
+    """Command Line Interface for converting TES/WES to WRROC."""
     manager = ConverterManager()
 
     # Load input data from JSON file
-    with open(input, 'r') as input_file:
+    with open(input) as input_file:
         data = json.load(input_file)
 
     # Perform the conversion based on the specified type
-    if conversion_type == 'tes-to-wrroc':
+    if conversion_type == "tes-to-wrroc":
         result = manager.convert_tes_to_wrroc(data)
-    elif conversion_type == 'wes-to-wrroc':
+    elif conversion_type == "wes-to-wrroc":
         result = manager.convert_wes_to_wrroc(data)
-    
+
     # Save the result to the output JSON file
-    with open(output, 'w') as output_file:
+    with open(output, "w") as output_file:
         json.dump(result, output_file, indent=4)
 
-if __name__ == '__main__':
+
+if __name__ == "__main__":
     cli()
diff --git a/crategen/converter_manager.py b/crategen/converter_manager.py
@@ -1,6 +1,7 @@
 from .converters.tes_converter import TESConverter
 from .converters.wes_converter import WESConverter
 
+
 class ConverterManager:
     def __init__(self):
         self.tes_converter = TESConverter()

diff --git a/crategen/converters/abstract_converter.py b/crategen/converters/abstract_converter.py
@@ -1,10 +1,11 @@
 from abc import ABC, abstractmethod
 
+
 class AbstractConverter(ABC):
     @abstractmethod
     def convert_to_wrroc(self, data):
         """Convert data to WRROC format"""
-    
+
     @abstractmethod
-    def convert_from_wrroc(self, wrroc_data):
+    def convert_from_wrroc(self, data):
         """Convert WRROC data to the original format"""
diff --git a/crategen/converters/tes_converter.py b/crategen/converters/tes_converter.py
@@ -1,52 +1,113 @@
+from datetime import datetime
+
+from pydantic import AnyUrl, ValidationError
+
+from ..models.tes_models import (
+    TESData,
+    TESExecutor,
+    TESInput,
+    TESOutput,
+    TESState,
+    TESTaskLog,
+)
+from ..models.wrroc_models import WRROCDataTES
+from ..validators import validate_wrroc_tes
 from .abstract_converter import AbstractConverter
-from .utils import convert_to_iso8601
+
 
 class TESConverter(AbstractConverter):
+    def convert_to_wrroc(self, data: dict) -> dict:
+        """
+        Convert TES data to WRROC format.
+
+        Args:
+            data: The input TES data.
+
+        Returns:
+            The converted WRROC data.
+
+        Raises:
+            ValidationError: If TES data is invalid.
+        """
+        # Validate TES data
+        try:
+            data_tes = TESData(**data)
+        except ValidationError as e:
+            raise ValueError(f"Invalid TES data: {e.errors()}") from e
+
+        executors = data_tes.executors
+        end_time = data_tes.logs[0].end_time if data_tes.logs else None
 
-    def convert_to_wrroc(self, tes_data):
-        # Validate and extract data with defaults
-        id = tes_data.get("id", "")
-        name = tes_data.get("name", "")
-        description = tes_data.get("description", "")
-        executors = tes_data.get("executors", [{}])
-        inputs = tes_data.get("inputs", [])
-        outputs = tes_data.get("outputs", [])
-        creation_time = tes_data.get("creation_time", "")
-        end_time = tes_data.get("logs", [{}])[0].get("end_time", "")  # Corrected to fetch from logs
-
-        # Convert to WRROC
         wrroc_data = {
-            "@id": id,
-            "name": name,
-            "description": description,
-            "instrument": executors[0].get("image", None) if executors else None,
-            "object": [{"@id": input.get("url", ""), "name": input.get("path", "")} for input in inputs],
-            "result": [{"@id": output.get("url", ""), "name": output.get("path", "")} for output in outputs],
-            "startTime": convert_to_iso8601(creation_time),
-            "endTime": convert_to_iso8601(end_time),
+            "@id": data_tes.id,
+            "name": data_tes.name,
+            "description": data_tes.description,
+            "instrument": executors[0].image if executors else None,
+            "object": [
+                {"@id": input.url, "name": input.path} for input in data_tes.inputs
+            ],
+            "result": [
+                {"@id": output.url, "name": output.path} for output in data_tes.outputs
+            ],
+            "startTime": data_tes.creation_time,
+            "endTime": end_time,
         }
+
+        validate_wrroc_tes(wrroc_data)
         return wrroc_data
 
-    def convert_from_wrroc(self, wrroc_data):
-        # Validate and extract data with defaults
-        id = wrroc_data.get("@id", "")
-        name = wrroc_data.get("name", "")
-        description = wrroc_data.get("description", "")
-        instrument = wrroc_data.get("instrument", "")
-        object_data = wrroc_data.get("object", [])
-        result_data = wrroc_data.get("result", [])
-        start_time = wrroc_data.get("startTime", "")
-        end_time = wrroc_data.get("endTime", "")
-
-        # Convert from WRROC to TES
-        tes_data = {
-            "id": id,
-            "name": name,
-            "description": description,
-            "executors": [{"image": instrument}],
-            "inputs": [{"url": obj.get("@id", ""), "path": obj.get("name", "")} for obj in object_data],
-            "outputs": [{"url": res.get("@id", ""), "path": res.get("name", "")} for res in result_data],
-            "creation_time": start_time,
-            "logs": [{"end_time": end_time}],  # Added to logs
-        }
-        return tes_data
+    def convert_from_wrroc(self, data: dict) -> dict:
+        """
+        Convert WRROC data to TES format.
+
+        Args:
+            data: The input WRROC data.
+
+        Returns:
+            The converted TES data.
+
+        Raises:
+            ValidationError: If WRROC data is invalid.
+        """
+        # Validate WRROC data
+        try:
+            data_wrroc = WRROCDataTES(**data)
+        except ValidationError as e:
+            raise ValueError(f"Invalid WRROC data: {e.errors()}") from e
+
+        # Convert URL strings to AnyUrl
+        tes_inputs = [TESInput(url=AnyUrl(url=obj.id), path=obj.name) for obj in data_wrroc.object]
+        tes_outputs = [TESOutput(url=AnyUrl(url=res.id), path=res.name) for res in data_wrroc.result]
+
+        # Ensure 'image' and 'command' fields are provided
+        tes_executors = [TESExecutor(image=data_wrroc.instrument or "", command=[])]  # Provide default empty list for command
+
+        # Ensure correct type for end_time (datetime)
+        end_time = datetime.fromisoformat(data_wrroc.endTime) if data_wrroc.endTime else None
+
+        tes_logs = [
+            TESTaskLog(
+                logs=[],
+                metadata=None,
+                start_time=None,
+                end_time=end_time, 
+                outputs=[],
+                system_logs=None
+            )
+        ]
+
+        tes_data = TESData(
+            id=data_wrroc.id,
+            name=data_wrroc.name,
+            description=data_wrroc.description,
+            executors=tes_executors,
+            inputs=tes_inputs,
+            outputs=tes_outputs,
+            creation_time=None, 
+            logs=tes_logs,
+            state=TESState.UNKNOWN
+        )
+
+        # Validate TES data before returning
+        tes_data = TESData(**tes_data.dict())
+        return tes_data.dict()