bessagroup · GuillaumeBroggi · Apr 28, 2025 · Apr 29, 2025 · Apr 29, 2025 · Apr 28, 2025
diff --git a/.gitignore b/.gitignore
@@ -129,6 +129,7 @@ venv/
 ENV/
 env.bak/
 venv.bak/
+.python-version
 
 # Spyder project settings
 .spyderproject
@@ -161,5 +162,19 @@ cython_debug/
 #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
 #.idea/
 
-# VSCode
-.vscode/
+# Visual Studio Code
+.vscode/
+
+# Local projects
+projects/
+
+# Benchmark
+benchmarks/cfd/*
+!benchmarks/cfd/cylinder_flow.ipynb
+!benchmarks/cfd/utils.py
+
+# Visual Studio Code
+.vscode/
+
+# Local projects
+projects/
diff --git a/benchmarks/cfd/cylinder_flow.ipynb b/benchmarks/cfd/cylinder_flow.ipynb
diff --git a/benchmarks/cfd/utils.py b/benchmarks/cfd/utils.py
@@ -0,0 +1,236 @@
+from pathlib import Path
+import json
+import numpy as np
+
+from urllib.request import urlretrieve
+from tqdm.notebook import tqdm
+import logging
+import pickle
+
+from itertools import count
+import pyvista as pv
+
+
+class DownloadProgressBar(tqdm):
+    """
+    Provides a progress bar compatible with the urlretrieve hook.
+
+    Credit: https://github.com/tqdm/tqdm?tab=readme-ov-file#hooks-and-callbacks
+
+    """
+
+    def update_to(self, n_block, block_size, total_size=None):
+        """
+        Updates the progress bar with the number of blocks transferred.
+
+        Parameters
+        ----------
+        n_block : int, optional
+            Number of blocks transferred so far.
+        block_size : int, optional
+            Size of each block in bytes.
+        total_size : int, optional
+            Total size.
+
+        """
+
+        if total_size is not None:
+            self.total = total_size
+
+        # update() also sets self.n = n_block * block_size
+        self.update(n_block * block_size - self.n)
+
+
+def download_file(file, base_url, dest_path, overwrite=False):
+    """
+    Downloads a file from a given URL to a specified destination path.
+
+    If the file already exists, download is skipped.
+
+    Parameters
+    ----------
+    file : str
+        The name of the file to download.
+
+    base_url : str
+        The base URL from which to download the file.
+
+    dest_path : str
+        The destination path where the file will be saved.
+
+    """
+
+    # Build the full URL
+    url = f"{base_url}/{file}"
+
+    # Validate the destination path
+    dest_path = Path(dest_path).resolve()
+
+    # Check if the file already exists and use it if overwrite is False
+    if (dest_path / file).exists() and not overwrite:
+        # Logging
+        logging.info(msg=f"Using '{file}' cached in in {dest_path}")
+        return
+
+    # Create the destination directory if it doesn't exist
+    dest_path.mkdir(parents=True, exist_ok=True)
+
+    # Logging
+    logging.info(msg=f"Downloading '{file}' to {dest_path}")
+
+    # Download the file with progress bar
+    with DownloadProgressBar(
+        unit="B",
+        unit_scale=True,
+        unit_divisor=1024,
+        miniters=1,
+        desc=file,
+    ) as pbar:
+        urlretrieve(
+            url,
+            filename=dest_path / file,
+            reporthook=pbar.update_to,
+            data=None,
+        )
+
+        # Update the progress bar to reflect the total size in bytes since
+        # total_size's units does not seem to be in bytes
+        pbar.total = pbar.n
+
+
+def parse_tensorflow_dataset(dataset_name, dataset_directory):
+    """
+    Parses a TensorFlow dataset and returns the features.
+
+    Parameters
+    ----------
+    dataset : tf.data.Dataset
+        The TensorFlow dataset to parse.
+
+    """
+    try:
+        import tensorflow as tf
+    except ImportError:
+        err_msg = (
+            "TensorFlow is required to parse the dataset."
+            " See https://www.tensorflow.org/install"
+            " for installation instructions."
+        )
+        raise ImportError(err_msg)
+
+    # Validate the dataset path
+    dataset_directory = Path(dataset_directory).resolve()
+
+    # Load the metadata
+    with open(dataset_directory / "meta.json", "r") as file:
+        metadata = json.load(file)
+
+    # Prepare the dataset path
+    dataset_path = dataset_directory / f"{dataset_name}.tfrecord"
+
+    if not dataset_path.exists():
+        raise FileNotFoundError(
+            f"Dataset '{dataset_name}' not found in {dataset_directory}."
+        )
+
+    # Load the dataset
+    dataset = tf.data.TFRecordDataset(dataset_path)
+
+    # Parse the dataset output path
+    output_path = dataset_directory / dataset_name
+    output_path.mkdir(parents=True, exist_ok=True)
+
+    # Initialize a sample counter
+    sample_cnt = count()
+    # Iterate over the dataset
+    for sample in tqdm(dataset):
+        # Parse the sample
+        sample_data = _parse_tensorflow_sample(sample, metadata)
+        # Prepare a sample path
+        sample_path = output_path / f"{dataset_name}_{next(sample_cnt)}.pkl"
+        # Export the sample to a pickle file
+        with open(sample_path, "wb") as file:
+
+            pickle.dump(sample_data, file)
+
+
+def _parse_tensorflow_sample(sample, metadata):
+    """
+    Parses a single sample from the TensorFlow dataset.
+
+    Credit: https://github.com/google-deepmind/deepmind-research/blob/master/meshgraphnets/dataset.py
+
+    Parameters
+    ----------
+    sample : tf.train.Example
+        The sample to parse.
+
+    metadata : dict
+        The metadata of the dataset.
+
+    """
+
+    try:
+        import tensorflow as tf
+    except ImportError:
+        err_msg = (
+            "TensorFlow is required to parse the dataset."
+            " See https://www.tensorflow.org/install"
+            " for installation instructions."
+        )
+        raise ImportError(err_msg)
+
+    feature_dict = {
+        k: tf.io.VarLenFeature(tf.string) for k in metadata["field_names"]
+    }
+    features = tf.io.parse_single_example(sample, feature_dict)
+    sample_data = {}
+    for key, field in metadata["features"].items():
+        data = tf.io.decode_raw(
+            features[key].values, getattr(tf, field["dtype"])
+        )
+        data = tf.reshape(data, field["shape"])
+        if field["type"] == "static":
+            data = data[0]
+
+        elif field["type"] != "dynamic":
+            raise ValueError("invalid data format")
+        sample_data[key] = data.numpy()
+
+    return sample_data
+
+
+def graph_to_pyvista_mesh(graph):
+    import pyvista as pv
+
+    # Get the mesh vertices, add a third dimension with zeros to make it 3D
+    mesh_vertices = np.insert(arr=graph.pos.numpy(), obj=2, values=0, axis=1)
+
+    # Get the raw sample data which define the mesh cells
+    raw_data_file = (
+        Path("data")
+        / graph.metadata["dataset_name"]
+        / f"{graph.metadata['dataset_name']}"
+        f"_sample_{graph.metadata['sample_id']}.pkl"
+    )
+    with open(raw_data_file, "rb") as file:
+        sample = pickle.load(file)
+
+    # Extract the cells
+    cells = sample["cells"]
+
+    # The cell are already defined as a list of 3 vertices
+    # Add the number of vertices to the beginning of each cell to comply with the
+    # vtk format
+    vtk_faces = np.insert(arr=cells, obj=0, values=3, axis=1)
+
+    # Create the mesh
+    mesh = pv.PolyData(mesh_vertices, faces=vtk_faces)
+
+    # Add the velocity as point data
+    mesh.point_data["velocity"] = graph.x[:, :2].numpy()
+
+    # Add the pressure as point data
+    mesh.point_data["pressure"] = graph.x[:, 2:3].numpy()
+
+    return mesh
diff --git a/requirements.txt b/requirements.txt
@@ -7,8 +7,8 @@ pytest==7.1.2
 scikit_learn==1.3.2
 scipy==1.10.0
 sphinx_rtd_theme==1.2.0
-torch==2.1.0+cu118
-torch_geometric==2.4.0
+torch==2.4.1
+torch_geometric==2.5.0
 tqdm==4.65.0
 shapely==2.0.2
 torchinfo==1.8.0

diff --git a/src/graphorge/gnn_base_model/data/graph_data.py b/src/graphorge/gnn_base_model/data/graph_data.py
@@ -929,7 +929,7 @@ def _check_edges_indexes_matrix(edges_indexes):
         """
         if not isinstance(edges_indexes, np.ndarray):
             raise RuntimeError('Edges indexes matrix is not a numpy.array.')
-        elif edges_indexes.dtype != int:
+        elif not np.issubdtype(edges_indexes.dtype, np.integer):
             raise RuntimeError('Edges indexes matrix is not a numpy.array '
                                'of dtype int.')
         elif len(edges_indexes.shape) != 2: