add utils

VinciGit00 · VinciGit00 · commit 3640434f5c61 · 2024-04-12T12:59:15.000+02:00
diff --git a/examples/local_models/Ollama/smart_scraper_ollama.py b/examples/local_models/Ollama/smart_scraper_ollama.py
@@ -2,7 +2,7 @@
 Basic example of scraping pipeline using SmartScraper
 """
 from scrapegraphai.graphs import SmartScraperGraph
-
+from scrapegraphai.utils import prettify_exec_info
 # ************************************************
 # Define the configuration for the graph
 # ************************************************
@@ -35,3 +35,10 @@
 
 result = smart_scraper_graph.run()
 print(result)
+
+# ************************************************
+# Get graph execution info
+# ************************************************
+
+graph_exec_info = smart_scraper_graph.get_execution_info()
+print(prettify_exec_info(graph_exec_info))
diff --git a/scrapegraphai/utils/__init__.py b/scrapegraphai/utils/__init__.py
@@ -4,3 +4,4 @@
 from .save_audio_from_bytes import save_audio_from_bytes
 from .convert_to_csv import convert_to_csv
 from .convert_to_json import convert_to_json
+from .prettify_exec_info import prettify_exec_info
diff --git a/scrapegraphai/utils/prettify_exec_info.py b/scrapegraphai/utils/prettify_exec_info.py
@@ -0,0 +1,48 @@
+"""
+Prettify the execution information of the graph.
+"""
+
+import pandas as pd
+
+
+def prettify_exec_info(complete_result: dict) -> pd.DataFrame:
+    """
+    Transform the execution information of the graph into a DataFrame for better visualization.
+
+    Args:
+    - complete_result (dict): The complete execution information of the graph.
+
+    Returns:
+    - pd.DataFrame: The execution information of the graph in a DataFrame.
+    """
+
+    nodes_info = complete_result['nodes_info']
+    total_info = {
+        'total_exec_time': complete_result['total_exec_time'],
+        'total_model_info': complete_result['total_model_info']
+    }
+
+    # Convert node-specific information to DataFrame
+    flat_data = []
+    for node_name, node_info in nodes_info.items():
+        flat_data.append({
+            'Node': node_name,
+            'Execution Time': node_info['exec_time'],
+            # Unpack the model_info dict into the row
+            **node_info['model_info']
+        })
+
+    df_nodes = pd.DataFrame(flat_data)
+
+    # Add a row for the total execution time and total model info
+    total_row = {
+        'Node': 'Total',
+        'Execution Time': total_info['total_exec_time'],
+        # Unpack the total_model_info dict into the row
+        **total_info['total_model_info']
+    }
+    df_total = pd.DataFrame([total_row])
+
+    # Combine the nodes DataFrame with the total info DataFrame
+    df_combined_with_total = pd.concat([df_nodes, df_total], ignore_index=True)
+    return df_combined_with_total