amolk · October 25, 2025 18:53
diff --git a/langfuse_export_trace.py b/langfuse_export_trace.py
 import argparse
 import json
 import tempfile
 from datetime import datetime

 import dotenv
 from langfuse import Langfuse
 from langfuse.client import os

 dotenv.load_dotenv()


 class DateTimeEncoder(json.JSONEncoder):
    """Custom JSON encoder that handles datetime objects and other non-serializable types."""

    def default(self, obj):
        if isinstance(obj, datetime):
            return "[redacted]"
        # Handle Pydantic models
        if hasattr(obj, "model_dump"):
            return obj.model_dump(mode="python")
        # Handle objects with __dict__
        if hasattr(obj, "__dict__"):
            return vars(obj)
        # Fallback to string representation
        return str(obj)


 # Initialize Langfuse client
 langfuse = Langfuse(
    secret_key=os.getenv("LANGFUSE_SECRET_KEY"),
    public_key=os.getenv("LANGFUSE_PUBLIC_KEY"),
    host=os.getenv("LANGFUSE_HOST"),  # Adjust for your region
 )
 if not langfuse:
    raise ValueError(
        "Failed to initialize Langfuse client. Check your environment variables in .env file."
        "LANGFUSE_SECRET_KEY, LANGFUSE_PUBLIC_KEY, and LANGFUSE_HOST must be set."
    )


 def get_nested_observations(observations):
    """Organize observations hierarchically."""
    # Convert observations to dictionaries if they're objects
    obs_list = []
    for obs in observations:
        if hasattr(obs, "__dict__"):
            # If it's an object, convert to dict
            obs_dict = (
                obs.model_dump(mode="python")
                if hasattr(obs, "model_dump")
                else vars(obs)
            )
        else:
            # If it's already a dict, use as-is
            obs_dict = obs
        obs_list.append(obs_dict)

    observation_map = {obs["id"]: obs for obs in obs_list}
    for obs in obs_list:
        parent_id = obs.get("parentObservationId")
        if parent_id and parent_id in observation_map:
            parent = observation_map[parent_id]
            if "children" not in parent:
                parent["children"] = []
            parent["children"].append(obs)
    return [obs for obs in obs_list if not obs.get("parentObservationId")]


 def export_observations(trace_id, save_to_file=False):
    try:
        # Fetch the trace and its observations
        trace_response = langfuse.fetch_trace(trace_id)
        observations_response = langfuse.fetch_observations(trace_id=trace_id)

        # Convert trace response to dictionary
        if hasattr(trace_response, "model_dump"):
            trace_dict = trace_response.model_dump(mode="python")
        elif hasattr(trace_response, "__dict__"):
            trace_dict = vars(trace_response)
        else:
            trace_dict = trace_response

        # Extract observations from the response object
        observations = (
            observations_response.observations
            if hasattr(observations_response, "observations")
            else observations_response.data
        )

        # Convert ObservationsView to list if needed
        if not isinstance(observations, list):
            observations = list(observations)

        # Structure the observations hierarchically
        structured_observations = get_nested_observations(observations)

        # Create the JSON export object
        export_data = {
            "trace": trace_dict.get("name", trace_id),
            "observations": structured_observations,
        }

        # Convert to JSON
        json_export = json.dumps(
            export_data, indent=2, sort_keys=True, cls=DateTimeEncoder
        )

        # Output the JSON (or save to a file)
        if save_to_file:
            # Use temp file
            fd, path = tempfile.mkstemp(
                prefix="langfuse_trace_", suffix=".json", dir=tempfile.gettempdir()
            )
            with open(fd, "w") as f:
                f.write(json_export)
                f.flush()
                # Print full file path
            print(path)
        else:
            print(json_export)

    except Exception as e:
        print("Error exporting observations:", e)


 # Example usage
 if __name__ == "__main__":
    parser = argparse.ArgumentParser()
    parser.add_argument("--trace-id", type=str, required=True)
    parser.add_argument("--save-to-file", action="store_true")
    args = parser.parse_args()
    export_observations(args.trace_id, args.save_to_file)

 # Setup
 # pip install argparse langfuse dotenv

 # Example usage (stdout)
 # python langfuse_export_trace.py --trace-id <trace_id_1>

 # Example usage (save to file)
 # python langfuse_export_trace.py --save_to_file --trace-id <trace_id_1>

 # Compare two traces (CLI)
 # diff $(python langfuse_export_trace.py --save_to_file --trace-id <trace_id_1>) $(python langfuse_export_trace.py --save_to_file --trace-id <trace_id_2>)

 # Compare two traces (VSCode)
 # code --diff $(python langfuse_export_trace.py --save_to_file --trace-id <trace_id_1>) $(python langfuse_export_trace.py --save_to_file --trace-id <trace_id_2>)
	import argparse
	import json
	import tempfile
	from datetime import datetime

	import dotenv
	from langfuse import Langfuse
	from langfuse.client import os

	dotenv.load_dotenv()


	class DateTimeEncoder(json.JSONEncoder):
	"""Custom JSON encoder that handles datetime objects and other non-serializable types."""

	def default(self, obj):
	if isinstance(obj, datetime):
	return "[redacted]"
	# Handle Pydantic models
	if hasattr(obj, "model_dump"):
	return obj.model_dump(mode="python")
	# Handle objects with __dict__
	if hasattr(obj, "__dict__"):
	return vars(obj)
	# Fallback to string representation
	return str(obj)


	# Initialize Langfuse client
	langfuse = Langfuse(
	secret_key=os.getenv("LANGFUSE_SECRET_KEY"),
	public_key=os.getenv("LANGFUSE_PUBLIC_KEY"),
	host=os.getenv("LANGFUSE_HOST"), # Adjust for your region
	)
	if not langfuse:
	raise ValueError(
	"Failed to initialize Langfuse client. Check your environment variables in .env file."
	"LANGFUSE_SECRET_KEY, LANGFUSE_PUBLIC_KEY, and LANGFUSE_HOST must be set."
	)


	def get_nested_observations(observations):
	"""Organize observations hierarchically."""
	# Convert observations to dictionaries if they're objects
	obs_list = []
	for obs in observations:
	if hasattr(obs, "__dict__"):
	# If it's an object, convert to dict
	obs_dict = (
	obs.model_dump(mode="python")
	if hasattr(obs, "model_dump")
	else vars(obs)
	)
	else:
	# If it's already a dict, use as-is
	obs_dict = obs
	obs_list.append(obs_dict)

	observation_map = {obs["id"]: obs for obs in obs_list}
	for obs in obs_list:
	parent_id = obs.get("parentObservationId")
	if parent_id and parent_id in observation_map:
	parent = observation_map[parent_id]
	if "children" not in parent:
	parent["children"] = []
	parent["children"].append(obs)
	return [obs for obs in obs_list if not obs.get("parentObservationId")]


	def export_observations(trace_id, save_to_file=False):
	try:
	# Fetch the trace and its observations
	trace_response = langfuse.fetch_trace(trace_id)
	observations_response = langfuse.fetch_observations(trace_id=trace_id)

	# Convert trace response to dictionary
	if hasattr(trace_response, "model_dump"):
	trace_dict = trace_response.model_dump(mode="python")
	elif hasattr(trace_response, "__dict__"):
	trace_dict = vars(trace_response)
	else:
	trace_dict = trace_response

	# Extract observations from the response object
	observations = (
	observations_response.observations
	if hasattr(observations_response, "observations")
	else observations_response.data
	)

	# Convert ObservationsView to list if needed
	if not isinstance(observations, list):
	observations = list(observations)

	# Structure the observations hierarchically
	structured_observations = get_nested_observations(observations)

	# Create the JSON export object
	export_data = {
	"trace": trace_dict.get("name", trace_id),
	"observations": structured_observations,
	}

	# Convert to JSON
	json_export = json.dumps(
	export_data, indent=2, sort_keys=True, cls=DateTimeEncoder
	)

	# Output the JSON (or save to a file)
	if save_to_file:
	# Use temp file
	fd, path = tempfile.mkstemp(
	prefix="langfuse_trace_", suffix=".json", dir=tempfile.gettempdir()
	)
	with open(fd, "w") as f:
	f.write(json_export)
	f.flush()
	# Print full file path
	print(path)
	else:
	print(json_export)

	except Exception as e:
	print("Error exporting observations:", e)


	# Example usage
	if __name__ == "__main__":
	parser = argparse.ArgumentParser()
	parser.add_argument("--trace-id", type=str, required=True)
	parser.add_argument("--save-to-file", action="store_true")
	args = parser.parse_args()
	export_observations(args.trace_id, args.save_to_file)

	# Setup
	# pip install argparse langfuse dotenv

	# Example usage (stdout)
	# python langfuse_export_trace.py --trace-id <trace_id_1>

	# Example usage (save to file)
	# python langfuse_export_trace.py --save_to_file --trace-id <trace_id_1>

	# Compare two traces (CLI)
	# diff $(python langfuse_export_trace.py --save_to_file --trace-id <trace_id_1>) $(python langfuse_export_trace.py --save_to_file --trace-id <trace_id_2>)

	# Compare two traces (VSCode)
	# code --diff $(python langfuse_export_trace.py --save_to_file --trace-id <trace_id_1>) $(python langfuse_export_trace.py --save_to_file --trace-id <trace_id_2>)
No results found