llm_moderation_testing

Running

App Files Files Community

Yacine Jernite commited on 26 days ago

Commit

10d9a6a

1 Parent(s): 06103c4

missing file

Browse files

Files changed (1) hide show

utils/dataset.py +193 -0

utils/dataset.py ADDED Viewed

	@@ -0,0 +1,193 @@

+"""Dataset utilities for saving and loading test results."""
+from datetime import datetime
+from datasets import Dataset, load_dataset
+from huggingface_hub import HfApi
+from utils.model_interface import extract_model_id, get_model_info
+def get_username_from_token(token: str | None) -> str:
+    """
+    Get username from Hugging Face token using whoami.
+    Args:
+        token: HF token string or None
+    Returns:
+        Username string, or "yjernite" as fallback if token is None or whoami fails
+    """
+    if token is None:
+        return "yjernite"
+    try:
+        api = HfApi()
+        user_info = api.whoami(token=token)
+        return user_info.get("name", "yjernite")
+    except Exception:
+        return "yjernite"
+def get_dataset_repo_id(token: str | None) -> str:
+    """
+    Get dataset repository ID for the current user.
+    Args:
+        token: HF token string or None
+    Returns:
+        Dataset repo ID in format "{username}/moderation-test-results"
+    """
+    username = get_username_from_token(token)
+    return f"{username}/moderation-test-results"
+def load_dataset_from_hub(token: str | None) -> tuple[list[dict], Exception | None]:
+    """
+    Load dataset from Hub and return list of examples.
+    Args:
+        token: HF token string or None
+    Returns:
+        Tuple of (list of example dicts, error Exception or None if successful)
+    """
+    repo_id = get_dataset_repo_id(token)
+    try:
+        # Use load_dataset - more standard way to load from Hub
+        dataset_dict = load_dataset(repo_id, token=token)
+        # Get the default split (usually 'train' or first split)
+        dataset = dataset_dict[list(dataset_dict.keys())[0]]
+        # Convert to list of dicts
+        examples = dataset.to_list()
+        return examples, None
+    except FileNotFoundError:
+        # Dataset doesn't exist yet
+        return [], None
+    except Exception as e:
+        # Other errors (network, auth, etc.) - return error
+        return [], e
+def format_categories_and_reasoning(parsed: dict) -> str:
+    """
+    Format categories and reasoning from parsed JSON response.
+    Args:
+        parsed: Parsed JSON dict with 'categories' key
+    Returns:
+        Formatted markdown string
+    """
+    categories = parsed.get("categories", [])
+    if categories and len(categories) > 0:
+        cat_text = "### Categories:\n\n"
+        for cat in categories:
+            category_name = cat.get('category', 'Unknown')
+            reasoning_text = cat.get('reasoning', 'No reasoning provided')
+            policy_source = cat.get('policy_source', '')
+            cat_text += f"- **Category:** {category_name}\n"
+            cat_text += f"  - **Explanation:** {reasoning_text}\n"
+            if policy_source:
+                cat_text += f"  - **Policy Source:** {policy_source}\n"
+            cat_text += "\n\n"
+        return cat_text
+    else:
+        return "*No categories found in response*\n\nThis output expects a valid JSON response, as specified for example in the default prompt.\n\nThe raw response can be seen in the Model Response section below."
+def save_to_dataset(token: str | None, data: dict) -> tuple[bool, str]:
+    """
+    Save test result to Hugging Face dataset.
+    Args:
+        token: HF token string or None
+        data: Dict with all test result fields
+    Returns:
+        Tuple of (success: bool, message: str)
+    """
+    try:
+        repo_id = get_dataset_repo_id(token)
+        # Load existing dataset and examples using shared function
+        examples, load_error = load_dataset_from_hub(token)
+        # If there was an error loading (other than FileNotFoundError), raise it
+        if load_error is not None:
+            raise load_error
+        # Append new example
+        examples.append(data)
+        # Create new dataset with all examples
+        dataset = Dataset.from_list(examples)
+        # Push to hub
+        dataset.push_to_hub(repo_id, token=token)
+        return True, f"Saved to {repo_id}"
+    except FileNotFoundError:
+        # Dataset doesn't exist yet, create new one
+        try:
+            repo_id = get_dataset_repo_id(token)
+            dataset = Dataset.from_list([data])
+            dataset.push_to_hub(repo_id, token=token)
+            return True, f"Saved to {repo_id}"
+        except Exception as e:
+            return False, f"Failed to create new dataset: {str(e)}"
+    except Exception as e:
+        return False, f"Failed to save: {str(e)}"
+def load_dataset_examples(token: str | None) -> tuple[list[dict], list[str]]:
+    """
+    Load examples from Hugging Face dataset.
+    Args:
+        token: HF token string or None
+    Returns:
+        Tuple of (list of example dicts, list of formatted dropdown labels)
+    """
+    # Use shared loading function
+    examples, load_error = load_dataset_from_hub(token)
+    # If there was an error loading, return empty lists
+    if load_error is not None:
+        return [], []
+    if not examples:
+        return [], []
+    # Format dropdown labels
+    labels = []
+    for idx, example in enumerate(examples):
+        input_text = example.get("input", "")
+        model_selection = example.get("model_selection", "")
+        policy_violation = example.get("policy_violation", -1)
+        # Get label emoji
+        if policy_violation == 1:
+            label_emoji = "❌"
+        elif policy_violation == 0:
+            label_emoji = "✅"
+        else:
+            label_emoji = "⚠️"
+        # Extract model name
+        model_id = extract_model_id(model_selection)
+        model_info = get_model_info(model_id) if model_id else None
+        model_name = model_info.get("name", model_id) if model_info else model_id or "Unknown"
+        # Truncate input for label
+        input_preview = input_text[:40] + "..." if len(input_text) > 40 else input_text
+        label = f"{input_preview} - {label_emoji} - {model_name} - #{idx}"
+        labels.append(label)
+    return examples, labels