DataDesigner/tests/config/utils/test_visualization.py
Johnny Greco f8c201e085
chore: update header script to check for diffs (#195)
* update script

* update headers

* refactor a bit and add test script

* update headers

* update for edge case

* update headers

* add step to get file creation date

* use git history to get copyright year

* generation type is printed with inference parameters

* fix unit test
2026-01-09 17:10:58 -05:00

87 lines
3.3 KiB
Python

# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
import pandas as pd
import pytest
from data_designer.config.config_builder import DataDesignerConfigBuilder
from data_designer.config.utils.code_lang import CodeLang
from data_designer.config.utils.visualization import (
display_sample_record,
get_truncated_list_as_string,
mask_api_key,
)
from data_designer.config.validator_params import CodeValidatorParams
@pytest.fixture
def validation_output():
"""Fixture providing a sample validation output structure."""
return {
"is_valid": True,
"python_linter_messages": [],
"python_linter_score": 10.0,
"python_linter_severity": "none",
}
@pytest.fixture
def config_builder_with_validation(stub_model_configs):
"""Fixture providing a DataDesignerConfigBuilder with a validation column."""
builder = DataDesignerConfigBuilder(model_configs=stub_model_configs)
# Add a validation column configuration
builder.add_column(
name="code_validation_result",
column_type="validation",
target_columns=["code"],
validator_type="code",
validator_params=CodeValidatorParams(code_lang=CodeLang.PYTHON),
)
return builder
def test_display_sample_record_twice_no_errors(validation_output, config_builder_with_validation):
"""Test that calling display_sample_record twice on validation output produces no errors."""
# Create a sample record with the validation output
sample_record = {"code": "print('hello world')", "code_validation_result": validation_output}
# Convert to pandas Series to match expected input format
record_series = pd.Series(sample_record)
# Call display_sample_record twice - should not produce any errors
display_sample_record(record_series, config_builder_with_validation)
display_sample_record(record_series, config_builder_with_validation)
# If we reach this point without exceptions, the test passes
assert True
def test_mask_api_key():
# Actual API keys are masked to show last 4 characters
assert mask_api_key("sk-1234567890") == "***7890"
assert mask_api_key("nv-some-api-key") == "***-key"
# Short API keys (4 or fewer chars) show only asterisks
assert mask_api_key("sk-1") == "***"
assert mask_api_key("key") == "***"
# Environment variable names (all uppercase) are kept visible
assert mask_api_key("OPENAI_API_KEY") == "OPENAI_API_KEY"
assert mask_api_key("NVIDIA_API_KEY") == "NVIDIA_API_KEY"
# None or empty returns "(not set)"
assert mask_api_key(None) == "(not set)"
assert mask_api_key("") == "(not set)"
def test_get_truncated_list_as_string():
assert get_truncated_list_as_string([1, 2, 3, 4, 5]) == "[1, 2, ...]"
assert get_truncated_list_as_string([1, 2, 3, 4, 5], max_items=1) == "[1, ...]"
assert get_truncated_list_as_string([1, 2, 3, 4, 5], max_items=3) == "[1, 2, 3, ...]"
assert get_truncated_list_as_string([1, 2, 3, 4, 5], max_items=10) == "[1, 2, 3, 4, 5]"
with pytest.raises(ValueError):
get_truncated_list_as_string([1, 2, 3, 4, 5], max_items=-1)
with pytest.raises(ValueError):
get_truncated_list_as_string([1, 2, 3, 4, 5], max_items=0)