Inspeq AI
  • Introduction
  • Registration Process
  • Quickstart
  • Metrics
  • Benchmarking Results
  • Response Structure Details
  • Default Config
  • Root Cause Analysis (RCA)
  • On-Premise Deployment Overview
  • On-Premise AWS Deployment Guide
  • API Overview
  • Authentication
  • Endpoints
Powered by GitBook
On this page

Default Config

We use this default configuration to tag the results of metrics evaluations. Which you can override while calling the inspeq eval methods.

{
  "global_communication_mode": "async",
  "auto_instrument_mode": 1,
  "evaluations": {
    "LLM": {
      "communication_mode": "sync",
      "auto_instrument_mode": 1,
      "configurations": {
        "answer_relevance_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Irrelevant Answer",
            "Marginally Relevant Answer",
            "Relevant Answer"
          ],
          "label_thresholds": [
            0,
            0.5,
            0.7,
            1
          ]
        },
        "answer_fluency_config": {
          "threshold": 0.5,
          "custom_labels": [
            "PASS",
            "FAIL"
          ],
          "label_thresholds": [
            0,
            0.5,
            1
          ]
        },
        "response_tone_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Negative",
            "Neutral",
            "Positive"
          ],
          "label_thresholds": [
            0,
            0.5,
            0.7,
            1
          ]
        },
        "factual_consistency_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Hallucinated",
            "Inconsistent",
            "Consistent"
          ],
          "label_thresholds": [
            0,
            0.5,
            0.7,
            1
          ]
        },
        "word_count_limit_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Failed",
            "Passed"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "do_not_use_keywords_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Failed",
            "Passed"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "coherence_config": {
          "threshold": 0.75,
          "custom_labels": [
            "Coherent",
            "Incoherent"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "bias_config":{
          "threshold": 0.5,
          "custom_labels": [
            "Unbiased", 
            "Biased"
          ],
          "label_thresholds": [
            0, 
            1
          ]
        },
        "grammatical_correctness_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Incorrect",
            "Partially Correct",
            "Correct"
          ],
          "label_thresholds": [
            0,
            0.5,
            0.7,
            1
          ]
        },
        "conceptual_similarity_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Dissimilar",
            "Somewhat similar",
            "Similar"
          ],
          "label_thresholds": [
            0,
            0.5,
            0.7,
            1
          ]
        },
        "readability_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Sophisticated",
            "Moderate",
            "Easy"
          ],
          "label_thresholds": [
            0,
            0.3,
            0.6,
            1
          ]
        },
        "clarity_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Not Clear",
            "Partially Clear",
            "Clear"
          ],
          "label_thresholds": [
            0,
            0.5,
            0.74,
            1
          ]
        },
        "narrative_continuity_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Non Continuous",
            "Continuous"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "model_refusal_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Detected",
            "Not Detected"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "data_leakage_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Not Detected",
            "Detected"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "creativity_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Not Creative",
            "Creative"
          ],
          "label_thresholds": [
            0,
            0.5,
            1
          ]
        },
        "diversity_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Redundant",
            "Non Redundant"
          ],
          "label_thresholds": [
            0,
            0.41,
            1
          ]
        },
        "insecure_output_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Not Detected",
            "Detected"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "prompt_injection_config": {
          "threshold": 0.61,
          "custom_labels": [
            "Detected",
            "Not Detected"
          ],
          "label_thresholds": [
            0,
            0.61,
            1
          ]
        },
        "compression_score_config": {
          "threshold": 0.8,
          "custom_labels": [
            "Compact Summary",
            "Loose Summary"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "density_score_config": {
          "threshold": 0.2,
          "custom_labels": [
            "Verbose Summarization",
            "Concise Summarization"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "fuzzy_score_config": {
          "threshold": 0.8,
          "custom_labels": [
            "Well Aligned Summarization",
            "Misaligned Summarization"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "rouge_score_config": {
          "threshold": 0.8,
          "custom_labels": [
            "High Overlap",
            "Low Overlap"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "bleu_score_config": {
          "threshold": 0.8,
          "custom_labels": [
            "Highly Conforming",
            "Poorly Conforming"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "meteor_score_config": {
          "threshold": 0.8,
          "custom_labels": [
            "Semantically Accurate",
            "Semantically Drifting"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "bert_score_config": {
          "threshold": 0.8,
          "custom_labels": [
            "Linguistically Congruent",
            "Linguistically Incongruent"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "cosine_similarity_score_config": {
          "threshold": 0.2,
          "custom_labels": [
            "Contextual Synchrony",
            "Contextual Divergence"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "euclidean_distance_score_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Detected",
            "Not Detected"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "toxicity_config":{
          "threshold":0.5,
          "custom_labels": [
            "Not Detected",
            "Detected"
          ]
        },
        "invisible_text_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Not Detected",
            "Detected"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "get_sentence_embedding_score_config": {
          "threshold": 0.5,
          "custom_labels": [
            "Detected",
            "Not Detected"
          ],
          "label_thresholds": [
            0,
            1
          ]
        }
      }
    },
    "RAGS": {
      "communication_mode": "sync",
      "auto_instrument_mode": 1,
      "configurations": {
        "retrieval_relevance_config": {
          "threshold": 0.5,
          "custom_labels": [
            "relevant",
            "irrelevant"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "response_coherence_config": {
          "threshold": 0.5,
          "custom_labels": [
            "coherent",
            "incoherent"
          ],
          "label_thresholds": [
            0
          ]
        }
      }
    },
    "SQL": {
      "communication_mode": "async",
      "auto_instrument_mode": 1,
      "configurations": {
        "query_performance_config": {
          "threshold": 0.5,
          "custom_labels": [
            "efficient",
            "inefficient"
          ],
          "label_thresholds": [
            0,
            1
          ]
        },
        "data_security_config": {
          "threshold": 0.5,
          "custom_labels": [
            "secure",
            "insecure"
          ],
          "label_thresholds": [
            0,
            1
          ]
        }
      }
    }
  }
}
PreviousResponse Structure DetailsNextRoot Cause Analysis (RCA)

Last updated 3 months ago