test-ragp / src /rag_pipelines /prompts /retrieval_critic.py

Upload 107 files

336f4a9 verified 9 months ago

5.53 kB

	from typing import Literal

	from pydantic import BaseModel, Field, field_validator

	RETRIEVAL_CRITIC_PROMPT = """You are a senior researcher evaluating document support quality. Follow these steps:

	1. Answer Requirements: Identify exact claims needed for complete answer
	2. Claim Verification: Check document's direct evidence for each requirement
	3. Evidence Strength: Assess quality/reliability of supporting facts
	4. Completeness Check: Identify missing elements or partial coverage
	5. Support Synthesis: Combine analysis into final support classification

	Question: {question}

	Document Excerpt: {context}

	Provide detailed reasoning through all steps, then state final decision as either:
	- "fully-supported" (covers all requirements with strong evidence)
	- "partially-supported" (covers some requirements or weak evidence)
	- "no-support" (contains no usable evidence)"""


	class RetrievalCriticResult(BaseModel):
	"""Structured evaluation of a document's ability to support answering a query.

	Validates that the reasoning chain contains all required analytical steps and that
	the final decision matches one of the predefined support classifications.

	Attributes:
	reasoning_chain (str): Step-by-step analysis through verification stages.
	Must contain all required section headers.
	decision (Literal["fully-supported", "partially-supported", "no-support"]):
	Final classification of document support quality.

	Raises:
	ValueError: If reasoning chain is missing required sections or is too short
	ValidationError: If decision value doesn't match allowed literals

	Example:
	>>> valid_result = RetrievalCriticResult(
	... reasoning_chain=(
	... "1. Answer Requirements: Needs 3 climate change impacts"
	... "2. Claim Verification: Documents sea level rise data"
	... "3. Evidence Strength: IPCC report citations provided"
	... "4. Completeness Check: Missing economic impact analysis"
	... "5. Support Synthesis: Covers 2/3 required impact areas"
	... ),
	... decision="partially-supported"
	... )
	>>> valid_result.decision
	'partially-supported'
	"""

	reasoning_chain: str = Field(
	...,
	description=(
	"Systematic analysis through verification stages. Must contain:\n"
	"- 1. Answer Requirements: Identification of needed claims\n"
	"- 2. Claim Verification: Document evidence checking\n"
	"- 3. Evidence Strength: Quality assessment of sources\n"
	"- 4. Completeness Check: Missing elements analysis\n"
	"- 5. Support Synthesis: Final classification rationale"
	),
	)
	decision: Literal["fully-supported", "partially-supported", "no-support"] = Field(
	...,
	description=(
	"Final classification of document's support quality:\n"
	"- 'fully-supported': Comprehensive evidence for all requirements\n"
	"- 'partially-supported': Partial or weak evidence coverage\n"
	"- 'no-support': No usable evidence found"
	),
	)

	@field_validator("reasoning_chain")
	@classmethod
	def validate_reasoning_steps(cls, chain_to_validate: str) -> str:
	"""Validate the structure and completeness of the analytical reasoning chain.

	Ensures the reasoning chain contains all required section headers and meets
	minimum length requirements for meaningful analysis.

	Args:
	chain_to_validate (str): The raw reasoning chain text to validate

	Returns:
	str: The validated reasoning chain if all requirements are met

	Raises:
	ValueError: If any required section headers are missing from the chain

	Example:
	>>> valid_chain = (
	... "1. Answer Requirements: Needs 5 economic indicators"
	... "2. Claim Verification: GDP data verified"
	... "3. Evidence Strength: Government reports cited"
	... "4. Completeness Check: Missing unemployment figures"
	... "5. Support Synthesis: Covers 4/5 required indicators"
	... )
	>>> RetrievalCriticResult.validate_reasoning_steps(valid_chain)
	'1. Answer Requirements: Needs 5 economic indicators...'
	"""
	required_steps = [
	"1. Answer Requirements",
	"2. Claim Verification",
	"3. Evidence Strength",
	"4. Completeness Check",
	"5. Support Synthesis",
	]

	missing: list[str] = [step for step in required_steps if step not in chain_to_validate]
	if missing:
	msg = f"Missing required analysis steps: {missing}"
	raise ValueError(msg)
	return chain_to_validate

	model_config = {
	"json_schema_extra": {
	"example": {
	"reasoning_chain": (
	"1. Answer Requirements: Needs 3 main battery innovations\n"
	"2. Claim Verification: Documents solid-state and lithium-air tech\n"
	"3. Evidence Strength: Peer-reviewed study citations\n"
	"4. Completeness Check: Missing third innovation details\n"
	"5. Support Synthesis: Strong evidence for 2/3 requirements"
	),
	"decision": "partially-supported",
	}
	}
	}