p59 + p60

This commit is contained in:
team 1
2026-05-07 07:52:52 +02:00
parent 56646a0c3b
commit 87c2134e6c
20 changed files with 808 additions and 1256 deletions

View File

@@ -4,79 +4,22 @@
parameters:
retriex.governance.config:
regression_baseline:
protected_short_model_tokens:
- th
- tc
- tp
- tm
- ph
- rx
protected_measurement_values:
- '0,02'
- '0,05'
- '0,1'
- '0,25'
- '0,5'
- '1,0'
- '2,0'
- '2,5'
- '5,0'
protected_technical_prompt_keywords:
- testomat
- indikator
- grenzwert
- messbereich
- gemessen
technical_priority_required_markers:
- runner-up
- second-lowest
- comparison
protected_accessory_prompt_keywords:
- indikator
- reagenz
protected_search_repair_specificity_terms:
- indikator
- testomat
- reagenz
protected_retrieval_reagent_words:
- indikator
- reagenz
protected_retrieval_device_word_groups:
geraet:
- geraet
- gerät
shop_prompt_regression_original_query: 'testomat 808 0,02'
shop_prompt_required_output_instruction_markers:
- 'Output only the final search query.'
- 'Output format:'
shop_query_meta_guard_terms:
- shop
- suche
shop_query_context_fallback_filter_terms:
- welchem
- kann
- messen
shop_query_current_input_preservation_terms:
- ph
- redox
# Protected vocabulary tokens fall back to
# regression_baseline.protected_short_model_tokens.
# Add vocabulary.protected_short_model_tokens only for an explicit override.
protected_short_model_tokens: []
protected_measurement_values: []
protected_technical_prompt_keywords: []
technical_priority_required_markers: []
protected_accessory_prompt_keywords: []
protected_search_repair_specificity_terms: []
protected_retrieval_reagent_words: []
protected_retrieval_device_word_groups: {}
shop_prompt_regression_original_query: ''
shop_prompt_required_output_instruction_markers: []
shop_query_meta_guard_terms: []
shop_query_context_fallback_filter_terms: []
shop_query_current_input_preservation_terms: []
vocabulary: {}
language:
protected_stopword_terms:
- nicht
- kein
- keine
- welche
- testomat
- indikator
- indikatortyp
- ph
- rx
- th
- tc
- '0,02'
protected_stopword_terms: []
required_cleanup_profiles:
- commerce_query
- rag_evidence
@@ -131,30 +74,7 @@ parameters:
- in_array
- array_intersect
- array_intersect_key
domain_marker_terms:
- testomat
- indikator
- indikatortyp
- grenzwert
- messbereich
- reagenz
- reagens
- shop
- produkt
- artikel
- kaufen
- bestellen
- geraet
- gerät
- messgerät
- messgeraet
- analysegerät
- analysegeraet
- analysator
- wasserhärte
- wasserhaerte
- chlor
- redox
domain_marker_terms: []
allowed_literal_patterns:
- path: src/Knowledge/Retrieval/NdjsonChunkLookup.php
pattern: '/Produkt\\s\+Titel/iu'