p28
This commit is contained in:
@@ -208,6 +208,8 @@ parameters:
|
||||
|
||||
rag_evidence_guard:
|
||||
cleanup_profile: rag_evidence
|
||||
# Legacy/domain override list. Generic German stopwords are provided by
|
||||
# language cleanup profile `rag_evidence`. Keep RAG/product-role terms here.
|
||||
stop_terms:
|
||||
- suche
|
||||
- suchen
|
||||
@@ -215,24 +217,8 @@ parameters:
|
||||
- finden
|
||||
- zeige
|
||||
- einen
|
||||
- eine
|
||||
- einem
|
||||
- einer
|
||||
- der
|
||||
- die
|
||||
- das
|
||||
- den
|
||||
- dem
|
||||
- des
|
||||
- für
|
||||
- fuer
|
||||
- mit
|
||||
- ohne
|
||||
- und
|
||||
- oder
|
||||
- kann
|
||||
- können
|
||||
- koennen
|
||||
- messen
|
||||
- messung
|
||||
- tester
|
||||
@@ -466,19 +452,16 @@ parameters:
|
||||
- '/\b(?:indikator(?:typ)?|indicator(?:\s+type)?|reagenz(?:satz|typ)?|reagent(?:\s+set|\s+type)?|typ|type)\s+[A-Za-zÄÖÜäöüß]{0,8}\s*\d{1,5}(?:\s*[A-ZÄÖÜ]{1,4})?(?:\s*%)?\b/iu'
|
||||
meta_query_guard:
|
||||
enabled: true
|
||||
cleanup_profile: shop_context_fallback
|
||||
context_fallback_enabled: true
|
||||
context_fallback_question_limit: 12
|
||||
context_fallback_history_budget_chars: 20000
|
||||
context_fallback_use_full_history: true
|
||||
context_fallback_max_terms: 6
|
||||
# Legacy/domain override list. Generic stopwords, user-instruction
|
||||
# phrases and presentation terms are provided by profile
|
||||
# `shop_context_fallback`. Keep shop/price/domain terms here.
|
||||
context_fallback_filter_terms:
|
||||
- mit
|
||||
- tabelle
|
||||
- tabellarisch
|
||||
- übersicht
|
||||
- uebersicht
|
||||
- liste
|
||||
- auflistung
|
||||
- preis
|
||||
- preise
|
||||
- preisen
|
||||
@@ -492,8 +475,6 @@ parameters:
|
||||
- welches
|
||||
- welchem
|
||||
- welchen
|
||||
- ist
|
||||
- sind
|
||||
- gut
|
||||
- geeignet
|
||||
- was
|
||||
@@ -515,24 +496,15 @@ parameters:
|
||||
- nehmen
|
||||
- zur
|
||||
- zum
|
||||
- für
|
||||
- fuer
|
||||
- messen
|
||||
- gemessen
|
||||
meta_only_terms:
|
||||
- shop
|
||||
- tabelle
|
||||
- tabellarisch
|
||||
- übersicht
|
||||
- uebersicht
|
||||
- liste
|
||||
- auflistung
|
||||
- preis
|
||||
- preise
|
||||
- preisen
|
||||
- kosten
|
||||
- kostet
|
||||
- mit
|
||||
- shopsuche
|
||||
- shop-suche
|
||||
- suche
|
||||
@@ -542,22 +514,14 @@ parameters:
|
||||
- find
|
||||
- zeige
|
||||
- zeig
|
||||
- bitte
|
||||
- mal
|
||||
- im
|
||||
- in
|
||||
- nach
|
||||
- danach
|
||||
- dazu
|
||||
- damit
|
||||
- dafür
|
||||
- dafuer
|
||||
- hierzu
|
||||
- den
|
||||
- die
|
||||
- das
|
||||
- der
|
||||
- dem
|
||||
language_preservation:
|
||||
enabled: true
|
||||
language_markers:
|
||||
|
||||
@@ -21,14 +21,11 @@ parameters:
|
||||
- horiba
|
||||
- neomeris
|
||||
|
||||
# Legacy/domain override list. General user-instruction phrases are provided by
|
||||
# language cleanup profile `commerce_query`. Keep only commerce-specific or
|
||||
# historically sensitive phrases here.
|
||||
phrases_to_remove:
|
||||
- ich suche
|
||||
- suche
|
||||
- habt ihr
|
||||
- gibt es
|
||||
- gebe mir
|
||||
- gib mir
|
||||
- zeige mir
|
||||
- welches gerät
|
||||
- welche gerät
|
||||
- welches modell
|
||||
@@ -42,8 +39,6 @@ parameters:
|
||||
- welcher
|
||||
- welches
|
||||
- welchen
|
||||
- sind
|
||||
- ist
|
||||
- geeignet
|
||||
- geeigent
|
||||
- verfügbarkeit
|
||||
@@ -53,27 +48,17 @@ parameters:
|
||||
- kurze
|
||||
- ich
|
||||
|
||||
# Legacy/domain override list. Generic German stopwords and conversation
|
||||
# filler terms are provided by language cleanup profile `commerce_query`.
|
||||
filter_search_tokens:
|
||||
- auch
|
||||
- noch
|
||||
- nochmal
|
||||
- zusätzlich
|
||||
- dazu
|
||||
- davon
|
||||
- stattdessen
|
||||
- bitte
|
||||
- preiswerte
|
||||
- gern
|
||||
- lösung
|
||||
- eine
|
||||
- größer
|
||||
- würde
|
||||
- gerne
|
||||
- welchem
|
||||
- kann
|
||||
- mit
|
||||
- mein
|
||||
- größer
|
||||
- zeige
|
||||
- zeig
|
||||
- such
|
||||
@@ -81,33 +66,20 @@ parameters:
|
||||
- finde
|
||||
- find
|
||||
- mir
|
||||
- mal
|
||||
- von
|
||||
- im
|
||||
- in
|
||||
- für
|
||||
- fuer
|
||||
- welche
|
||||
- welcher
|
||||
- welches
|
||||
- welchen
|
||||
- sind
|
||||
- zur
|
||||
- ist
|
||||
- geeignet
|
||||
- geeigent
|
||||
- verfügbarkeit
|
||||
- verfuegbarkeit
|
||||
- prüfe
|
||||
- pruefe
|
||||
- den
|
||||
- die
|
||||
- das
|
||||
- der
|
||||
- dem
|
||||
- des
|
||||
- und
|
||||
- oder
|
||||
- sowie
|
||||
- seine
|
||||
- seinen
|
||||
@@ -129,8 +101,6 @@ parameters:
|
||||
- kostet
|
||||
- kosten
|
||||
- ua
|
||||
- ein
|
||||
- also
|
||||
- gut
|
||||
- gute
|
||||
- guten
|
||||
|
||||
@@ -68,10 +68,45 @@ parameters:
|
||||
protected_stopword_terms:
|
||||
- nicht
|
||||
- kein
|
||||
- keine
|
||||
- welche
|
||||
- testomat
|
||||
- indikator
|
||||
- indikatortyp
|
||||
- ph
|
||||
- rx
|
||||
- th
|
||||
- tc
|
||||
- '0,02'
|
||||
required_cleanup_profiles:
|
||||
- commerce_query
|
||||
- rag_evidence
|
||||
- shop_context_fallback
|
||||
required_profile_terms:
|
||||
commerce_query:
|
||||
stopwords:
|
||||
- der
|
||||
- mit
|
||||
- bitte
|
||||
phrases:
|
||||
- ich suche
|
||||
- suche im shop
|
||||
rag_evidence:
|
||||
stopwords:
|
||||
- der
|
||||
- mit
|
||||
- bitte
|
||||
shop_context_fallback:
|
||||
stopwords:
|
||||
- der
|
||||
- mit
|
||||
- bitte
|
||||
phrases:
|
||||
- zeige mir
|
||||
- suche im shop
|
||||
meta_terms:
|
||||
- tabelle
|
||||
- übersicht
|
||||
core_pattern_audit:
|
||||
source_roots:
|
||||
- src
|
||||
|
||||
@@ -53,12 +53,13 @@ parameters:
|
||||
|
||||
# Central language cleanup structure for RetrieX 1.5.3+.
|
||||
# Legacy key `words` above remains the runtime-compatible default list.
|
||||
# New cleanup profiles are introduced additively and are not yet wired into
|
||||
# Commerce/Agent runtime logic in this patch.
|
||||
# Cleanup profiles are the preferred home for generic language noise.
|
||||
# Domain configs should only keep domain-specific overrides.
|
||||
protected_terms:
|
||||
- nicht
|
||||
- kein
|
||||
- keine
|
||||
- welche
|
||||
- testomat
|
||||
- indikator
|
||||
- indikatortyp
|
||||
|
||||
Reference in New Issue
Block a user