Spaces:

MyNameIsTatiBond
/

fraud-detector

Running

App Files Files Community

MyNameIsTatiBond commited on 22 days ago

Commit

6697d65

1 Parent(s): ff34011

Refine SHAP explanations with value descriptors

Browse files

Files changed (2) hide show

app.py +45 -21
index.html +1 -1

app.py CHANGED Viewed

@@ -253,51 +253,75 @@ def get_readable_explanation(feature_name, shap_val, metadata=None):
 def get_nuanced_explanation(feature_name, shap_val, feature_val, metadata=None):
     """
-    Generate explanation with relative-to-typical context.
     """
     baseline_direction = "UP" if shap_val > 0 else "DOWN"
-    # Default Text
-    direction, text = get_readable_explanation(feature_name, shap_val, metadata)
-    # Trend Analysis
     if TREND_REGISTRY and feature_name in TREND_REGISTRY:
         try:
             entry = TREND_REGISTRY[feature_name]
             bins = entry["bins"]
             shaps = entry["shap_values"]
             ref_idx = entry.get("ref_idx", len(bins)//2)
             # Find current bin
-            # simple nearest neighbor in bins
-            # bins are sorted. np.searchsorted or just min dist
             curr_idx = (np.abs(np.array(bins) - feature_val)).argmin()
             curr_shap_med = shaps[curr_idx]
             ref_shap_med = shaps[ref_idx]
             typical_delta = curr_shap_med - ref_shap_med
-            # Threshold for "significant" relative difference?
-            # Let's say if abs delta > 0.0005 (small but real for SHAP probability)
             if typical_delta > 0.0005:
                 # Riskier than typical
-                if baseline_direction == "DOWN":
-                    text += ", but riskier than typical values"
-                else:
-                    text += " (high risk factor)"
             elif typical_delta < -0.0005:
                 # Safer than typical
-                if baseline_direction == "UP":
-                    text += ", but safer than typical values"
-                else:
-                    text += " (low risk factor)"
-        except Exception as e:
-            # Fallback to standard
             pass
-    return baseline_direction, text
 @app.get("/")
 async def root():

 def get_nuanced_explanation(feature_name, shap_val, feature_val, metadata=None):
     """
+    Generate explanation with relative-to-typical context and value descriptors.
     """
     baseline_direction = "UP" if shap_val > 0 else "DOWN"
+    # 1. Resolve Name
+    raw_feat = feature_name
+    if metadata and feature_name in metadata:
+        raw_feat = metadata[feature_name].get("raw_feature", feature_name)
+    user_label = FEATURE_MAP.get(raw_feat, raw_feat.replace("_", " ").title())
+    # 2. Trend Analysis
+    trend_text = ""
+    value_desc = ""
     if TREND_REGISTRY and feature_name in TREND_REGISTRY:
         try:
             entry = TREND_REGISTRY[feature_name]
             bins = entry["bins"]
             shaps = entry["shap_values"]
             ref_idx = entry.get("ref_idx", len(bins)//2)
+            min_val, max_val = entry.get("min_val", bins[0]), entry.get("max_val", bins[-1])
             # Find current bin
             curr_idx = (np.abs(np.array(bins) - feature_val)).argmin()
             curr_shap_med = shaps[curr_idx]
             ref_shap_med = shaps[ref_idx]
             typical_delta = curr_shap_med - ref_shap_med
+            # Value Descriptor (Low/High/Typical)
+            # Simple percentile check
+            rng = max_val - min_val
+            if rng > 0:
+                rel_pos = (feature_val - min_val) / rng
+                if rel_pos < 0.33: value_desc = "Low "
+                elif rel_pos > 0.66: value_desc = "High "
+                else: value_desc = "Typical "
+            # Threshold for "significant" relative difference
             if typical_delta > 0.0005:
                 # Riskier than typical
+                trend_text = "associated with higher risk than average"
             elif typical_delta < -0.0005:
                 # Safer than typical
+                trend_text = "associated with lower risk than average"
+        except Exception:
             pass
+    # 3. Construct Final Sentence
+    # Case A: Trend info available and significant
+    if trend_text:
+        # "Low Injury Cost Portion is associated with higher risk than average."
+        if value_desc == "Typical ": value_desc = "" # Omit "Typical" prefix usually
+        full_text = f"{value_desc}{user_label} is {trend_text}"
+        # Add baseline context if it contradicts?
+        # If baseline is DOWN but trend is RISKIER -> "Reduces risk overall, but Low X is associated with higher risk than average"
+        # User implies they just want the "causes it higher" part.
+        # "Low Injury Cost Portion is associated with higher risk than average" is very clear.
+        pass
+    else:
+        # Case B: Standard Baseline Fallback
+        if shap_val > 0:
+            full_text = f"{user_label} contributes to risk"
+        else:
+            full_text = f"{user_label} reduces risk estimate"
+    return baseline_direction, full_text
 @app.get("/")
 async def root():

index.html CHANGED Viewed

@@ -1283,7 +1283,7 @@
                              ${icon} ${directionText}
                         </div>
                         <div style="font-size: 12px; opacity: 0.6; font-style: italic;">
-                             Associated with ${isUp ? 'higher' : 'lower'} risk patterns
                         </div>
                      `;
                     list.appendChild(row);

                              ${icon} ${directionText}
                         </div>
                         <div style="font-size: 12px; opacity: 0.6; font-style: italic;">
+                             ${item.text}
                         </div>
                      `;
                     list.appendChild(row);