mirror of
https://github.com/YspCoder/clawgo.git
synced 2026-05-06 03:37:31 +08:00
inbound dedupe + ekg stratification: channel-level message_id dedupe and source/channel-separated ekg stats
This commit is contained in:
@@ -5,7 +5,9 @@ import (
|
||||
"fmt"
|
||||
"path/filepath"
|
||||
"strings"
|
||||
"sync"
|
||||
"sync/atomic"
|
||||
"time"
|
||||
|
||||
"clawgo/pkg/bus"
|
||||
"clawgo/pkg/logger"
|
||||
@@ -32,6 +34,8 @@ type BaseChannel struct {
|
||||
running atomic.Bool
|
||||
name string
|
||||
allowList []string
|
||||
recentMsgMu sync.Mutex
|
||||
recentMsg map[string]time.Time
|
||||
}
|
||||
|
||||
func NewBaseChannel(name string, config interface{}, bus *bus.MessageBus, allowList []string) *BaseChannel {
|
||||
@@ -40,6 +44,7 @@ func NewBaseChannel(name string, config interface{}, bus *bus.MessageBus, allowL
|
||||
bus: bus,
|
||||
name: name,
|
||||
allowList: allowList,
|
||||
recentMsg: map[string]time.Time{},
|
||||
}
|
||||
}
|
||||
|
||||
@@ -78,6 +83,29 @@ func (c *BaseChannel) IsAllowed(senderID string) bool {
|
||||
return false
|
||||
}
|
||||
|
||||
func (c *BaseChannel) isDuplicateInboundMessage(messageID string) bool {
|
||||
messageID = strings.TrimSpace(messageID)
|
||||
if messageID == "" {
|
||||
return false
|
||||
}
|
||||
now := time.Now()
|
||||
const ttl = 10 * time.Minute
|
||||
c.recentMsgMu.Lock()
|
||||
defer c.recentMsgMu.Unlock()
|
||||
for id, ts := range c.recentMsg {
|
||||
if now.Sub(ts) > ttl {
|
||||
delete(c.recentMsg, id)
|
||||
}
|
||||
}
|
||||
if ts, ok := c.recentMsg[messageID]; ok {
|
||||
if now.Sub(ts) <= ttl {
|
||||
return true
|
||||
}
|
||||
}
|
||||
c.recentMsg[messageID] = now
|
||||
return false
|
||||
}
|
||||
|
||||
func (c *BaseChannel) HandleMessage(senderID, chatID, content string, media []string, metadata map[string]string) {
|
||||
if !c.IsAllowed(senderID) {
|
||||
logger.WarnCF("channels", "Message rejected by allowlist", map[string]interface{}{
|
||||
@@ -88,6 +116,19 @@ func (c *BaseChannel) HandleMessage(senderID, chatID, content string, media []st
|
||||
return
|
||||
}
|
||||
|
||||
if metadata != nil {
|
||||
if messageID := strings.TrimSpace(metadata["message_id"]); messageID != "" {
|
||||
if c.isDuplicateInboundMessage(c.name + ":" + messageID) {
|
||||
logger.WarnCF("channels", "Duplicate inbound message skipped", map[string]interface{}{
|
||||
logger.FieldChannel: c.name,
|
||||
"message_id": messageID,
|
||||
logger.FieldChatID: chatID,
|
||||
})
|
||||
return
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// Build session key: channel:chatID
|
||||
sessionKey := fmt.Sprintf("%s:%s", c.name, chatID)
|
||||
|
||||
|
||||
@@ -41,9 +41,6 @@ type FeishuChannel struct {
|
||||
tenantAccessToken string
|
||||
tenantTokenExpire time.Time
|
||||
tenantTokenErr error
|
||||
|
||||
recentMsgMu sync.Mutex
|
||||
recentMsg map[string]time.Time
|
||||
}
|
||||
|
||||
func (c *FeishuChannel) SupportsAction(action string) bool {
|
||||
@@ -62,7 +59,6 @@ func NewFeishuChannel(cfg config.FeishuConfig, bus *bus.MessageBus) (*FeishuChan
|
||||
BaseChannel: base,
|
||||
config: cfg,
|
||||
client: lark.NewClient(cfg.AppID, cfg.AppSecret),
|
||||
recentMsg: map[string]time.Time{},
|
||||
}, nil
|
||||
}
|
||||
|
||||
@@ -226,12 +222,6 @@ func (c *FeishuChannel) handleMessageReceive(ctx context.Context, event *larkim.
|
||||
if sender != nil && sender.TenantKey != nil {
|
||||
metadata["tenant_key"] = *sender.TenantKey
|
||||
}
|
||||
if messageID := metadata["message_id"]; messageID != "" {
|
||||
if c.isDuplicateInboundMessage(messageID) {
|
||||
logger.WarnCF("feishu", "Duplicate Feishu inbound message skipped", map[string]interface{}{"message_id": messageID, logger.FieldChatID: chatID})
|
||||
return nil
|
||||
}
|
||||
}
|
||||
|
||||
logger.InfoCF("feishu", "Feishu message received", map[string]interface{}{
|
||||
logger.FieldSenderID: senderID,
|
||||
@@ -332,29 +322,6 @@ func (c *FeishuChannel) isAllowedChat(chatID, chatType string) bool {
|
||||
return false
|
||||
}
|
||||
|
||||
func (c *FeishuChannel) isDuplicateInboundMessage(messageID string) bool {
|
||||
messageID = strings.TrimSpace(messageID)
|
||||
if messageID == "" {
|
||||
return false
|
||||
}
|
||||
now := time.Now()
|
||||
const ttl = 10 * time.Minute
|
||||
c.recentMsgMu.Lock()
|
||||
defer c.recentMsgMu.Unlock()
|
||||
for id, ts := range c.recentMsg {
|
||||
if now.Sub(ts) > ttl {
|
||||
delete(c.recentMsg, id)
|
||||
}
|
||||
}
|
||||
if ts, ok := c.recentMsg[messageID]; ok {
|
||||
if now.Sub(ts) <= ttl {
|
||||
return true
|
||||
}
|
||||
}
|
||||
c.recentMsg[messageID] = now
|
||||
return false
|
||||
}
|
||||
|
||||
func (c *FeishuChannel) shouldHandleGroupMessage(chatType, content string) bool {
|
||||
chatType = strings.ToLower(strings.TrimSpace(chatType))
|
||||
isGroup := chatType != "" && chatType != "p2p"
|
||||
|
||||
@@ -1637,8 +1637,18 @@ func (s *RegistryServer) handleWebUIEKGStats(w http.ResponseWriter, r *http.Requ
|
||||
if len(lines) > 3000 {
|
||||
lines = lines[len(lines)-3000:]
|
||||
}
|
||||
type kv struct {
|
||||
Key string `json:"key"`
|
||||
Score float64 `json:"score,omitempty"`
|
||||
Count int `json:"count,omitempty"`
|
||||
}
|
||||
providerScore := map[string]float64{}
|
||||
providerScoreWorkload := map[string]float64{}
|
||||
errSigCount := map[string]int{}
|
||||
errSigHeartbeat := map[string]int{}
|
||||
errSigWorkload := map[string]int{}
|
||||
sourceStats := map[string]int{}
|
||||
channelStats := map[string]int{}
|
||||
for _, ln := range lines {
|
||||
if strings.TrimSpace(ln) == "" {
|
||||
continue
|
||||
@@ -1650,40 +1660,52 @@ func (s *RegistryServer) handleWebUIEKGStats(w http.ResponseWriter, r *http.Requ
|
||||
provider := strings.TrimSpace(fmt.Sprintf("%v", row["provider"]))
|
||||
status := strings.ToLower(strings.TrimSpace(fmt.Sprintf("%v", row["status"])))
|
||||
errSig := strings.TrimSpace(fmt.Sprintf("%v", row["errsig"]))
|
||||
source := strings.ToLower(strings.TrimSpace(fmt.Sprintf("%v", row["source"])))
|
||||
channel := strings.ToLower(strings.TrimSpace(fmt.Sprintf("%v", row["channel"])))
|
||||
if source == "" {
|
||||
source = "unknown"
|
||||
}
|
||||
if channel == "" {
|
||||
channel = "unknown"
|
||||
}
|
||||
sourceStats[source]++
|
||||
channelStats[channel]++
|
||||
isHeartbeat := source == "heartbeat"
|
||||
if provider != "" {
|
||||
switch status {
|
||||
case "success":
|
||||
providerScore[provider] += 1
|
||||
if !isHeartbeat { providerScoreWorkload[provider] += 1 }
|
||||
case "suppressed":
|
||||
providerScore[provider] += 0.2
|
||||
if !isHeartbeat { providerScoreWorkload[provider] += 0.2 }
|
||||
case "error":
|
||||
providerScore[provider] -= 1
|
||||
if !isHeartbeat { providerScoreWorkload[provider] -= 1 }
|
||||
}
|
||||
}
|
||||
if errSig != "" {
|
||||
errSigCount[errSig]++
|
||||
if isHeartbeat {
|
||||
errSigHeartbeat[errSig]++
|
||||
} else {
|
||||
errSigWorkload[errSig]++
|
||||
}
|
||||
}
|
||||
}
|
||||
type kv struct {
|
||||
Key string `json:"key"`
|
||||
Score float64 `json:"score,omitempty"`
|
||||
Count int `json:"count,omitempty"`
|
||||
toTopScore := func(m map[string]float64, n int) []kv {
|
||||
out := make([]kv, 0, len(m))
|
||||
for k, v := range m { out = append(out, kv{Key:k, Score:v}) }
|
||||
sort.Slice(out, func(i,j int) bool { return out[i].Score > out[j].Score })
|
||||
if len(out) > n { out = out[:n] }
|
||||
return out
|
||||
}
|
||||
providerTop := make([]kv, 0, len(providerScore))
|
||||
for k, v := range providerScore {
|
||||
providerTop = append(providerTop, kv{Key: k, Score: v})
|
||||
}
|
||||
sort.Slice(providerTop, func(i, j int) bool { return providerTop[i].Score > providerTop[j].Score })
|
||||
if len(providerTop) > 5 {
|
||||
providerTop = providerTop[:5]
|
||||
}
|
||||
errTop := make([]kv, 0, len(errSigCount))
|
||||
for k, v := range errSigCount {
|
||||
errTop = append(errTop, kv{Key: k, Count: v})
|
||||
}
|
||||
sort.Slice(errTop, func(i, j int) bool { return errTop[i].Count > errTop[j].Count })
|
||||
if len(errTop) > 5 {
|
||||
errTop = errTop[:5]
|
||||
toTopCount := func(m map[string]int, n int) []kv {
|
||||
out := make([]kv, 0, len(m))
|
||||
for k, v := range m { out = append(out, kv{Key:k, Count:v}) }
|
||||
sort.Slice(out, func(i,j int) bool { return out[i].Count > out[j].Count })
|
||||
if len(out) > n { out = out[:n] }
|
||||
return out
|
||||
}
|
||||
escalations := 0
|
||||
tasksPath := filepath.Join(workspace, "memory", "tasks.json")
|
||||
@@ -1698,10 +1720,15 @@ func (s *RegistryServer) handleWebUIEKGStats(w http.ResponseWriter, r *http.Requ
|
||||
}
|
||||
}
|
||||
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
||||
"ok": true,
|
||||
"provider_top": providerTop,
|
||||
"errsig_top": errTop,
|
||||
"escalation_count": escalations,
|
||||
"ok": true,
|
||||
"provider_top": toTopScore(providerScore, 5),
|
||||
"provider_top_workload": toTopScore(providerScoreWorkload, 5),
|
||||
"errsig_top": toTopCount(errSigCount, 5),
|
||||
"errsig_top_heartbeat": toTopCount(errSigHeartbeat, 5),
|
||||
"errsig_top_workload": toTopCount(errSigWorkload, 5),
|
||||
"source_stats": sourceStats,
|
||||
"channel_stats": channelStats,
|
||||
"escalation_count": escalations,
|
||||
})
|
||||
}
|
||||
|
||||
|
||||
Reference in New Issue
Block a user