- 新增 ops 主服务(ops_service.go)和端口定义(ops_port.go) - 实现账号可用性检查服务(ops_account_availability.go) - 实现数据聚合服务(ops_aggregation_service.go) - 实现告警评估服务(ops_alert_evaluator_service.go) - 实现告警管理服务(ops_alerts.go) - 实现数据清理服务(ops_cleanup_service.go) - 实现并发控制服务(ops_concurrency.go) - 实现仪表板服务(ops_dashboard.go) - 实现错误处理服务(ops_errors.go) - 实现直方图服务(ops_histograms.go) - 实现指标采集服务(ops_metrics_collector.go) - 实现查询模式服务(ops_query_mode.go) - 实现实时监控服务(ops_realtime.go) - 实现请求详情服务(ops_request_details.go) - 实现重试机制服务(ops_retry.go) - 实现配置管理服务(ops_settings.go) - 实现趋势分析服务(ops_trends.go) - 实现窗口统计服务(ops_window_stats.go) - 添加 ops 相关领域常量 - 注册 service 依赖注入
258 lines
6.7 KiB
Go
258 lines
6.7 KiB
Go
package service
|
|
|
|
import (
|
|
"context"
|
|
"log"
|
|
"time"
|
|
|
|
"github.com/Wei-Shaw/sub2api/internal/pkg/pagination"
|
|
)
|
|
|
|
const (
|
|
opsAccountsPageSize = 100
|
|
opsConcurrencyBatchChunkSize = 200
|
|
)
|
|
|
|
func (s *OpsService) listAllAccountsForOps(ctx context.Context, platformFilter string) ([]Account, error) {
|
|
if s == nil || s.accountRepo == nil {
|
|
return []Account{}, nil
|
|
}
|
|
|
|
out := make([]Account, 0, 128)
|
|
page := 1
|
|
for {
|
|
accounts, pageInfo, err := s.accountRepo.ListWithFilters(ctx, pagination.PaginationParams{
|
|
Page: page,
|
|
PageSize: opsAccountsPageSize,
|
|
}, platformFilter, "", "", "")
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
if len(accounts) == 0 {
|
|
break
|
|
}
|
|
|
|
out = append(out, accounts...)
|
|
if pageInfo != nil && int64(len(out)) >= pageInfo.Total {
|
|
break
|
|
}
|
|
if len(accounts) < opsAccountsPageSize {
|
|
break
|
|
}
|
|
|
|
page++
|
|
if page > 10_000 {
|
|
log.Printf("[Ops] listAllAccountsForOps: aborting after too many pages (platform=%q)", platformFilter)
|
|
break
|
|
}
|
|
}
|
|
|
|
return out, nil
|
|
}
|
|
|
|
func (s *OpsService) getAccountsLoadMapBestEffort(ctx context.Context, accounts []Account) map[int64]*AccountLoadInfo {
|
|
if s == nil || s.concurrencyService == nil {
|
|
return map[int64]*AccountLoadInfo{}
|
|
}
|
|
if len(accounts) == 0 {
|
|
return map[int64]*AccountLoadInfo{}
|
|
}
|
|
|
|
// De-duplicate IDs (and keep the max concurrency to avoid under-reporting).
|
|
unique := make(map[int64]int, len(accounts))
|
|
for _, acc := range accounts {
|
|
if acc.ID <= 0 {
|
|
continue
|
|
}
|
|
if prev, ok := unique[acc.ID]; !ok || acc.Concurrency > prev {
|
|
unique[acc.ID] = acc.Concurrency
|
|
}
|
|
}
|
|
|
|
batch := make([]AccountWithConcurrency, 0, len(unique))
|
|
for id, maxConc := range unique {
|
|
batch = append(batch, AccountWithConcurrency{
|
|
ID: id,
|
|
MaxConcurrency: maxConc,
|
|
})
|
|
}
|
|
|
|
out := make(map[int64]*AccountLoadInfo, len(batch))
|
|
for i := 0; i < len(batch); i += opsConcurrencyBatchChunkSize {
|
|
end := i + opsConcurrencyBatchChunkSize
|
|
if end > len(batch) {
|
|
end = len(batch)
|
|
}
|
|
part, err := s.concurrencyService.GetAccountsLoadBatch(ctx, batch[i:end])
|
|
if err != nil {
|
|
// Best-effort: return zeros rather than failing the ops UI.
|
|
log.Printf("[Ops] GetAccountsLoadBatch failed: %v", err)
|
|
continue
|
|
}
|
|
for k, v := range part {
|
|
out[k] = v
|
|
}
|
|
}
|
|
|
|
return out
|
|
}
|
|
|
|
// GetConcurrencyStats returns real-time concurrency usage aggregated by platform/group/account.
|
|
//
|
|
// Optional filters:
|
|
// - platformFilter: only include accounts in that platform (best-effort reduces DB load)
|
|
// - groupIDFilter: only include accounts that belong to that group
|
|
func (s *OpsService) GetConcurrencyStats(
|
|
ctx context.Context,
|
|
platformFilter string,
|
|
groupIDFilter *int64,
|
|
) (map[string]*PlatformConcurrencyInfo, map[int64]*GroupConcurrencyInfo, map[int64]*AccountConcurrencyInfo, *time.Time, error) {
|
|
if err := s.RequireMonitoringEnabled(ctx); err != nil {
|
|
return nil, nil, nil, nil, err
|
|
}
|
|
|
|
accounts, err := s.listAllAccountsForOps(ctx, platformFilter)
|
|
if err != nil {
|
|
return nil, nil, nil, nil, err
|
|
}
|
|
|
|
collectedAt := time.Now()
|
|
loadMap := s.getAccountsLoadMapBestEffort(ctx, accounts)
|
|
|
|
platform := make(map[string]*PlatformConcurrencyInfo)
|
|
group := make(map[int64]*GroupConcurrencyInfo)
|
|
account := make(map[int64]*AccountConcurrencyInfo)
|
|
|
|
for _, acc := range accounts {
|
|
if acc.ID <= 0 {
|
|
continue
|
|
}
|
|
|
|
var matchedGroup *Group
|
|
if groupIDFilter != nil && *groupIDFilter > 0 {
|
|
for _, grp := range acc.Groups {
|
|
if grp == nil || grp.ID <= 0 {
|
|
continue
|
|
}
|
|
if grp.ID == *groupIDFilter {
|
|
matchedGroup = grp
|
|
break
|
|
}
|
|
}
|
|
// Group filter provided: skip accounts not in that group.
|
|
if matchedGroup == nil {
|
|
continue
|
|
}
|
|
}
|
|
|
|
load := loadMap[acc.ID]
|
|
currentInUse := int64(0)
|
|
waiting := int64(0)
|
|
if load != nil {
|
|
currentInUse = int64(load.CurrentConcurrency)
|
|
waiting = int64(load.WaitingCount)
|
|
}
|
|
|
|
// Account-level view picks one display group (the first group).
|
|
displayGroupID := int64(0)
|
|
displayGroupName := ""
|
|
if matchedGroup != nil {
|
|
displayGroupID = matchedGroup.ID
|
|
displayGroupName = matchedGroup.Name
|
|
} else if len(acc.Groups) > 0 && acc.Groups[0] != nil {
|
|
displayGroupID = acc.Groups[0].ID
|
|
displayGroupName = acc.Groups[0].Name
|
|
}
|
|
|
|
if _, ok := account[acc.ID]; !ok {
|
|
info := &AccountConcurrencyInfo{
|
|
AccountID: acc.ID,
|
|
AccountName: acc.Name,
|
|
Platform: acc.Platform,
|
|
GroupID: displayGroupID,
|
|
GroupName: displayGroupName,
|
|
CurrentInUse: currentInUse,
|
|
MaxCapacity: int64(acc.Concurrency),
|
|
WaitingInQueue: waiting,
|
|
}
|
|
if info.MaxCapacity > 0 {
|
|
info.LoadPercentage = float64(info.CurrentInUse) / float64(info.MaxCapacity) * 100
|
|
}
|
|
account[acc.ID] = info
|
|
}
|
|
|
|
// Platform aggregation.
|
|
if acc.Platform != "" {
|
|
if _, ok := platform[acc.Platform]; !ok {
|
|
platform[acc.Platform] = &PlatformConcurrencyInfo{
|
|
Platform: acc.Platform,
|
|
}
|
|
}
|
|
p := platform[acc.Platform]
|
|
p.MaxCapacity += int64(acc.Concurrency)
|
|
p.CurrentInUse += currentInUse
|
|
p.WaitingInQueue += waiting
|
|
}
|
|
|
|
// Group aggregation (one account may contribute to multiple groups).
|
|
if matchedGroup != nil {
|
|
grp := matchedGroup
|
|
if _, ok := group[grp.ID]; !ok {
|
|
group[grp.ID] = &GroupConcurrencyInfo{
|
|
GroupID: grp.ID,
|
|
GroupName: grp.Name,
|
|
Platform: grp.Platform,
|
|
}
|
|
}
|
|
g := group[grp.ID]
|
|
if g.GroupName == "" && grp.Name != "" {
|
|
g.GroupName = grp.Name
|
|
}
|
|
if g.Platform != "" && grp.Platform != "" && g.Platform != grp.Platform {
|
|
// Groups are expected to be platform-scoped. If mismatch is observed, avoid misleading labels.
|
|
g.Platform = ""
|
|
}
|
|
g.MaxCapacity += int64(acc.Concurrency)
|
|
g.CurrentInUse += currentInUse
|
|
g.WaitingInQueue += waiting
|
|
} else {
|
|
for _, grp := range acc.Groups {
|
|
if grp == nil || grp.ID <= 0 {
|
|
continue
|
|
}
|
|
if _, ok := group[grp.ID]; !ok {
|
|
group[grp.ID] = &GroupConcurrencyInfo{
|
|
GroupID: grp.ID,
|
|
GroupName: grp.Name,
|
|
Platform: grp.Platform,
|
|
}
|
|
}
|
|
g := group[grp.ID]
|
|
if g.GroupName == "" && grp.Name != "" {
|
|
g.GroupName = grp.Name
|
|
}
|
|
if g.Platform != "" && grp.Platform != "" && g.Platform != grp.Platform {
|
|
// Groups are expected to be platform-scoped. If mismatch is observed, avoid misleading labels.
|
|
g.Platform = ""
|
|
}
|
|
g.MaxCapacity += int64(acc.Concurrency)
|
|
g.CurrentInUse += currentInUse
|
|
g.WaitingInQueue += waiting
|
|
}
|
|
}
|
|
}
|
|
|
|
for _, info := range platform {
|
|
if info.MaxCapacity > 0 {
|
|
info.LoadPercentage = float64(info.CurrentInUse) / float64(info.MaxCapacity) * 100
|
|
}
|
|
}
|
|
for _, info := range group {
|
|
if info.MaxCapacity > 0 {
|
|
info.LoadPercentage = float64(info.CurrentInUse) / float64(info.MaxCapacity) * 100
|
|
}
|
|
}
|
|
|
|
return platform, group, account, &collectedAt, nil
|
|
}
|