relay-claude_test.go 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305
  1. package claude
  2. import (
  3. "strings"
  4. "testing"
  5. "github.com/QuantumNous/new-api/dto"
  6. )
  7. func TestFormatClaudeResponseInfo_MessageStart(t *testing.T) {
  8. claudeInfo := &ClaudeResponseInfo{
  9. Usage: &dto.Usage{},
  10. }
  11. claudeResponse := &dto.ClaudeResponse{
  12. Type: "message_start",
  13. Message: &dto.ClaudeMediaMessage{
  14. Id: "msg_123",
  15. Model: "claude-3-5-sonnet",
  16. Usage: &dto.ClaudeUsage{
  17. InputTokens: 100,
  18. OutputTokens: 1,
  19. CacheCreationInputTokens: 50,
  20. CacheReadInputTokens: 30,
  21. },
  22. },
  23. }
  24. ok := FormatClaudeResponseInfo(claudeResponse, nil, claudeInfo)
  25. if !ok {
  26. t.Fatal("expected true")
  27. }
  28. if claudeInfo.Usage.PromptTokens != 100 {
  29. t.Errorf("PromptTokens = %d, want 100", claudeInfo.Usage.PromptTokens)
  30. }
  31. if claudeInfo.Usage.PromptTokensDetails.CachedTokens != 30 {
  32. t.Errorf("CachedTokens = %d, want 30", claudeInfo.Usage.PromptTokensDetails.CachedTokens)
  33. }
  34. if claudeInfo.Usage.PromptTokensDetails.CachedCreationTokens != 50 {
  35. t.Errorf("CachedCreationTokens = %d, want 50", claudeInfo.Usage.PromptTokensDetails.CachedCreationTokens)
  36. }
  37. if claudeInfo.ResponseId != "msg_123" {
  38. t.Errorf("ResponseId = %s, want msg_123", claudeInfo.ResponseId)
  39. }
  40. if claudeInfo.Model != "claude-3-5-sonnet" {
  41. t.Errorf("Model = %s, want claude-3-5-sonnet", claudeInfo.Model)
  42. }
  43. }
  44. func TestFormatClaudeResponseInfo_MessageDelta_FullUsage(t *testing.T) {
  45. // message_start 先积累 usage
  46. claudeInfo := &ClaudeResponseInfo{
  47. Usage: &dto.Usage{
  48. PromptTokens: 100,
  49. PromptTokensDetails: dto.InputTokenDetails{
  50. CachedTokens: 30,
  51. CachedCreationTokens: 50,
  52. },
  53. CompletionTokens: 1,
  54. },
  55. }
  56. // message_delta 带完整 usage(原生 Anthropic 场景)
  57. claudeResponse := &dto.ClaudeResponse{
  58. Type: "message_delta",
  59. Usage: &dto.ClaudeUsage{
  60. InputTokens: 100,
  61. OutputTokens: 200,
  62. CacheCreationInputTokens: 50,
  63. CacheReadInputTokens: 30,
  64. },
  65. }
  66. ok := FormatClaudeResponseInfo(claudeResponse, nil, claudeInfo)
  67. if !ok {
  68. t.Fatal("expected true")
  69. }
  70. if claudeInfo.Usage.PromptTokens != 100 {
  71. t.Errorf("PromptTokens = %d, want 100", claudeInfo.Usage.PromptTokens)
  72. }
  73. if claudeInfo.Usage.CompletionTokens != 200 {
  74. t.Errorf("CompletionTokens = %d, want 200", claudeInfo.Usage.CompletionTokens)
  75. }
  76. if claudeInfo.Usage.TotalTokens != 300 {
  77. t.Errorf("TotalTokens = %d, want 300", claudeInfo.Usage.TotalTokens)
  78. }
  79. if !claudeInfo.Done {
  80. t.Error("expected Done = true")
  81. }
  82. }
  83. func TestFormatClaudeResponseInfo_MessageDelta_OnlyOutputTokens(t *testing.T) {
  84. // 模拟 Bedrock: message_start 已积累 usage
  85. claudeInfo := &ClaudeResponseInfo{
  86. Usage: &dto.Usage{
  87. PromptTokens: 100,
  88. PromptTokensDetails: dto.InputTokenDetails{
  89. CachedTokens: 30,
  90. CachedCreationTokens: 50,
  91. },
  92. CompletionTokens: 1,
  93. ClaudeCacheCreation5mTokens: 10,
  94. ClaudeCacheCreation1hTokens: 20,
  95. },
  96. }
  97. // Bedrock 的 message_delta 只有 output_tokens,缺少 input_tokens 和 cache 字段
  98. claudeResponse := &dto.ClaudeResponse{
  99. Type: "message_delta",
  100. Usage: &dto.ClaudeUsage{
  101. OutputTokens: 200,
  102. // InputTokens, CacheCreationInputTokens, CacheReadInputTokens 都是 0
  103. },
  104. }
  105. ok := FormatClaudeResponseInfo(claudeResponse, nil, claudeInfo)
  106. if !ok {
  107. t.Fatal("expected true")
  108. }
  109. // PromptTokens 应保持 message_start 的值(因为 message_delta 的 InputTokens=0,不更新)
  110. if claudeInfo.Usage.PromptTokens != 100 {
  111. t.Errorf("PromptTokens = %d, want 100", claudeInfo.Usage.PromptTokens)
  112. }
  113. if claudeInfo.Usage.CompletionTokens != 200 {
  114. t.Errorf("CompletionTokens = %d, want 200", claudeInfo.Usage.CompletionTokens)
  115. }
  116. if claudeInfo.Usage.TotalTokens != 300 {
  117. t.Errorf("TotalTokens = %d, want 300", claudeInfo.Usage.TotalTokens)
  118. }
  119. // cache 字段应保持 message_start 的值
  120. if claudeInfo.Usage.PromptTokensDetails.CachedTokens != 30 {
  121. t.Errorf("CachedTokens = %d, want 30", claudeInfo.Usage.PromptTokensDetails.CachedTokens)
  122. }
  123. if claudeInfo.Usage.PromptTokensDetails.CachedCreationTokens != 50 {
  124. t.Errorf("CachedCreationTokens = %d, want 50", claudeInfo.Usage.PromptTokensDetails.CachedCreationTokens)
  125. }
  126. if claudeInfo.Usage.ClaudeCacheCreation5mTokens != 10 {
  127. t.Errorf("ClaudeCacheCreation5mTokens = %d, want 10", claudeInfo.Usage.ClaudeCacheCreation5mTokens)
  128. }
  129. if claudeInfo.Usage.ClaudeCacheCreation1hTokens != 20 {
  130. t.Errorf("ClaudeCacheCreation1hTokens = %d, want 20", claudeInfo.Usage.ClaudeCacheCreation1hTokens)
  131. }
  132. if !claudeInfo.Done {
  133. t.Error("expected Done = true")
  134. }
  135. }
  136. func TestFormatClaudeResponseInfo_NilClaudeInfo(t *testing.T) {
  137. claudeResponse := &dto.ClaudeResponse{Type: "message_start"}
  138. ok := FormatClaudeResponseInfo(claudeResponse, nil, nil)
  139. if ok {
  140. t.Error("expected false for nil claudeInfo")
  141. }
  142. }
  143. func TestFormatClaudeResponseInfo_ContentBlockDelta(t *testing.T) {
  144. text := "hello"
  145. claudeInfo := &ClaudeResponseInfo{
  146. Usage: &dto.Usage{},
  147. ResponseText: strings.Builder{},
  148. }
  149. claudeResponse := &dto.ClaudeResponse{
  150. Type: "content_block_delta",
  151. Delta: &dto.ClaudeMediaMessage{
  152. Text: &text,
  153. },
  154. }
  155. ok := FormatClaudeResponseInfo(claudeResponse, nil, claudeInfo)
  156. if !ok {
  157. t.Fatal("expected true")
  158. }
  159. if claudeInfo.ResponseText.String() != "hello" {
  160. t.Errorf("ResponseText = %q, want %q", claudeInfo.ResponseText.String(), "hello")
  161. }
  162. }
  163. // TestEnrichMessageDeltaUsage 测试 message_delta 事件的 usage 补全逻辑
  164. // 这是修复 issue #2881 的核心逻辑:当上游(如 Bedrock)的 message_delta 缺少
  165. // input_tokens 和 cache 相关字段时,用 claudeInfo 中积累的数据补全
  166. func TestEnrichMessageDeltaUsage(t *testing.T) {
  167. tests := []struct {
  168. name string
  169. claudeInfo *ClaudeResponseInfo
  170. deltaUsage *dto.ClaudeUsage
  171. wantInput int
  172. wantCacheRead int
  173. wantCacheCreate int
  174. wantOutput int
  175. want5m int
  176. want1h int
  177. }{
  178. {
  179. name: "Bedrock: delta 只有 output_tokens,从 claudeInfo 补全其他字段",
  180. claudeInfo: &ClaudeResponseInfo{
  181. Usage: &dto.Usage{
  182. PromptTokens: 100,
  183. PromptTokensDetails: dto.InputTokenDetails{
  184. CachedTokens: 30,
  185. CachedCreationTokens: 50,
  186. },
  187. ClaudeCacheCreation5mTokens: 10,
  188. ClaudeCacheCreation1hTokens: 20,
  189. },
  190. },
  191. deltaUsage: &dto.ClaudeUsage{OutputTokens: 200},
  192. wantInput: 100,
  193. wantCacheRead: 30,
  194. wantCacheCreate: 50,
  195. wantOutput: 200,
  196. want5m: 10,
  197. want1h: 20,
  198. },
  199. {
  200. name: "原生 Anthropic: delta 已包含所有字段,不覆盖",
  201. claudeInfo: &ClaudeResponseInfo{
  202. Usage: &dto.Usage{
  203. PromptTokens: 100,
  204. PromptTokensDetails: dto.InputTokenDetails{
  205. CachedTokens: 30,
  206. CachedCreationTokens: 50,
  207. },
  208. },
  209. },
  210. deltaUsage: &dto.ClaudeUsage{
  211. InputTokens: 100,
  212. OutputTokens: 200,
  213. CacheReadInputTokens: 30,
  214. CacheCreationInputTokens: 50,
  215. },
  216. wantInput: 100,
  217. wantCacheRead: 30,
  218. wantCacheCreate: 50,
  219. wantOutput: 200,
  220. },
  221. {
  222. name: "delta usage 为 nil,创建并补全",
  223. claudeInfo: &ClaudeResponseInfo{
  224. Usage: &dto.Usage{
  225. PromptTokens: 80,
  226. PromptTokensDetails: dto.InputTokenDetails{
  227. CachedTokens: 20,
  228. CachedCreationTokens: 40,
  229. },
  230. },
  231. },
  232. deltaUsage: nil,
  233. wantInput: 80,
  234. wantCacheRead: 20,
  235. wantCacheCreate: 40,
  236. wantOutput: 0,
  237. },
  238. {
  239. name: "没有 cache 数据,不补全",
  240. claudeInfo: &ClaudeResponseInfo{
  241. Usage: &dto.Usage{
  242. PromptTokens: 100,
  243. },
  244. },
  245. deltaUsage: &dto.ClaudeUsage{OutputTokens: 50},
  246. wantInput: 100,
  247. wantCacheRead: 0,
  248. wantCacheCreate: 0,
  249. wantOutput: 50,
  250. },
  251. }
  252. for _, tt := range tests {
  253. t.Run(tt.name, func(t *testing.T) {
  254. claudeResponse := &dto.ClaudeResponse{
  255. Type: "message_delta",
  256. Usage: tt.deltaUsage,
  257. }
  258. // 模拟 HandleStreamResponseData 中 Claude 格式的补全逻辑
  259. enrichMessageDeltaUsage(claudeResponse, tt.claudeInfo)
  260. if claudeResponse.Usage == nil {
  261. t.Fatal("Usage should not be nil after enrichment")
  262. }
  263. if claudeResponse.Usage.InputTokens != tt.wantInput {
  264. t.Errorf("InputTokens = %d, want %d", claudeResponse.Usage.InputTokens, tt.wantInput)
  265. }
  266. if claudeResponse.Usage.CacheReadInputTokens != tt.wantCacheRead {
  267. t.Errorf("CacheReadInputTokens = %d, want %d", claudeResponse.Usage.CacheReadInputTokens, tt.wantCacheRead)
  268. }
  269. if claudeResponse.Usage.CacheCreationInputTokens != tt.wantCacheCreate {
  270. t.Errorf("CacheCreationInputTokens = %d, want %d", claudeResponse.Usage.CacheCreationInputTokens, tt.wantCacheCreate)
  271. }
  272. if claudeResponse.Usage.OutputTokens != tt.wantOutput {
  273. t.Errorf("OutputTokens = %d, want %d", claudeResponse.Usage.OutputTokens, tt.wantOutput)
  274. }
  275. if tt.want5m > 0 || tt.want1h > 0 {
  276. if claudeResponse.Usage.CacheCreation == nil {
  277. t.Fatal("CacheCreation should not be nil")
  278. }
  279. if claudeResponse.Usage.CacheCreation.Ephemeral5mInputTokens != tt.want5m {
  280. t.Errorf("Ephemeral5mInputTokens = %d, want %d", claudeResponse.Usage.CacheCreation.Ephemeral5mInputTokens, tt.want5m)
  281. }
  282. if claudeResponse.Usage.CacheCreation.Ephemeral1hInputTokens != tt.want1h {
  283. t.Errorf("Ephemeral1hInputTokens = %d, want %d", claudeResponse.Usage.CacheCreation.Ephemeral1hInputTokens, tt.want1h)
  284. }
  285. }
  286. })
  287. }
  288. }