pricing.yaml 5.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246
  1. # LLM 定价配置
  2. #
  3. # 价格单位:美元 / 1M tokens
  4. # 支持通配符:* 匹配任意字符
  5. #
  6. # 字段说明:
  7. # model: 模型名称(必填)
  8. # input_price: 输入 token 价格(必填)
  9. # output_price: 输出 token 价格(必填)
  10. # reasoning_price: 推理 token 价格(可选,默认 = output_price)
  11. # cache_creation_price: 缓存创建价格(可选,默认 = input_price * 1.25)
  12. # cache_read_price: 缓存读取价格(可选,默认 = input_price * 0.1)
  13. # provider: 提供商名称(可选,用于分类)
  14. # description: 描述(可选)
  15. #
  16. # 使用方法:
  17. # 1. 复制此文件到项目根目录或 config/ 目录
  18. # 2. 或设置环境变量 AGENT_PRICING_CONFIG 指向配置文件
  19. # 3. 根据实际使用的模型修改价格
  20. models:
  21. # ===== OpenAI =====
  22. - model: gpt-4o
  23. input_price: 2.50
  24. output_price: 10.00
  25. provider: openai
  26. - model: gpt-4o-mini
  27. input_price: 0.15
  28. output_price: 0.60
  29. provider: openai
  30. - model: gpt-4-turbo
  31. input_price: 10.00
  32. output_price: 30.00
  33. provider: openai
  34. # o1 系列(有 reasoning tokens)
  35. - model: o1
  36. input_price: 15.00
  37. output_price: 60.00
  38. reasoning_price: 60.00 # reasoning tokens 和 output 同价
  39. provider: openai
  40. - model: o1-mini
  41. input_price: 3.00
  42. output_price: 12.00
  43. reasoning_price: 12.00
  44. provider: openai
  45. - model: o3-mini
  46. input_price: 1.10
  47. output_price: 4.40
  48. reasoning_price: 4.40
  49. provider: openai
  50. # ===== Anthropic Claude =====
  51. # Claude 支持 prompt caching,缓存价格:
  52. # - cache_creation: 1.25x input_price
  53. # - cache_read: 0.1x input_price
  54. - model: claude-3-5-sonnet-20241022
  55. input_price: 3.00
  56. output_price: 15.00
  57. cache_creation_price: 3.75 # 3.00 * 1.25
  58. cache_read_price: 0.30 # 3.00 * 0.1
  59. provider: anthropic
  60. - model: claude-3-5-haiku-20241022
  61. input_price: 0.80
  62. output_price: 4.00
  63. cache_creation_price: 1.00 # 0.80 * 1.25
  64. cache_read_price: 0.08 # 0.80 * 0.1
  65. provider: anthropic
  66. - model: claude-3-opus-20240229
  67. input_price: 15.00
  68. output_price: 75.00
  69. cache_creation_price: 18.75 # 15.00 * 1.25
  70. cache_read_price: 1.50 # 15.00 * 0.1
  71. provider: anthropic
  72. # Claude 通配符(匹配新版本)
  73. - model: claude-3-5-sonnet*
  74. input_price: 3.00
  75. output_price: 15.00
  76. cache_creation_price: 3.75
  77. cache_read_price: 0.30
  78. provider: anthropic
  79. - model: claude-sonnet-4*
  80. input_price: 3.00
  81. output_price: 15.00
  82. cache_creation_price: 3.75 # 3.00 * 1.25
  83. cache_read_price: 0.30 # 3.00 * 0.1
  84. provider: anthropic
  85. - model: claude-opus-4*
  86. input_price: 5.00
  87. output_price: 25.00
  88. cache_creation_price: 6.25 # 5.00 * 1.25
  89. cache_read_price: 0.50 # 5.00 * 0.1
  90. provider: anthropic
  91. # ===== Google Gemini =====
  92. - model: gemini-2.5-pro
  93. input_price: 1.25
  94. output_price: 10.00
  95. reasoning_price: 10.00 # thinking mode
  96. provider: google
  97. - model: gemini-2.0-flash
  98. input_price: 0.10
  99. output_price: 0.40
  100. provider: google
  101. - model: gemini-2.0-flash-thinking
  102. input_price: 0.10
  103. output_price: 0.40
  104. reasoning_price: 0.40
  105. provider: google
  106. - model: gemini-1.5-pro
  107. input_price: 1.25
  108. output_price: 5.00
  109. provider: google
  110. - model: gemini-1.5-flash
  111. input_price: 0.075
  112. output_price: 0.30
  113. provider: google
  114. # Gemini 通配符
  115. - model: gemini-2.5*
  116. input_price: 1.25
  117. output_price: 10.00
  118. provider: google
  119. - model: gemini-2.0*
  120. input_price: 0.10
  121. output_price: 0.40
  122. provider: google
  123. # ===== DeepSeek =====
  124. - model: deepseek-chat
  125. input_price: 0.14
  126. output_price: 0.28
  127. provider: deepseek
  128. - model: deepseek-reasoner
  129. input_price: 0.55
  130. output_price: 2.19
  131. reasoning_price: 2.19
  132. provider: deepseek
  133. - model: deepseek-r1*
  134. input_price: 0.55
  135. output_price: 2.19
  136. reasoning_price: 2.19
  137. provider: deepseek
  138. # ===== OpenRouter 转发 =====
  139. # OpenRouter 使用 provider/model 格式
  140. - model: anthropic/claude-sonnet-4.5
  141. input_price: 3.00
  142. output_price: 15.00
  143. cache_creation_price: 3.75
  144. cache_read_price: 0.30
  145. provider: openrouter
  146. - model: anthropic/claude-opus-4.5
  147. input_price: 5.00
  148. output_price: 25.00
  149. cache_creation_price: 6.25
  150. cache_read_price: 0.50
  151. provider: openrouter
  152. - model: anthropic/claude-opus-4.6
  153. input_price: 5.00
  154. output_price: 25.00
  155. cache_creation_price: 6.25
  156. cache_read_price: 0.50
  157. provider: openrouter
  158. - model: anthropic/claude-haiku-4.5
  159. input_price: 1.00
  160. output_price: 5.00
  161. cache_creation_price: 1.25
  162. cache_read_price: 0.10
  163. provider: openrouter
  164. - model: anthropic/claude-sonnet-4
  165. input_price: 3.00
  166. output_price: 15.00
  167. cache_creation_price: 3.75
  168. cache_read_price: 0.30
  169. provider: openrouter
  170. - model: anthropic/claude*
  171. input_price: 3.00
  172. output_price: 15.00
  173. cache_creation_price: 3.75
  174. cache_read_price: 0.30
  175. provider: openrouter
  176. - model: openai/gpt-4o*
  177. input_price: 2.50
  178. output_price: 10.00
  179. provider: openrouter
  180. - model: openai/o1*
  181. input_price: 15.00
  182. output_price: 60.00
  183. reasoning_price: 60.00
  184. provider: openrouter
  185. - model: google/gemini-3-pro-preview
  186. input_price: 2
  187. output_price: 12
  188. reasoning_price: 12
  189. provider: openrouter
  190. - model: google/gemini-3-flash-preview
  191. input_price: 0.50
  192. output_price: 3
  193. reasoning_price: 3
  194. provider: openrouter
  195. - model: google/gemini*
  196. input_price: 0.30
  197. output_price: 2.50
  198. reasoning_price: 2.50
  199. provider: openrouter
  200. - model: deepseek/deepseek-r1*
  201. input_price: 0.55
  202. output_price: 2.19
  203. reasoning_price: 2.19
  204. provider: openrouter
  205. # ===== Yescode 代理 =====
  206. - model: claude-sonnet-4.5
  207. input_price: 3.00
  208. output_price: 15.00
  209. cache_creation_price: 3.75
  210. cache_read_price: 0.30
  211. provider: yescode