groq.go 2.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182
  1. package models
  2. const (
  3. ProviderGROQ ModelProvider = "groq"
  4. // GROQ
  5. QWENQwq ModelID = "qwen-qwq"
  6. // GROQ preview models
  7. Llama4Scout ModelID = "meta-llama/llama-4-scout-17b-16e-instruct"
  8. Llama4Maverick ModelID = "meta-llama/llama-4-maverick-17b-128e-instruct"
  9. Llama3_3_70BVersatile ModelID = "llama-3.3-70b-versatile"
  10. DeepseekR1DistillLlama70b ModelID = "deepseek-r1-distill-llama-70b"
  11. )
  12. var GroqModels = map[ModelID]Model{
  13. //
  14. // GROQ
  15. QWENQwq: {
  16. ID: QWENQwq,
  17. Name: "Qwen Qwq",
  18. Provider: ProviderGROQ,
  19. APIModel: "qwen-qwq-32b",
  20. CostPer1MIn: 0.29,
  21. CostPer1MInCached: 0.275,
  22. CostPer1MOutCached: 0.0,
  23. CostPer1MOut: 0.39,
  24. ContextWindow: 128_000,
  25. DefaultMaxTokens: 50000,
  26. // for some reason, the groq api doesn't like the reasoningEffort parameter
  27. CanReason: false,
  28. },
  29. Llama4Scout: {
  30. ID: Llama4Scout,
  31. Name: "Llama4Scout",
  32. Provider: ProviderGROQ,
  33. APIModel: "meta-llama/llama-4-scout-17b-16e-instruct",
  34. CostPer1MIn: 0.11,
  35. CostPer1MInCached: 0,
  36. CostPer1MOutCached: 0,
  37. CostPer1MOut: 0.34,
  38. ContextWindow: 128_000, // 10M when?
  39. },
  40. Llama4Maverick: {
  41. ID: Llama4Maverick,
  42. Name: "Llama4Maverick",
  43. Provider: ProviderGROQ,
  44. APIModel: "meta-llama/llama-4-maverick-17b-128e-instruct",
  45. CostPer1MIn: 0.20,
  46. CostPer1MInCached: 0,
  47. CostPer1MOutCached: 0,
  48. CostPer1MOut: 0.20,
  49. ContextWindow: 128_000,
  50. },
  51. Llama3_3_70BVersatile: {
  52. ID: Llama3_3_70BVersatile,
  53. Name: "Llama3_3_70BVersatile",
  54. Provider: ProviderGROQ,
  55. APIModel: "llama-3.3-70b-versatile",
  56. CostPer1MIn: 0.59,
  57. CostPer1MInCached: 0,
  58. CostPer1MOutCached: 0,
  59. CostPer1MOut: 0.79,
  60. ContextWindow: 128_000,
  61. },
  62. DeepseekR1DistillLlama70b: {
  63. ID: DeepseekR1DistillLlama70b,
  64. Name: "DeepseekR1DistillLlama70b",
  65. Provider: ProviderGROQ,
  66. APIModel: "deepseek-r1-distill-llama-70b",
  67. CostPer1MIn: 0.75,
  68. CostPer1MInCached: 0,
  69. CostPer1MOutCached: 0,
  70. CostPer1MOut: 0.99,
  71. ContextWindow: 128_000,
  72. CanReason: true,
  73. },
  74. }