llm_constant.py 3.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110
  1. from _decimal import Decimal
  2. models = {
  3. 'claude-instant-1': 'anthropic', # 100,000 tokens
  4. 'claude-2': 'anthropic', # 100,000 tokens
  5. 'gpt-4': 'openai', # 8,192 tokens
  6. 'gpt-4-32k': 'openai', # 32,768 tokens
  7. 'gpt-3.5-turbo': 'openai', # 4,096 tokens
  8. 'gpt-3.5-turbo-16k': 'openai', # 16384 tokens
  9. 'text-davinci-003': 'openai', # 4,097 tokens
  10. 'text-davinci-002': 'openai', # 4,097 tokens
  11. 'text-curie-001': 'openai', # 2,049 tokens
  12. 'text-babbage-001': 'openai', # 2,049 tokens
  13. 'text-ada-001': 'openai', # 2,049 tokens
  14. 'text-embedding-ada-002': 'openai', # 8191 tokens, 1536 dimensions
  15. 'whisper-1': 'openai'
  16. }
  17. max_context_token_length = {
  18. 'claude-instant-1': 100000,
  19. 'claude-2': 100000,
  20. 'gpt-4': 8192,
  21. 'gpt-4-32k': 32768,
  22. 'gpt-3.5-turbo': 4096,
  23. 'gpt-3.5-turbo-16k': 16384,
  24. 'text-davinci-003': 4097,
  25. 'text-davinci-002': 4097,
  26. 'text-curie-001': 2049,
  27. 'text-babbage-001': 2049,
  28. 'text-ada-001': 2049,
  29. 'text-embedding-ada-002': 8191,
  30. }
  31. models_by_mode = {
  32. 'chat': [
  33. 'claude-instant-1', # 100,000 tokens
  34. 'claude-2', # 100,000 tokens
  35. 'gpt-4', # 8,192 tokens
  36. 'gpt-4-32k', # 32,768 tokens
  37. 'gpt-3.5-turbo', # 4,096 tokens
  38. 'gpt-3.5-turbo-16k', # 16,384 tokens
  39. ],
  40. 'completion': [
  41. 'claude-instant-1', # 100,000 tokens
  42. 'claude-2', # 100,000 tokens
  43. 'gpt-4', # 8,192 tokens
  44. 'gpt-4-32k', # 32,768 tokens
  45. 'gpt-3.5-turbo', # 4,096 tokens
  46. 'gpt-3.5-turbo-16k', # 16,384 tokens
  47. 'text-davinci-003', # 4,097 tokens
  48. 'text-davinci-002' # 4,097 tokens
  49. 'text-curie-001', # 2,049 tokens
  50. 'text-babbage-001', # 2,049 tokens
  51. 'text-ada-001' # 2,049 tokens
  52. ],
  53. 'embedding': [
  54. 'text-embedding-ada-002' # 8191 tokens, 1536 dimensions
  55. ]
  56. }
  57. model_currency = 'USD'
  58. model_prices = {
  59. 'claude-instant-1': {
  60. 'prompt': Decimal('0.00163'),
  61. 'completion': Decimal('0.00551'),
  62. },
  63. 'claude-2': {
  64. 'prompt': Decimal('0.01102'),
  65. 'completion': Decimal('0.03268'),
  66. },
  67. 'gpt-4': {
  68. 'prompt': Decimal('0.03'),
  69. 'completion': Decimal('0.06'),
  70. },
  71. 'gpt-4-32k': {
  72. 'prompt': Decimal('0.06'),
  73. 'completion': Decimal('0.12')
  74. },
  75. 'gpt-3.5-turbo': {
  76. 'prompt': Decimal('0.0015'),
  77. 'completion': Decimal('0.002')
  78. },
  79. 'gpt-3.5-turbo-16k': {
  80. 'prompt': Decimal('0.003'),
  81. 'completion': Decimal('0.004')
  82. },
  83. 'text-davinci-003': {
  84. 'prompt': Decimal('0.02'),
  85. 'completion': Decimal('0.02')
  86. },
  87. 'text-curie-001': {
  88. 'prompt': Decimal('0.002'),
  89. 'completion': Decimal('0.002')
  90. },
  91. 'text-babbage-001': {
  92. 'prompt': Decimal('0.0005'),
  93. 'completion': Decimal('0.0005')
  94. },
  95. 'text-ada-001': {
  96. 'prompt': Decimal('0.0004'),
  97. 'completion': Decimal('0.0004')
  98. },
  99. 'text-embedding-ada-002': {
  100. 'usage': Decimal('0.0001'),
  101. }
  102. }
  103. agent_model_name = 'text-davinci-003'