chipling commited on
Commit
f7f5f3d
·
verified ·
1 Parent(s): af5e18d

Delete models/together

Browse files
models/together/__pycache__/main.cpython-312.pyc DELETED
Binary file (5.8 kB)
 
models/together/main.py DELETED
@@ -1,79 +0,0 @@
1
- import httpx
2
- import asyncio
3
-
4
- class TogetherAPI:
5
-
6
- cookies = {
7
- 'intercom-id-evnv2y8k': 'fea4d452-f9be-42e0-93e3-1e47a3836362',
8
- 'intercom-device-id-evnv2y8k': '2bb3e469-0159-4b6b-a33e-1aea4b51ccb1',
9
- '__stripe_mid': 'e0f7c1ba-56c6-44d4-ba1d-cf4611453eb43cf922',
10
- 'state-csrf': '6f2o8nqgee2dfqdmhaxipe',
11
- 'together_auth_cookie': '%7B%22expires%22%3A%222026-04-09T15%3A14%3A08.985Z%22%2C%22session%22%3A%220eae08c6fd1b79a22476a317d440a2104d74cd3ba333e40771b5ce50a90784297eb82eff36263debca2ee0658abe3e43cab97f87794421111d4bdec56b43dd2595ee22a165c123ba3d0f807759555b5f6d3f51b7c248e7cefcdf0f0b897f62b25b2a569e2cb89633032f15dca9818f39ed49f3ac2d7e0bc3d24517c62c78b1e4%22%7D',
12
- '__stripe_sid': '979e00a2-06ed-45be-9a95-88d7e7580f625ccce4',
13
- 'intercom-session-evnv2y8k': 'TzZzSzBNRG8xdHJtTVprMm1zUXFob0M2ekhFV3VmeDZFcW5UVldlYmFYc3RsRjFmdWJidjU1ZXVSZzNOSW9QTE82OUx6anlvMWVncmlTd2ZvOERDUXN4OUdoSEM5ZzRnQmh4d2o5S3JKeDA9LS00S3JOclNpNzU0VkVBaTNRNWhSMm93PT0=--2719775e99e920753d35527a45a6731bac5e8f8f',
14
- 'AMP_7112ee0414': 'JTdCJTIyZGV2aWNlSWQlMjIlM0ElMjJmY2ZmNjE3Ny00Yzg0LTRlOTItYTFhMC1kM2Y1ZjllOTFkYTglMjIlMkMlMjJ1c2VySWQlMjIlM0ElMjI2N2I1ZDkwNDNkZTIyN2Q0OGIzMWEwZTMlMjIlMkMlMjJzZXNzaW9uSWQlMjIlM0ExNzQ0MjExNjQyMjEwJTJDJTIyb3B0T3V0JTIyJTNBZmFsc2UlMkMlMjJsYXN0RXZlbnRUaW1lJTIyJTNBMTc0NDIxMTc1ODAwOSUyQyUyMmxhc3RFdmVudElkJTIyJTNBMjMyJTJDJTIycGFnZUNvdW50ZXIlMjIlM0E1JTdE',
15
- }
16
-
17
- headers = {
18
- 'accept': 'application/json',
19
- 'accept-language': 'en-US,en;q=0.9,ja;q=0.8',
20
- 'authorization': 'Bearer 4d900964e385651ea685af6f6cd5573a17b421f50657f73f903525177915a7e2',
21
- 'content-type': 'application/json',
22
- 'priority': 'u=1, i',
23
- 'sec-ch-ua': '"Google Chrome";v="135", "Not-A.Brand";v="8", "Chromium";v="135"',
24
- 'sec-ch-ua-mobile': '?0',
25
- 'sec-ch-ua-platform': '"macOS"',
26
- 'sec-fetch-dest': 'empty',
27
- 'sec-fetch-mode': 'cors',
28
- 'sec-fetch-site': 'same-origin',
29
- 'x-stainless-arch': 'unknown',
30
- 'x-stainless-lang': 'js',
31
- 'x-stainless-os': 'Unknown',
32
- 'x-stainless-package-version': '0.11.1',
33
- 'x-stainless-retry-count': '0',
34
- 'x-stainless-runtime': 'browser:chrome',
35
- 'x-stainless-runtime-version': '135.0.0',
36
- 'referer': 'https://api.together.ai/playground/v2/chat/meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8',
37
- }
38
-
39
- def __init__(self):
40
- self.base_url = "https://api.together.ai/inference"
41
-
42
- def get_model_list(self):
43
- models = ['meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8', 'meta-llama/Llama-4-Scout-17B-16E-Instruct', 'deepseek-ai/DeepSeek-R1', 'deepseek-ai/DeepSeek-V3', 'Qwen/Qwen2.5-VL-72B-Instruct', 'google/gemma-2-27b-it']
44
- return models
45
-
46
- async def generate(self, json_data: dict):
47
- max_retries = 5
48
- for attempt in range(max_retries):
49
- async with httpx.AsyncClient(timeout=None) as client:
50
- try:
51
- request_ctx = client.stream(
52
- "POST",
53
- "https://api.together.ai/inference",
54
- cookies=TogetherAPI.cookies,
55
- headers=TogetherAPI.headers,
56
- json=json_data
57
- )
58
-
59
- async with request_ctx as response:
60
- if response.status_code == 200:
61
- async for line in response.aiter_lines():
62
- if line:
63
- yield f"{line}\n"
64
- return
65
- elif response.status_code == 429:
66
- if attempt < max_retries - 1:
67
- await asyncio.sleep(0.5)
68
- continue
69
- yield "data: [Rate limited, max retries]\n\n"
70
- return
71
- else:
72
- yield f"data: [Unexpected status code: {response.status_code}]\n\n"
73
- return
74
- except Exception as e:
75
- yield f"data: [Connection error: {str(e)}]\n\n"
76
- return
77
-
78
- yield "data: [Max retries reached]\n\n"
79
-