-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathbilling.py
More file actions
288 lines (245 loc) · 8.8 KB
/
billing.py
File metadata and controls
288 lines (245 loc) · 8.8 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
# billing.py
from __future__ import annotations
from datetime import datetime, timedelta
from decimal import Decimal
from typing import Any, Dict
from fastapi import HTTPException
from sqlalchemy import select
from sqlalchemy.ext.asyncio import AsyncSession
from models import (
User,
Project,
ProjectShare,
ProjectAllowance,
AllowanceInterval,
ModelPricing,
ModelType,
UsageLog,
CreditLedger, # <-- ADDED: to write ledger rows
)
# ---------------------- Utilities ----------------------
def approx_tokens_from_text(text: str) -> int:
"""
Very rough token estimate (safe for billing preview):
~ 4 chars per token, add small overhead.
"""
if not text:
return 0
return max(1, int(len(text) / 4) + text.count(" "))
async def log_usage(
session: AsyncSession,
user: User,
model: str,
provider: str,
model_type: ModelType,
input_count: int,
output_count: int,
billed_credits: Decimal,
request_meta: Dict[str, Any] | None = None,
response_meta: Dict[str, Any] | None = None,
):
ul = UsageLog(
user_id=user.id,
provider=provider,
model=model,
model_type=model_type,
input_count=input_count or 0,
output_count=output_count or 0,
billed_credits=Decimal(str(billed_credits or 0)),
request_meta=request_meta or {},
response_meta=response_meta or {},
)
session.add(ul)
# ---------------------- Ledger helper (ADDED) ----------------------
async def _log_ledger(
session: AsyncSession, *,
user_id: int,
delta: Decimal,
reason: str
) -> None:
"""
Append a row to CreditLedger. Call this ONLY when user.credits changes.
"""
session.add(CreditLedger(user_id=user_id, delta=Decimal(str(delta)), reason=reason))
# ---------------------- CommonPool debit ----------------------
def _period_bounds(now: datetime, interval: AllowanceInterval) -> tuple[datetime, datetime]:
if interval == AllowanceInterval.DAILY:
start = datetime(now.year, now.month, now.day)
end = start + timedelta(days=1)
elif interval == AllowanceInterval.WEEKLY:
start = datetime(now.year, now.month, now.day) - timedelta(days=now.weekday())
end = start + timedelta(days=7)
else:
start = datetime(now.year, now.month, 1)
if now.month == 12:
end = datetime(now.year + 1, 1, 1)
else:
end = datetime(now.year, now.month + 1, 1)
return start, end
async def _ensure_allowance(session: AsyncSession, user: User, project: Project) -> ProjectAllowance:
now = datetime.utcnow()
start, end = _period_bounds(now, project.allowance_interval)
q = await session.execute(
select(ProjectAllowance).where(
ProjectAllowance.project_id == project.id,
ProjectAllowance.user_id == user.id,
)
)
pa = q.scalar_one_or_none()
if not pa:
pa = ProjectAllowance(
project_id=project.id,
user_id=user.id,
remaining=project.allowance_per_user,
period_start=start,
period_end=end,
)
session.add(pa)
await session.flush()
return pa
# Reset on boundary crossing; roll unused to common pool
if not pa.period_start or not pa.period_end or now >= pa.period_end:
unused = Decimal(pa.remaining or 0)
project.common_pool_balance = Decimal(project.common_pool_balance or 0) + unused
pa.remaining = Decimal(project.allowance_per_user or 0)
pa.period_start, pa.period_end = start, end
await session.flush()
return pa
async def debit_credits(session: AsyncSession, user: User, cost: Decimal, model: str, provider: str) -> None:
"""
Deduct 'cost' credits with the policy:
CommonPool ON:
1) per-user allowance.remaining
2) project.common_pool_balance
3) user.credits
CommonPool OFF:
1) user.credits
2) project.credits
Raises HTTPException(402) if funds are insufficient.
"""
need = Decimal(cost or 0)
if need <= 0:
return
project: Project | None = user.project
if project and project.has_common_pool and project.allowance_interval:
pa = await _ensure_allowance(session, user, project)
# 1) allowance
take = min(need, Decimal(pa.remaining or 0))
if take > 0:
pa.remaining = Decimal(pa.remaining or 0) - take
project.credits = Decimal(project.credits or 0) - take
need -= take
# 2) common pool
if need > 0:
take = min(need, Decimal(project.common_pool_balance or 0))
if take > 0:
project.common_pool_balance = Decimal(project.common_pool_balance or 0) - take
project.credits = Decimal(project.credits or 0) - take
need -= take
# 3) user's own credits
if need > 0:
take = min(need, Decimal(user.credits or 0))
if take > 0:
user.credits = Decimal(user.credits or 0) - take
# ---------- ADDED: ledger row for actual user spend ----------
await _log_ledger(
session,
user_id=user.id,
delta=-take,
reason=f"spend:{provider}:{model}"
)
# -------------------------------------------------------------
need -= take
if need > 0:
raise HTTPException(
status_code=402,
detail="Insufficient credits (allowance, common pool and user balance exhausted).",
)
return
# ---- CommonPool OFF path ----
take = min(need, Decimal(user.credits or 0))
if take > 0:
user.credits = Decimal(user.credits or 0) - take
# ---------- ADDED: ledger row for actual user spend ----------
await _log_ledger(
session,
user_id=user.id,
delta=-take,
reason=f"spend:{provider}:{model}"
)
# -------------------------------------------------------------
need -= take
if need > 0 and project:
take = min(need, Decimal(project.credits or 0))
if take > 0:
project.credits = Decimal(project.credits or 0) - take
need -= take
if need > 0:
raise HTTPException(
status_code=402,
detail="Insufficient credits (user and project balances exhausted).",
)
# ---------------------- Price charges ----------------------
async def _pricing(session: AsyncSession, model: str, provider: str) -> ModelPricing | None:
q = await session.execute(
select(ModelPricing).where(ModelPricing.model == model, ModelPricing.provider == provider)
)
return q.scalar_one_or_none()
async def charge_llm(
session: AsyncSession,
user: User,
model: str,
provider: str,
input_tokens: int,
output_tokens: int,
) -> Decimal:
"""
Rechnet Preise als 'pro 1.000.000 Tokens' ab.
Beispiel: p_input=0.15 => 0,15 Credits je 1M Input-Tokens.
"""
p = await _pricing(session, model, provider)
if not p:
cost = Decimal(0)
else:
million = Decimal("1000000")
pi_per_million = Decimal(p.price_per_input_token or 0) # jetzt als 'pro 1M' gespeichert
po_per_million = Decimal(p.price_per_output_token or 0) # jetzt als 'pro 1M' gespeichert
pi = (pi_per_million * Decimal(input_tokens or 0)) / million
po = (po_per_million * Decimal(output_tokens or 0)) / million
cost = pi + po
await debit_credits(session, user, cost, model, provider)
return cost
async def charge_tts(
session: AsyncSession,
user: User,
model: str,
provider: str,
characters: int,
) -> Decimal:
p = await _pricing(session, model, provider)
cost = Decimal(p.price_per_character or 0) * Decimal(characters or 0) if p else Decimal(0)
await debit_credits(session, user, cost, model, provider)
return cost
async def charge_asr(
session: AsyncSession,
user: User,
model: str,
provider: str,
seconds: int,
) -> Decimal:
"""
Bills ASR by HOUR (fallback mode), using the DB field 'price_per_second' as the hourly price.
Rationale:
- We keep the DB column/name and API surface unchanged for minimal edits.
- Admin UI shows 'price/hour'; the value users enter is stored in price_per_second.
- Here we convert seconds -> hours and multiply by the stored hourly price.
"""
p = await _pricing(session, model, provider)
if not p:
cost = Decimal(0)
else:
hourly_price = Decimal(p.price_per_second or 0) # interpret as "price/hour"
hours = Decimal(seconds or 0) / Decimal(3600)
cost = hourly_price * hours
await debit_credits(session, user, cost, model, provider)
return cost