-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathapp.py
320 lines (280 loc) · 11.1 KB
/
app.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
from flask import Flask, render_template, abort, url_for, redirect, request, send_file
import logging
from scraper import init_db, scrape_models, get_models, get_model_by_slug
import threading
import sqlite3
import os
import csv
import io
# Configure logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)
app = Flask(__name__, static_folder='static', static_url_path='/static')
# Global variables to track scraping status
is_scraping = False
should_stop_scraping = False
total_models_to_scrape = 0
def initialize_database():
"""Initialize database only"""
try:
logger.info("Initializing database...")
init_db() # Creates table if it doesn't exist
return True
except Exception as e:
logger.error(f"Error initializing database: {str(e)}")
return False
def start_scraping():
"""Start scraping models in a background thread"""
global is_scraping, should_stop_scraping, total_models_to_scrape
def scrape_worker():
global is_scraping, should_stop_scraping
try:
is_scraping = True
should_stop_scraping = False
logger.info("Scraping models...")
models = scrape_models(lambda: should_stop_scraping) # Pass stop check callback
if should_stop_scraping:
logger.info("Scraping was stopped by user")
else:
logger.info(f"Successfully scraped {len(models)} models")
except Exception as e:
logger.error(f"Error scraping models: {str(e)}")
finally:
is_scraping = False
should_stop_scraping = False
if not is_scraping:
thread = threading.Thread(target=scrape_worker)
thread.daemon = True
thread.start()
return True
return False
@app.route('/admin/stop', methods=['POST'])
def stop_scraping():
"""Stop the scraping process"""
global should_stop_scraping
try:
logger.info("Stopping scraping process...")
should_stop_scraping = True
return redirect('/admin')
except Exception as e:
logger.error(f"Error stopping scrape: {str(e)}")
logger.exception(e)
abort(500)
@app.route('/admin/delete', methods=['POST'])
def delete_models():
"""Delete all models from the database"""
try:
logger.info("Deleting all models from database...")
conn = sqlite3.connect('models.db')
c = conn.cursor()
c.execute('DELETE FROM models')
conn.commit()
conn.close()
logger.info("Successfully deleted all models")
return redirect('/admin')
except Exception as e:
logger.error(f"Error deleting models: {str(e)}")
logger.exception(e)
abort(500)
return False
# Initialize database on startup (without scraping)
initialize_database()
@app.route('/')
def home():
breadcrumbs = [] # Home page has no breadcrumbs
return render_template('index.html', breadcrumbs=breadcrumbs)
@app.route('/models')
def models():
try:
# Get search query and page number from query parameters
search_query = request.args.get('q', '').lower()
page = int(request.args.get('page', 1))
per_page = 20
# Set breadcrumbs
breadcrumbs = [
{'url': '/models', 'text': 'Models'}
]
# Get models from database
logger.info("Fetching models from database...")
model_list = get_models()
# Only show models that have been fully downloaded
available_models = [
model for model in model_list
if model.get('providers') and model.get('provider_details') and model.get('description')
]
# Filter models if search query exists
if search_query:
filtered_models = []
for model in available_models:
name = model['name'].lower()
model_id = model['model_id'].lower()
providers = [p.lower() for p in model['providers']]
if (search_query in name or
search_query in model_id or
any(search_query in p for p in providers)):
filtered_models.append(model)
available_models = filtered_models
# Sort models, prioritizing newer models
def sort_key(model):
name = model['name'].lower()
model_id = model['model_id'].lower()
if 'claude-3' in model_id:
return ('0', name) # Claude-3 models first
elif 'gpt-4' in model_id:
return ('1', name) # GPT-4 models second
elif 'gemini' in model_id:
return ('2', name) # Gemini models third
return ('3', name) # All other models
available_models.sort(key=sort_key)
# Calculate pagination
total_models = len(available_models)
total_pages = (total_models + per_page - 1) // per_page
# Ensure page is within valid range
page = max(1, min(page, total_pages))
# Slice the models list for current page
start_idx = (page - 1) * per_page
end_idx = start_idx + per_page
paginated_models = available_models[start_idx:end_idx]
# Get total models being scraped
global total_models_to_scrape
if total_models_to_scrape == 0:
try:
# Check if database exists
if os.path.exists('models.db'):
conn = sqlite3.connect('models.db')
c = conn.cursor()
c.execute('SELECT COUNT(*) FROM models')
total_models_to_scrape = c.fetchone()[0] or 217 # Default to 217 if no count
conn.close()
else:
total_models_to_scrape = 217 # Default number of models
except:
total_models_to_scrape = 217 # Default if database error
logger.info(f"Retrieved {len(available_models)} available models out of {total_models_to_scrape} total models")
return render_template(
'models.html',
models=paginated_models,
total_models=total_models_to_scrape,
available_models=len(available_models),
breadcrumbs=breadcrumbs,
current_page=page,
total_pages=total_pages,
per_page=per_page,
is_scraping=is_scraping # Pass scraping status to template
)
except Exception as e:
logger.error(f"Error retrieving models: {str(e)}")
logger.exception(e) # This will log the full stack trace
return render_template('models.html', models=[], total_models=217, available_models=0, breadcrumbs=breadcrumbs, is_scraping=is_scraping)
@app.route('/model/<slug>')
def model_detail(slug):
try:
logger.info(f"Fetching details for model: {slug}")
model = get_model_by_slug(slug)
if model is None:
logger.warning(f"Model not found with slug: {slug}")
abort(404)
# Set breadcrumbs
breadcrumbs = [
{'url': '/models', 'text': 'Models'},
{'url': f'/model/{slug}', 'text': model['name']}
]
logger.info(f"Found model: {model['name']}")
return render_template('model_detail.html', model=model, breadcrumbs=breadcrumbs)
except Exception as e:
logger.error(f"Error retrieving model details: {str(e)}")
logger.exception(e) # This will log the full stack trace
abort(500)
@app.route('/admin')
def admin():
try:
# Set breadcrumbs
breadcrumbs = [
{'url': '/admin', 'text': 'Admin'}
]
# Get models count
model_list = get_models()
available_models = [
model for model in model_list
if model.get('providers') and model.get('provider_details') and model.get('description')
]
return render_template(
'admin.html',
total_models=total_models_to_scrape,
available_models=len(available_models),
breadcrumbs=breadcrumbs,
is_scraping=is_scraping # Pass scraping status to template
)
except Exception as e:
logger.error(f"Error accessing admin page: {str(e)}")
logger.exception(e)
abort(500)
@app.route('/admin/export')
def export_models():
try:
# Get all models
models = get_models()
# Create a string buffer to write CSV data
output = io.StringIO()
writer = csv.writer(output)
# Write header
writer.writerow(['Name', 'Model ID', 'Provider', 'Context Length', 'Max Output',
'Input Price', 'Output Price', 'Latency', 'Throughput', 'URL'])
# Write data
for model in models:
for provider in model.get('providers', []):
if provider in model.get('provider_details', {}):
details = model['provider_details'][provider]
writer.writerow([
model['name'],
model['model_id'],
provider,
details.get('context', ''),
details.get('max_output', ''),
details.get('input_price', ''),
details.get('output_price', ''),
details.get('latency', ''),
details.get('throughput', ''),
details.get('url', '')
])
# Move cursor to beginning of file
output.seek(0)
# Return the CSV file
return send_file(
io.BytesIO(output.getvalue().encode('utf-8')),
mimetype='text/csv',
as_attachment=True,
download_name='models.csv'
)
except Exception as e:
logger.error(f"Error exporting models: {str(e)}")
logger.exception(e)
abort(500)
@app.route('/admin/refresh', methods=['POST'])
def refresh_models():
try:
# Start scraping in background
logger.info("Starting model refresh...")
if start_scraping():
logger.info("Model refresh started successfully")
else:
logger.warning("Scraping already in progress")
return redirect('/admin')
except Exception as e:
logger.error(f"Error starting model refresh: {str(e)}")
logger.exception(e)
abort(500)
@app.errorhandler(404)
def not_found_error(error):
breadcrumbs = [{'url': '#', 'text': 'Not Found'}]
return render_template('404.html', breadcrumbs=breadcrumbs), 404
@app.errorhandler(500)
def internal_error(error):
breadcrumbs = [{'url': '#', 'text': 'Error'}]
return render_template('500.html', breadcrumbs=breadcrumbs), 500
if __name__ == '__main__':
# Ensure static directory exists
os.makedirs('static/css', exist_ok=True)
# Start the Flask server immediately
logger.info("Starting Flask server on port 5000...")
app.run(host='127.0.0.1', port=5000, debug=True)