-
Notifications
You must be signed in to change notification settings - Fork 1
/
search.py
62 lines (55 loc) · 2.21 KB
/
search.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
import os
import requests
import pandas as pd
from serpapi import GoogleSearch
from dotenv import load_dotenv
from tqdm import tqdm
load_dotenv()
SUPPORTED_FORMATS = ('.png', '.jpg', '.jpeg', '.gif', '.bmp', '.webp')
MAX_RESULTS = 20
def upload_image(image_path):
try:
with open(image_path, "rb") as image_file:
response = requests.post(
"https://api.imgbb.com/1/upload",
files={"image": image_file},
params={"key": os.getenv('IMGBB_API_KEY')},
timeout=10
)
response.raise_for_status()
return response.json().get("data", {}).get("url", "")
except requests.exceptions.RequestException as e:
print(f"Network or request issue: {e}")
except Exception as e:
print(f"Unexpected error occurred: {e}")
return None
def google_lens_search(image_url):
try:
search = GoogleSearch({
"engine": "google_lens",
"url": image_url,
"no_cache": "true",
"api_key": os.getenv('SERPAPI_KEY')
})
results = search.get_dict()
thumbnails, links = zip(*[(match.get("thumbnail"), match.get("link")) for match in results.get("visual_matches", [])[:MAX_RESULTS]])
return list(thumbnails), list(links)
except Exception as e:
print(f"Search API error: {e}")
return [], []
def process_images(folder_path):
data = []
for filename in tqdm(os.listdir(folder_path)):
if filename.lower().endswith(SUPPORTED_FORMATS):
print(f"Processing {filename}...")
image_url = upload_image(os.path.join(folder_path, filename))
if image_url:
thumbnails, links = google_lens_search(image_url)
data.append([filename] + thumbnails + links)
else:
data.append([filename] + ["Upload failed"] * (2 * MAX_RESULTS))
column_names = ['Filename'] + [f"Thumbnail {i+1}" for i in range(MAX_RESULTS)] + [f"Link {i+1}" for i in range(MAX_RESULTS)]
df = pd.DataFrame(data, columns=column_names)
df.to_excel('results.xlsx', index=False)
print("All images processed and results are saved to results.xlsx.")
process_images(os.getenv('FOLDER_PATH'))