-
Notifications
You must be signed in to change notification settings - Fork 0
/
tuftpostbot.py
500 lines (417 loc) · 17.8 KB
/
tuftpostbot.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
import os
import sys
import json
import random
import tweepy
import flickrapi
import wget
import pathlib
from time import sleep
from dotenv import load_dotenv
from datetime import datetime
from PIL import Image
from PIL import ImageOps
from urllib import request
from fastai.vision.all import *
from fastai.text.all import *
from fastai.collab import *
from fastai.tabular.all import *
from discord_webhook import DiscordWebhook
from cohost.models.user import User
from cohost.models.block import MarkdownBlock
from atproto import Client
from atproto.exceptions import BadRequestError
from bskysession import *
base_posix_path = pathlib.PosixPath
if sys.platform.startswith("linux"):
pass
elif sys.platform.startswith("win32"):
pathlib.PosixPath = pathlib.WindowsPath
load_dotenv()
# API auth keys
CONS_KEY=os.getenv('TWT_CONSUMER_APIKEY')
CONS_SEC=os.getenv('TWT_CONSUMER_APISECRET')
AUTH_ACC=os.getenv('TWT_AUTH_ACCESSTOKEN')
AUTH_SEC=os.getenv('TWT_AUTH_SECRET')
BEARER=os.getenv('TWT_BEARER')
FLKR_KEY=os.getenv('FLICKR_KEY')
FLKR_SEC=os.getenv('FLICKR_SECRET')
BSKY_UNAME=str(os.getenv('BSKY_UNAME'))
BSKY_PASS=str(os.getenv('BSKY_PASS'))
# cohost env vars
CH_UNAME=os.getenv('COHO_UNAME')
CH_PW=os.getenv('COHO_PW')
CH_PAGE=os.getenv('COHO_PAGE')
# init
istuft = 0
probability = 0
owner_name = 0
backup_used_flag = False
# config
CONFIDENCE_THRESHOLD = 0.50
ATTEMPTS = 50
FETCH_COUNT = 15 #15
PAGE_RANGE = 256 #256
BLOCKLIST = ["61021753@N02", "101072775@N04", "120795404@N04"]
LOGFILE = "titpostbotlog.txt"
EXTRA_ARGS = 'url_o, owner_name, path_alias'
TAGS = 'tufted titmouse'
RESOLUTION = 1600 #pixels, width
REGISTRY_FILE="tuftregistry.txt"
DEFAULTMSG = (f"#Tuftpostbot Tuftie: {istuft}({probability}). Photo by {owner_name}")
WEBHOOK_URL = "https://discord.com/api/webhooks/1009424824399056896/pwF8xcTBfpN25d0RxC7SZgaixE01Yadpjq2N-IFT9wk8x-02zUNrZ5vWCn57ZcCHyZkk"
ENABLE_WEBHOOK = True
ENABLE_BSKY=bool(os.getenv('ENABLE_BSKY'))
ENABLE_COHOST=bool(os.getenv('ENABLE_COHOST'))
BACKUP_TUFT_DIR = "fallbacktuft"
BACKUP_METAFILE = "fallbackmeta.json"
# WEBHOOK = TUFTED TIDDIES SERVER
# references
# v1.1 api
auth = tweepy.OAuthHandler(CONS_KEY, CONS_SEC)
auth.set_access_token(AUTH_ACC, AUTH_SEC)
api = tweepy.API(auth, wait_on_rate_limit=True)
# v2.0 api
twclient = tweepy.Client(BEARER, CONS_KEY, CONS_SEC, AUTH_ACC, AUTH_SEC, wait_on_rate_limit=True)
# flickr api
flickr = flickrapi.FlickrAPI(FLKR_KEY, FLKR_SEC, format='parsed-json')
#bsky api
if ENABLE_BSKY:
bsky_client = Client()
session_string = getSessionString()
try:
bsky_client.login(session_string=session_string)
except BadRequestError as e:
print(f"Bsky login failed: {e}")
else:
print("Bsky login succesful!")
# twitter login
try:
api.verify_credentials()
print("Authentication OK")
except Exception as e:
print(f"Error during authentication: {e}")
# utility functions
def getTime():
dateTimeObj = datetime.now()
timestampStr = dateTimeObj.strftime("[%d-%m-%Y %H:%M:%S]")
return(timestampStr)
def writeToLog(message):
output = open(str(LOGFILE), "a")
output.write(getTime() + " " + str(message) + "\n")
output.close()
def deleteAllTempImages(folder_path):
for file in os.scandir(folder_path):
os.remove(file.path)
def deleteSingleImage(folder_path, filename):
full_path = folder_path+"/"+filename
#print(f"deleted {full_path} :D")
os.remove(full_path)
def findStringInNestedList(search_list, search_string):
for sublist in search_list:
try:
if search_string in sublist:
return search_list.index(sublist), sublist.index(search_string)
except TypeError:
print("Index not found!")
# check if image exists in registry; returns True if already exists.
def checkImageIDInRegistry(string):
try:
with open(REGISTRY_FILE, "r") as registry:
if string in set(registry.read().split('\n')):
#print(f"Found {string}!")
#writeToLog("checkImageIDInRegistry: Found match. Ignoring!")
return True
else:
#print(f"Could not find {string}!")
return False
except FileNotFoundError:
print(f"File not found. Creating {REGISTRY_FILE}")
writeToLog("checkImageIDInRegistry: Registry file not found. Creating...")
newfile = open(REGISTRY_FILE, "x")
newfile.close()
return False
def writeImageIDToRegistry(string):
try:
if checkImageIDInRegistry(string) == False:
with open(REGISTRY_FILE, "a") as registry:
registry.write(string+"\n")
print(f"Wrote {string} to file")
writeToLog("writeImageIDToRegistry: Wrote string " + string + " to registry.")
else:
print(f"Cannot write {string} to registry: already exists")
except FileNotFoundError:
print(f"File {REGISTRY_FILE} not found. Creating and appending image ID.")
writeToLog("writeImageIDToRegistry: Registry file not found. Creating...")
with open(REGISTRY_FILE, "a") as newregistry:
newregistry.write(string)
print(f"Wrote {string} to new file")
# this needs to be up here because fastai is a dummy
def is_tufter(filename):
return filename[0].isupper()
# always keep this below def is_tufter() to avoid bugs
learn = load_learner('tuftmodel_v8_10ep_lr0.001.pkl')
#main functions
def findBirdImage(search_tags, extra_arguments, image_fetch_count):
page_number = random.randint(1, PAGE_RANGE)
search_arguments = [extra_arguments]
#print(f"Page: {page_number}.")
search_query = flickr.photos.search(tags=search_tags, extras=search_arguments, per_page=image_fetch_count, page=page_number)
return search_query
# filter based on functionality; filtering on bird type comes later
def filterSearchResults(search_query):
image_url_data = ""
photo_id = ""
photo_owner_id = ""
photo_owner_name = ""
rejected = 0
b_pathalias = False
b_returned_image = False
for v in search_query["photos"]["photo"]:
temp_image_id = v["id"]
if not checkImageIDInRegistry(v["id"]):
if not v["owner"] in BLOCKLIST:
if "url_o" in v:
image_url_data = v["url_o"]
b_returned_image = True
if "owner" in v:
photo_owner_id = v["owner"]
photo_id = v["id"]
if "pathalias" in v:
if v["pathalias"] != None:
photo_owner_name = v["pathalias"]
f_pathAlias = True
else:
photo_owner_name = v["ownername"]
f_pathAlias = False
else:
rejected = rejected + 1
b_returned_image = False
else:
print(f"Blocked image from {v['owner']}")
rejected = rejected + 1
b_returned_image = False
else:
#print(f"ImageID {temp_image_id} already posted. Ignoring.")
writeToLog("ImageID " + temp_image_id + " already posted. Ignoring.")
b_returned_image = False
if len(image_url_data) == 0:
return ([], False)
data_list_full = [image_url_data, photo_owner_name, photo_id, photo_owner_id]
return(data_list_full, b_returned_image)
def collectInitialImageDataSet(count, max_requests):
iterator = 0
foundImages = 0
result_data_set = []
while foundImages < count:
sleep(1)
data_set, b_returned_image = filterSearchResults(findBirdImage(TAGS, EXTRA_ARGS, FETCH_COUNT))
if b_returned_image == False:
# no images found
iterator += 1
elif b_returned_image == True:
# found image
foundImages += 1
print(f"Found {foundImages} images...")
writeToLog(f"Found {foundImages} images...")
iterator += 1
result_data_set.append(data_set)
if iterator >= max_requests:
break
result_string = str(f"Found {count} images in {iterator}/{max_requests} attempts.")
print(result_string)
writeToLog(result_string)
return result_data_set
def downloadImagesFromURL(data_set, destination_path):
list_filenames = []
if len(data_set) < 1:
print("Dataset empty! AAAAAAAA")
writeToLog("dataset empty! AAAAAAA")
# TODO handle exception
for _, url in enumerate(data_set):
file_extension = str(url[0][-4:])
file_name = url[2]
file_name_full = file_name+file_extension
dl_image = urllib.request.urlretrieve(url[0], filename=destination_path+"/"+file_name_full)
list_filenames.append(file_name_full)
return list_filenames
# resize before using ML inference; operates faster on smaller images (if images are larger than 1600px)
def resizeImages(list_filenames, filepath, target_path, width):
for i, file in enumerate(list_filenames):
full_path = filepath+"/"+file
filename_no_extension = file[:-4]
image = Image.open(full_path)
image = ImageOps.exif_transpose(image) # if image is rotated; get correct rotation from EXIF metadata; if data is not present, just get a copy of 'image'
width_percentage = (width/float(image.size[0]))
height_size = int((float(image.size[1])*float(width_percentage)))
image = image.resize((width, height_size), Image.ANTIALIAS)
image.convert('RGB').save((target_path + "/" + "rs_" + filename_no_extension+".jpg"), format="JPEG")
def checkTufts(filepath, image_data_list):
for file in os.listdir(filepath):
img = PILImage.create(str(filepath)+"/"+str(file))
is_tufter,_,probs = learn.predict(img)
if probs[1].item() < CONFIDENCE_THRESHOLD:
writeToLog(f"{file} rejected, {probs[1].item()}")
deleteSingleImage(filepath, file)
image_id = file.replace("rs_", "").replace(".jpg", "")
index_a, index_b = findStringInNestedList(image_data_list, image_id)
probability = '{:.4f}'.format(probs[1].item())
image_data_list[index_a].append(probability)
image_data_list[index_a].append(str(is_tufter))
del image_data_list[index_a]
else:
writeToLog(f"{file} accepted, {probs[1].item()}")
image_id = file.replace("rs_", "").replace(".jpg", "")
index_a, index_b = findStringInNestedList(image_data_list, image_id)
probability = '{:.4f}'.format(probs[1].item())
image_data_list[index_a].append(probability)
image_data_list[index_a].append(str(is_tufter))
if len(image_data_list) == 0:
writeToLog("CheckTufts: dataset empty!")
print("CheckTufts: dataset empty!")
final_data_table = image_data_list
return final_data_table
def pickBackupTuftie():
# select one of the entries in the metadata file at random
with open(BACKUP_METAFILE) as file:
data = json.load(file)
keys = list(data)
index = random.randint(0, len(data)-1)
result_key = keys[index]
result_data = data[result_key]
# construct data table
# format: ['url', 'owner', 'filename', 'owner-id', 'probability', 'istuft true/false']
fallbackDataTable = list(result_data.values())
print(fallbackDataTable)
return fallbackDataTable
def pickBestTuftieFromResults(input_list, b_writeRegistry):
writeToLog(f"input list length: {len(input_list)}. list: {input_list}")
print(f"input list length: {len(input_list)}. list: {input_list}")
try:
index = random.randint(0, len(input_list)-1)
result_list = input_list[index]
picked_image_id = input_list[index][2]
print(f"index: {index}. results: {result_list}. ID: {picked_image_id}")
writeToLog(f"index: {index}. results: {result_list}. ID: {picked_image_id}")
if b_writeRegistry == True:
writeImageIDToRegistry(picked_image_id)
test_value = result_list[4]
print(test_value)
print(f"result_list: {result_list}")
writeToLog(f"result list: {result_list}")
return result_list
except Exception as e:
print(f"Exception {type(e).__name__} occurred in pickBestTuftieFromResults: {repr(e)}")
writeToLog(f"Exception {type(e).__name__} occurred in pickBestTuftieFromResults: {repr(e)}")
global backup_used_flag
backup_used_flag = True
#backup_tuft = ['https://live.staticflickr.com/65535/49872212437_1db03f17d4_o.jpg', 'tuftpostbot5000', 'backuptuft', '12345', '4325.000', 'YES']
backup_tuft = pickBackupTuftie()
return backup_tuft
def postBirdToTwitter(picked_image, message="default", b_should_post=True):
owner_name = picked_image[1]
filename = picked_image[2]
owner_id = picked_image[3]
istuft = picked_image[5]
media_id_list = []
media_url_original = picked_image[0]
try:
probability = picked_image[4]
except IndexError:
print("Can't find probability somehow, using fallback data")
owner_name = "tuftpostbot5000"
filename = "backuptuft"
probability = "OVER 9000"
istuft = "YEEHAW"
if backup_used_flag == True:
# using fallback tufterino
print("WARNING: BACKUP IMAGE USED.")
writeToLog("WARNING: BACKUP IMAGE USED.")
file_path = "fallbacktuft"
else:
file_path = "resized"
image_name = "rs_"+filename+".jpg"
full_path = file_path+"/"+image_name
if message == "default":
status_text_twt = (f"#Tuftpostbot Tuftie: {istuft}({probability}). Photo by {owner_name}. Tuftpostbot is now also on blue sky: titmou.se/sky")
status_text_other = (f"#Tuftpostbot Tuftie: {istuft}({probability}). Photo by {owner_name}.")
#status_text = DEFAULTMSG
else:
status_text_twt = (f"#Tuftpostbot {message}. Tuftie: {istuft}({probability}). Photo by {owner_name}. Tuftpostbot is now also on blue sky: titmou.se/sky")
status_text_other = (f"#Tuftpostbot {message}. Tuftie: {istuft}({probability}). Photo by {owner_name}.")
if b_should_post:
#send to twitter
#media_info = api.simple_upload(filename=full_path)
#media_id_list.append(media_info.media_id)
media_info = api.media_upload(filename=full_path)
posted_status_v2 = twclient.create_tweet(text=status_text_twt, media_ids=[media_info.media_id])
#posted_status_info = api.update_status(status=status_text, media_ids=media_id_list)
#media_id_list.clear()
print(f"Sent {status_text_twt} to Twitter!")
writeToLog(f"Sent {status_text_twt} to Twitter!")
#media_url = posted_status_info.entities["media"][0]["media_url"]
tweet_id = str(posted_status_v2.data["id"])
tweet_url = "https://vxtwitter.com/asoftbird/status/"+tweet_id
if ENABLE_WEBHOOK:
#send to discord webhook
#discord_text = (f"Tuftie: {istuft}({probability}). {picked_image[0]}")
discord_text = tweet_url
webhook = DiscordWebhook(url=WEBHOOK_URL, content=discord_text)
response = webhook.execute()
print(f"Sent {discord_text} to Discord!")
writeToLog(f"Sent {discord_text} to Discord!")
if ENABLE_COHOST:
#cohost stuff
user = User.login(CH_UNAME, CH_PW)
project = user.getProject(CH_PAGE)
# newpost = project.post(status_text, blocks=[MarkdownBlock(f"{tweet_url}")], tags=['tuftpostbot']) # 'tufted titmouse', 'automated posting', 'bot'
newpost = project.post(status_text_other, blocks=[MarkdownBlock(f"![]({media_url_original})")], tags=['tuftpostbot']) # 'tufted titmouse', 'automated posting', 'bot'
print(f"Sent {status_text_other} to Cohost as well (hopefully)!")
writeToLog(f"Sent {status_text_other} to Cohost as well (hopefully)!")
if ENABLE_BSKY:
with open(full_path, 'rb') as f:
image_data = f.read()
bsky_client.send_image(text=status_text_other, image=image_data, image_alt=status_text_other)
print(f"Sent {status_text_other} to bluesky!")
writeToLog(f"Sent {status_text_other} to bluesky!")
else:
print(f"Did not send to twitter/dc: NOPOST flag used. Text: {status_text_twt}")
writeToLog(f"Did not send to twitter/dc: NOPOST flag used. Text: {status_text_twt}")
# TODO:
# keep files in /resized/ around so there's a supply of tufterinos available
# clear temp folders before loading new images
deleteAllTempImages("ids")
deleteAllTempImages("resized")
if "NOPOST" in sys.argv:
b_should_post = False
b_writeRegistry = False
message = "default"
else:
b_should_post = True
b_writeRegistry = True
if len(sys.argv) <=1:
print("starting without arguments")
writeToLog("starting without arguments")
message = "default"
else:
message = str(sys.argv[1])
print(f"Using custom message '{message}'")
writeToLog(f"Using custom message '{message}'")
chance = random.randint(0, 500)
print(f"\n Looking for new tufties! Rolled {chance}\n")
writeToLog(f"Looking for tufties! Rolled {chance}")
if chance != 42:
initial_data_set = (collectInitialImageDataSet(5, ATTEMPTS))
downloaded_filename_list = downloadImagesFromURL(initial_data_set, "ids")
resizeImages(downloaded_filename_list, "ids", "resized", RESOLUTION)
result_list = checkTufts("resized", initial_data_set)
print(result_list)
pick = pickBestTuftieFromResults(result_list, b_writeRegistry)
else:
print("\n Rolled a 42! Posting shitpost tuftie!\n")
writeToLog("Rolled a 42! Posting shitpost tuftie!")
# we do a lil shitposting
pick = pickBackupTuftie()
print(f"Picked {pick} as #1 best tuftie of the year!")
writeToLog(pick)
postBirdToTwitter(pick, message, b_should_post)