From fbaf714fb52da66febb137d798b68ba209c2a21c Mon Sep 17 00:00:00 2001 From: Kiran Jonnalagadda Date: Mon, 2 Dec 2024 14:46:06 +0530 Subject: [PATCH 1/3] Add Bluesky support --- .gitignore | 3 + README.md | 2 +- hasjob/models/jobpost.py | 2 +- hasjob/socialmedia.py | 131 ++++++++++++++++++++++++++++++++++++ hasjob/twitter.py | 47 ------------- hasjob/views/listing.py | 23 ++++++- instance/settings-sample.py | 4 ++ requirements.txt | 1 + 8 files changed, 163 insertions(+), 50 deletions(-) create mode 100644 hasjob/socialmedia.py delete mode 100644 hasjob/twitter.py diff --git a/.gitignore b/.gitignore index 524ed67ff..b0c1b09ed 100644 --- a/.gitignore +++ b/.gitignore @@ -9,6 +9,9 @@ test.db .settings .sass-cache .webassets-cache +.venv +.env +.envrc error.log error.log.* .coverage diff --git a/README.md b/README.md index 554bedb20..6b99540a1 100644 --- a/README.md +++ b/README.md @@ -174,7 +174,7 @@ gid = chdir = /path/to/hasjob/git/repo/folder virtualenv = /path/to/virtualenv plugins-dir = /usr/lib/uwsgi/plugins -plugins = python37 +plugins = python311 pp = .. wsgi-file = wsgi.py callable = application diff --git a/hasjob/models/jobpost.py b/hasjob/models/jobpost.py index 145421fe0..802f66b0a 100644 --- a/hasjob/models/jobpost.py +++ b/hasjob/models/jobpost.py @@ -187,7 +187,7 @@ class JobPost(BaseMixin, Model): company_name = sa.orm.mapped_column(sa.Unicode(80), nullable=False) company_logo = sa.orm.mapped_column(sa.Unicode(255), nullable=True) company_url = sa.orm.mapped_column(sa.Unicode(255), nullable=False, default='') - twitter = sa.orm.mapped_column(sa.Unicode(15), nullable=True) + twitter = sa.orm.mapped_column(sa.Unicode(15), nullable=True) # Deprecated #: XXX: Deprecated field, used before user_id was introduced fullname = sa.orm.mapped_column(sa.Unicode(80), nullable=True) email = sa.orm.mapped_column(sa.Unicode(80), nullable=False) diff --git a/hasjob/socialmedia.py b/hasjob/socialmedia.py new file mode 100644 index 000000000..3ad7e01db --- /dev/null +++ b/hasjob/socialmedia.py @@ -0,0 +1,131 @@ +import re + +from atproto import ( + Client as BlueskyClient, + Session as BlueskySession, + SessionEvent as BlueskySessionEvent, + client_utils as atproto_client_utils, +) +from atproto.exceptions import AtProtocolError +from tweepy import API, OAuthHandler + +from baseframe import cache + +from . import app, rq + + +@rq.job('hasjob') +def tweet( + title: str, + url: str, + location: str | None = None, + parsed_location=None, + username: str | None = None, +) -> None: + auth = OAuthHandler( + app.config['TWITTER_CONSUMER_KEY'], app.config['TWITTER_CONSUMER_SECRET'] + ) + auth.set_access_token( + app.config['TWITTER_ACCESS_KEY'], app.config['TWITTER_ACCESS_SECRET'] + ) + api = API(auth) + urllength = 23 # Current Twitter standard for HTTPS (as of Oct 2014) + maxlength = 140 - urllength - 1 # == 116 + if username: + maxlength -= len(username) + 2 + locationtag = '' + if parsed_location: + locationtags = [] + for token in parsed_location.get('tokens', []): + if 'geoname' in token and 'token' in token: + locname = token['token'].strip() + if locname: + locationtags.append('#' + locname.title().replace(' ', '_')) + locationtag = ' '.join(locationtags) + if locationtag: + maxlength -= len(locationtag) + 1 + if not locationtag and location: + # Make a hashtag from the first word in the location. This catches + # locations like 'Anywhere' which have no geonameid but are still valid + locationtag = '#' + re.split(r'\W+', location)[0] + maxlength -= len(locationtag) + 1 + + if len(title) > maxlength: + text = title[: maxlength - 1] + '…' + else: + text = title[:maxlength] + text = text + ' ' + url # Don't shorten URLs, now that there's t.co + if locationtag: + text = text + ' ' + locationtag + if username: + text = text + ' @' + username + api.update_status(text) + + +def get_bluesky_session() -> str | None: + session_string = cache.get('hasjob:bluesky_session') + if not isinstance(session_string, str) or not session_string: + return None + return session_string + + +def save_bluesky_session(session_string: str) -> None: + cache.set('hasjob:bluesky_session', session_string) # No timeout + + +def on_bluesky_session_change( + event: BlueskySessionEvent, session: BlueskySession +) -> None: + if event in (BlueskySessionEvent.CREATE, BlueskySessionEvent.REFRESH): + save_bluesky_session(session.export()) + + +def init_bluesky_client() -> BlueskyClient: + client = BlueskyClient() # Only support the default `bsky.social` domain for now + client.on_session_change(on_bluesky_session_change) + + session_string = get_bluesky_session() + if session_string: + try: + client.login(session_string=session_string) + return client + except (ValueError, AtProtocolError): # Invalid session string + pass + # Fallback to a fresh login + client.login(app.config['BLUESKY_USERNAME'], app.config['BLUESKY_PASSWORD']) + return client + + +@rq.job('hasjob') +def bluesky_post( + title: str, + url: str, + location: str | None = None, + parsed_location=None, +): + locationtags = [] + if parsed_location: + for token in parsed_location.get('tokens', []): + if 'geoname' in token and 'token' in token: + locname = token['token'].strip() + if locname: + locationtags.append(locname.title().replace(' ', '_')) + if not locationtags and location: + # Make a hashtag from the first word in the location. This catches + # locations like 'Anywhere' which have no geonameid but are still valid + locationtag = re.split(r'\W+', location)[0] + locationtags.append(locationtag) + + maxlength = 300 # Bluesky allows 300 characters + if locationtags: + # Subtract length of all tags, plus length of visible `#`s and one space + maxlength -= len(' '.join(locationtags)) + len(locationtags) + 1 + + content = atproto_client_utils.TextBuilder() + content.link(title[: maxlength - 1] + '…' if len(title) > maxlength else title, url) + if locationtags: + for loc in locationtags: + content.text(' ') + content.tag('#' + loc, loc) + client = init_bluesky_client() + client.send_post(content) diff --git a/hasjob/twitter.py b/hasjob/twitter.py deleted file mode 100644 index cddb19a95..000000000 --- a/hasjob/twitter.py +++ /dev/null @@ -1,47 +0,0 @@ -import re - -from tweepy import API, OAuthHandler - -from . import app, rq - - -@rq.job('hasjob') -def tweet(title, url, location=None, parsed_location=None, username=None): - auth = OAuthHandler( - app.config['TWITTER_CONSUMER_KEY'], app.config['TWITTER_CONSUMER_SECRET'] - ) - auth.set_access_token( - app.config['TWITTER_ACCESS_KEY'], app.config['TWITTER_ACCESS_SECRET'] - ) - api = API(auth) - urllength = 23 # Current Twitter standard for HTTPS (as of Oct 2014) - maxlength = 140 - urllength - 1 # == 116 - if username: - maxlength -= len(username) + 2 - locationtag = '' - if parsed_location: - locationtags = [] - for token in parsed_location.get('tokens', []): - if 'geoname' in token and 'token' in token: - locname = token['token'].strip() - if locname: - locationtags.append('#' + locname.title().replace(' ', '')) - locationtag = ' '.join(locationtags) - if locationtag: - maxlength -= len(locationtag) + 1 - if not locationtag and location: - # Make a hashtag from the first word in the location. This catches - # locations like 'Anywhere' which have no geonameid but are still valid - locationtag = '#' + re.split(r'\W+', location)[0] - maxlength -= len(locationtag) + 1 - - if len(title) > maxlength: - text = title[: maxlength - 1] + '…' - else: - text = title[:maxlength] - text = text + ' ' + url # Don't shorten URLs, now that there's t.co - if locationtag: - text = text + ' ' + locationtag - if username: - text = text + ' @' + username - api.update_status(text) diff --git a/hasjob/views/listing.py b/hasjob/views/listing.py index 847d96710..d923d47fa 100644 --- a/hasjob/views/listing.py +++ b/hasjob/views/listing.py @@ -48,8 +48,8 @@ viewstats_by_id_hour, ) from ..nlp import identify_language +from ..socialmedia import bluesky_post, tweet from ..tagging import add_to_boards, tag_jobpost, tag_locations -from ..twitter import tweet from ..uploads import UploadNotAllowed, uploaded_logos from ..utils import common_legal_names, get_word_bag, random_long_key, redactemail from .helper import ( @@ -1063,6 +1063,27 @@ def confirm_email(domain, hashid, key): dict(post.parsed_location or {}), username=post.twitter, ) + if app.config['BLUESKY_ENABLED']: + if post.headlineb: + bluesky_post.queue( + post.headline, + post.url_for(b=0, _external=True), + post.location, + dict(post.parsed_location or {}), + ) + bluesky_post.queue( + post.headlineb, + post.url_for(b=1, _external=True), + post.location, + dict(post.parsed_location or {}), + ) + else: + bluesky_post.queue( + post.headline, + post.url_for(_external=True), + post.location, + dict(post.parsed_location or {}), + ) add_to_boards.queue(post.id) flash( "Congratulations! Your job post has been published. As a bonus for being an employer on Hasjob, " diff --git a/instance/settings-sample.py b/instance/settings-sample.py index a3863452c..1c1f6d6ac 100644 --- a/instance/settings-sample.py +++ b/instance/settings-sample.py @@ -55,6 +55,10 @@ TWITTER_CONSUMER_SECRET = '' # nosec B105 TWITTER_ACCESS_KEY = '' TWITTER_ACCESS_SECRET = '' # nosec B105 +#: Bluesky integration +BLUESKY_ENABLED = False +BLUESKY_USERNAME = '' # Login username +BLUESKY_PASSWORD = '' # App password # nosec B105 #: Bit.ly integration for short URLs BITLY_USER = '' BITLY_KEY = '' diff --git a/requirements.txt b/requirements.txt index 1bf9cc8bf..3f20581c8 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,3 +1,4 @@ +atproto git+https://github.com/hasgeek/baseframe#egg=baseframe bleach git+https://github.com/hasgeek/coaster#egg=coaster From ee2f142c7bb092fd6006016886989d909601ad5e Mon Sep 17 00:00:00 2001 From: Kiran Jonnalagadda Date: Mon, 2 Dec 2024 15:18:30 +0530 Subject: [PATCH 2/3] Include employer name, skip A/B headline dupes --- hasjob/views/listing.py | 26 ++++++-------------------- 1 file changed, 6 insertions(+), 20 deletions(-) diff --git a/hasjob/views/listing.py b/hasjob/views/listing.py index d923d47fa..281c0e6f1 100644 --- a/hasjob/views/listing.py +++ b/hasjob/views/listing.py @@ -1064,26 +1064,12 @@ def confirm_email(domain, hashid, key): username=post.twitter, ) if app.config['BLUESKY_ENABLED']: - if post.headlineb: - bluesky_post.queue( - post.headline, - post.url_for(b=0, _external=True), - post.location, - dict(post.parsed_location or {}), - ) - bluesky_post.queue( - post.headlineb, - post.url_for(b=1, _external=True), - post.location, - dict(post.parsed_location or {}), - ) - else: - bluesky_post.queue( - post.headline, - post.url_for(_external=True), - post.location, - dict(post.parsed_location or {}), - ) + bluesky_post.queue( + f'{post.headline} —{post.company_name}', + post.url_for(_external=True), + post.location, + dict(post.parsed_location or {}), + ) add_to_boards.queue(post.id) flash( "Congratulations! Your job post has been published. As a bonus for being an employer on Hasjob, " From 210d048712a0bdb3fd8bf172e13e810e0541e5de Mon Sep 17 00:00:00 2001 From: Kiran Jonnalagadda Date: Mon, 2 Dec 2024 15:29:41 +0530 Subject: [PATCH 3/3] Include employer name and browse URL --- hasjob/socialmedia.py | 10 ++++++++++ hasjob/views/listing.py | 4 +++- 2 files changed, 13 insertions(+), 1 deletion(-) diff --git a/hasjob/socialmedia.py b/hasjob/socialmedia.py index 3ad7e01db..6d294f7cf 100644 --- a/hasjob/socialmedia.py +++ b/hasjob/socialmedia.py @@ -102,6 +102,8 @@ def bluesky_post( url: str, location: str | None = None, parsed_location=None, + employer: str | None = None, + employer_url: str | None = None, ): locationtags = [] if parsed_location: @@ -117,12 +119,20 @@ def bluesky_post( locationtags.append(locationtag) maxlength = 300 # Bluesky allows 300 characters + if employer: + maxlength -= len(employer) + 2 # Minus employer name and prefix if locationtags: # Subtract length of all tags, plus length of visible `#`s and one space maxlength -= len(' '.join(locationtags)) + len(locationtags) + 1 content = atproto_client_utils.TextBuilder() content.link(title[: maxlength - 1] + '…' if len(title) > maxlength else title, url) + if employer: + content.text(' –') + if employer_url: + content.link(employer, employer_url) + else: + content.text(employer) if locationtags: for loc in locationtags: content.text(' ') diff --git a/hasjob/views/listing.py b/hasjob/views/listing.py index 281c0e6f1..d560ecaef 100644 --- a/hasjob/views/listing.py +++ b/hasjob/views/listing.py @@ -1065,10 +1065,12 @@ def confirm_email(domain, hashid, key): ) if app.config['BLUESKY_ENABLED']: bluesky_post.queue( - f'{post.headline} —{post.company_name}', + post.headline, post.url_for(_external=True), post.location, dict(post.parsed_location or {}), + employer=post.company_name, + employer_url=post.url_for('browse', _external=True), ) add_to_boards.queue(post.id) flash(