Skip to content

Commit

Permalink
Move from seatemperature.info to seatemperature.org
Browse files Browse the repository at this point in the history
  • Loading branch information
torbencarstens committed Dec 7, 2023
1 parent 2a0ac82 commit 68ab5aa
Show file tree
Hide file tree
Showing 3 changed files with 66 additions and 77 deletions.
75 changes: 0 additions & 75 deletions lake_scrapers/scrapers/seatemperatureinfo.py

This file was deleted.

64 changes: 64 additions & 0 deletions lake_scrapers/scrapers/seatemperatureorg.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,64 @@
import os
import re
from datetime import datetime

from lake_scrapers import convert_timestamp, LakeTemperatureItem
from lake_scrapers.scraper import Scraper


class SeaTemperatureOrgScraper(Scraper):
data = {
"europe/italy/sorrento.htm": {
"UUID": os.getenv("SORRENTO_UUID"),
"regex": re.compile(
r"^(?P<temperature>\d+(\.\d+)?).C\s+",
re.IGNORECASE,
),
},
"europe/spain/santander.htm": {
"UUID": os.getenv("SANTANDER_UUID"),
"regex": re.compile(
r"^(?P<temperature>\d+(\.\d+)?).C\s+",
re.IGNORECASE,
),
},
"europe/greece/heraklion.htm": {
"UUID": os.getenv("HERAKLION_UUID"),
"regex": re.compile(
r"^(?P<temperature>\d+(\.\d+)?).C\s+",
re.IGNORECASE,
),
},
"north-america/canada/vancouver.htm": {
"UUID": os.getenv("VANCOUVER_UUID"),
"regex": re.compile(
r"^(?P<temperature>\d+(\.\d+)?).C\s+",
re.IGNORECASE,
),
},
}

base_url = "https://www.seatemperature.org"
paths = [
"europe/italy/sorrento.htm",
"europe/spain/santander.htm",
"europe/greece/heraklion.htm",
"north-america/canada/vancouver.htm",
]

def parse(self, response, **kwargs):
path = response.request.url.path.lstrip("/")
regex = self.data[path]["regex"]
soup = self.soup(response)
span = soup.find("div", attrs={"id": "sea-temperature"}).find("span")
content = span.string.strip()
matches = regex.search(content)
temperature = matches.group("temperature")

timestamp = datetime.now().timestamp()
timestamp = convert_timestamp(timestamp, is_timestamp=True)

uuid = self.data[path]["UUID"]
return LakeTemperatureItem(
temperature=temperature, timestamp=timestamp, uuid=uuid
)
4 changes: 2 additions & 2 deletions main.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@
from lake_scrapers.scrapers.blaarmeersen import BlaarmeersenScraper
from lake_scrapers.scrapers.cuxhaven import CuxhavenScraper
from lake_scrapers.scrapers.pegelonline import PegelonlineScraper
from lake_scrapers.scrapers.seatemperatureinfo import SeaTemperatureInfoScraper
from lake_scrapers.scrapers.seatemperatureorg import SeaTemperatureOrgScraper
from lake_scrapers.scrapers.woog import WoogScraper


Expand All @@ -24,7 +24,7 @@ def process_item(item: LakeTemperatureItem, logger):
BlaarmeersenScraper,
CuxhavenScraper,
PegelonlineScraper,
SeaTemperatureInfoScraper,
SeaTemperatureOrgScraper,
WoogScraper,
]
# SCRAPER_CLASSES = [WoogSpider]
Expand Down

0 comments on commit 68ab5aa

Please sign in to comment.