From 22a23862b475ba7727eff52b176e28278d4c8a04 Mon Sep 17 00:00:00 2001 From: Joakim Soderlund Date: Fri, 2 Oct 2015 13:00:55 +0200 Subject: [PATCH] Add fetcher for Fimfiction --- fimfarchive/fetchers.py | 79 +++++++++++++++++++++++++++++++++++++++++ 1 file changed, 79 insertions(+) diff --git a/fimfarchive/fetchers.py b/fimfarchive/fetchers.py index d605b45..b54c228 100644 --- a/fimfarchive/fetchers.py +++ b/fimfarchive/fetchers.py @@ -22,6 +22,11 @@ Fetchers for Fimfarchive. # +import requests + +from fimfarchive.exceptions import InvalidStoryError, StorySourceError + + class Fetcher: """ Abstract base class for story fetchers. @@ -95,3 +100,77 @@ class Fetcher: StorySourceError: If source does not return any data. """ raise NotImplementedError() + + +class FimfictionFetcher(Fetcher): + """ + Fetcher for Fimfiction. + """ + data_path = 'https://www.fimfiction.net/download_story.php' + meta_path = 'https://www.fimfiction.net/api/story.php' + + def close(self): + pass + + def get(self, url, **kwargs): + """ + Performs an HTTP GET request. + + Args: + url: Target of the HTTP request. + **kwargs: HTTP query parameters. + + Returns: + Response: A new `Response` object. + + Raises: + StorySourceError: If the server does not return HTTP 200 OK. + """ + try: + response = requests.get(url, params=kwargs) + except IOError as e: + raise StorySourceError("Could not read from server.") from e + + if not response.ok: + raise StorySourceError( + "Server responded with HTTP {} {}." + .format(response.status_code, response.reason) + ) + + return response + + def fetch_data(self, pk): + response = self.get(self.data_path, story=pk, html=True) + data = response.content + + if len(data) == 0: + raise InvalidStoryError("Server returned empty response body.") + + if b'

' not in data: + raise InvalidStoryError("Server did not return any chapters.") + + if not data.endswith(b''): + raise StorySourceError("Server returned incomplete response.") + + return data + + def fetch_meta(self, pk): + response = self.get(self.meta_path, story=pk) + + try: + meta = response.json() + except ValueError as e: + raise StorySourceError("Server did not return valid JSON.") from e + + if 'error' in meta: + message = meta['error'] + + if message == 'Invalid story id': + raise InvalidStoryError("Story does not exist.") + else: + raise StorySourceError(message) + + if 'story' not in meta: + raise StorySourceError("Server did not return a story object.") + + return meta['story']