1.3. Dependency Injection
Dependency injection, as a software design pattern, has number of advantages that are common for each language (including Python):
Dependency Injection decreases coupling between a class and its dependency.
Because dependency injection doesn't require any change in code behavior it can be applied to legacy code as a refactoring. The result is clients that are more independent and that are easier to unit test in isolation using stubs or mock objects that simulate other objects not under test. This ease of testing is often the first benefit noticed when using dependency injection.
Dependency injection can be used to externalize a system's configuration details into configuration files allowing the system to be reconfigured without recompilation (rebuilding). Separate configurations can be written for different situations that require different implementations of components. This includes, but is not limited to, testing.
Reduction of boilerplate code in the application objects since all work to initialize or set up dependencies is handled by a provider component.
Dependency injection allows a client to remove all knowledge of a concrete implementation that it needs to use. This helps isolate the client from the impact of design changes and defects. It promotes reusability, testability and maintainability.
Dependency injection allows a client the flexibility of being configurable. Only the client's behavior is fixed. The client may act on anything that supports the intrinsic interface the client expects.
Dependency injection:
from dataclasses import dataclass
from datetime import timedelta
from typing import Any
@dataclass
class Cache:
expiration: timedelta = timedelta(days=30)
location: str | None = None
def get(self, key: str) -> Any:
raise NotImplementedError
def set(self, key: str, value: Any) -> None:
raise NotImplementedError
def is_valid(self, key) -> bool:
raise NotImplementedError
class CacheFilesystem(Cache):
"""Cache using files"""
class CacheMemory(Cache):
"""Cache using memory"""
class CacheDatabase(Cache):
"""Cache using database"""
@dataclass
class HTTP:
_cache: CacheInterface
def _fetch(self, url):
return ...
def get(self, url):
if self._cache.is_valid(url):
# Use cached data
self._cache.get(url)
else:
data = self._fetch(url)
self._cache.set(url, data)
if __name__ == '__main__':
database = CacheDatabase(location='sqlite3:///tmp/http-cache.sqlite3')
filesystem = CacheFilesystem(location='/tmp/')
memory = CacheMemory(expiration=timedelta(hours=2))
http1 = HTTP(_cache=database)
http1.get('https://python3.info')
http2 = HTTP(_cache=filesystem)
http2.get('https://python3.info')
http3 = HTTP(_cache=memory)
http3.get('https://python3.info')
import os
from dataclasses import dataclass, field
from hashlib import sha1
from datetime import timedelta, datetime
from http import HTTPStatus
import requests
class CacheInterface:
def _get_location(self, key: str) -> str:
raise NotImplementedError
def get(self, key: str) -> str:
raise NotImplementedError
def set(self, key: str, value: str) -> None:
raise NotImplementedError
def clear(self, key: str) -> None:
raise NotImplementedError
def is_valid(self, key: str) -> bool:
raise NotImplementedError
@dataclass
class CacheMemory(CacheInterface):
expiration: timedelta = timedelta(seconds=30)
_data: dict[str, str] = field(default_factory=dict)
def is_valid(self, key: str) -> bool:
return key in self._data
def set(self, key: str, value: str) -> None:
self._data[key] = value
def get(self, key: str) -> str:
return self._data[key]
@dataclass
class CacheFilesystem(CacheInterface):
location: str = "/tmp/cache/"
expiration: timedelta = timedelta(seconds=30)
def __post_init__(self):
if os.path.isfile(self.location):
os.remove(self.location)
if not os.path.isdir(self.location):
os.makedirs(self.location, exist_ok=True)
def _get_location(self, key: str) -> str:
filename = sha1(key.encode()).hexdigest()
return os.path.join(self.location, filename)
def is_valid(self, key: str) -> bool:
location = self._get_location(key)
if not os.path.isfile(location):
return False
timestamp = os.path.getmtime(location)
modification_date = datetime.fromtimestamp(timestamp)
last_update = datetime.now() - modification_date
return last_update < self.expiration:
def get(self, key: str) -> str:
location = self._get_location(key)
with open(location) as file:
return file.read()
def set(self, key: str, value: str) -> None:
location = self._get_location(key)
with open(location, mode="w") as file:
file.write(value)
@dataclass
class HTTPGateway:
_cache: CacheInterface = CacheMemory
def get(self, url):
if self._cache.is_valid(url):
return self._cache.get(url)
else:
data = self._fetch(url)
self._cache.set(url, data)
return data
def _fetch(self, url):
response = requests.get(url)
if response.status_code == HTTPStatus.OK:
return response.text
else:
raise ConnectionError()
@dataclass
class CacheDatabase(CacheInterface):
location: str
if __name__ == '__main__':
cache = CacheFilesystem(location="/tmp/cache/", expiration=timedelta(seconds=1))
http = HTTPGateway(cache)
URL = 'https://python3.info/_static/iris-clean.csv'
data = http.get(URL)
print(data)