Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

lfs: add tests for rate limit retries #341

Merged
merged 2 commits into from
Mar 16, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -39,6 +39,7 @@ Source = "https://github.com/iterative/scmrepo"

[project.optional-dependencies]
tests = [
"aioresponses==0.7.6",
"pytest==8.1.1",
"pytest-sugar==1.0.0",
"pytest-cov==4.1.0",
Expand Down
2 changes: 1 addition & 1 deletion src/scmrepo/git/lfs/client.py
Original file line number Diff line number Diff line change
Expand Up @@ -86,7 +86,7 @@ def loop(self):
def from_git_url(cls, git_url: str) -> "LFSClient":
if git_url.startswith(("ssh://", "git@")):
return _SSHLFSClient.from_git_url(git_url)
if git_url.startswith("https://"):
if git_url.startswith(("http://", "https://")):
return _HTTPLFSClient.from_git_url(git_url)
raise NotImplementedError(f"Unsupported Git URL: {git_url}")

Expand Down
212 changes: 210 additions & 2 deletions tests/test_lfs.py
Original file line number Diff line number Diff line change
@@ -1,16 +1,27 @@
# pylint: disable=redefined-outer-name
import io
from collections import defaultdict
from collections.abc import Sequence
from http import HTTPStatus
from time import time
from typing import Callable

import pytest
from aiohttp import ClientResponseError
from aioresponses import CallbackResult, aioresponses
from pytest_mock import MockerFixture
from pytest_test_utils import TempDirFactory, TmpDir
from yarl import URL

from scmrepo.git import Git
from scmrepo.git.lfs import LFSStorage, Pointer, smudge
from scmrepo.git.lfs import LFSClient, LFSStorage, Pointer, smudge

FOO_OID = "2c26b46b68ffc68ff99b453c1d30413413422d706483bfa0f98a5e886266e7ae"
FOO_SIZE = 3
FOO_POINTER = (
f"version https://git-lfs.github.com/spec/v1\noid sha256:{FOO_OID}\nsize 3\n"
f"version https://git-lfs.github.com/spec/v1\n"
f"oid sha256:{FOO_OID}\n"
f"size {FOO_SIZE}\n"
).encode()


Expand Down Expand Up @@ -74,3 +85,200 @@ def test_lfs(tmp_dir: TmpDir, scm: Git, lfs_objects: TmpDir):
assert fobj.read() == FOO_POINTER
with fs.open("foo.lfs", "rb", raw=False) as fobj:
assert fobj.read() == b"foo"


class CallbackResultRecorder:
def __init__(self) -> None:
self._results: dict[str, list[CallbackResult]] = defaultdict(list)

def record(self, result: CallbackResult) -> Callable[..., CallbackResult]:
def _callback(url: URL, **_) -> CallbackResult:
self._results[str(url)].append(result)
return result

return _callback

def __getitem__(self, url: str) -> Sequence[CallbackResult]:
return self._results[url]


class LFSServerMock:
def __init__(
self,
mocker: aioresponses,
recorder: CallbackResultRecorder,
batch_url: str,
objects_url: str,
) -> None:
self._mocker = mocker
self._recorder = recorder
self.batch_url = batch_url
self.objects_url = objects_url

def get_object_url(self, oid: str) -> str:
return f"{self.objects_url}/{oid}"

def mock_batch_200(self, pointer: Pointer) -> None:
self._mocker.post(
self.batch_url,
callback=self._recorder.record(
CallbackResult(
status=HTTPStatus.OK,
headers={"Content-Type": "application/vnd.git-lfs+json"},
payload={
"transfer": "basic",
"objects": [
{
"oid": pointer.oid,
"size": pointer.size,
"authenticated": True,
"actions": {
"download": {
"href": self.get_object_url(pointer.oid),
}
},
}
],
"hash_algo": "sha256",
},
)
),
)

def mock_batch_429(
self, header: str, value: Callable[[], str], *, repeat: bool = False
) -> None:
self._mocker.post(
self.batch_url,
callback=self._recorder.record(
CallbackResult(
status=HTTPStatus.TOO_MANY_REQUESTS,
headers={header: value()},
reason="Too many requests",
)
),
repeat=repeat,
)

def mock_object_200(self, oid: str) -> None:
self._mocker.get(
self.get_object_url(oid),
callback=self._recorder.record(
CallbackResult(
status=HTTPStatus.OK,
body=f"object {oid} data",
)
),
)

def mock_object_429(
self,
oid: str,
header: str,
value: Callable[[], str],
*,
repeat: bool = False,
) -> None:
self._mocker.get(
self.get_object_url(oid),
callback=self._recorder.record(
CallbackResult(
status=HTTPStatus.TOO_MANY_REQUESTS,
headers={header: value()},
reason="Too many requests",
)
),
repeat=repeat,
)


@pytest.mark.parametrize(
"rate_limit_header, rate_limit_value",
[
("Retry-After", lambda: "1"),
("RateLimit-Reset", lambda: f"{int(time()) + 1}"),
("X-RateLimit-Reset", lambda: f"{int(time()) + 1}"),
],
)
def test_rate_limit_retry(
storage: LFSStorage, rate_limit_header: str, rate_limit_value: Callable[[], str]
):
client = LFSClient.from_git_url("http://git.example.com/namespace/project.git")
recorder = CallbackResultRecorder()

with aioresponses() as m:
lfs_server = LFSServerMock(
m, recorder, f"{client.url}/objects/batch", "http://git-lfs.example.com"
)
lfs_server.mock_batch_429(rate_limit_header, rate_limit_value)
lfs_server.mock_batch_200(Pointer(FOO_OID, FOO_SIZE))
lfs_server.mock_object_429(FOO_OID, rate_limit_header, rate_limit_value)
lfs_server.mock_object_200(FOO_OID)

client.download(storage, [Pointer(oid=FOO_OID, size=FOO_SIZE)])

results = recorder[lfs_server.batch_url]
assert [r.status for r in results] == [429, 200]

results = recorder[lfs_server.get_object_url(FOO_OID)]
assert [r.status for r in results] == [429, 200]


@pytest.mark.parametrize(
"rate_limit_header, rate_limit_value",
[
("Retry-After", lambda: "1"),
("RateLimit-Reset", lambda: f"{int(time()) + 1}"),
("X-RateLimit-Reset", lambda: f"{int(time()) + 1}"),
],
)
def test_rate_limit_max_retries_batch(
storage: LFSStorage, rate_limit_header: str, rate_limit_value: Callable[[], str]
):
client = LFSClient.from_git_url("http://git.example.com/namespace/project.git")
recorder = CallbackResultRecorder()

with aioresponses() as m:
lfs_server = LFSServerMock(
m, recorder, f"{client.url}/objects/batch", "http://git-lfs.example.com"
)
lfs_server.mock_batch_429(rate_limit_header, rate_limit_value, repeat=True)

with pytest.raises(ClientResponseError, match="Too many requests"):
client.download(storage, [Pointer(oid=FOO_OID, size=FOO_SIZE)])

results = recorder[lfs_server.batch_url]
assert [r.status for r in results] == [429] * 5


@pytest.mark.parametrize(
"rate_limit_header, rate_limit_value",
[
("Retry-After", lambda: "1"),
("RateLimit-Reset", lambda: f"{int(time()) + 1}"),
("X-RateLimit-Reset", lambda: f"{int(time()) + 1}"),
],
)
def test_rate_limit_max_retries_objects(
storage: LFSStorage, rate_limit_header: str, rate_limit_value: Callable[[], str]
):
client = LFSClient.from_git_url("http://git.example.com/namespace/project.git")
recorder = CallbackResultRecorder()

with aioresponses() as m:
lfs_server = LFSServerMock(
m, recorder, f"{client.url}/objects/batch", "http://git-lfs.example.com"
)
lfs_server.mock_batch_200(Pointer(FOO_OID, FOO_SIZE))
lfs_server.mock_object_429(
FOO_OID, rate_limit_header, rate_limit_value, repeat=True
)

with pytest.raises(ClientResponseError, match="Too many requests"):
client.download(storage, [Pointer(oid=FOO_OID, size=FOO_SIZE)])

results = recorder[lfs_server.batch_url]
assert [r.status for r in results] == [200]

results = recorder[lfs_server.get_object_url(FOO_OID)]
assert [r.status for r in results] == [429] * 5
Loading