07:13:24 softwareheritage@belvedere:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/keybase/client' and ovs.type='git' order by date desc limit 4;
11:02:07 softwareheritage@belvedere:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/torvalds/linux' and ovs.type='git' order by date desc limit 2;
11:28:34 softwareheritage@belvedere:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/rdicosmo/parmap' and ovs.type='git' order by date desc limit 2;
11:42:22 softwareheritage@belvedere:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/hylang/hy' and ovs.type='git' order by date desc limit 2;
13:06:38 softwareheritage@belvedere:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/hylang/hyrule' and ovs.type='git' order by date desc limit 2;
11:59:20 softwareheritage@belvedere:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/kubernetes/kubernetes' and ovs.type='git' order by date desc limit 2;
13:15:44 softwareheritage@belvedere:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/NixOS/nixpkgs' and ovs.type='git' order by date desc limit 2;
dulwich 0.20.25 # ----------------> assuming it's ok to diverge a bit
(ve) swhworker@worker0:~$ pip list | grep swh.loader.git
swh.loader.git 1.0.1
(ve) swhworker@worker0:~/ve$ time swh loader -C /etc/softwareheritage/loader_git.yml run git https://github.com/keybase
/client
INFO:swh.loader.git.loader.GitLoader:Load origin 'https://github.com/keybase/client' with type 'git'
Enumerating objects: 868404, done.
Counting objects: 100% (169/169), done.
Compressing objects: 100% (74/74), done.
Total 868404 (delta 104), reused 133 (delta 93), pack-reused 868235
INFO:swh.loader.git.loader.GitLoader:Listed 19852 refs for repo https://github.com/keybase/client
{'status': 'eventful'}
real 183m33.441s
user 56m13.315s
sys 3m4.313s
#+end_src
Then another visit which finishes with the same snapshot:
#+begin_src sh
(ve) swhworker@worker0:~/ve$ time swh loader -C /etc/softwareheritage/loader_git.yml run git https://github.com/keybase/client
INFO:swh.loader.git.loader.GitLoader:Load origin 'https://github.com/keybase/client' with type 'git'
INFO:swh.loader.git.loader.GitLoader:Listed 19852 refs for repo https://github.com/keybase/client
{'status': 'uneventful'}
real 0m18.420s
user 0m11.367s
sys 0m0.146s
#+end_src
The resulting snapshot is: \xcddaccc0a2d452098701dec921731e8c96630e2b
#+begin_src sql
07:15:14 swh@db1:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/keybase/client' and ovs.type='git' order by date desc limit 4;
11:59:26 swh@db1:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/torvalds/linux' and ovs.type='git' order by date desc limit 2;
11:42:11 swh@db1:5432=> select * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/rdicosmo/parmap' and ovs.type='git' order by date desc limit 2;
11:42:14 swh@db1:5432=> select * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/hylang/hy' and ovs.type='git' order by date desc limit 2;
13:03:26 swh@db1:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/hylang/hyrule' and ovs.type='git' order by date desc limit 2;
11:59:29 swh@db1:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/kubernetes/kubernetes' and ovs.type='git' order by date desc limit 2;
09:57:29 swh@db1:5432=> select now(), * from origin o inner join origin_visit_status ovs on o.id=ovs.origin where o.url = 'https://github.com/NixOS/nixpkgs' and ovs.type='git' order by date desc limit 2;