1
1
#! /bin/bash
2
2
PDT=201905
3
+ PDTdash=2019-05-01
3
4
DT=201910
4
5
# Get updated repos only: updated since last gathering
5
6
# python3 ghUpdatedRepos.py 2018-12-01 gh201813 repos &> ghReposList201813.updt &
6
- python3 ghUpdatedRepos.py 2019-05-01 gh$DT repos & > ghReposList$DT .updt &
7
+ cat tokens_date | while read r ; do echo $r | python3 ghUpdatedRepos.new. py gh$DT repos & > ghReposList$( echo $r | cut -d ' ' -f2 ) .updt & done
7
8
8
9
# BB: need to extract all, no way to check for updated ones
9
10
# python3 bbRepos.py 1980-01-01 bitbucket$DT 2013-00-01 &> bbRepos${DT}0.out &
@@ -15,7 +16,7 @@ python3 ghUpdatedRepos.py 2019-05-01 gh$DT repos &> ghReposList$DT.updt &
15
16
# python3 bbRepos.py 2017-05-03 bitbucket$DT 2018-05-03 &> bbRepos${DT}6.out &
16
17
# python3 bbRepos.py 2018-05-03 bitbucket$DT 2022-05-03 &> bbRepos${DT}7.out &
17
18
# get only new, use heads for existing repos
18
- python3 bbRepos.py 2019-02-01 bitbucket$DT 2022-05-03 & > bbRepos${DT} 0.out &
19
+ python3 bbRepos.py $PDTdash bitbucket$DT 2022-05-03 & > bbRepos${DT} 0.out &
19
20
20
21
21
22
# SF
@@ -64,9 +65,9 @@ done | gzip > cgit.kde.org.$DT.heads &
64
65
# https://gitlab.gnome.org/explore/projects?page=300&sort=latest_activity_desc
65
66
# insert username/password to prevend password requests
66
67
for p in {1..300}
67
- do wget
" https://gitlab.gnome.org/explore/projects?page=$p " -O -
2> /dev/null
| perl -ane
' chop();if (m|^<a class="text-plain" href="|){s|<a class="text-plain" href="||;s|".*||;s|^/||;print "https://a:[email protected] /$_\n"}'
68
+ do wget " https://gitlab.gnome.org/explore/projects?page=$p " -O - 2> /dev/null | perl -ane ' chop();if (m|^<a class="text-plain" href="|){s|<a class="text-plain" href="||;s|".*||;s|^/||;print "https://a:a\ @gitlab.gnome.org/$_\n"}'
68
69
done | sort -u > gitlab.gnome.org.$DT
69
- cat gitlab.gnome.org.$DT | while read r; do a=$( git ls-remote $r | awk ' {print ";"$1}' ) ; echo $r$a | sed ' s/ //g' ; done | gzip > gitlab.gnome.org.heads. $DT &
70
+ cat gitlab.gnome.org.$DT | while read r; do a=$( git ls-remote $r | awk ' {print ";"$1}' ) ; echo $r$a | sed ' s/ //g' ; done | gzip > gitlab.gnome.org.$DT .heads &
70
71
71
72
72
73
# pages 1-1530
@@ -132,13 +133,13 @@ cat git.kernel.org.$DT | while read r; do a=$(git ls-remote $r | awk '{print ";"
132
133
133
134
134
135
wget http://git.savannah.gnu.org/cgit -O git.savannah.gnu.org.html
135
- perl -ane " while (m|<td class='sublevel-repo'><a title='[^']*' href='([^']*)'|g){print \" https://git.savannah.gnu.org\$ 1\n\" ;}" < git.savannah.gnu.org.html | sed ' s|/cgit/|/git/|' | sort -u | > git.savannah.gnu.org.$DT
136
+ perl -ane " while (m|<td class='sublevel-repo'><a title='[^']*' href='([^']*)'|g){print \" https://git.savannah.gnu.org\$ 1\n\" ;}" < git.savannah.gnu.org.html | sed ' s|/cgit/|/git/|' | sort -u > git.savannah.gnu.org.$DT
136
137
cat git.savannah.gnu.org.$DT | while read r; do a=$( git ls-remote $r | awk ' {print ";"$1}' ) ; echo $r$a | sed ' s/ //g' ; done | gzip > git.savannah.gnu.org.$DT .heads &
137
138
138
139
wait
139
140
140
141
# Get update repos for GL
141
- python3 listU.py gl$DT repos ' { "last_activity_at" : { "$gt" : "2019-02-01 " }}' http_url_to_repo | sed " s|^b'||;s|'$||" > gl$DT .new
142
+ python3 listU.py gl$DT repos ' { "last_activity_at" : { "$gt" : "' " $PDTdash " ' " }}' http_url_to_repo | sed " s|^b'||;s|'$||" > gl$DT .new
142
143
cat gl$DT .new | sed ' s|https://gitlab.com/|gl:|' | while read r; do a=$( git ls-remote $r | awk ' {print ";"$1}' ) ; echo $r$a | sed ' s/ //g' ;
143
144
done | gzip > gl$DT .new.heads &
144
145
@@ -152,7 +153,7 @@ do cat gh$DT.u.$j | while read r; do
152
153
done
153
154
154
155
# Get updated bb (do heads on all 2M?)
155
- python3 listU.py bitbucket$DT repos ' { "updated_on" : { "$gt" : "2019-02-01 " } }' full_name | \
156
+ python3 listU.py bitbucket$DT repos ' { "updated_on" : { "$gt" : "' " $PDTdash " ' " } }' full_name | \
156
157
sed " s|^b'||;s|'$||" | sort -u > bitbucket$DT .new
157
158
split -n l/10 -da1 bitbucket$DT .new bitbucket$DT .new.
158
159
for j in {0..8}
0 commit comments