The script comes from https://www.jianshu.com/p/67d827fbb4e8
Add some modifications to solve the problem of incomplete downloading when a group contains too many items.
from urllib.request import urlopen import json import subprocess, shlex import time import os gitlabToken = 'token' gitlabAddr = 'gitlab.com' # gitlab address targets = ['intel'] # The group or subgroup it belongs to, you can also fill in its ID (ps: leave it empty to clone all groups, use with caution) withShared = 'false' # Whether to include shared projects, the default is false (ps: true will pull projects belonging to other groups) max_projects = '100' #The script can only read one page and set the maximum number of projects. The excess parts will not be downloaded. #-------------------------- counter = 0 procs = [] def get_next(group_id): global counter global procs print('get_next group_id:', group_id) url = gen_next_url(group_id) allProjects = urlopen(url) allProjectsDict = json.loads(allProjects.read().decode()) if len(allProjectsDict) == 0: return for thisProject in allProjectsDict: try: thisProjectURL = thisProject['http_url_to_repo'] thisProjectPath = thisProject['path_with_namespace'] if os.path.exists(thisProjectPath): command = shlex.split('git -C "%s" pull' % (thisProjectPath)) else: print("============ Start cloning %s %s ===========" % (group_id, thisProject['name'])) print('Execute: git clone %s %s' % (thisProjectURL, thisProjectPath)) command = shlex.split('git clone %s %s' % (thisProjectURL, thisProjectPath)) proc = subprocess.Popen(command) procs.append(proc) time.sleep(1) counter + = 1 except Exception as e: print("Error on %s: %s" % (thisProjectURL, e.strerror)) print("============ Waiting for the end of child thread execution ===========") for p in procs: p.wait() p.kill() print("=========== Sub-thread execution ends ===========") return def have_next_projects(group_id): url = gen_next_url(group_id) allProjects = urlopen(url) allProjectsDict = json.loads(allProjects.read().decode()) if len(allProjectsDict) == 0: return False return True def get_sub_groups(parent_id): url = gen_subgroups_url(parent_id) allProjects = urlopen(url) allProjectsDict = json.loads(allProjects.read().decode()) sub_ids = [] if len(allProjectsDict) == 0: return sub_ids for thisProject in allProjectsDict: try: id = thisProject['id'] sub_ids.append(id) except Exception as e: print("Error on %s: %s" % (id, e.strerror)) return sub_ids def cal_next_sub_groupids(parent_id): parent = '' parent = parent_id is_start = 1 parent_list = [] sub_ids = get_sub_groups(parent_id) print('cal_next_sub_groupids sub_ids and parent_id:',sub_ids, parent_id) ok = have_next_projects(parent_id) print('have_next_projects result:', ok) if len(sub_ids)!=0 and ok == False: for i in range(len(sub_ids)): print('cal_next_sub_groupids sub_ids[i]:', sub_ids[i]) parent = sub_ids[i] a = cal_next_sub_groupids(sub_ids[i]) return a if len(sub_ids) !=0 and ok == True: for i in range(len(sub_ids)): print('cal_next_sub_groupids parent:', parent) parent = sub_ids[i] parent_list.append(sub_ids[i]) a = cal_next_sub_groupids(sub_ids[i]) parent_list.extend(a) if len(sub_ids) == 0 and ok == True: print('cal_next_sub_groupids is_start:',is_start) parent_list.append(parent) return parent_list if len(sub_ids) ==0 and ok == False: return parent_list return parent_list def download_code(parent_id): data =cal_next_sub_groupids(parent_id) print('download_code result: ',data) for group_id in data: get_next(group_id) return def gen_next_url(target_id): return "https://%s/api/v4/groups/%s/projects?per_page=%s & amp;private_token=%s & amp;with_shared=%s & amp;order_by=updated_at" % (max_projects, gitlabAddr , target_id, gitlabToken, withShared) def gen_subgroups_url(target_id): return "https://%s/api/v4/groups/%s/subgroups?private_token=%s" % (gitlabAddr, target_id, gitlabToken) def gen_global_url(): return "http://%s/api/v4/projects?private_token=%s" % (gitlabAddr, gitlabToken) def download_global_code(): global counter global procs url = gen_global_url() allProjects = urlopen(url) allProjectsDict = json.loads(allProjects.read().decode()) if len(allProjectsDict) == 0: return for thisProject in allProjectsDict: try: thisProjectURL = thisProject['http_url_to_repo'] thisProjectPath = thisProject['path_with_namespace'] print(thisProjectURL + ' ' + thisProjectPath) if os.path.exists(thisProjectPath): command = shlex.split('git -C "%s" pull' % (thisProjectPath)) else: print("============ Start cloning %s %s ===========" % (group_id, thisProject['name'])) print('Execute: git clone %s %s' % (thisProjectURL, thisProjectPath)) command = shlex.split('git clone %s %s' % (thisProjectURL, thisProjectPath)) proc = subprocess.Popen(command) procs.append(proc) time.sleep(1) counter + = 1 except Exception as e: print("Error on %s: %s" % (thisProjectURL, e.strerror)) print("============ Waiting for the end of child thread execution ===========") for p in procs: p.wait() p.kill() print("=========== Sub-thread execution ends ===========") return def download_targets_code(): for target in targets: url = "https://%s/api/v4/groups?private_token=%s & amp;search=%s" % (gitlabAddr, gitlabToken, target) allProjects = urlopen(url) allProjectsDict = json.loads(allProjects.read().decode()) if len(allProjectsDict) == 0: return target_id = '' for thisProject in allProjectsDict: try: this_name = thisProject['name'] if target == this_name: target_id = thisProject['id'] break except Exception as e: print("Error on %s: %s" % (this_name, e.strerror)) download_code(target_id) return def main(): if len(targets) == 0: download_global_code() else: download_targets_code() print("============ Execution ends, number of cloned items: %s ===========" % (counter)) return main()