1
0
Fork 0
mirror of https://github.com/clockfort/GitHub-Backup.git synced 2025-03-23 00:00:05 +01:00
GitHub-Backup/github-backup.py

148 lines
4.7 KiB
Python
Raw Normal View History

2012-06-23 14:59:50 -04:00
#!/usr/bin/env python
2013-08-02 01:21:55 +02:00
"""
Authors: Anthony Gargiulo (anthony@agargiulo.com)
Steffen Vogel (post@steffenvogel.de)
Created: Fri Jun 15 2012
"""
2019-05-05 01:56:22 +02:00
from pygithub3 import Github
from argparse import ArgumentParser
import subprocess
import os
2019-05-05 01:56:22 +02:00
def main():
2019-05-05 01:48:21 +02:00
parser = init_parser()
args = parser.parse_args()
2019-05-05 01:48:21 +02:00
if not args.git:
args.git = []
2019-05-05 01:48:21 +02:00
# Process args
if args.cron:
args.git.append("--quiet")
2013-08-02 01:21:55 +02:00
2019-05-05 01:48:21 +02:00
# Make the connection to Github here.
2019-05-05 01:56:22 +02:00
config = {'user': args.username}
2019-05-05 01:48:21 +02:00
args.backupdir = args.backupdir.rstrip("/")
2019-05-05 01:48:21 +02:00
if (args.token):
config['token'] = args.token
2019-05-05 01:48:21 +02:00
if (args.password):
config['password'] = args.password
config['login'] = args.username
2019-05-05 01:48:21 +02:00
# if both password and token are specified, the token will be
# used, according to pygithub3 sources
# however, the username isn't required when using a token
if (args.token):
config['token'] = args.token
2013-10-15 01:07:34 +11:00
2019-05-05 01:48:21 +02:00
gh = Github(**config)
2019-05-05 01:48:21 +02:00
# Get all repos
2019-05-05 01:56:22 +02:00
users = {}
2019-05-05 01:48:21 +02:00
user_repos = gh.repos.list(user=args.username).all()
for repo in user_repos:
if repo.owner.login not in users:
users[repo.owner.login] = gh.users.get(repo.owner.login)
2019-02-02 21:27:20 +01:00
2019-05-05 01:48:21 +02:00
repo.user = users[repo.owner.login]
2019-05-05 01:56:22 +02:00
fullrepo = gh.repos.get(repo.owner.login, repo.name)
is_fork = hasattr(fullrepo, 'parent') and hasattr(fullrepo, 'source')
if not (args.skip_forks and is_fork):
2019-05-05 01:48:21 +02:00
process_repo(repo, args)
2013-08-02 01:21:55 +02:00
def init_parser():
2019-05-05 01:48:21 +02:00
"""
set up the argument parser
"""
parser = ArgumentParser(description="makes a backup of all of a github user's repositories")
parser.add_argument("username", help="A Github username")
parser.add_argument("backupdir", help="The folder where you want your backups to go")
parser.add_argument("-c", "--cron", help="Use this when running from a cron job", action="store_true")
parser.add_argument("-m", "--mirror", help="Create a bare mirror", action="store_true")
parser.add_argument("-f", "--skip-forks", help="Skip forks", action="store_true")
parser.add_argument("-g", "--git", nargs="+", help="Pass extra arguments to git", default="", metavar="ARGS")
parser.add_argument("-S", "--ssh", help="Use SSH protocol", action="store_true")
parser.add_argument("-s", "--suffix", help="Add suffix to repository directory names", default="")
parser.add_argument("-p", "--password", help="Authenticate with Github API")
parser.add_argument("-P", "--prefix", help="Add prefix to repository directory names", default="")
parser.add_argument("-t", "--token", help="Authenticate with Github API using OAuth token", default="")
parser.add_argument("-o", "--organization", help="Backup Organizational repositories", metavar="ORG")
return parser
2019-05-05 01:56:22 +02:00
2012-06-23 15:49:34 -04:00
def process_repo(repo, args):
2019-05-05 01:48:21 +02:00
if not args.cron:
2019-05-05 01:56:22 +02:00
print("Processing repo: %s" % (repo.full_name))
2012-06-23 15:49:34 -04:00
2019-05-05 01:48:21 +02:00
dir = "%s/%s" % (args.backupdir, repo.name + args.suffix)
config = "%s/%s" % (dir, "config" if args.mirror else ".git/config")
2019-05-05 01:48:21 +02:00
if not os.access(config, os.F_OK):
if not args.cron:
print("Repo doesn't exists, lets clone it")
2019-02-02 21:27:20 +01:00
2019-05-05 01:48:21 +02:00
clone_repo(repo, dir, args)
else:
if not args.cron:
print("Repo already exists, let's try to update it instead")
2013-08-02 01:21:55 +02:00
2019-05-05 01:48:21 +02:00
update_repo(repo, dir, args)
2013-08-02 00:50:54 +02:00
2019-02-02 21:27:20 +01:00
def clone_repo(repo, dir, args):
2019-05-05 01:48:21 +02:00
if args.mirror:
git("clone", ["--mirror", repo.git_url, dir], args.git, dir)
else:
git("clone", [repo.git_url, dir], args.git, dir)
2014-06-26 00:14:25 +02:00
2013-08-02 01:21:55 +02:00
def update_repo(repo, dir, args):
2019-05-05 01:48:21 +02:00
# GitHub => Local
2019-05-05 01:56:22 +02:00
# TODO: use subprocess package and fork git into
# background (major performance boost expected)
2019-05-05 01:48:21 +02:00
if args.mirror:
git("fetch", ["--prune"], args.git, dir)
else:
git("pull", gargs=args.git, gdir=dir)
# Fetch description and owner (useful for gitweb, cgit etc.)
if repo.description:
2019-05-05 01:56:22 +02:00
git("config", ["--local", "gitweb.description",
repo.description.encode("utf-8")], gdir=dir)
2019-05-05 01:48:21 +02:00
if repo.user.name and repo.user.email:
2019-05-05 01:56:22 +02:00
owner = "%s <%s>" % (repo.user.name.encode("utf-8"),
repo.user.email.encode("utf-8"))
git("config", ["--local", "gitweb.owner", owner], gdir=dir)
2019-05-05 01:48:21 +02:00
git("config", ["--local", "cgit.name", str(repo.name)], gdir=dir)
git("config", ["--local", "cgit.defbranch", str(repo.default_branch)], gdir=dir)
git("config", ["--local", "cgit.clone-url", str(repo.clone_url)], gdir=dir)
2019-05-05 01:56:22 +02:00
def git(gcmd, args=[], gargs=[], gdir=""):
2019-05-05 01:48:21 +02:00
cmd = ["git"]
if gdir:
cmd.append("--git-dir")
cmd.append(gdir)
cmd.append(gcmd)
cmd.extend(gargs)
cmd.extend(args)
2019-05-05 01:48:21 +02:00
subprocess.call(cmd)
if __name__ == "__main__":
2019-05-05 01:48:21 +02:00
main()