forked from importers/git-importer
		
	Compare commits
	
		
			20 Commits
		
	
	
		
	
	| Author | SHA1 | Date | |
|---|---|---|---|
|  | c8455c22dc | ||
|  | 94fdb3b442 | ||
|  | f2358446da | ||
| 9660e633af | |||
| 85b9ed5e75 | |||
| 86f82325d8 | |||
|  | 39ba616226 | ||
| 531dbc7c1b | |||
|  | 1318f9e0c4 | ||
|  | d563076d9e | ||
| b11b3f1adb | |||
|  | 479738d4b2 | ||
|  | 2d04136ca5 | ||
|  | 40ad64ddff | ||
|  | 6bd5d72100 | ||
|  | 022ae5ab58 | ||
|  | 2ff8ed76d0 | ||
|  | 5f228dc046 | ||
|  | 4e07d8272e | ||
|  | 2a3475ab6e | 
							
								
								
									
										2
									
								
								Makefile
									
									
									
									
									
								
							
							
						
						
									
										2
									
								
								Makefile
									
									
									
									
									
								
							| @@ -9,5 +9,5 @@ test: | |||||||
| update-packages: | update-packages: | ||||||
| 	f=$$(mktemp) ;\ | 	f=$$(mktemp) ;\ | ||||||
| 	osc api /source/openSUSE:Factory?view=info | grep -v lsrcmd5 | grep srcmd5= | sed -e 's,.*package=",,; s,".*,,' | grep -v : > $$f ;\ | 	osc api /source/openSUSE:Factory?view=info | grep -v lsrcmd5 | grep srcmd5= | sed -e 's,.*package=",,; s,".*,,' | grep -v : > $$f ;\ | ||||||
| 	echo _project >> $$f ;\ | 	echo _project >> $$f;\ | ||||||
| 	mv $$f packages | 	mv $$f packages | ||||||
|   | |||||||
							
								
								
									
										19
									
								
								README.md
									
									
									
									
									
								
							
							
						
						
									
										19
									
								
								README.md
									
									
									
									
									
								
							| @@ -1,5 +1,18 @@ | |||||||
| sudo zypper in python3-psycopg | Installation | ||||||
| sudo su - postgres | ------------ | ||||||
| # `createdb -O <LOCAL_USER> imported_git` |  | ||||||
|  |     sudo zypper in python3-psycopg | ||||||
|  |     sudo su - postgres | ||||||
|  |     createdb -O <LOCAL_USER> imported_git` | ||||||
|  |  | ||||||
| To reset the database, drop table scheme | To reset the database, drop table scheme | ||||||
|  |  | ||||||
|  |  | ||||||
|  | Gitea parameters | ||||||
|  | ---------------- | ||||||
|  |  | ||||||
|  |   * `GITEA_HOST` - default: src.opensuse.org | ||||||
|  |   * `GITEA_USER` - Used to generate SSH links for push. Default: gitea | ||||||
|  |   * `GITEA_ORG`  - target organization to push to | ||||||
|  |   * `GITEA_DEFAULT_BRANCH` - default branch | ||||||
|  |  | ||||||
|   | |||||||
| @@ -42,8 +42,8 @@ PROJECTS = [ | |||||||
| ] | ] | ||||||
|  |  | ||||||
|  |  | ||||||
| def export_package(package, repodir, cachedir, gc): | def export_package(project, package, repodir, cachedir, gc): | ||||||
|     exporter = GitExporter(URL_OBS, "openSUSE:Factory", package, repodir, cachedir) |     exporter = GitExporter(URL_OBS, project, package, repodir, cachedir) | ||||||
|     exporter.set_gc_interval(gc) |     exporter.set_gc_interval(gc) | ||||||
|     exporter.export_as_git() |     exporter.export_as_git() | ||||||
|  |  | ||||||
| @@ -51,6 +51,12 @@ def export_package(package, repodir, cachedir, gc): | |||||||
| def main(): | def main(): | ||||||
|     parser = argparse.ArgumentParser(description="OBS history importer into git") |     parser = argparse.ArgumentParser(description="OBS history importer into git") | ||||||
|     parser.add_argument("packages", help="OBS package names", nargs="*") |     parser.add_argument("packages", help="OBS package names", nargs="*") | ||||||
|  |     parser.add_argument( | ||||||
|  |         "-p", | ||||||
|  |         "--project", | ||||||
|  |         default="openSUSE:Factory", | ||||||
|  |         help="Project to import/export, default is openSUSE:Factory", | ||||||
|  |     ) | ||||||
|     parser.add_argument( |     parser.add_argument( | ||||||
|         "-r", |         "-r", | ||||||
|         "--repodir", |         "--repodir", | ||||||
| @@ -110,10 +116,13 @@ def main(): | |||||||
|     if not args.cachedir: |     if not args.cachedir: | ||||||
|         args.cachedir = pathlib.Path("~/.cache/git-import/").expanduser() |         args.cachedir = pathlib.Path("~/.cache/git-import/").expanduser() | ||||||
|  |  | ||||||
|     importer = Importer(URL_OBS, "openSUSE:Factory", args.packages) |     importer = Importer(URL_OBS, args.project, args.packages) | ||||||
|     importer.import_into_db() |     importer.import_into_db() | ||||||
|     for package in args.packages: |     for package in args.packages: | ||||||
|         export_package(package, args.repodir, args.cachedir, args.gc) |         if not importer.package_with_scmsync(package): | ||||||
|  |             export_package(args.project, package, args.repodir, args.cachedir, args.gc) | ||||||
|  |         else: | ||||||
|  |             logging.debug(f"{args.project}/{package} has scmsync links - skipping export") | ||||||
|  |  | ||||||
|  |  | ||||||
| if __name__ == "__main__": | if __name__ == "__main__": | ||||||
|   | |||||||
							
								
								
									
										37
									
								
								lib/git.py
									
									
									
									
									
								
							
							
						
						
									
										37
									
								
								lib/git.py
									
									
									
									
									
								
							| @@ -48,6 +48,7 @@ class Git: | |||||||
|     def open(self): |     def open(self): | ||||||
|         if not self.exists(): |         if not self.exists(): | ||||||
|             self.git_run(["init", "--object-format=sha256", "-b", "factory"]) |             self.git_run(["init", "--object-format=sha256", "-b", "factory"]) | ||||||
|  |         self.git_run(["config", "lfs.allowincompletepush", "true"]) | ||||||
|  |  | ||||||
|     def is_dirty(self): |     def is_dirty(self): | ||||||
|         """Check if there is something to commit""" |         """Check if there is something to commit""" | ||||||
| @@ -85,7 +86,7 @@ class Git: | |||||||
|         """Checkout into the branch HEAD""" |         """Checkout into the branch HEAD""" | ||||||
|         new_branch = False |         new_branch = False | ||||||
|         if branch not in self.branches(): |         if branch not in self.branches(): | ||||||
|             self.git_run(["branch", "-q", branch, "HEAD"]) |             self.git_run(["switch", "-q", "--orphan", branch]) | ||||||
|             new_branch = True |             new_branch = True | ||||||
|         else: |         else: | ||||||
|             ref = f"refs/heads/{branch}" |             ref = f"refs/heads/{branch}" | ||||||
| @@ -180,7 +181,13 @@ class Git: | |||||||
|     #                logging.warning(f"Error removing file {path}: {e}") |     #                logging.warning(f"Error removing file {path}: {e}") | ||||||
|  |  | ||||||
|     def add(self, filename): |     def add(self, filename): | ||||||
|         self.git_run(["add", filename]) |         self.git_run(["add", ":(literal)" + str(filename)]) | ||||||
|  |  | ||||||
|  |     def add_default_gitignore(self): | ||||||
|  |         if not (self.path / ".gitignore").exists(): | ||||||
|  |             with (self.path / ".gitignore").open("w") as f: | ||||||
|  |                 f.write(".osc\n") | ||||||
|  |             self.add(".gitignore") | ||||||
|  |  | ||||||
|     def add_default_lfs_gitattributes(self, force=False): |     def add_default_lfs_gitattributes(self, force=False): | ||||||
|         if not (self.path / ".gitattributes").exists() or force: |         if not (self.path / ".gitattributes").exists() or force: | ||||||
| @@ -235,7 +242,7 @@ class Git: | |||||||
|  |  | ||||||
|     def remove(self, file: pathlib.Path): |     def remove(self, file: pathlib.Path): | ||||||
|         self.git_run( |         self.git_run( | ||||||
|             ["rm", "-q", "-f", "--ignore-unmatch", file.name], |             ["rm", "-q", "-f", "--ignore-unmatch", ":(literal)" + file.name], | ||||||
|         ) |         ) | ||||||
|         patterns = self.get_specific_lfs_gitattributes() |         patterns = self.get_specific_lfs_gitattributes() | ||||||
|         if file.name in patterns: |         if file.name in patterns: | ||||||
| @@ -245,15 +252,27 @@ class Git: | |||||||
|     def add_gitea_remote(self, package): |     def add_gitea_remote(self, package): | ||||||
|         repo_name = package.replace("+", "_") |         repo_name = package.replace("+", "_") | ||||||
|         org_name = "rpm" |         org_name = "rpm" | ||||||
|  |         gitea_user = "gitea" | ||||||
|  |         gitea_host = "src.opensuse.org" | ||||||
|  |         default_branch = "factory" | ||||||
|  |  | ||||||
|  |         if os.getenv("GITEA_HOST"): | ||||||
|  |             gitea_host = getenv("GITEA_HOST") | ||||||
|  |         if os.getenv("GITEA_USER"): | ||||||
|  |             gitea_user = getenv("GITEA_USER") | ||||||
|  |         if os.getenv("GITEA_ORG"): | ||||||
|  |             org_name = getenv("GITEA_ORG") | ||||||
|  |         if os.getenv("GITEA_DEFAULT_BRANCH"): | ||||||
|  |             default_branch = getenv("GITEA_DEFAULT_BRANCH") | ||||||
|  |  | ||||||
|         if not os.getenv("GITEA_TOKEN"): |         if not os.getenv("GITEA_TOKEN"): | ||||||
|             logging.warning("Not adding a remote due to missing $GITEA_TOKEN") |             logging.warning("Not adding a remote due to missing $GITEA_TOKEN") | ||||||
|             return |             return | ||||||
|  |  | ||||||
|         url = f"https://src.opensuse.org/api/v1/org/{org_name}/repos" |         url = f"https://{gitea_host}/api/v1/org/{org_name}/repos" | ||||||
|         response = requests.post( |         response = requests.post( | ||||||
|             url, |             url, | ||||||
|             data={"name": repo_name}, |             data={"name": repo_name, "object_format_name": "sha256", "default_branch": default_branch}, | ||||||
|             headers={"Authorization": f"token {os.getenv('GITEA_TOKEN')}"}, |             headers={"Authorization": f"token {os.getenv('GITEA_TOKEN')}"}, | ||||||
|             timeout=10, |             timeout=10, | ||||||
|         ) |         ) | ||||||
| @@ -261,7 +280,7 @@ class Git: | |||||||
|         # 201 Created |         # 201 Created | ||||||
|         if response.status_code not in (201, 409): |         if response.status_code not in (201, 409): | ||||||
|             print(response.data) |             print(response.data) | ||||||
|         url = f"gitea@src.opensuse.org:{org_name}/{repo_name}.git" |         url = f"{gitea_user}@{gitea_host}:{org_name}/{repo_name}.git" | ||||||
|         self.git_run( |         self.git_run( | ||||||
|             ["remote", "add", "origin", url], |             ["remote", "add", "origin", url], | ||||||
|         ) |         ) | ||||||
| @@ -271,13 +290,11 @@ class Git: | |||||||
|             ["remote"], |             ["remote"], | ||||||
|             stdout=subprocess.PIPE, |             stdout=subprocess.PIPE, | ||||||
|         ).stdout.decode("utf-8"): |         ).stdout.decode("utf-8"): | ||||||
|             logger.warning("Not pushing to remote because no 'origin' configured") |             logging.warning("Not pushing to remote because no 'origin' configured") | ||||||
|             return |             return | ||||||
|  |  | ||||||
|         cmd = ["push"] |         cmd = ["push"] | ||||||
|         if force: |         if force: | ||||||
|             cmd.append("-f") |             cmd.append("-f") | ||||||
|         cmd.append("origin") |         cmd += ["origin", "--all"] | ||||||
|         cmd.append("refs/heads/factory") |  | ||||||
|         cmd.append("refs/heads/devel") |  | ||||||
|         self.git_run(cmd) |         self.git_run(cmd) | ||||||
|   | |||||||
| @@ -29,7 +29,7 @@ class GitExporter: | |||||||
|             self.git.open() |             self.git.open() | ||||||
|         else: |         else: | ||||||
|             self.git.create() |             self.git.create() | ||||||
|             self.git.add_gitea_remote(package) |             # self.git.add_gitea_remote(package) | ||||||
|         self.state_file = os.path.join(self.git.path, ".git", "_flat_state.yaml") |         self.state_file = os.path.join(self.git.path, ".git", "_flat_state.yaml") | ||||||
|         self.gc_interval = 200 |         self.gc_interval = 200 | ||||||
|         self.cachedir = cachedir |         self.cachedir = cachedir | ||||||
| @@ -86,6 +86,11 @@ class GitExporter: | |||||||
|             logging.debug(f"Committing {flat}") |             logging.debug(f"Committing {flat}") | ||||||
|             self.commit_flat(flat, branch_state) |             self.commit_flat(flat, branch_state) | ||||||
|  |  | ||||||
|  |         # make sure that we create devel branch | ||||||
|  |         if not branch_state["devel"]: | ||||||
|  |             logging.debug("force creating devel") | ||||||
|  |             self.git.set_branch_head("devel", self.git.branch_head("factory")) | ||||||
|  |  | ||||||
|         self.git.push(force=True) |         self.git.push(force=True) | ||||||
|  |  | ||||||
|     def run_gc(self): |     def run_gc(self): | ||||||
| @@ -150,6 +155,7 @@ class GitExporter: | |||||||
|  |  | ||||||
|         # create file if not existant |         # create file if not existant | ||||||
|         self.git.add_default_lfs_gitattributes(force=False) |         self.git.add_default_lfs_gitattributes(force=False) | ||||||
|  |         self.git.add_default_gitignore() | ||||||
|  |  | ||||||
|         to_download, to_delete = flat.commit.calc_delta(branch_state[flat.branch]) |         to_download, to_delete = flat.commit.calc_delta(branch_state[flat.branch]) | ||||||
|         for file in to_delete: |         for file in to_delete: | ||||||
|   | |||||||
| @@ -26,13 +26,16 @@ class Importer: | |||||||
|         # Import multiple Factory packages into the database |         # Import multiple Factory packages into the database | ||||||
|         self.packages = packages |         self.packages = packages | ||||||
|         self.project = project |         self.project = project | ||||||
|  |         self.scmsync_cache = dict() | ||||||
|  |         self.packages_with_scmsync = set() | ||||||
|  |  | ||||||
|         self.db = DB() |         self.db = DB() | ||||||
|         self.obs = OBS(api_url) |         self.obs = OBS(api_url) | ||||||
|         assert project == "openSUSE:Factory" |         assert not self.has_scmsync(project) | ||||||
|         self.refreshed_packages = set() |         self.refreshed_packages = set() | ||||||
|         self.gone_packages_set = None |         self.gone_packages_set = None | ||||||
|  |  | ||||||
|  |  | ||||||
|     def import_request(self, number): |     def import_request(self, number): | ||||||
|         self.obs.request(number).import_into_db(self.db) |         self.obs.request(number).import_into_db(self.db) | ||||||
|  |  | ||||||
| @@ -213,6 +216,10 @@ class Importer: | |||||||
|             return |             return | ||||||
|         logging.debug(f"Refresh {project}/{package}") |         logging.debug(f"Refresh {project}/{package}") | ||||||
|         self.refreshed_packages.add(key) |         self.refreshed_packages.add(key) | ||||||
|  |         if self.has_scmsync(project) or self.has_scmsync(key): | ||||||
|  |             self.packages_with_scmsync.add(package) | ||||||
|  |             logging.debug(f"{project}/{package} already in Git - skipping") | ||||||
|  |             return | ||||||
|         self.update_db_package(project, package) |         self.update_db_package(project, package) | ||||||
|         self.fetch_all_linked_packages(project, package) |         self.fetch_all_linked_packages(project, package) | ||||||
|  |  | ||||||
| @@ -255,3 +262,18 @@ class Importer: | |||||||
|                 for line in f.readlines(): |                 for line in f.readlines(): | ||||||
|                     self.gone_packages_set.add(line.strip()) |                     self.gone_packages_set.add(line.strip()) | ||||||
|         return key in self.gone_packages_set |         return key in self.gone_packages_set | ||||||
|  |  | ||||||
|  |     def has_scmsync(self, key): | ||||||
|  |         if key in self.scmsync_cache: | ||||||
|  |             return self.scmsync_cache[key] | ||||||
|  |  | ||||||
|  |         root = self.obs._meta(key) | ||||||
|  |         scmsync_exists = False | ||||||
|  |         if root is not None: | ||||||
|  |             scmsync_exists = root.find('scmsync') is not None | ||||||
|  |         self.scmsync_cache[key] = scmsync_exists | ||||||
|  |         return scmsync_exists | ||||||
|  |  | ||||||
|  |     def package_with_scmsync(self, package): | ||||||
|  |         return package in self.packages_with_scmsync | ||||||
|  |  | ||||||
|   | |||||||
| @@ -83,6 +83,7 @@ class LFSOid: | |||||||
|             self.register() |             self.register() | ||||||
|  |  | ||||||
|     def check(self): |     def check(self): | ||||||
|  |         return True | ||||||
|         url = f"http://localhost:9999/check/{self.sha256}/{self.size}" |         url = f"http://localhost:9999/check/{self.sha256}/{self.size}" | ||||||
|         response = requests.get( |         response = requests.get( | ||||||
|             url, |             url, | ||||||
|   | |||||||
							
								
								
									
										10
									
								
								lib/obs.py
									
									
									
									
									
								
							
							
						
						
									
										10
									
								
								lib/obs.py
									
									
									
									
									
								
							| @@ -73,11 +73,11 @@ class OBS: | |||||||
|         logging.debug(f"GET {url}") |         logging.debug(f"GET {url}") | ||||||
|         return ET.parse(osc.core.http_GET(url)).getroot() |         return ET.parse(osc.core.http_GET(url)).getroot() | ||||||
|  |  | ||||||
|     def _meta(self, project, package, **params): |     def _meta(self, key, **params): | ||||||
|         try: |         try: | ||||||
|             root = self._xml(f"source/{project}/{package}/_meta", **params) |             root = self._xml(f"source/{key}/_meta", **params) | ||||||
|         except HTTPError: |         except HTTPError: | ||||||
|             logging.error(f"Package [{project}/{package} {params}] has no meta") |             logging.error(f"Project/Package [{key} {params}] has no meta") | ||||||
|             return None |             return None | ||||||
|         return root |         return root | ||||||
|  |  | ||||||
| @@ -118,13 +118,13 @@ class OBS: | |||||||
|         return root |         return root | ||||||
|  |  | ||||||
|     def exists(self, project, package): |     def exists(self, project, package): | ||||||
|         root = self._meta(project, package) |         root = self._meta(f"{project}/{package}") | ||||||
|         if root is None: |         if root is None: | ||||||
|             return False |             return False | ||||||
|         return root.get("project") == project |         return root.get("project") == project | ||||||
|  |  | ||||||
|     def devel_project(self, project, package): |     def devel_project(self, project, package): | ||||||
|         root = self._meta(project, package) |         root = self._meta(f"{project}/{package}") | ||||||
|         devel = root.find("devel") |         devel = root.find("devel") | ||||||
|         if devel is None: |         if devel is None: | ||||||
|             return None |             return None | ||||||
|   | |||||||
| @@ -2,36 +2,58 @@ | |||||||
| import json | import json | ||||||
| from pathlib import Path | from pathlib import Path | ||||||
| import pika | import pika | ||||||
| import sys | import random | ||||||
|  | import time | ||||||
|  |  | ||||||
| MY_TASKS_DIR = Path(__file__).parent / "tasks" | MY_TASKS_DIR = Path(__file__).parent / "tasks" | ||||||
|  |  | ||||||
| connection = pika.BlockingConnection(pika.URLParameters("amqps://opensuse:opensuse@rabbit.opensuse.org")) |  | ||||||
| channel = connection.channel() |  | ||||||
|  |  | ||||||
| channel.exchange_declare(exchange='pubsub', exchange_type='topic', passive=True, durable=True) | def listen_events(): | ||||||
|  |     connection = pika.BlockingConnection( | ||||||
|  |         pika.URLParameters("amqps://opensuse:opensuse@rabbit.opensuse.org") | ||||||
|  |     ) | ||||||
|  |     channel = connection.channel() | ||||||
|  |  | ||||||
| result = channel.queue_declare("", exclusive=True) |     channel.exchange_declare( | ||||||
| queue_name = result.method.queue |         exchange="pubsub", exchange_type="topic", passive=True, durable=False | ||||||
|  |     ) | ||||||
|  |  | ||||||
| channel.queue_bind(exchange='pubsub', |     result = channel.queue_declare("", exclusive=True) | ||||||
|                    queue=queue_name,routing_key='#') |     queue_name = result.method.queue | ||||||
|  |  | ||||||
| print(' [*] Waiting for logs. To exit press CTRL+C') |     channel.queue_bind( | ||||||
|  |         exchange="pubsub", queue=queue_name, routing_key="opensuse.obs.package.commit" | ||||||
|  |     ) | ||||||
|  |  | ||||||
| def callback(ch, method, properties, body): |     print(" [*] Waiting for logs. To exit press CTRL+C") | ||||||
|  |  | ||||||
|  |     def callback(ch, method, properties, body): | ||||||
|         if method.routing_key not in ("opensuse.obs.package.commit",): |         if method.routing_key not in ("opensuse.obs.package.commit",): | ||||||
|             return |             return | ||||||
|         body = json.loads(body) |         body = json.loads(body) | ||||||
|     if 'project' in body and 'package' in body and body['project'] == 'openSUSE:Factory': |         if ( | ||||||
|         if '/' in body['package']: |             "project" in body | ||||||
|  |             and "package" in body | ||||||
|  |             and body["project"] == "openSUSE:Factory" | ||||||
|  |         ): | ||||||
|  |             if "/" in body["package"]: | ||||||
|                 return |                 return | ||||||
|  |  | ||||||
|         (MY_TASKS_DIR / body['package']).touch() |             (MY_TASKS_DIR / body["package"]).touch() | ||||||
|         print(" [x] %r:%r" % (method.routing_key, body['package'])) |             print(" [x] %r:%r" % (method.routing_key, body["package"])) | ||||||
|  |  | ||||||
| channel.basic_consume(queue_name, |     channel.basic_consume(queue_name, callback, auto_ack=True) | ||||||
|                       callback, |  | ||||||
|                       auto_ack=True) |  | ||||||
|  |  | ||||||
| channel.start_consuming() |     channel.start_consuming() | ||||||
|  |  | ||||||
|  |  | ||||||
|  | def main(): | ||||||
|  |     while True: | ||||||
|  |         try: | ||||||
|  |             listen_events() | ||||||
|  |         except (pika.exceptions.ConnectionClosed, pika.exceptions.AMQPHeartbeatTimeout): | ||||||
|  |             time.sleep(random.randint(10, 100)) | ||||||
|  |  | ||||||
|  |  | ||||||
|  | if __name__ == "__main__": | ||||||
|  |     main() | ||||||
|   | |||||||
							
								
								
									
										19
									
								
								update-tasks.sh
									
									
									
									
									
										Executable file
									
								
							
							
						
						
									
										19
									
								
								update-tasks.sh
									
									
									
									
									
										Executable file
									
								
							| @@ -0,0 +1,19 @@ | |||||||
|  | #!/bin/bash | ||||||
|  | # | ||||||
|  | cd /space/dmueller/git-importer | ||||||
|  |  | ||||||
|  | source credentials.sh | ||||||
|  |  | ||||||
|  | while true; do | ||||||
|  |    for i in $PWD/tasks/*; do | ||||||
|  |        if test -f "$i"; then | ||||||
|  |             echo "$(date): Importing $(basename $i)" | ||||||
|  |             if ! python3 ./git-importer.py -c repos/.cache $(basename $i); then | ||||||
|  |                 mkdir -p $PWD/failed-tasks | ||||||
|  |                 mv -f $i $PWD/failed-tasks | ||||||
|  |             fi | ||||||
|  |             rm -f $i | ||||||
|  |         fi | ||||||
|  |    done | ||||||
|  |    inotifywait -q -e create $PWD/tasks | ||||||
|  | done | ||||||
		Reference in New Issue
	
	Block a user