2023-02-03 20:28:55 +00:00
|
|
|
import subprocess
|
2023-02-08 16:28:05 +00:00
|
|
|
import json
|
2023-04-03 16:29:06 +00:00
|
|
|
import datetime
|
2023-02-03 20:28:55 +00:00
|
|
|
|
2023-02-13 11:16:35 +00:00
|
|
|
from typing import List
|
2023-04-14 11:58:39 +00:00
|
|
|
from collections.abc import Iterable
|
2023-06-07 15:55:38 +00:00
|
|
|
from json.decoder import JSONDecodeError
|
2023-02-13 11:16:35 +00:00
|
|
|
|
2023-06-16 15:48:58 +00:00
|
|
|
from selfprivacy_api.backup.backuppers import AbstractBackuper
|
2023-02-13 11:16:35 +00:00
|
|
|
from selfprivacy_api.models.backup.snapshot import Snapshot
|
2023-05-17 20:09:29 +00:00
|
|
|
from selfprivacy_api.backup.jobs import get_backup_job
|
|
|
|
from selfprivacy_api.services import get_service_by_id
|
|
|
|
from selfprivacy_api.jobs import Jobs, JobStatus
|
2023-01-23 13:43:18 +00:00
|
|
|
|
2023-02-17 15:55:19 +00:00
|
|
|
from selfprivacy_api.backup.local_secret import LocalBackupSecret
|
|
|
|
|
2023-01-23 13:43:18 +00:00
|
|
|
|
|
|
|
class ResticBackuper(AbstractBackuper):
|
2023-01-23 14:21:43 +00:00
|
|
|
def __init__(self, login_flag: str, key_flag: str, type: str):
|
|
|
|
self.login_flag = login_flag
|
|
|
|
self.key_flag = key_flag
|
|
|
|
self.type = type
|
2023-02-03 20:28:55 +00:00
|
|
|
self.account = ""
|
|
|
|
self.key = ""
|
2023-05-17 17:48:06 +00:00
|
|
|
self.repo = ""
|
2023-02-03 20:28:55 +00:00
|
|
|
|
2023-05-17 17:48:06 +00:00
|
|
|
def set_creds(self, account: str, key: str, repo: str):
|
2023-02-03 20:28:55 +00:00
|
|
|
self.account = account
|
|
|
|
self.key = key
|
2023-05-17 17:48:06 +00:00
|
|
|
self.repo = repo
|
2023-01-23 14:21:43 +00:00
|
|
|
|
2023-05-17 17:48:06 +00:00
|
|
|
def restic_repo(self) -> str:
|
2023-01-23 14:21:43 +00:00
|
|
|
# https://restic.readthedocs.io/en/latest/030_preparing_a_new_repo.html#other-services-via-rclone
|
|
|
|
# https://forum.rclone.org/t/can-rclone-be-run-solely-with-command-line-options-no-config-no-env-vars/6314/5
|
2023-05-17 17:48:06 +00:00
|
|
|
return f"rclone:{self.type}{self.repo}"
|
2023-01-23 14:21:43 +00:00
|
|
|
|
|
|
|
def rclone_args(self):
|
|
|
|
return "rclone.args=serve restic --stdio" + self.backend_rclone_args()
|
|
|
|
|
2023-02-08 14:05:25 +00:00
|
|
|
def backend_rclone_args(self) -> str:
|
2023-02-03 18:03:13 +00:00
|
|
|
acc_arg = ""
|
|
|
|
key_arg = ""
|
2023-02-08 14:05:25 +00:00
|
|
|
if self.account != "":
|
|
|
|
acc_arg = f"{self.login_flag} {self.account}"
|
|
|
|
if self.key != "":
|
|
|
|
key_arg = f"{self.key_flag} {self.key}"
|
2023-02-03 18:03:13 +00:00
|
|
|
|
|
|
|
return f"{acc_arg} {key_arg}"
|
2023-01-23 14:21:43 +00:00
|
|
|
|
2023-02-17 15:55:19 +00:00
|
|
|
def _password_command(self):
|
|
|
|
return f"echo {LocalBackupSecret.get()}"
|
|
|
|
|
2023-06-23 09:40:10 +00:00
|
|
|
def restic_command(self, *args, tag: str = ""):
|
2023-02-08 14:05:25 +00:00
|
|
|
command = [
|
2023-01-23 14:21:43 +00:00
|
|
|
"restic",
|
|
|
|
"-o",
|
|
|
|
self.rclone_args(),
|
|
|
|
"-r",
|
2023-05-17 17:48:06 +00:00
|
|
|
self.restic_repo(),
|
2023-02-17 15:55:19 +00:00
|
|
|
"--password-command",
|
|
|
|
self._password_command(),
|
2023-02-08 14:05:25 +00:00
|
|
|
]
|
2023-06-23 09:40:10 +00:00
|
|
|
if tag != "":
|
2023-05-17 17:48:06 +00:00
|
|
|
command.extend(
|
|
|
|
[
|
|
|
|
"--tag",
|
2023-06-23 09:40:10 +00:00
|
|
|
tag,
|
2023-05-17 17:48:06 +00:00
|
|
|
]
|
|
|
|
)
|
2023-02-08 14:05:25 +00:00
|
|
|
if args != []:
|
2023-04-14 11:58:39 +00:00
|
|
|
command.extend(ResticBackuper.__flatten_list(args))
|
2023-02-08 14:05:25 +00:00
|
|
|
return command
|
2023-02-03 20:28:55 +00:00
|
|
|
|
2023-04-14 11:58:39 +00:00
|
|
|
@staticmethod
|
|
|
|
def __flatten_list(list):
|
|
|
|
"""string-aware list flattener"""
|
|
|
|
result = []
|
|
|
|
for item in list:
|
|
|
|
if isinstance(item, Iterable) and not isinstance(item, str):
|
|
|
|
result.extend(ResticBackuper.__flatten_list(item))
|
|
|
|
continue
|
|
|
|
result.append(item)
|
|
|
|
return result
|
|
|
|
|
2023-05-17 20:09:29 +00:00
|
|
|
@staticmethod
|
|
|
|
def output_yielder(command):
|
|
|
|
with subprocess.Popen(
|
|
|
|
command,
|
|
|
|
shell=False,
|
|
|
|
stdout=subprocess.PIPE,
|
|
|
|
stderr=subprocess.STDOUT,
|
|
|
|
universal_newlines=True,
|
|
|
|
) as handle:
|
|
|
|
for line in iter(handle.stdout.readline, ""):
|
2023-06-23 09:40:10 +00:00
|
|
|
if "NOTICE:" not in line:
|
2023-05-17 20:09:29 +00:00
|
|
|
yield line
|
|
|
|
|
2023-06-23 09:40:10 +00:00
|
|
|
def start_backup(self, folders: List[str], tag: str):
|
2023-02-03 20:28:55 +00:00
|
|
|
"""
|
|
|
|
Start backup with restic
|
|
|
|
"""
|
2023-04-14 11:20:03 +00:00
|
|
|
|
|
|
|
# but maybe it is ok to accept a union of a string and an array of strings
|
|
|
|
assert not isinstance(folders, str)
|
|
|
|
|
2023-02-03 20:28:55 +00:00
|
|
|
backup_command = self.restic_command(
|
|
|
|
"backup",
|
2023-04-03 16:29:06 +00:00
|
|
|
"--json",
|
2023-04-14 11:58:39 +00:00
|
|
|
folders,
|
2023-06-23 09:40:10 +00:00
|
|
|
tag=tag,
|
2023-02-03 20:28:55 +00:00
|
|
|
)
|
2023-05-17 20:09:29 +00:00
|
|
|
|
|
|
|
messages = []
|
2023-06-23 09:40:10 +00:00
|
|
|
job = get_backup_job(get_service_by_id(tag))
|
2023-05-17 20:09:29 +00:00
|
|
|
try:
|
|
|
|
for raw_message in ResticBackuper.output_yielder(backup_command):
|
2023-05-17 20:21:37 +00:00
|
|
|
message = self.parse_message(raw_message, job)
|
2023-05-17 20:09:29 +00:00
|
|
|
messages.append(message)
|
2023-06-23 09:40:10 +00:00
|
|
|
return ResticBackuper._snapshot_from_backup_messages(messages, tag)
|
2023-05-17 20:09:29 +00:00
|
|
|
except ValueError as e:
|
|
|
|
raise ValueError("could not create a snapshot: ", messages) from e
|
2023-04-03 16:29:06 +00:00
|
|
|
|
|
|
|
@staticmethod
|
|
|
|
def _snapshot_from_backup_messages(messages, repo_name) -> Snapshot:
|
|
|
|
for message in messages:
|
|
|
|
if message["message_type"] == "summary":
|
|
|
|
return ResticBackuper._snapshot_from_fresh_summary(message, repo_name)
|
2023-04-03 17:23:16 +00:00
|
|
|
raise ValueError("no summary message in restic json output")
|
2023-04-03 16:29:06 +00:00
|
|
|
|
2023-05-17 20:21:37 +00:00
|
|
|
def parse_message(self, raw_message, job=None) -> object:
|
2023-06-23 09:40:10 +00:00
|
|
|
message = ResticBackuper.parse_json_output(raw_message)
|
2023-05-17 20:21:37 +00:00
|
|
|
if message["message_type"] == "status":
|
|
|
|
if job is not None: # only update status if we run under some job
|
|
|
|
Jobs.update(
|
|
|
|
job,
|
|
|
|
JobStatus.RUNNING,
|
|
|
|
progress=int(message["percent_done"]),
|
|
|
|
)
|
|
|
|
return message
|
2023-05-17 20:09:29 +00:00
|
|
|
|
2023-04-03 16:29:06 +00:00
|
|
|
@staticmethod
|
|
|
|
def _snapshot_from_fresh_summary(message: object, repo_name) -> Snapshot:
|
|
|
|
return Snapshot(
|
|
|
|
id=message["snapshot_id"],
|
|
|
|
created_at=datetime.datetime.now(datetime.timezone.utc),
|
|
|
|
service_name=repo_name,
|
|
|
|
)
|
2023-02-08 15:40:45 +00:00
|
|
|
|
2023-05-29 16:50:14 +00:00
|
|
|
def init(self):
|
2023-02-17 15:59:27 +00:00
|
|
|
init_command = self.restic_command(
|
|
|
|
"init",
|
|
|
|
)
|
2023-02-20 13:04:39 +00:00
|
|
|
with subprocess.Popen(
|
2023-02-17 15:59:27 +00:00
|
|
|
init_command,
|
|
|
|
shell=False,
|
2023-02-20 13:04:39 +00:00
|
|
|
stdout=subprocess.PIPE,
|
2023-02-17 15:59:27 +00:00
|
|
|
stderr=subprocess.STDOUT,
|
2023-02-20 13:04:39 +00:00
|
|
|
) as process_handle:
|
|
|
|
output = process_handle.communicate()[0].decode("utf-8")
|
|
|
|
if not "created restic repository" in output:
|
|
|
|
raise ValueError("cannot init a repo: " + output)
|
2023-02-17 15:59:27 +00:00
|
|
|
|
2023-05-29 16:50:14 +00:00
|
|
|
def is_initted(self) -> bool:
|
2023-03-14 00:39:15 +00:00
|
|
|
command = self.restic_command(
|
|
|
|
"check",
|
|
|
|
"--json",
|
|
|
|
)
|
|
|
|
|
|
|
|
with subprocess.Popen(command, stdout=subprocess.PIPE, shell=False) as handle:
|
|
|
|
output = handle.communicate()[0].decode("utf-8")
|
2023-06-23 09:40:10 +00:00
|
|
|
if not ResticBackuper.has_json(output):
|
2023-03-14 00:39:15 +00:00
|
|
|
return False
|
|
|
|
# raise NotImplementedError("error(big): " + output)
|
|
|
|
return True
|
|
|
|
|
2023-06-23 09:40:10 +00:00
|
|
|
def restored_size(self, snapshot_id: str) -> int:
|
2023-02-22 18:48:08 +00:00
|
|
|
"""
|
|
|
|
Size of a snapshot
|
|
|
|
"""
|
|
|
|
command = self.restic_command(
|
|
|
|
"stats",
|
|
|
|
snapshot_id,
|
|
|
|
"--json",
|
|
|
|
)
|
|
|
|
|
2023-06-23 09:40:10 +00:00
|
|
|
with subprocess.Popen(
|
|
|
|
command,
|
|
|
|
stdout=subprocess.PIPE,
|
|
|
|
shell=False,
|
|
|
|
) as handle:
|
2023-02-22 18:48:08 +00:00
|
|
|
output = handle.communicate()[0].decode("utf-8")
|
|
|
|
try:
|
2023-06-23 09:40:10 +00:00
|
|
|
parsed_output = ResticBackuper.parse_json_output(output)
|
2023-02-22 18:48:08 +00:00
|
|
|
return parsed_output["total_size"]
|
|
|
|
except ValueError as e:
|
|
|
|
raise ValueError("cannot restore a snapshot: " + output) from e
|
|
|
|
|
2023-06-23 09:40:10 +00:00
|
|
|
def restore_from_backup(self, snapshot_id, folders):
|
2023-02-08 15:40:45 +00:00
|
|
|
"""
|
|
|
|
Restore from backup with restic
|
|
|
|
"""
|
2023-02-22 15:58:36 +00:00
|
|
|
# snapshots save the path of the folder in the file system
|
|
|
|
# I do not alter the signature yet because maybe this can be
|
|
|
|
# changed with flags
|
2023-02-08 15:40:45 +00:00
|
|
|
restore_command = self.restic_command(
|
2023-02-22 15:58:36 +00:00
|
|
|
"restore",
|
|
|
|
snapshot_id,
|
|
|
|
"--target",
|
|
|
|
"/",
|
2023-02-08 15:40:45 +00:00
|
|
|
)
|
|
|
|
|
2023-02-22 14:45:11 +00:00
|
|
|
with subprocess.Popen(
|
|
|
|
restore_command, stdout=subprocess.PIPE, shell=False
|
|
|
|
) as handle:
|
|
|
|
|
2023-06-07 15:55:38 +00:00
|
|
|
# for some reason restore does not support nice reporting of progress via json
|
2023-02-22 14:45:11 +00:00
|
|
|
output = handle.communicate()[0].decode("utf-8")
|
2023-02-22 15:58:36 +00:00
|
|
|
if "restoring" not in output:
|
2023-02-22 14:45:11 +00:00
|
|
|
raise ValueError("cannot restore a snapshot: " + output)
|
2023-02-08 16:28:05 +00:00
|
|
|
|
2023-05-31 13:16:08 +00:00
|
|
|
def _load_snapshots(self) -> object:
|
2023-02-08 16:28:05 +00:00
|
|
|
"""
|
|
|
|
Load list of snapshots from repository
|
2023-02-17 15:55:19 +00:00
|
|
|
raises Value Error if repo does not exist
|
2023-02-08 16:28:05 +00:00
|
|
|
"""
|
|
|
|
listing_command = self.restic_command(
|
|
|
|
"snapshots",
|
|
|
|
"--json",
|
|
|
|
)
|
|
|
|
|
|
|
|
with subprocess.Popen(
|
|
|
|
listing_command,
|
|
|
|
shell=False,
|
|
|
|
stdout=subprocess.PIPE,
|
|
|
|
stderr=subprocess.STDOUT,
|
|
|
|
) as backup_listing_process_descriptor:
|
|
|
|
output = backup_listing_process_descriptor.communicate()[0].decode("utf-8")
|
|
|
|
|
2023-02-17 15:55:19 +00:00
|
|
|
if "Is there a repository at the following location?" in output:
|
|
|
|
raise ValueError("No repository! : " + output)
|
2023-02-08 16:28:05 +00:00
|
|
|
try:
|
2023-06-23 09:40:10 +00:00
|
|
|
return ResticBackuper.parse_json_output(output)
|
2023-02-17 15:55:19 +00:00
|
|
|
except ValueError as e:
|
|
|
|
raise ValueError("Cannot load snapshots: ") from e
|
2023-02-08 16:28:05 +00:00
|
|
|
|
2023-05-31 13:16:08 +00:00
|
|
|
def get_snapshots(self) -> List[Snapshot]:
|
2023-02-13 11:16:35 +00:00
|
|
|
"""Get all snapshots from the repo"""
|
2023-02-08 16:28:05 +00:00
|
|
|
snapshots = []
|
2023-05-31 13:16:08 +00:00
|
|
|
for restic_snapshot in self._load_snapshots():
|
2023-02-22 13:35:55 +00:00
|
|
|
snapshot = Snapshot(
|
|
|
|
id=restic_snapshot["short_id"],
|
|
|
|
created_at=restic_snapshot["time"],
|
2023-05-17 17:48:06 +00:00
|
|
|
service_name=restic_snapshot["tags"][0],
|
2023-02-22 13:35:55 +00:00
|
|
|
)
|
|
|
|
|
2023-02-08 16:28:05 +00:00
|
|
|
snapshots.append(snapshot)
|
|
|
|
return snapshots
|
|
|
|
|
2023-06-23 09:40:10 +00:00
|
|
|
@staticmethod
|
|
|
|
def parse_json_output(output: str) -> object:
|
|
|
|
starting_index = ResticBackuper.json_start(output)
|
2023-03-14 00:39:15 +00:00
|
|
|
|
|
|
|
if starting_index == -1:
|
2023-04-03 16:29:06 +00:00
|
|
|
raise ValueError("There is no json in the restic output : " + output)
|
|
|
|
|
|
|
|
truncated_output = output[starting_index:]
|
|
|
|
json_messages = truncated_output.splitlines()
|
|
|
|
if len(json_messages) == 1:
|
2023-06-07 15:55:38 +00:00
|
|
|
try:
|
|
|
|
return json.loads(truncated_output)
|
|
|
|
except JSONDecodeError as e:
|
|
|
|
raise ValueError(
|
|
|
|
"There is no json in the restic output : " + output
|
|
|
|
) from e
|
2023-03-14 00:39:15 +00:00
|
|
|
|
2023-04-03 16:29:06 +00:00
|
|
|
result_array = []
|
|
|
|
for message in json_messages:
|
|
|
|
result_array.append(json.loads(message))
|
|
|
|
return result_array
|
2023-03-14 00:39:15 +00:00
|
|
|
|
2023-06-23 09:40:10 +00:00
|
|
|
@staticmethod
|
|
|
|
def json_start(output: str) -> int:
|
2023-02-22 18:48:08 +00:00
|
|
|
indices = [
|
|
|
|
output.find("["),
|
|
|
|
output.find("{"),
|
|
|
|
]
|
|
|
|
indices = [x for x in indices if x != -1]
|
|
|
|
|
|
|
|
if indices == []:
|
2023-03-14 00:39:15 +00:00
|
|
|
return -1
|
|
|
|
return min(indices)
|
2023-02-22 18:48:08 +00:00
|
|
|
|
2023-06-23 09:40:10 +00:00
|
|
|
@staticmethod
|
|
|
|
def has_json(output: str) -> bool:
|
|
|
|
if ResticBackuper.json_start(output) == -1:
|
2023-03-14 00:39:15 +00:00
|
|
|
return False
|
|
|
|
return True
|