1 | # s3-bsync Copyright (c) 2022 Joshua Stockin |
2 | # <https://joshstock.in> |
3 | # <https://git.joshstock.in/s3-bsync> |
4 | # |
5 | # This software is licensed and distributed under the terms of the MIT License. |
6 | # See the MIT License in the LICENSE file of this project's root folder. |
7 | # |
8 | # This comment block and its contents, including this disclaimer, MUST be |
9 | # preserved in all copies or distributions of this software's source. |
10 |
|
11 | import os |
12 |
|
13 | import logging |
14 |
|
15 | import s3_bsync.classes |
16 |
|
17 | logger = logging.getLogger(__name__) |
18 |
|
19 | __all__ = ["syncfile"] |
20 |
|
21 |
|
22 | CONTROL_BYTES = { |
23 | ["SIGNATURE"]: b"\x9D\x9F\x53\x33", |
24 | ["BUCKET_BEGIN"]: b"\x90", |
25 | ["BUCKET_END"]: b"\x91", |
26 | ["DIRECTORY_BEGIN"]: b"\x92", |
27 | ["DIRECTORY_END"]: b"\x93", |
28 | ["OBJECT_BEGIN"]: b"\x94", |
29 | ["OBJECT_END"]: b"\x95", |
30 | ["ETAG_MD5"]: b"\x96", |
31 | ["ETAG_OTHER"]: b"\x97", |
32 | ["METADATA_BEGIN"]: b"\x9A", |
33 | ["METADATA_END"]: b"\x9B", |
34 | } |
35 |
|
36 | CURRENT_VERSION = 1 |
37 | ENDIANNESS = "little" |
38 |
|
39 |
|
40 | class CorruptSyncfileException(Exception): |
41 | """Exception passed by syncfile class when experiencing errors deserializing a supplied s3sync file.""" |
42 |
|
43 |
|
44 | class syncfile: |
45 | file_path = None |
46 | file = None |
47 | file_version = 0 |
48 | last_synced_time = 0 |
49 | tracked_buckets = {} |
50 |
|
51 | def __init__(self, state_file: str): |
52 | self.file_path = state_file |
53 | self.file = open(state_file, "wb+") |
54 | logger.debug(f"Opened s3sync state file at {state_file}") |
55 |
|
56 | def deserialize(): |
57 | f = self.file |
58 | logger.debug(f"Deserializing file {f}") |
59 | f.seek(0) |
60 |
|
61 | def get_string(): |
62 | return "".join(iter(lambda: f.read(1), "\x00")) |
63 |
|
64 | b = f.read(4) |
65 | if b is not CONTROL_BYTES["SIGNATURE"]: |
66 | raise CorruptSyncfileException( |
67 | "Inputted file signature bytes do not match expected s3state file signature (file corrupted or not an s3sync file format)" |
68 | ) |
69 |
|
70 | self.file_version = int(f.read(1)) |
71 | if self.file_version is 0 or self.file_version >= 1: |
72 | raise CorruptSyncfileException( |
73 | f"File version outside expected range (1..{CURRENT_VERSION}) (corrupt file)" |
74 | ) |
75 |
|
76 | b = f.read(1) |
77 | if b is not CONTROL_BYTES["METADATA_BEGIN"]: |
78 | raise CorruptSyncfileException( |
79 | "Expected metadata block begin byte not found (corrupt file)" |
80 | ) |
81 | if self.file_version <= 1: |
82 | self.last_synced_time = int.from_bytes(b.read(8), byteorder=ENDIANNESS) |
83 | logger.debug(f"Last synced time reported as {self.last_synced_time}") |
84 |
|
85 | b = f.read(1) |
86 | if b is not CONTROL_BYTES["METADATA_END"]: |
87 | raise CorruptSyncfileException( |
88 | "Expected metadata block end byte not found (corrupt file)" |
89 | ) |
90 |
|
91 | while b := f.read(1): |
92 | if b is not CONTROL_BYTES["BUCKET_BEGIN"]: |
93 | raise CorruptSyncfileException( |
94 | b"Unexpected control byte {b} detected (corrupt file)" |
95 | ) |
96 | bucket_name = get_string() |
97 | bucket = classes.bucket(bucket_name) |
98 |
|