From 7a0b96e80587909786007c524516813ba0948695 Mon Sep 17 00:00:00 2001 From: cleontay Date: Tue, 30 May 2023 22:19:02 +0800 Subject: [PATCH] docx depreciated --- Application/lib/steganography/docx_steg.py | 155 --------------------- 1 file changed, 155 deletions(-) delete mode 100644 Application/lib/steganography/docx_steg.py diff --git a/Application/lib/steganography/docx_steg.py b/Application/lib/steganography/docx_steg.py deleted file mode 100644 index e2cda72..0000000 --- a/Application/lib/steganography/docx_steg.py +++ /dev/null @@ -1,155 +0,0 @@ -import numpy as np - -################################################## -# Duplicate of file_steg.py, to remove # -################################################## -class docx_steg: - def __init__(self, docx_file: str = "testfile.docx", bits_to_hide: list[int] = None) -> None: - """ - Initialize the class - :param docx_file: PathName of the docx file to encode or decode - :type docx_file: str - :param bits_to_hide: Bit to hide the data in (1 - LSB to 8 - MSB) - :type bits_to_hide: list[int] - """ - raise NotImplementedError("Duplicate of file_steg.py, to remove") - self.docx_file = docx_file - self.bits_to_hide = [8 - bit_pos for bit_pos in bits_to_hide] if bits_to_hide else [1] # Default is LSB - self.delimiter = "=====" # Delimiter to indicate the end of the secret data - - def encode(self, secret_data: str = "Hello World") -> bytes: - """ - Encode the secret data into the docx file - - :param secret_data: String of data to hide - - :return: Encoded docx file as bytes - :rtype: bytes - """ - - with open(self.docx_file, "rb") as f: - data = f.read() - - # Max Bytes to encode - n_bytes = len(data) // 8 - - # Check if secret data can be encoded into docx file - # print(f"Secret data length: {len(secret_data)}, Max data length: {n_bytes}") - if len(secret_data) > n_bytes: - raise ValueError( - f"[-] Error: Binary Secret data length {len(secret_data)} is greater than data length {n_bytes}") - - # Convert secret data to binary - binary_secret_data = self.to_bin(secret_data) - - # Add delimiter - binary_secret_data += self.to_bin(self.delimiter) - - data_index = 0 - encoded_data = bytearray() - - print(f"[+] Starting encoding...") - # Encode data into docx - for byte in data: - if data_index >= len(binary_secret_data): - encoded_data.append(byte) - else: - for bit_pos in self.bits_to_hide: - if data_index < len(binary_secret_data): - byte = list(format(byte, "08b")) - byte = list(byte) - byte[bit_pos] = binary_secret_data[data_index] - data_index += 1 - # Convert byte back to int - byte = int("".join(byte), 2) - encoded_data.append(byte) - - print(f"[+] Encoding completed successfully.") - return bytes(encoded_data) - - def decode(self) -> str: - """ - Decode the secret data from the docx file - :return: Decoded secret data - :rtype: str - """ - with open(self.docx_file, "rb") as f: - data = f.read() - - binary_data = "" - print(f"[+] Starting decoding...") - for byte in data: - # Add byte to binary data - # Convert byte from int to binary string - byte = format(byte, "08b") - # Pad byte with 0's to make sure it has 8 bits - byte = "0" * (8 - len(byte)) + byte - for bit_pos in self.bits_to_hide: - binary_data += byte[bit_pos] - - all_bytes = [binary_data[i: i + 8] for i in range(0, len(binary_data), 8)] - - decoded_data = "" - for byte in all_bytes: - decoded_data += chr(int(byte, 2)) - if decoded_data[-len(self.delimiter):] == self.delimiter: - break - - print(f"[+] Decoding completed successfully.") - # Return the decoded data - return decoded_data[:-len(self.delimiter)] - - def to_bin(self, data: str) -> str | list[str]: - """ - Convert text file data to binary format as string - :param data: String - :type data: str - :return: Binary Data: String | List[String] - """ - - if isinstance(data, str): - return ''.join([format(ord(i), "08b") for i in data]) - elif isinstance(data, bytes) or isinstance(data, np.ndarray): - return [format(i, "08b") for i in data] - elif isinstance(data, int) or isinstance(data, np.unit8): - return format(data, "08b") - else: - raise TypeError("Type not supported") - - def from_bin(self, data: str) -> str: - """ - Convert binary `data` back to the original format - :param data: String - :type data: str - :return: Original Data: String - """ - - return ''.join([chr(int(data[i:i + 8], 2)) for i in range(0, len(data), 8)]) - - -if __name__ == "__main__": - with open("secret_data.txt", "r") as f: - secret_data = f.read() - - bits_to_hide = np.random.choice(range(1, 9), np.random.randint(1, 9), replace=False) - bits_to_hide = list(bits_to_hide) - bits_to_hide.sort() - # bits_to_hide = [1] - print(f"Bits to hide: {bits_to_hide}") - - docx_file = "testfile.docx" - output_encoded_docx = "encoded_document.docx" - - - # Encode data, get as bytes - encoded_data = docx_steg(docx_file=docx_file, bits_to_hide=bits_to_hide).encode(secret_data=secret_data) - - # Write encoded data to file - with open(output_encoded_docx, "wb") as f: - f.write(encoded_data) - - # Decode data from encoded docx file - decoded_data = docx_steg(docx_file=output_encoded_docx, bits_to_hide=bits_to_hide).decode() - - # Print the decoded data - print("[+] Decoded data:", decoded_data)