194 lines
6.4 KiB
Python
194 lines
6.4 KiB
Python
import wave
|
|
import numpy as np
|
|
|
|
|
|
class wav_steg:
|
|
|
|
def __init__(self, wav_file: str = "sample.wav", bits_to_hide: list[int] = None) -> None:
|
|
"""
|
|
Initialize the class
|
|
:param wav_file: PathName of the wav file to encode or decode
|
|
:type wav_file: str
|
|
:param bits_to_hide: Bit to hide the data in (1 - LSB to 8 - MSB)
|
|
:type bits_to_hide: list[int]
|
|
"""
|
|
self.wav_file = wav_file
|
|
self.bits_to_hide = [
|
|
8 - bit_pos for bit_pos in bits_to_hide] if bits_to_hide else [7] # Default is LSB (index = 7)
|
|
self.delimiter = "=====" # Delimiter to indicate the end of the secret data
|
|
print(self.bits_to_hide)
|
|
|
|
def encode(self, secret_data: str = "Hello World") -> dict:
|
|
"""
|
|
Encode the secret data into the wav file
|
|
|
|
:param secret_data: String of data to hide
|
|
|
|
:return: Encoded wav file parameters
|
|
:rtype: dict
|
|
"""
|
|
|
|
# Read wav file
|
|
try:
|
|
wav_file = wave.open(self.wav_file, 'rb')
|
|
except:
|
|
raise FileNotFoundError("File not found")
|
|
|
|
# Get the audio file's parameters
|
|
num_channels = wav_file.getnchannels()
|
|
sample_width = wav_file.getsampwidth()
|
|
frame_rate = wav_file.getframerate()
|
|
num_frames = wav_file.getnframes()
|
|
|
|
# Read all the audio frames
|
|
data = wav_file.readframes(num_frames)
|
|
|
|
#Add delimiter
|
|
secret_data+=self.delimiter
|
|
|
|
# Max Bits to encode
|
|
n_bits = (len(data) // 8) * len(self.bits_to_hide)
|
|
|
|
# Check if secret data can be encoded into wav file
|
|
# print(f"Secret data length: {len(secret_data)}, Max data length: {n_bytes}")
|
|
if len(secret_data)*8 > n_bits:
|
|
raise ValueError(
|
|
f"[-] Error: Binary Secret data length {len(secret_data)*8} is greater than data length {n_bits}")
|
|
|
|
# Convert secret data to binary
|
|
binary_secret_data = self.to_bin(secret_data)
|
|
|
|
data_index = 0
|
|
encoded_data = bytearray()
|
|
|
|
print(f"[+] Starting encoding...")
|
|
# Encode data into wav
|
|
for byte in data:
|
|
if data_index >= len(binary_secret_data):
|
|
encoded_data.append(byte)
|
|
else:
|
|
for bit_pos in self.bits_to_hide:
|
|
if data_index < len(binary_secret_data):
|
|
byte = list(format(byte, "08b"))
|
|
byte = list(byte)
|
|
byte[bit_pos] = binary_secret_data[data_index]
|
|
data_index += 1
|
|
# Convert byte back to int
|
|
byte = int("".join(byte), 2)
|
|
encoded_data.append(byte)
|
|
|
|
print(f"[+] Encoding completed successfully.")
|
|
|
|
new_wav_dict = {
|
|
"num_channels": num_channels,
|
|
"sample_width": sample_width,
|
|
"frame_rate": frame_rate,
|
|
"num_frames": bytes(encoded_data)
|
|
}
|
|
return new_wav_dict
|
|
|
|
def decode(self) -> str:
|
|
"""
|
|
Decode the secret data from the wav file
|
|
:return: Decoded secret data
|
|
:rtype: str
|
|
"""
|
|
# Read wav file
|
|
try:
|
|
modified_wav_file = wave.open(self.wav_file, 'rb')
|
|
except:
|
|
raise FileNotFoundError("File not found")
|
|
|
|
# Get the audio parameters
|
|
num_frames = modified_wav_file.getnframes()
|
|
|
|
# Read the audio samples
|
|
data = modified_wav_file.readframes(num_frames)
|
|
|
|
binary_data = ""
|
|
print(f"[+] Starting decoding...")
|
|
for byte in data:
|
|
# Add byte to binary data
|
|
# Convert byte from int to binary string
|
|
byte = format(byte, "08b")
|
|
# Pad byte with 0's to make sure it has 8 bits
|
|
byte = "0" * (8 - len(byte)) + byte
|
|
for bit_pos in self.bits_to_hide:
|
|
binary_data += byte[bit_pos]
|
|
|
|
all_bytes = [binary_data[i: i + 8]
|
|
for i in range(0, len(binary_data), 8)]
|
|
|
|
decoded_data = ""
|
|
for byte in all_bytes:
|
|
decoded_data += chr(int(byte, 2))
|
|
if decoded_data[-len(self.delimiter):] == self.delimiter:
|
|
break
|
|
|
|
print(f"[+] Decoding completed successfully.")
|
|
# Return the decoded data
|
|
return decoded_data[:-len(self.delimiter)]
|
|
|
|
def to_bin(self, data: str) -> str | list[str]:
|
|
"""
|
|
Convert text file data to binary format as string
|
|
:param data: String
|
|
:type data: str
|
|
:return: Binary Data: String | List[String]
|
|
"""
|
|
|
|
if isinstance(data, str):
|
|
return ''.join([format(ord(i), "08b") for i in data])
|
|
elif isinstance(data, bytes) or isinstance(data, np.ndarray):
|
|
return [format(i, "08b") for i in data]
|
|
elif isinstance(data, int) or isinstance(data, np.unit8):
|
|
return format(data, "08b")
|
|
else:
|
|
raise TypeError("Type not supported")
|
|
|
|
def from_bin(self, data: str) -> str:
|
|
"""
|
|
Convert binary `data` back to the original format
|
|
:param data: String
|
|
:type data: str
|
|
:return: Original Data: String
|
|
"""
|
|
|
|
return ''.join([chr(int(data[i:i + 8], 2)) for i in range(0, len(data), 8)])
|
|
|
|
|
|
if __name__ == "__main__":
|
|
wav_file = "sample.wav"
|
|
output_file_wav = "encoded.wav"
|
|
secret_txt = "payload.txt"
|
|
|
|
with open(secret_txt, "r") as f:
|
|
secret_data = f.read()
|
|
|
|
bits_to_hide = np.random.choice(
|
|
range(1, 9), np.random.randint(1, 9), replace=False)
|
|
bits_to_hide = list(bits_to_hide)
|
|
bits_to_hide.sort()
|
|
bits_to_hide = [1, 2, 3, 4, 5]
|
|
print(f"Bits to hide: {bits_to_hide}")
|
|
|
|
# Encode data, get as bytes
|
|
encoded_data = wav_steg(wav_file=wav_file, bits_to_hide=bits_to_hide).encode(
|
|
secret_data=secret_data)
|
|
|
|
# Write encoded data to file
|
|
new_wav_file = wave.open(output_file_wav, "wb")
|
|
new_wav_file.setnchannels(encoded_data["num_channels"])
|
|
new_wav_file.setsampwidth(encoded_data["sample_width"])
|
|
new_wav_file.setframerate(encoded_data["frame_rate"])
|
|
new_wav_file.writeframes(encoded_data["num_frames"])
|
|
# Close the New WAV file
|
|
new_wav_file.close()
|
|
|
|
# Decode data from wav file
|
|
decoded_data = wav_steg(wav_file=output_file_wav,
|
|
bits_to_hide=bits_to_hide).decode()
|
|
|
|
# Print the decoded data
|
|
# print("[+] Decoded data:", decoded_data)
|