main.py 6.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298
  1. import os
  2. import os.path
  3. import sys
  4. import time
  5. import queue
  6. import argparse
  7. import tempfile
  8. import threading
  9. import cv2
  10. import requests
  11. from loguru import logger
  12. from Crypto.Hash import BLAKE2b
  13. try:
  14. import rdrand
  15. except ImportError:
  16. logger.warning("RdRand is not available.")
  17. class TemporaryFile:
  18. def __init__(self, name, io, delete):
  19. self.name = name
  20. self.__io = io
  21. self.__delete = delete
  22. def __getattr__(self, k):
  23. return getattr(self.__io, k)
  24. def __del__(self):
  25. if self.__delete:
  26. try:
  27. os.unlink(self.name)
  28. except FileNotFoundError:
  29. pass
  30. def NamedTemporaryFile(
  31. mode="w+b", bufsize=-1, suffix="", prefix="tmp", dir=None, delete=True
  32. ):
  33. if not dir:
  34. dir = tempfile.gettempdir()
  35. name = os.path.join(dir, prefix + os.urandom(32).hex() + suffix)
  36. if mode is None:
  37. return TemporaryFile(name, None, delete)
  38. fh = open(name, "w+b", bufsize)
  39. if mode != "w+b":
  40. fh.close()
  41. fh = open(name, mode)
  42. return TemporaryFile(name, fh, delete)
  43. def chunks(lst, n):
  44. for i in range(0, len(lst), n):
  45. yield lst[i : i + n]
  46. def run_check(cmd):
  47. logger.info(f"Executing '{cmd}'.")
  48. if os.system(cmd) != 0:
  49. raise ValueError("Exit code != 0.")
  50. def extract_image(path):
  51. logger.info(f"Extract image '{path}'.")
  52. im = cv2.imread(path)
  53. data = []
  54. rows, cols, _ = im.shape
  55. for i in range(rows):
  56. for j in range(cols):
  57. r, g, b = im[i, j]
  58. data.append(((r << 16) + (g << 8) + b) & 255)
  59. return bytes(data)
  60. def extract_wav(path):
  61. logger.info(f"Extract audio: '{path}'.")
  62. data = []
  63. with open(path, "rb") as f:
  64. for sample in chunks(f.read()[44:], 2):
  65. data.append(sample[0])
  66. return bytes(data)
  67. def extract_video(path):
  68. logger.info(f"Extract video: '{path}'.")
  69. with tempfile.TemporaryDirectory() as tmpd:
  70. run_check(
  71. f"ffmpeg -hide_banner -loglevel error -y -i {path} -vf mpdecimate -r 1/1 {tmpd}/%d.bmp"
  72. )
  73. data = b""
  74. for filename in os.listdir(tmpd):
  75. data += extract_image(os.path.join(tmpd, filename))
  76. return data
  77. def extract_lsbs(data):
  78. logger.info("Extract LSBs.")
  79. buffer = []
  80. if len(data) % 2 != 0:
  81. data = data[:-1]
  82. for chunk in chunks(data, 2):
  83. tmp_byte = 0
  84. for byte in chunk:
  85. for n in range(4):
  86. tmp_byte = (tmp_byte << 1) | ((byte >> n) & 1)
  87. buffer.append(tmp_byte & 255)
  88. return bytes(buffer)
  89. def whiten(data):
  90. logger.info("Whitening.")
  91. buffer = b""
  92. for chunk in chunks(data, 128):
  93. buffer += BLAKE2b.new(data=chunk, digest_bits=256).digest()
  94. return buffer
  95. def read_video(source, duration=60):
  96. tmpf = NamedTemporaryFile(suffix=".mkv", mode=None)
  97. run_check(
  98. f"ffmpeg -hide_banner -loglevel error -y -i {source} -t {duration} -acodec copy -vcodec copy {tmpf.name}"
  99. )
  100. return extract_video(tmpf.name)
  101. def read_audio(source, duration=60):
  102. tmpf = NamedTemporaryFile(suffix=".wav", mode=None)
  103. run_check(
  104. f"ffmpeg -f alsa -i {source} -t {duration} -ar 48000 -f s16le -acodec pcm_s16le {tmpf.name}"
  105. )
  106. return extract_wav(tmpf.name)
  107. def read_audio_video(source, duration=60):
  108. tmpf = NamedTemporaryFile(suffix=".mkv", mode=None)
  109. run_check(
  110. f"ffmpeg -hide_banner -loglevel error -y -i {source} -t {duration} -acodec copy -vcodec copy {tmpf.name}"
  111. )
  112. data_a = extract_video(tmpf.name)
  113. tmpf2 = NamedTemporaryFile(suffix=".wav", mode=None)
  114. run_check(
  115. f"ffmpeg -hide_banner -loglevel error -y -i {tmpf.name} -vn -ar 48000 -f s16le -acodec pcm_s16le {tmpf2.name}"
  116. )
  117. data_b = extract_wav(tmpf2.name)
  118. return bytes(a ^ b for a, b in zip(data_a, data_b))
  119. def read_rdseed(_, amount=16):
  120. data = rdrand.rdseed_get_bytes(amount)
  121. if len(data) != amount or data.count(0) == amount:
  122. raise ValueError("bad data")
  123. return data
  124. def sample(source, source_type, multiplier=1):
  125. match source_type:
  126. case "video":
  127. sampler = read_video
  128. multiplier *= 60
  129. case "audio":
  130. sampler = read_audio
  131. multiplier *= 60
  132. case "video+audio":
  133. sampler = read_audio_video
  134. multiplier *= 60
  135. case "rdseed":
  136. sampler = read_rdseed
  137. case _:
  138. raise ValueError(source_type)
  139. multiplier = int(multiplier)
  140. if multiplier < 1:
  141. raise ValueError(multiplier)
  142. logger.info("Sampling...")
  143. data = sampler(source, multiplier)
  144. logger.info(f"Sample ready: {len(data)}b.")
  145. if source_type != "rdseed":
  146. data = extract_lsbs(data)
  147. data = whiten(data)
  148. return data
  149. def push(pool_url, data, secret):
  150. logger.info(f"Pushing {len(data)}b.")
  151. resp = requests.post(
  152. f"{pool_url}/api/pool", data=data, headers={"X-Secret": secret}
  153. )
  154. (logger.success if resp.status_code == 200 else logger.error)(
  155. f"{resp.status_code}: {resp.text}"
  156. )
  157. def puller(queue, source, source_type, multiplier):
  158. while True:
  159. try:
  160. data = sample(source, source_type, multiplier)
  161. except KeyboardInterrupt:
  162. logger.info("Interrupted by user.")
  163. sys.exit(0)
  164. except Exception as e:
  165. logger.error(f"Pull exception: {e}")
  166. continue
  167. for piece in chunks(data, 1024 * 500):
  168. queue.put(piece)
  169. def pusher(queue, pool_url, secret, cooldown=0):
  170. while True:
  171. piece = queue.get()
  172. try:
  173. push(pool_url, piece, secret)
  174. except KeyboardInterrupt:
  175. logger.info("Interrupted by user.")
  176. sys.exit(0)
  177. except Exception as e:
  178. logger.error(f"Push exception: {e}")
  179. if cooldown:
  180. time.sleep(cooldown)
  181. if __name__ == "__main__":
  182. parser = argparse.ArgumentParser()
  183. parser.add_argument("--source", type=str, required=True)
  184. parser.add_argument("--source-type", type=str, default="video+audio")
  185. parser.add_argument("--multiplier", type=float, default=1)
  186. parser.add_argument("--secret-file", type=str, default="./.secret")
  187. parser.add_argument("--cooldown", type=int, default=0)
  188. parser.add_argument("--pool-url", type=str, default="https://trng.iike.ru")
  189. args = parser.parse_args()
  190. with open(args.secret_file, "r") as f:
  191. lines = f.read().strip().split("\n")
  192. ident = lines[0].strip()
  193. secret = lines[1].strip()
  194. secret = f"{ident} {secret}"
  195. q = queue.Queue()
  196. threading.Thread(
  197. target=puller, args=(q, args.source, args.source_type, args.multiplier)
  198. ).start()
  199. pusher_th = threading.Thread(
  200. target=pusher, args=(q, args.pool_url, secret, args.cooldown)
  201. )
  202. pusher_th.start()
  203. pusher_th.join()