Não pode escolher mais do que 25 tópicos Os tópicos devem começar com uma letra ou um número, podem incluir traços ('-') e podem ter até 35 caracteres.

producers.py 6.7 KiB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176
  1. """Classes for producing videos"""
  2. from abc import ABC
  3. import json
  4. import logging
  5. import os
  6. import subprocess
  7. import tempfile
  8. # for visualisations:
  9. import matplotlib.pyplot as plt
  10. # for encoding as JSON
  11. from pipeline.utils import Feature
  12. class Producer(ABC):
  13. """Generic producer interface."""
  14. def __init__(self, features):
  15. """All producers should take a list of features as input"""
  16. def produce(self):
  17. """All Producers should produce something!"""
  18. class VideoProducer(Producer):
  19. """Video producer interface."""
  20. class FfmpegVideoProducer(VideoProducer):
  21. """Produce videos using ffmpeg"""
  22. # TODO: consider output filename options
  23. _CONFIG_COMPILE_CLIPS = True
  24. def __init__(self, features, compile_clips=_CONFIG_COMPILE_CLIPS) -> None:
  25. if not features:
  26. raise ValueError("No features provided")
  27. # TODO: consider if we want to permit empty features (producing no video)
  28. self.features = features
  29. self._compile_clips = compile_clips
  30. def _run_no_output(self, cmd: list, cwd:str=".") -> None:
  31. """Run a command and return the output as a string
  32. Defined to be mocked out in tests via unittest.mock.patch
  33. """
  34. subprocess.run(cmd, stdout=None, stderr=None, cwd=cwd)
  35. def _ffmpeg_feature_to_clip(self, feature=None, output_filepath=None):
  36. """use ffmpeg to produve a video clip from a feature"""
  37. OVERWRITE = True # TODO: consider making this a config option
  38. if not feature or not feature.interval:
  39. raise ValueError("No feature provided")
  40. if not output_filepath:
  41. raise ValueError("No output filepath provided")
  42. ffmpeg_prefix = ["ffmpeg", "-y"] if OVERWRITE else ["ffmpeg"]
  43. ffmpeg_suffix = ["-r", "60", "-c:v", "libx264", "-crf", "26", "-c:a", "aac", "-preset", "ultrafast"]
  44. # TODO: match framerate of input video
  45. # TODO: adjustable encoding options
  46. seek = ["-ss", str(feature.interval.start)]
  47. duration = ["-t", str(feature.interval.duration)]
  48. ffmpeg_args = ffmpeg_prefix + seek + ["-i"] + [feature.source.path] +\
  49. duration + ffmpeg_suffix + [output_filepath]
  50. logging.info(f"ffmpeg_args: {ffmpeg_args}")
  51. self._run_no_output(ffmpeg_args)
  52. def _ffmpeg_concat_clips(self, clips=None, output_filepath=None):
  53. """use ffmpeg to concatenate clips into a single video"""
  54. OVERWRITE = True
  55. ffmpeg_prefix = ["ffmpeg"]
  56. ffmpeg_prefix += ["-y"] if OVERWRITE else []
  57. ffmpeg_prefix += ["-f", "concat", "-safe", "0", "-i"]
  58. # there is a method to do this via process substitution, but it's not portable
  59. # so we'll use the input file list method
  60. if not clips:
  61. raise ValueError("No clips provided")
  62. if not output_filepath:
  63. raise ValueError("No output filepath provided")
  64. # generate a temporary file with the list of clips
  65. join_file = tempfile.NamedTemporaryFile(mode="w")
  66. for clip in clips:
  67. join_file.write(f"file '{clip}'\n")
  68. join_file.flush()
  69. ffmpeg_args = ffmpeg_prefix + [join_file.name] + ["-c", "copy", output_filepath]
  70. logging.info(f"ffmpeg_args: {ffmpeg_args}")
  71. self._run_no_output(ffmpeg_args)
  72. join_file.close()
  73. def produce(self):
  74. OUTPUT_DIR = "/tmp/" # TODO: make this a config option
  75. clips = []
  76. for num, feature in enumerate(self.features):
  77. output_filepath = f"{OUTPUT_DIR}/highlight_{num}.mp4"
  78. self._ffmpeg_feature_to_clip(feature, output_filepath)
  79. clips.append(output_filepath)
  80. # concatenate the clips
  81. if self._compile_clips:
  82. output_filepath = f"{OUTPUT_DIR}/highlights.mp4"
  83. self._ffmpeg_concat_clips(clips, output_filepath)
  84. logging.info(f"Produced video: {output_filepath}")
  85. class VisualisationProducer(Producer):
  86. """Visualisation producer -- illustrate the features we have extracted"""
  87. def __init__(self, features):
  88. if not features:
  89. raise ValueError("No features provided")
  90. self.features = features
  91. def produce(self):
  92. """Produce visualisation"""
  93. # basic idea: use matplotlib to plot:
  94. # - a wide line segment representing the source video[s]
  95. # - shorter line segments representing the features extracted where:
  96. # + width represents duration
  97. # + colour represents feature type
  98. # + position represents time
  99. # - save as image
  100. plotted_source_videos = []
  101. bar_labels = []
  102. fig, ax = plt.subplots()
  103. for feature in self.features:
  104. # plot source video line if not done already
  105. if feature.source not in plotted_source_videos:
  106. # use video duration as width
  107. # ax.plot([0, feature.source.duration()], [0, 0], color='black', linewidth=10)
  108. ax.broken_barh([(0, feature.source.duration())], (0, 5), facecolors='grey')
  109. plotted_source_videos.append(feature.source)
  110. bar_labels.append(os.path.basename(feature.source.path))
  111. # annotate the source video
  112. ax.text(0.25, 0.25, os.path.basename(feature.source.path), ha='left', va='bottom',
  113. fontsize=16)
  114. # plot feature line
  115. # ax.plot([feature.interval.start, feature.interval.end], [1, 1], color='red', linewidth=5)
  116. ax.broken_barh([(feature.interval.start, feature.interval.duration)], (10, 5), facecolors='red')
  117. if feature.feature_extractor not in bar_labels:
  118. bar_labels.append(feature.feature_extractor)
  119. # label bar with feature extractor
  120. ax.text(0, 8, feature.feature_extractor, ha='left', va='bottom',
  121. fontsize=16)
  122. # label the plot's axes
  123. ax.set_xlabel('Time')
  124. # ax.set_yticks([], labels=bar_labels)
  125. ax.set_yticks([])
  126. # ax.tick_params(axis='y', labelrotation=90, ha='right')
  127. # save the plot
  128. plt.savefig("/tmp/visualisation.png")
  129. plt.close()
  130. class PipelineJSONEncoder(json.JSONEncoder):
  131. def default(self, obj):
  132. if hasattr(obj, 'to_json'):
  133. return obj.to_json()
  134. else:
  135. return json.JSONEncoder.default(self, obj)
  136. class JSONProducer(Producer):
  137. """Produce JSON output"""
  138. def __init__(self, features):
  139. if not features:
  140. raise ValueError("No features provided")
  141. self.features = features
  142. def produce(self):
  143. # FIXME: config option for output path
  144. with open("/tmp/features.json", "w") as jsonfile:
  145. jsonfile.write(json.dumps(self.features, cls=PipelineJSONEncoder, indent=4))