pyaudviz/core.py

import sys, io, os
from PySide2 import QtCore, QtGui
from PySide2.QtGui import QPainter, QColor
from os.path import expanduser
import subprocess as sp
import numpy
from PIL import Image, ImageDraw, ImageFont
from PIL.ImageQt import ImageQt
import tempfile
from shutil import rmtree
import atexit

class Core():

  def __init__(self):
    self.lastBackgroundImage = ""
    self._image = None

    self.FFMPEG_BIN = self.findFfmpeg()
    self.tempDir = None
    atexit.register(self.deleteTempDir)

  def findFfmpeg(self):
    if sys.platform == "win32":
      return "ffmpeg.exe"
    else:
      try:
        with open(os.devnull, "w") as f:
          sp.check_call(['ffmpeg', '-version'], stdout=f, stderr=f)
        return "ffmpeg"
      except:
        return "avconv"

  def parseBaseImage(self, backgroundImage, preview=False):
      ''' determines if the base image is a single frame or list of frames '''
      if backgroundImage == "":
         return []
      else:
         _, bgExt = os.path.splitext(backgroundImage)
         if not bgExt == '.mp4':
            return [backgroundImage]
         else:
            return self.getVideoFrames(backgroundImage, preview)

  def drawBaseImage(self, backgroundFile, titleText, titleFont, fontSize, alignment,\
                     xOffset, yOffset, textColor, visColor):
    if backgroundFile == '':
       im = Image.new("RGB", (1280, 720), "black")
    else:
       im = Image.open(backgroundFile)

    if self._image == None or not self.lastBackgroundImage == backgroundFile:
      self.lastBackgroundImage = backgroundFile

      # resize if necessary
      if not im.size == (1280, 720):
        im = im.resize((1280, 720), Image.ANTIALIAS)

      self._image = ImageQt(im)
   
    self._image1 = QtGui.QImage(self._image)
    painter = QPainter(self._image1)
    font = titleFont
    font.setPixelSize(fontSize)
    painter.setFont(font)
    painter.setPen(QColor(*textColor))

    yPosition = yOffset

    fm = QtGui.QFontMetrics(font)
    if alignment == 0:      #Left
       xPosition = xOffset
    if alignment == 1:      #Middle
       xPosition = xOffset - fm.width(titleText)/2
    if alignment == 2:      #Right
       xPosition = xOffset - fm.width(titleText)
    painter.drawText(xPosition, yPosition, titleText)
    painter.end()

    buffer = QtCore.QBuffer()
    buffer.open(QtCore.QIODevice.ReadWrite)
    self._image1.save(buffer, "PNG")

    strio = io.BytesIO()
    strio.write(buffer.data())
    buffer.close()
    strio.seek(0)
    return Image.open(strio)

  def drawBars(self, spectrum, image, color):

    imTop = Image.new("RGBA", (1280, 360))
    draw = ImageDraw.Draw(imTop)
    r, g, b = color
    color2 = (r, g, b, 50)
    for j in range(0, 63):
      draw.rectangle((10 + j * 20, 325, 10 + j * 20 + 20, 325 - spectrum[j * 4] * 1 - 10), fill=color2)
      draw.rectangle((15 + j * 20, 320, 15 + j * 20 + 10, 320 - spectrum[j * 4] * 1), fill=color)


    imBottom = imTop.transpose(Image.FLIP_TOP_BOTTOM)
    
    im = Image.new("RGB", (1280, 720), "black")
    im.paste(image, (0, 0))
    im.paste(imTop, (0, 0), mask=imTop)
    im.paste(imBottom, (0, 360), mask=imBottom)

    return im

  def readAudioFile(self, filename):
    command = [ self.FFMPEG_BIN,
          '-i', filename,
          '-f', 's16le',
          '-acodec', 'pcm_s16le',
          '-ar', '44100', # ouput will have 44100 Hz
          '-ac', '1', # mono (set to '2' for stereo)
          '-']
    in_pipe = sp.Popen(command, stdout=sp.PIPE, stderr=sp.DEVNULL, bufsize=10**8)
    
    completeAudioArray = numpy.empty(0, dtype="int16")

    while True:
      # read 2 seconds of audio
      raw_audio = in_pipe.stdout.read(88200*4)
      if len(raw_audio) == 0:
        break
      audio_array = numpy.fromstring(raw_audio, dtype="int16")
      completeAudioArray = numpy.append(completeAudioArray, audio_array)
      # print(audio_array)

    in_pipe.kill()
    in_pipe.wait()

    # add 0s the end
    completeAudioArrayCopy = numpy.zeros(len(completeAudioArray) + 44100, dtype="int16")
    completeAudioArrayCopy[:len(completeAudioArray)] = completeAudioArray
    completeAudioArray = completeAudioArrayCopy

    return completeAudioArray

  def transformData(self, i, completeAudioArray, sampleSize, smoothConstantDown, smoothConstantUp, lastSpectrum):
    if len(completeAudioArray) < (i + sampleSize):
      sampleSize = len(completeAudioArray) - i

    window = numpy.hanning(sampleSize)
    data = completeAudioArray[i:i+sampleSize][::1] * window
    paddedSampleSize = 2048
    paddedData = numpy.pad(data, (0, paddedSampleSize - sampleSize), 'constant')
    spectrum = numpy.fft.fft(paddedData)
    sample_rate = 44100
    frequencies = numpy.fft.fftfreq(len(spectrum), 1./sample_rate)

    y = abs(spectrum[0:int(paddedSampleSize/2) - 1])

    # filter the noise away
    # y[y<80] = 0

    y = 20 * numpy.log10(y)
    y[numpy.isinf(y)] = 0

    if lastSpectrum is not None:
      lastSpectrum[y < lastSpectrum] = y[y < lastSpectrum] * smoothConstantDown + lastSpectrum[y < lastSpectrum] * (1 - smoothConstantDown)
      lastSpectrum[y >= lastSpectrum] = y[y >= lastSpectrum] * smoothConstantUp + lastSpectrum[y >= lastSpectrum] * (1 - smoothConstantUp)
    else:
      lastSpectrum = y

    x = frequencies[0:int(paddedSampleSize/2) - 1]

    return lastSpectrum

  def deleteTempDir(self):
     if self.tempDir and os.path.exists(self.tempDir):
         rmtree(self.tempDir)


  def getVideoFrames(self, videoPath, firstOnly=False):
      self.tempDir = os.path.join(tempfile.gettempdir(), 'audio-visualizer-python-data')
      # recreate the temporary directory so it is empty
      self.deleteTempDir()
      os.mkdir(self.tempDir)
      if firstOnly:
         filename = 'preview%s.jpg' % os.path.basename(videoPath).split('.', 1)[0]
         options = '-ss 10 -vframes 1'
      else:
         filename = '$frame%05d.jpg'
         options = ''
      sp.call( \
         '%s -i "%s" -y %s "%s"' % ( \
            self.FFMPEG_BIN,
            videoPath,
            options,
            os.path.join(self.tempDir, filename)
         ),
         shell=True
      )
      return sorted([os.path.join(self.tempDir, f) for f in os.listdir(self.tempDir)])

  @staticmethod
  def RGBFromString(string):
   ''' turns an RGB string like "255, 255, 255" into a tuple '''
   try:
     tup = tuple([int(i) for i in string.split(',')])
     if len(tup) != 3:
        raise ValueError
     for i in tup:
        if i > 255 or i < 0:
           raise ValueError
     return tup
   except:
     return (255, 255, 255)
add setup.py, automatic discovery for avconv/ffmpeg, add installation help to readme 2015-03-05 09:58:45 -05:00			`import sys, io, os`
Resolves #1 Update to use PySide2 & Qt5 2019-12-05 12:08:07 -05:00			`from PySide2 import QtCore, QtGui`
			`from PySide2.QtGui import QPainter, QColor`
first commit 2015-03-02 16:47:52 -05:00			`from os.path import expanduser`
			`import subprocess as sp`
			`import numpy`
			`from PIL import Image, ImageDraw, ImageFont`
			`from PIL.ImageQt import ImageQt`
added ability to use an mp4 as the background might not be the best way to do this (dumping all the video frames to a temp location), but it works for clips of a few minutes or less 2017-05-18 19:14:27 -04:00			`import tempfile`
			`from shutil import rmtree`
			`import atexit`
first commit 2015-03-02 16:47:52 -05:00
			`class Core():`

			`def __init__(self):`
			`self.lastBackgroundImage = ""`
			`self._image = None`

add setup.py, automatic discovery for avconv/ffmpeg, add installation help to readme 2015-03-05 09:58:45 -05:00			`self.FFMPEG_BIN = self.findFfmpeg()`
added ability to use an mp4 as the background might not be the best way to do this (dumping all the video frames to a temp location), but it works for clips of a few minutes or less 2017-05-18 19:14:27 -04:00			`self.tempDir = None`
			`atexit.register(self.deleteTempDir)`
add setup.py, automatic discovery for avconv/ffmpeg, add installation help to readme 2015-03-05 09:58:45 -05:00
			`def findFfmpeg(self):`
first commit 2015-03-02 16:47:52 -05:00			`if sys.platform == "win32":`
add setup.py, automatic discovery for avconv/ffmpeg, add installation help to readme 2015-03-05 09:58:45 -05:00			`return "ffmpeg.exe"`
first commit 2015-03-02 16:47:52 -05:00			`else:`
add setup.py, automatic discovery for avconv/ffmpeg, add installation help to readme 2015-03-05 09:58:45 -05:00			`try:`
			`with open(os.devnull, "w") as f:`
			`sp.check_call(['ffmpeg', '-version'], stdout=f, stderr=f)`
			`return "ffmpeg"`
			`except:`
			`return "avconv"`
first commit 2015-03-02 16:47:52 -05:00
added ability to use an mp4 as the background might not be the best way to do this (dumping all the video frames to a temp location), but it works for clips of a few minutes or less 2017-05-18 19:14:27 -04:00			`def parseBaseImage(self, backgroundImage, preview=False):`
			`''' determines if the base image is a single frame or list of frames '''`
first commit 2015-03-02 16:47:52 -05:00			`if backgroundImage == "":`
added ability to use an mp4 as the background might not be the best way to do this (dumping all the video frames to a temp location), but it works for clips of a few minutes or less 2017-05-18 19:14:27 -04:00			`return []`
first commit 2015-03-02 16:47:52 -05:00			`else:`
added ability to use an mp4 as the background might not be the best way to do this (dumping all the video frames to a temp location), but it works for clips of a few minutes or less 2017-05-18 19:14:27 -04:00			`_, bgExt = os.path.splitext(backgroundImage)`
			`if not bgExt == '.mp4':`
			`return [backgroundImage]`
			`else:`
			`return self.getVideoFrames(backgroundImage, preview)`

text and visualization colour can be changed using commandline 2017-05-22 19:42:32 -04:00			`def drawBaseImage(self, backgroundFile, titleText, titleFont, fontSize, alignment,\`
			`xOffset, yOffset, textColor, visColor):`
added ability to use an mp4 as the background might not be the best way to do this (dumping all the video frames to a temp location), but it works for clips of a few minutes or less 2017-05-18 19:14:27 -04:00			`if backgroundFile == '':`
			`im = Image.new("RGB", (1280, 720), "black")`
			`else:`
			`im = Image.open(backgroundFile)`

			`if self._image == None or not self.lastBackgroundImage == backgroundFile:`
			`self.lastBackgroundImage = backgroundFile`
first commit 2015-03-02 16:47:52 -05:00
			`# resize if necessary`
			`if not im.size == (1280, 720):`
			`im = im.resize((1280, 720), Image.ANTIALIAS)`

			`self._image = ImageQt(im)`
added back in spaces deleted by my editor 2017-05-18 19:54:48 -04:00
first commit 2015-03-02 16:47:52 -05:00			`self._image1 = QtGui.QImage(self._image)`
			`painter = QPainter(self._image1)`
			`font = titleFont`
try fixing problems with high dpi screens, font size for video in pixels 2017-05-23 15:24:58 -04:00			`font.setPixelSize(fontSize)`
first commit 2015-03-02 16:47:52 -05:00			`painter.setFont(font)`
text and visualization colour can be changed using commandline 2017-05-22 19:42:32 -04:00			`painter.setPen(QColor(*textColor))`
first commit 2015-03-02 16:47:52 -05:00
added font size of text in preview 2017-04-20 13:01:19 -04:00			`yPosition = yOffset`
added x/y offset of text in preview 2017-04-20 12:47:14 -04:00
Added text alignment option 2017-04-18 07:35:29 -04:00			`fm = QtGui.QFontMetrics(font)`
changed differentiater of text alignment from string to int 2017-04-20 19:00:17 -04:00			`if alignment == 0: #Left`
added font size of text in preview 2017-04-20 13:01:19 -04:00			`xPosition = xOffset`
changed differentiater of text alignment from string to int 2017-04-20 19:00:17 -04:00			`if alignment == 1: #Middle`
added font size of text in preview 2017-04-20 13:01:19 -04:00			`xPosition = xOffset - fm.width(titleText)/2`
changed differentiater of text alignment from string to int 2017-04-20 19:00:17 -04:00			`if alignment == 2: #Right`
added font size of text in preview 2017-04-20 13:01:19 -04:00			`xPosition = xOffset - fm.width(titleText)`
added x/y offset of text in preview 2017-04-20 12:47:14 -04:00			`painter.drawText(xPosition, yPosition, titleText)`
first commit 2015-03-02 16:47:52 -05:00			`painter.end()`

			`buffer = QtCore.QBuffer()`
			`buffer.open(QtCore.QIODevice.ReadWrite)`
			`self._image1.save(buffer, "PNG")`

			`strio = io.BytesIO()`
			`strio.write(buffer.data())`
			`buffer.close()`
			`strio.seek(0)`
			`return Image.open(strio)`

text and visualization colour can be changed using commandline 2017-05-22 19:42:32 -04:00			`def drawBars(self, spectrum, image, color):`
first commit 2015-03-02 16:47:52 -05:00
			`imTop = Image.new("RGBA", (1280, 360))`
			`draw = ImageDraw.Draw(imTop)`
text and visualization colour can be changed using commandline 2017-05-22 19:42:32 -04:00			`r, g, b = color`
			`color2 = (r, g, b, 50)`
first commit 2015-03-02 16:47:52 -05:00			`for j in range(0, 63):`
text and visualization colour can be changed using commandline 2017-05-22 19:42:32 -04:00			`draw.rectangle((10 + j * 20, 325, 10 + j * 20 + 20, 325 - spectrum[j * 4] * 1 - 10), fill=color2)`
			`draw.rectangle((15 + j * 20, 320, 15 + j * 20 + 10, 320 - spectrum[j * 4] * 1), fill=color)`
first commit 2015-03-02 16:47:52 -05:00

			`imBottom = imTop.transpose(Image.FLIP_TOP_BOTTOM)`
added back in spaces deleted by my editor 2017-05-18 19:54:48 -04:00
first commit 2015-03-02 16:47:52 -05:00			`im = Image.new("RGB", (1280, 720), "black")`
			`im.paste(image, (0, 0))`
			`im.paste(imTop, (0, 0), mask=imTop)`
			`im.paste(imBottom, (0, 360), mask=imBottom)`

			`return im`

			`def readAudioFile(self, filename):`
			`command = [ self.FFMPEG_BIN,`
			`'-i', filename,`
			`'-f', 's16le',`
			`'-acodec', 'pcm_s16le',`
			`'-ar', '44100', # ouput will have 44100 Hz`
			`'-ac', '1', # mono (set to '2' for stereo)`
			`'-']`
			`in_pipe = sp.Popen(command, stdout=sp.PIPE, stderr=sp.DEVNULL, bufsize=10**8)`
added back in spaces deleted by my editor 2017-05-18 19:54:48 -04:00
first commit 2015-03-02 16:47:52 -05:00			`completeAudioArray = numpy.empty(0, dtype="int16")`

			`while True:`
			`# read 2 seconds of audio`
			`raw_audio = in_pipe.stdout.read(88200*4)`
			`if len(raw_audio) == 0:`
			`break`
			`audio_array = numpy.fromstring(raw_audio, dtype="int16")`
			`completeAudioArray = numpy.append(completeAudioArray, audio_array)`
			`# print(audio_array)`

			`in_pipe.kill()`
			`in_pipe.wait()`

			`# add 0s the end`
			`completeAudioArrayCopy = numpy.zeros(len(completeAudioArray) + 44100, dtype="int16")`
			`completeAudioArrayCopy[:len(completeAudioArray)] = completeAudioArray`
			`completeAudioArray = completeAudioArrayCopy`

			`return completeAudioArray`

			`def transformData(self, i, completeAudioArray, sampleSize, smoothConstantDown, smoothConstantUp, lastSpectrum):`
			`if len(completeAudioArray) < (i + sampleSize):`
			`sampleSize = len(completeAudioArray) - i`

			`window = numpy.hanning(sampleSize)`
			`data = completeAudioArray[i:i+sampleSize][::1] * window`
			`paddedSampleSize = 2048`
			`paddedData = numpy.pad(data, (0, paddedSampleSize - sampleSize), 'constant')`
			`spectrum = numpy.fft.fft(paddedData)`
			`sample_rate = 44100`
			`frequencies = numpy.fft.fftfreq(len(spectrum), 1./sample_rate)`

cast slice indices to integer 2017-04-17 06:55:58 -04:00			`y = abs(spectrum[0:int(paddedSampleSize/2) - 1])`
first commit 2015-03-02 16:47:52 -05:00
			`# filter the noise away`
			`# y[y<80] = 0`

			`y = 20 * numpy.log10(y)`
			`y[numpy.isinf(y)] = 0`

			`if lastSpectrum is not None:`
			`lastSpectrum[y < lastSpectrum] = y[y < lastSpectrum] * smoothConstantDown + lastSpectrum[y < lastSpectrum] * (1 - smoothConstantDown)`
			`lastSpectrum[y >= lastSpectrum] = y[y >= lastSpectrum] * smoothConstantUp + lastSpectrum[y >= lastSpectrum] * (1 - smoothConstantUp)`
			`else:`
			`lastSpectrum = y`

cast slice indices to integer 2017-04-17 06:55:58 -04:00			`x = frequencies[0:int(paddedSampleSize/2) - 1]`
first commit 2015-03-02 16:47:52 -05:00
cast slice indices to integer 2017-04-17 06:55:58 -04:00			`return lastSpectrum`
added ability to use an mp4 as the background might not be the best way to do this (dumping all the video frames to a temp location), but it works for clips of a few minutes or less 2017-05-18 19:14:27 -04:00
			`def deleteTempDir(self):`
			`if self.tempDir and os.path.exists(self.tempDir):`
			`rmtree(self.tempDir)`


			`def getVideoFrames(self, videoPath, firstOnly=False):`
			`self.tempDir = os.path.join(tempfile.gettempdir(), 'audio-visualizer-python-data')`
			`# recreate the temporary directory so it is empty`
			`self.deleteTempDir()`
			`os.mkdir(self.tempDir)`
			`if firstOnly:`
fixed preview not updating when changing between two videos making the filename of preview.jpg different each time seems to work 2017-05-21 20:07:07 -04:00			`filename = 'preview%s.jpg' % os.path.basename(videoPath).split('.', 1)[0]`
added ability to use an mp4 as the background might not be the best way to do this (dumping all the video frames to a temp location), but it works for clips of a few minutes or less 2017-05-18 19:14:27 -04:00			`options = '-ss 10 -vframes 1'`
			`else:`
			`filename = '$frame%05d.jpg'`
			`options = ''`
			`sp.call( \`
			`'%s -i "%s" -y %s "%s"' % ( \`
			`self.FFMPEG_BIN,`
			`videoPath,`
			`options,`
			`os.path.join(self.tempDir, filename)`
			`),`
			`shell=True`
			`)`
			`return sorted([os.path.join(self.tempDir, f) for f in os.listdir(self.tempDir)])`
colors are configurable in the GUI any invalid RGB tuple entered will result in white 2017-05-22 22:25:38 -04:00
			`@staticmethod`
			`def RGBFromString(string):`
			`''' turns an RGB string like "255, 255, 255" into a tuple '''`
			`try:`
			`tup = tuple([int(i) for i in string.split(',')])`
			`if len(tup) != 3:`
			`raise ValueError`
			`for i in tup:`
			`if i > 255 or i < 0:`
			`raise ValueError`
			`return tup`
			`except:`
			`return (255, 255, 255)`