示例#1
0
文件: multigram.py 项目: cutun/kazoo
def file_test (small_exponent = 9, large_exponent = 12):
  "multigram"
  s = K.Multigram(small_exponent, large_exponent)
  size_in = s.size_in
  large_size = s.size_out
  length = s.size_out / 2#arbitrary

  print "reading sound file"
  sound = formats.read_wav('test.wav', size_in*length, size_in)
  image = K.Reals(length, large_size)

  print "transforming data"
  for i in range(length):
    s.transform_fwd(sound[i,:], image[i,:])
  del sound

  print "saving image"
  image = util.energy_to_loudness(image + 1e-5)
  formats.write_image(image, 'test.png')
示例#2
0
文件: supergram.py 项目: cutun/kazoo
def show_file (size_exponent = 10, time_exponent = 2, freq_exponent = 3):
  'Shows supergram of an audio file'

  s = K.Supergram(size_exponent, time_exponent, freq_exponent)
  size = s.size
  small_size = s.small_size
  large_size = s.super_size
  length = s.super_size #arbitrary

  print "reading sound file"
  sound = formats.read_wav('test.wav', small_size*length, small_size)
  image = K.transforms.Reals(length, large_size)

  print "transforming data"
  for i in range(length):
    s.transform_fwd(sound[i,:], image[i,:])
  #del sound

  print "saving image"
  image = K.util.energy_to_loudness(image + 1e-5)
  formats.write_image(image, 'test.png').show()
示例#3
0
文件: pitchgram.py 项目: fritzo/kazoo
def show_file(bank_size=512, block_size=K.DEFAULT_FRAMES_PER_BUFFER):
    "Shows pitchgram of an audio file"

    size_in = block_size
    size_out = bank_size
    length = size_out * 16 / 9  # arbitrary

    pitchgram = K.Pitchgram(size_in, size_out)

    print "reading sound file"
    sound = formats.read_wav("test.wav", size_in * length, size_in)
    image = K.transforms.Reals(length, size_out)

    print "transforming data"
    for i in range(length):
        pitchgram.transform(sound[i, :], image[i, :])
    # del sound

    print "saving image"
    image = K.util.energy_to_loudness(image + 1e-5)
    formats.write_image(image, "test.png").show()
示例#4
0
文件: read_wav.py 项目: cutun/kazoo
def read_spectrogram (exponent = 10, wavname = 'test.wav'):
  """
  read a sound file, say a wav file;
  compute a spectrogram or reassigned spectrogram;
  write image to png file
  """

  width = 1 << exponent
  height = width
  size = height * width

  print "reading sound file"
  sound = formats.read_wav(wavname, size, width)
  image = K.Reals(height, width/2)

  print "transforming data"
  s = K.Spectrogram(exponent)
  for i in range(height):
    s.transform_fwd(sound[i,:],image[i,:])

  print "saving image"
  image = formats.energy_to_loudness(image)
  formats.write_image(image, 'test.png')