shithub: aubio

ref: 197571a68720b9cceafb22353d2bb6a654ed2a4a
dir: /python/aubiopitch/

View raw version
#!/usr/bin/python

""" this file was written by Paul Brossier 
  it is released under the GNU/GPL license.
"""

import sys
from aubio.tasks import *

usage = "usage: %s [options] -i soundfile" % sys.argv[0]


def parse_args():
        from optparse import OptionParser
        parser = OptionParser(usage=usage)
        parser.add_option("-i","--input",
                          action="store", dest="filename", 
                          help="input sound file")
        parser.add_option("-m","--mode", action="callback", 
                          callback=check_pitch_mode, dest="mode", 
                          default=[aubio_pitch_mcomb],
                          help="pitch detection mode [default=mcomb] \
                          mcomb|yin|fcomb|schmitt")
        parser.add_option("-u","--units", action="callback", 
                          callback=check_pitchm_mode, dest="omode",
                          default=aubio_pitchm_freq,
                          help="output pitch in units [default=Hz] \
                          freq|midi|cent|bin")
        parser.add_option("-B","--bufsize",
                          action="store", dest="bufsize", default=None, 
                          help="buffer size [default=1024]")
        parser.add_option("-H","--hopsize",
                          action="store", dest="hopsize", default=None, 
                          help="overlap size [default=512]")
        parser.add_option("-t","--threshold",
                          action="store", dest="threshold", default=0.1, 
                          help="pitch threshold (for yin) [default=0.1]")
        parser.add_option("-s","--silence",
                          action="store", dest="silence", default=-70, 
                          help="silence threshold [default=-70]")
        parser.add_option("-D","--delay",
                          action="store", dest="delay",  
                          help="number of seconds to take back [default=system]\
                          default system delay is 2*hopsize/samplerate")
        parser.add_option("-L","--localmin",
                          action="store_true", dest="localmin", default=False, 
                          help="use local minima after peak detection")
        parser.add_option("-c","--cut",
                          action="store_true", dest="cut", default=False,
                          help="cut input sound file at detected labels \
                          best used with option -L")
        # to be implemented
        parser.add_option("-n","--note",
                          action="store_true", dest="note", default=False,
                          help="NOT IMPLEMENTED output notes")
        # plotting functions
        parser.add_option("-p","--plot",
                          action="store_true", dest="plot", default=False, 
                          help="NOT IMPLEMENTED draw plot")
        parser.add_option("-O","--outplot",
                          action="store", dest="outplot", default=None, 
                          help="NOT IMPLEMENTED save plot to output.{ps,png}")
        parser.add_option("-v","--verbose",
                          action="store_true", dest="verbose", default=False,
                          help="make lots of noise [default]")
        parser.add_option("-q","--quiet",
                          action="store_false", dest="verbose", default=False, 
                          help="be quiet")
        (options, args) = parser.parse_args()
        if not options.bufsize:
                if options.mode == aubio_pitch_yin:     options.bufsize = 1024
                if options.mode == aubio_pitch_schmitt: options.bufsize = 2048
                if options.mode == aubio_pitch_mcomb:   options.bufsize = 4096
                if options.mode == aubio_pitch_fcomb:   options.bufsize = 4096 
                else: options.bufsize = 2048
        if not options.hopsize:
                options.hopsize = float(options.bufsize) / 2
        if not options.filename: 
                print "no file name given\n", usage
                sys.exit(1)
        return options, args

options, args = parse_args()

#print options.bufsize, options.hopsize

filename   = options.filename
samplerate = float(sndfile(filename).samplerate())
hopsize    = int(options.hopsize)
bufsize    = int(options.bufsize)
step       = float(samplerate)/float(hopsize)
threshold  = float(options.threshold)
silence    = float(options.silence)
mode       = options.mode
#mintol     = float(options.mintol)*step
# default take back system delay
if options.delay: delay = float(options.delay)
else:             delay = 2./step

if options.note:
        exit("not implemented yet")
else:
        pitch = []
        for i in range(len(mode)):
                pitch.append(getpitch(filename, #threshold,
                        mode=mode[i],
                        omode=options.omode,
                        bufsize=bufsize,hopsize=hopsize,
                        silence=silence))
                for j in range(len(pitch[i])):
                        if pitch[i][j] > 1500 or pitch[i][j] < 40:
                                pitch[i][j] = 0.;

## take back system delay
#if delay != 0:
#        for i in range(len(onsets)):
#                onsets[i] -= delay*step
#
## prune doubled 
#if mintol > 0:
#        last = -2*mintol
#        newonsets = []
#        for new in onsets:
#                if (new - last > mintol): 
#                        newonsets.append(new)
#                last = new
#        onsets = newonsets

# print times in second
if options.verbose:
        for j in range(len(pitch[0])): 
                print "%f\t" % (j/step),
                for i in range(len(pitch)): 
                        print "%f\t" % pitch[i][j],
                print

if options.plot:
        from aubio.gnuplot import plot_pitch
        plot_pitch(filename, pitch, 
                samplerate=samplerate, hopsize=hopsize, outplot=options.outplot)