python/scripts/aubiocut: add -b option
[aubio.git] / python / scripts / aubiocut
1 #! /usr/bin/env python
2
3 """ this file was written by Paul Brossier
4   it is released under the GNU/GPL license.
5 """
6
7 import sys
8 #from aubio.task import *
9
10 usage = "usage: %s [options] -i soundfile" % sys.argv[0]
11 usage += "\n help: %s -h" % sys.argv[0]
12
13 def parse_args():
14     from optparse import OptionParser
15     parser = OptionParser(usage=usage)
16     parser.add_option("-i", "--input", action = "store", dest = "source_file",
17             help="input sound file to analyse", metavar = "<source_file>")
18     parser.add_option("-m","--method",
19             action="store", dest="onset_method", default='default',
20             metavar = "<onset_method>",
21             help="onset detection method [default=default] \
22                     complexdomain|hfc|phase|specdiff|energy|kl|mkl")
23     # cutting methods
24     parser.add_option("-b","--beat",
25             action="store_true", dest="beat", default=False,
26             help="use beat locations")
27     """
28     parser.add_option("-S","--silencecut",
29             action="store_true", dest="silencecut", default=False,
30             help="use silence locations")
31     parser.add_option("-s","--silence",
32             metavar = "<value>",
33             action="store", dest="silence", default=-70,
34             help="silence threshold [default=-70]")
35             """
36     # algorithm parameters
37     parser.add_option("--samplerate",
38             metavar = "<freq>", type='int',
39             action="store", dest="samplerate", default=0,
40             help="samplerate at which the file should be represented")
41     parser.add_option("-B","--bufsize",
42             action="store", dest="bufsize", default=512,
43             metavar = "<size>", type='int',
44             help="buffer size [default=512]")
45     parser.add_option("-H","--hopsize",
46             metavar = "<size>", type='int',
47             action="store", dest="hopsize", default=256,
48             help="overlap size [default=256]")
49     parser.add_option("-t","--threshold",
50             metavar = "<value>", type="float",
51             action="store", dest="threshold", default=0.3,
52             help="onset peak picking threshold [default=0.3]")
53     parser.add_option("-c","--cut",
54             action="store_true", dest="cut", default=False,
55             help="cut input sound file at detected labels \
56                     best used with option -L")
57     """
58     parser.add_option("-D","--delay",
59             action = "store", dest = "delay", type = "float",
60             metavar = "<seconds>", default=0,
61             help="number of seconds to take back [default=system]\
62                     default system delay is 3*hopsize/samplerate")
63     parser.add_option("-C","--dcthreshold",
64             metavar = "<value>",
65             action="store", dest="dcthreshold", default=1.,
66             help="onset peak picking DC component [default=1.]")
67     parser.add_option("-M","--mintol",
68             metavar = "<value>",
69             action="store", dest="mintol", default=0.048,
70             help="minimum inter onset interval [default=0.048]")
71     parser.add_option("-L","--localmin",
72             action="store_true", dest="localmin", default=False,
73             help="use local minima after peak detection")
74     parser.add_option("-d","--derivate",
75             action="store_true", dest="derivate", default=False,
76             help="derivate onset detection function")
77     parser.add_option("-z","--zerocross",
78             metavar = "<value>",
79             action="store", dest="zerothres", default=0.008,
80             help="zero-crossing threshold for slicing [default=0.00008]")
81             """
82     # plotting functions
83     """
84     parser.add_option("-p","--plot",
85             action="store_true", dest="plot", default=False,
86             help="draw plot")
87     parser.add_option("-x","--xsize",
88             metavar = "<size>",
89             action="store", dest="xsize", default=1.,
90             type='float', help="define xsize for plot")
91     parser.add_option("-y","--ysize",
92             metavar = "<size>",
93             action="store", dest="ysize", default=1.,
94             type='float', help="define ysize for plot")
95     parser.add_option("-f","--function",
96             action="store_true", dest="func", default=False,
97             help="print detection function")
98     parser.add_option("-n","--no-onsets",
99             action="store_true", dest="nplot", default=False,
100             help="do not plot detected onsets")
101     parser.add_option("-O","--outplot",
102             metavar = "<output_image>",
103             action="store", dest="outplot", default=None,
104             help="save plot to output.{ps,png}")
105     parser.add_option("-F","--spectrogram",
106             action="store_true", dest="spectro", default=False,
107             help="add spectrogram to the plot")
108     """
109     parser.add_option("-v","--verbose",
110             action="store_true", dest="verbose", default=True,
111             help="make lots of noise [default]")
112     parser.add_option("-q","--quiet",
113             action="store_false", dest="verbose", default=True,
114             help="be quiet")
115     (options, args) = parser.parse_args()
116     if not options.source_file:
117         print "no file name given\n", usage
118         sys.exit(1)
119     return options, args
120
121 if __name__ == '__main__':
122     options, args = parse_args()
123
124     hopsize = options.hopsize
125     bufsize = options.bufsize
126     samplerate = options.samplerate
127     source_file = options.source_file
128
129     from aubio import onset, tempo, source, sink
130
131     s = source(source_file, samplerate, hopsize)
132     if samplerate == 0: samplerate = s.get_samplerate()
133
134     if options.beat:
135         o = tempo(options.onset_method, bufsize, hopsize)
136     else:
137         o = onset(options.onset_method, bufsize, hopsize)
138     o.set_threshold(options.threshold)
139
140     timestamps = []
141     total_frames = 0
142     # analyze pass
143     while True:
144         samples, read = s()
145         if o(samples):
146             timestamps.append (o.get_last())
147             if options.verbose: print "%.4f" % o.get_last_s()
148         total_frames += read
149         if read < hopsize: break
150     del s
151     # print some info
152     nstamps = len(timestamps)
153     duration = float (total_frames) / float(samplerate)
154     info = 'found %(nstamps)d timestamps in %(source_file)s' % locals()
155     info += ' (total %(duration).2fs at %(samplerate)dHz)\n' % locals()
156     sys.stderr.write(info)
157
158     # cutting pass
159     if options.cut and nstamps > 0:
160         # generate output filenames
161         import os
162         source_base_name, source_ext = os.path.splitext(os.path.basename(source_file))
163         def new_sink_name(source_base_name, timestamp):
164             return source_base_name + '_%02.3f' % (timestamp) + '.wav'
165         # reopen source file
166         s = source(source_file, samplerate, hopsize)
167         if samplerate == 0: samplerate = s.get_samplerate()
168         # create first sink at 0
169         g = sink(new_sink_name(source_base_name, 0.), samplerate)
170         total_frames = 0
171         # get next region
172         next_onset = int(timestamps.pop(0))
173         while True:
174             vec, read = s()
175             remaining = next_onset - total_frames
176             if remaining <= read:
177                 # write remaining samples from current region
178                 g(vec[0:remaining], remaining)
179                 # close this file
180                 del g
181                 # create a new file for the new region
182                 g = sink(new_sink_name(source_base_name, next_onset / float(samplerate)), samplerate)
183                 # write the remaining samples in the new file
184                 g(vec[remaining:read], read - remaining)
185                 #print "new slice", total_frames_written, "+", remaining, "=", start_of_next_region
186                 if len(timestamps):
187                     next_onset = int(timestamps.pop(0))
188                 else:
189                     next_onset = 1e120
190             else:
191                 g(vec[0:read], read)
192             total_frames += read
193             if read < hopsize: break
194
195         # print some info
196         duration = float (total_frames) / float(samplerate)
197         info = 'created %(nstamps)d slices from %(source_file)s' % locals()
198         info += ' (total %(duration).2fs at %(samplerate)dHz)\n' % locals()
199         sys.stderr.write(info)