source: python/scripts/aubiocut @ 8b884ef

feature/autosinkfeature/cnnfeature/cnn_orgfeature/constantqfeature/crepefeature/crepe_orgfeature/pitchshiftfeature/pydocstringsfeature/timestretchfix/ffmpeg5pitchshiftsamplertimestretchyinfft+
Last change on this file since 8b884ef was dee4164, checked in by Paul Brossier <piem@piem.org>, 12 years ago

python/scripts/aubiocut: add slicing

  • Property mode set to 100755
File size: 7.9 KB
Line 
1#! /usr/bin/env python
2
3""" this file was written by Paul Brossier
4  it is released under the GNU/GPL license.
5"""
6
7import sys
8#from aubio.task import *
9
10usage = "usage: %s [options] -i soundfile" % sys.argv[0]
11usage += "\nhelp: %s -h" % sys.argv[0]
12
13def parse_args():
14    from optparse import OptionParser
15    parser = OptionParser(usage=usage)
16    parser.add_option("-i", "--input", action = "store", dest = "source_file",
17            help="input sound file to analyse", metavar = "<source_file>")
18    parser.add_option("-m","--method",
19            action="store", dest="onset_method", default='default',
20            metavar = "<onset_method>",
21            help="onset detection method [default=default] \
22                    complexdomain|hfc|phase|specdiff|energy|kl|mkl")
23    # cutting methods
24    """
25    parser.add_option("-b","--beat",
26            action="store_true", dest="beat", default=False,
27            help="use beat locations")
28    parser.add_option("-S","--silencecut",
29            action="store_true", dest="silencecut", default=False,
30            help="use silence locations")
31    parser.add_option("-s","--silence",
32            metavar = "<value>",
33            action="store", dest="silence", default=-70,
34            help="silence threshold [default=-70]")
35            """
36    # algorithm parameters
37    parser.add_option("--samplerate",
38            metavar = "<freq>", type='int',
39            action="store", dest="samplerate", default=0,
40            help="samplerate at which the file should be represented")
41    parser.add_option("-B","--bufsize",
42            action="store", dest="bufsize", default=512,
43            metavar = "<size>",
44            help="buffer size [default=512]")
45    parser.add_option("-H","--hopsize",
46            metavar = "<size>",
47            action="store", dest="hopsize", default=256,
48            help="overlap size [default=256]")
49    parser.add_option("-t","--threshold",
50            metavar = "<value>", type="float",
51            action="store", dest="threshold", default=0.3,
52            help="onset peak picking threshold [default=0.3]")
53    parser.add_option("-c","--cut",
54            action="store_true", dest="cut", default=False,
55            help="cut input sound file at detected labels \
56                    best used with option -L")
57    """
58    parser.add_option("-D","--delay",
59            action = "store", dest = "delay", type = "float",
60            metavar = "<seconds>", default=0,
61            help="number of seconds to take back [default=system]\
62                    default system delay is 3*hopsize/samplerate")
63    parser.add_option("-C","--dcthreshold",
64            metavar = "<value>",
65            action="store", dest="dcthreshold", default=1.,
66            help="onset peak picking DC component [default=1.]")
67    parser.add_option("-M","--mintol",
68            metavar = "<value>",
69            action="store", dest="mintol", default=0.048,
70            help="minimum inter onset interval [default=0.048]")
71    parser.add_option("-L","--localmin",
72            action="store_true", dest="localmin", default=False,
73            help="use local minima after peak detection")
74    parser.add_option("-d","--derivate",
75            action="store_true", dest="derivate", default=False,
76            help="derivate onset detection function")
77    parser.add_option("-z","--zerocross",
78            metavar = "<value>",
79            action="store", dest="zerothres", default=0.008,
80            help="zero-crossing threshold for slicing [default=0.00008]")
81            """
82    # plotting functions
83    """
84    parser.add_option("-p","--plot",
85            action="store_true", dest="plot", default=False,
86            help="draw plot")
87    parser.add_option("-x","--xsize",
88            metavar = "<size>",
89            action="store", dest="xsize", default=1.,
90            type='float', help="define xsize for plot")
91    parser.add_option("-y","--ysize",
92            metavar = "<size>",
93            action="store", dest="ysize", default=1.,
94            type='float', help="define ysize for plot")
95    parser.add_option("-f","--function",
96            action="store_true", dest="func", default=False,
97            help="print detection function")
98    parser.add_option("-n","--no-onsets",
99            action="store_true", dest="nplot", default=False,
100            help="do not plot detected onsets")
101    parser.add_option("-O","--outplot",
102            metavar = "<output_image>",
103            action="store", dest="outplot", default=None,
104            help="save plot to output.{ps,png}")
105    parser.add_option("-F","--spectrogram",
106            action="store_true", dest="spectro", default=False,
107            help="add spectrogram to the plot")
108    """
109    parser.add_option("-v","--verbose",
110            action="store_true", dest="verbose", default=True,
111            help="make lots of noise [default]")
112    parser.add_option("-q","--quiet",
113            action="store_false", dest="verbose", default=True,
114            help="be quiet")
115    (options, args) = parser.parse_args()
116    if not options.source_file:
117        print "no file name given\n", usage
118        sys.exit(1)
119    return options, args
120
121if __name__ == '__main__':
122    options, args = parse_args()
123
124    hopsize = options.hopsize
125    bufsize = options.bufsize
126    samplerate = options.samplerate
127    source_file = options.source_file
128
129    from aubio import onset, source, sink
130
131    s = source(source_file, samplerate, hopsize)
132    if samplerate == 0: samplerate = s.get_samplerate()
133
134    o = onset(options.onset_method, bufsize, hopsize)
135    o.set_threshold(options.threshold)
136
137    timestamps = []
138    total_frames = 0
139    # analyze pass
140    while True:
141        samples, read = s()
142        if o(samples):
143            this_onset = o.get_last_onset()
144            if options.verbose: print "%.4f" % o.get_last_onset_s()
145            timestamps.append (this_onset)
146        total_frames += read
147        if read < hopsize: break
148
149    # print some info
150    nstamps = len(timestamps)
151    duration = float (total_frames) / float(samplerate)
152    info = 'found %(nstamps)d timestamps in %(source_file)s' % locals()
153    info += ' (total %(duration).2fs at %(samplerate)dHz)\n' % locals()
154    sys.stderr.write(info)
155
156    # cutting pass
157    if options.cut and nstamps > 0:
158        # generate output filenames
159        import os
160        source_base_name, source_ext = os.path.splitext(os.path.basename(source_file))
161        def new_sink_name(source_base_name, timestamp):
162            return source_base_name + '_%02.3f' % (timestamp) + '.wav'
163        # reopen source file
164        del s
165        s = source(source_file, samplerate, hopsize)
166        # create first sink at 0
167        g = sink(new_sink_name(source_base_name, 0.), samplerate)
168        total_frames = 0
169        # get next region
170        next_onset = int(timestamps.pop(0))
171        while True:
172            vec, read = s()
173            remaining = next_onset - total_frames
174            if remaining <= read:
175                # write remaining samples from current region
176                g(vec[0:remaining], remaining)
177                # close this file
178                del g
179                # create a new file for the new region
180                g = sink(new_sink_name(source_base_name, next_onset / float(samplerate)), samplerate)
181                # write the remaining samples in the new file
182                g(vec[remaining:read], read - remaining)
183                #print "new slice", total_frames_written, "+", remaining, "=", start_of_next_region
184                if len(timestamps):
185                    next_onset = int(timestamps.pop(0))
186                else:
187                    next_onset = 1e120
188            else:
189                g(vec[0:read], read)
190            total_frames += read
191            if read < hopsize: break
192
193        # print some info
194        duration = float (total_frames) / float(samplerate)
195        info = 'created %(nstamps)d slices from %(source_file)s' % locals()
196        info += ' (total %(duration).2fs at %(samplerate)dHz)\n' % locals()
197        sys.stderr.write(info)
Note: See TracBrowser for help on using the repository browser.