source: python/scripts/aubiocut @ e97d0b3

feature/autosinkfeature/cnnfeature/cnn_orgfeature/constantqfeature/crepefeature/crepe_orgfeature/pitchshiftfeature/pydocstringsfeature/timestretchfix/ffmpeg5pitchshiftsamplertimestretchyinfft+
Last change on this file since e97d0b3 was 7fc5ba2, checked in by Paul Brossier <piem@piem.org>, 11 years ago

python/scripts/aubiocut: add -b option

  • Property mode set to 100755
File size: 8.0 KB
Line 
1#! /usr/bin/env python
2
3""" this file was written by Paul Brossier
4  it is released under the GNU/GPL license.
5"""
6
7import sys
8#from aubio.task import *
9
10usage = "usage: %s [options] -i soundfile" % sys.argv[0]
11usage += "\n help: %s -h" % sys.argv[0]
12
13def parse_args():
14    from optparse import OptionParser
15    parser = OptionParser(usage=usage)
16    parser.add_option("-i", "--input", action = "store", dest = "source_file",
17            help="input sound file to analyse", metavar = "<source_file>")
18    parser.add_option("-m","--method",
19            action="store", dest="onset_method", default='default',
20            metavar = "<onset_method>",
21            help="onset detection method [default=default] \
22                    complexdomain|hfc|phase|specdiff|energy|kl|mkl")
23    # cutting methods
24    parser.add_option("-b","--beat",
25            action="store_true", dest="beat", default=False,
26            help="use beat locations")
27    """
28    parser.add_option("-S","--silencecut",
29            action="store_true", dest="silencecut", default=False,
30            help="use silence locations")
31    parser.add_option("-s","--silence",
32            metavar = "<value>",
33            action="store", dest="silence", default=-70,
34            help="silence threshold [default=-70]")
35            """
36    # algorithm parameters
37    parser.add_option("--samplerate",
38            metavar = "<freq>", type='int',
39            action="store", dest="samplerate", default=0,
40            help="samplerate at which the file should be represented")
41    parser.add_option("-B","--bufsize",
42            action="store", dest="bufsize", default=512,
43            metavar = "<size>", type='int',
44            help="buffer size [default=512]")
45    parser.add_option("-H","--hopsize",
46            metavar = "<size>", type='int',
47            action="store", dest="hopsize", default=256,
48            help="overlap size [default=256]")
49    parser.add_option("-t","--threshold",
50            metavar = "<value>", type="float",
51            action="store", dest="threshold", default=0.3,
52            help="onset peak picking threshold [default=0.3]")
53    parser.add_option("-c","--cut",
54            action="store_true", dest="cut", default=False,
55            help="cut input sound file at detected labels \
56                    best used with option -L")
57    """
58    parser.add_option("-D","--delay",
59            action = "store", dest = "delay", type = "float",
60            metavar = "<seconds>", default=0,
61            help="number of seconds to take back [default=system]\
62                    default system delay is 3*hopsize/samplerate")
63    parser.add_option("-C","--dcthreshold",
64            metavar = "<value>",
65            action="store", dest="dcthreshold", default=1.,
66            help="onset peak picking DC component [default=1.]")
67    parser.add_option("-M","--mintol",
68            metavar = "<value>",
69            action="store", dest="mintol", default=0.048,
70            help="minimum inter onset interval [default=0.048]")
71    parser.add_option("-L","--localmin",
72            action="store_true", dest="localmin", default=False,
73            help="use local minima after peak detection")
74    parser.add_option("-d","--derivate",
75            action="store_true", dest="derivate", default=False,
76            help="derivate onset detection function")
77    parser.add_option("-z","--zerocross",
78            metavar = "<value>",
79            action="store", dest="zerothres", default=0.008,
80            help="zero-crossing threshold for slicing [default=0.00008]")
81            """
82    # plotting functions
83    """
84    parser.add_option("-p","--plot",
85            action="store_true", dest="plot", default=False,
86            help="draw plot")
87    parser.add_option("-x","--xsize",
88            metavar = "<size>",
89            action="store", dest="xsize", default=1.,
90            type='float', help="define xsize for plot")
91    parser.add_option("-y","--ysize",
92            metavar = "<size>",
93            action="store", dest="ysize", default=1.,
94            type='float', help="define ysize for plot")
95    parser.add_option("-f","--function",
96            action="store_true", dest="func", default=False,
97            help="print detection function")
98    parser.add_option("-n","--no-onsets",
99            action="store_true", dest="nplot", default=False,
100            help="do not plot detected onsets")
101    parser.add_option("-O","--outplot",
102            metavar = "<output_image>",
103            action="store", dest="outplot", default=None,
104            help="save plot to output.{ps,png}")
105    parser.add_option("-F","--spectrogram",
106            action="store_true", dest="spectro", default=False,
107            help="add spectrogram to the plot")
108    """
109    parser.add_option("-v","--verbose",
110            action="store_true", dest="verbose", default=True,
111            help="make lots of noise [default]")
112    parser.add_option("-q","--quiet",
113            action="store_false", dest="verbose", default=True,
114            help="be quiet")
115    (options, args) = parser.parse_args()
116    if not options.source_file:
117        print "no file name given\n", usage
118        sys.exit(1)
119    return options, args
120
121if __name__ == '__main__':
122    options, args = parse_args()
123
124    hopsize = options.hopsize
125    bufsize = options.bufsize
126    samplerate = options.samplerate
127    source_file = options.source_file
128
129    from aubio import onset, tempo, source, sink
130
131    s = source(source_file, samplerate, hopsize)
132    if samplerate == 0: samplerate = s.get_samplerate()
133
134    if options.beat:
135        o = tempo(options.onset_method, bufsize, hopsize)
136    else:
137        o = onset(options.onset_method, bufsize, hopsize)
138    o.set_threshold(options.threshold)
139
140    timestamps = []
141    total_frames = 0
142    # analyze pass
143    while True:
144        samples, read = s()
145        if o(samples):
146            timestamps.append (o.get_last())
147            if options.verbose: print "%.4f" % o.get_last_s()
148        total_frames += read
149        if read < hopsize: break
150    del s
151    # print some info
152    nstamps = len(timestamps)
153    duration = float (total_frames) / float(samplerate)
154    info = 'found %(nstamps)d timestamps in %(source_file)s' % locals()
155    info += ' (total %(duration).2fs at %(samplerate)dHz)\n' % locals()
156    sys.stderr.write(info)
157
158    # cutting pass
159    if options.cut and nstamps > 0:
160        # generate output filenames
161        import os
162        source_base_name, source_ext = os.path.splitext(os.path.basename(source_file))
163        def new_sink_name(source_base_name, timestamp):
164            return source_base_name + '_%02.3f' % (timestamp) + '.wav'
165        # reopen source file
166        s = source(source_file, samplerate, hopsize)
167        if samplerate == 0: samplerate = s.get_samplerate()
168        # create first sink at 0
169        g = sink(new_sink_name(source_base_name, 0.), samplerate)
170        total_frames = 0
171        # get next region
172        next_onset = int(timestamps.pop(0))
173        while True:
174            vec, read = s()
175            remaining = next_onset - total_frames
176            if remaining <= read:
177                # write remaining samples from current region
178                g(vec[0:remaining], remaining)
179                # close this file
180                del g
181                # create a new file for the new region
182                g = sink(new_sink_name(source_base_name, next_onset / float(samplerate)), samplerate)
183                # write the remaining samples in the new file
184                g(vec[remaining:read], read - remaining)
185                #print "new slice", total_frames_written, "+", remaining, "=", start_of_next_region
186                if len(timestamps):
187                    next_onset = int(timestamps.pop(0))
188                else:
189                    next_onset = 1e120
190            else:
191                g(vec[0:read], read)
192            total_frames += read
193            if read < hopsize: break
194
195        # print some info
196        duration = float (total_frames) / float(samplerate)
197        info = 'created %(nstamps)d slices from %(source_file)s' % locals()
198        info += ' (total %(duration).2fs at %(samplerate)dHz)\n' % locals()
199        sys.stderr.write(info)
Note: See TracBrowser for help on using the repository browser.