source: python/scripts/aubiocut @ ca45e58

feature/autosinkfeature/cnnfeature/cnn_orgfeature/constantqfeature/crepefeature/crepe_orgfeature/pitchshiftfeature/pydocstringsfeature/timestretchfix/ffmpeg5pitchshiftsamplertimestretchyinfft+
Last change on this file since ca45e58 was 1e1a2c9, checked in by Paul Brossier <piem@piem.org>, 11 years ago

python/scripts/aubiocut: make -i optional

  • Property mode set to 100755
File size: 8.1 KB
RevLine 
[9582713]1#! /usr/bin/env python
2
3""" this file was written by Paul Brossier
4  it is released under the GNU/GPL license.
5"""
6
7import sys
8#from aubio.task import *
9
10usage = "usage: %s [options] -i soundfile" % sys.argv[0]
[7fc5ba2]11usage += "\n help: %s -h" % sys.argv[0]
[9582713]12
13def parse_args():
14    from optparse import OptionParser
15    parser = OptionParser(usage=usage)
16    parser.add_option("-i", "--input", action = "store", dest = "source_file",
17            help="input sound file to analyse", metavar = "<source_file>")
18    parser.add_option("-m","--method",
19            action="store", dest="onset_method", default='default',
20            metavar = "<onset_method>",
21            help="onset detection method [default=default] \
22                    complexdomain|hfc|phase|specdiff|energy|kl|mkl")
23    # cutting methods
24    parser.add_option("-b","--beat",
25            action="store_true", dest="beat", default=False,
26            help="use beat locations")
[7fc5ba2]27    """
[9582713]28    parser.add_option("-S","--silencecut",
29            action="store_true", dest="silencecut", default=False,
30            help="use silence locations")
31    parser.add_option("-s","--silence",
32            metavar = "<value>",
33            action="store", dest="silence", default=-70,
34            help="silence threshold [default=-70]")
35            """
36    # algorithm parameters
37    parser.add_option("--samplerate",
38            metavar = "<freq>", type='int',
39            action="store", dest="samplerate", default=0,
40            help="samplerate at which the file should be represented")
41    parser.add_option("-B","--bufsize",
42            action="store", dest="bufsize", default=512,
[7fc5ba2]43            metavar = "<size>", type='int',
[9582713]44            help="buffer size [default=512]")
45    parser.add_option("-H","--hopsize",
[7fc5ba2]46            metavar = "<size>", type='int',
[9582713]47            action="store", dest="hopsize", default=256,
48            help="overlap size [default=256]")
49    parser.add_option("-t","--threshold",
50            metavar = "<value>", type="float",
51            action="store", dest="threshold", default=0.3,
52            help="onset peak picking threshold [default=0.3]")
53    parser.add_option("-c","--cut",
54            action="store_true", dest="cut", default=False,
55            help="cut input sound file at detected labels \
56                    best used with option -L")
57    """
58    parser.add_option("-D","--delay",
59            action = "store", dest = "delay", type = "float",
60            metavar = "<seconds>", default=0,
61            help="number of seconds to take back [default=system]\
62                    default system delay is 3*hopsize/samplerate")
63    parser.add_option("-C","--dcthreshold",
64            metavar = "<value>",
65            action="store", dest="dcthreshold", default=1.,
66            help="onset peak picking DC component [default=1.]")
67    parser.add_option("-M","--mintol",
68            metavar = "<value>",
69            action="store", dest="mintol", default=0.048,
70            help="minimum inter onset interval [default=0.048]")
71    parser.add_option("-L","--localmin",
72            action="store_true", dest="localmin", default=False,
73            help="use local minima after peak detection")
74    parser.add_option("-d","--derivate",
75            action="store_true", dest="derivate", default=False,
76            help="derivate onset detection function")
77    parser.add_option("-z","--zerocross",
78            metavar = "<value>",
79            action="store", dest="zerothres", default=0.008,
80            help="zero-crossing threshold for slicing [default=0.00008]")
81            """
82    # plotting functions
83    """
84    parser.add_option("-p","--plot",
85            action="store_true", dest="plot", default=False,
86            help="draw plot")
87    parser.add_option("-x","--xsize",
88            metavar = "<size>",
89            action="store", dest="xsize", default=1.,
90            type='float', help="define xsize for plot")
91    parser.add_option("-y","--ysize",
92            metavar = "<size>",
93            action="store", dest="ysize", default=1.,
94            type='float', help="define ysize for plot")
95    parser.add_option("-f","--function",
96            action="store_true", dest="func", default=False,
97            help="print detection function")
98    parser.add_option("-n","--no-onsets",
99            action="store_true", dest="nplot", default=False,
100            help="do not plot detected onsets")
101    parser.add_option("-O","--outplot",
102            metavar = "<output_image>",
103            action="store", dest="outplot", default=None,
104            help="save plot to output.{ps,png}")
105    parser.add_option("-F","--spectrogram",
106            action="store_true", dest="spectro", default=False,
107            help="add spectrogram to the plot")
108    """
109    parser.add_option("-v","--verbose",
110            action="store_true", dest="verbose", default=True,
111            help="make lots of noise [default]")
112    parser.add_option("-q","--quiet",
113            action="store_false", dest="verbose", default=True,
114            help="be quiet")
115    (options, args) = parser.parse_args()
116    if not options.source_file:
[1e1a2c9]117        import os.path
118        if len(args) == 1:
119            options.source_file = args[0]
120        else:
121            print "no file name given\n", usage
122            sys.exit(1)
[9582713]123    return options, args
124
125if __name__ == '__main__':
126    options, args = parse_args()
127
128    hopsize = options.hopsize
129    bufsize = options.bufsize
130    samplerate = options.samplerate
131    source_file = options.source_file
132
[7fc5ba2]133    from aubio import onset, tempo, source, sink
[9582713]134
135    s = source(source_file, samplerate, hopsize)
136    if samplerate == 0: samplerate = s.get_samplerate()
137
[7fc5ba2]138    if options.beat:
139        o = tempo(options.onset_method, bufsize, hopsize)
140    else:
141        o = onset(options.onset_method, bufsize, hopsize)
[9582713]142    o.set_threshold(options.threshold)
143
144    timestamps = []
[dee4164]145    total_frames = 0
146    # analyze pass
[9582713]147    while True:
148        samples, read = s()
[dee4164]149        if o(samples):
[7fc5ba2]150            timestamps.append (o.get_last())
151            if options.verbose: print "%.4f" % o.get_last_s()
[dee4164]152        total_frames += read
[9582713]153        if read < hopsize: break
[7fc5ba2]154    del s
[9582713]155    # print some info
156    nstamps = len(timestamps)
[dee4164]157    duration = float (total_frames) / float(samplerate)
[9582713]158    info = 'found %(nstamps)d timestamps in %(source_file)s' % locals()
[dee4164]159    info += ' (total %(duration).2fs at %(samplerate)dHz)\n' % locals()
[9582713]160    sys.stderr.write(info)
[dee4164]161
162    # cutting pass
163    if options.cut and nstamps > 0:
164        # generate output filenames
165        import os
166        source_base_name, source_ext = os.path.splitext(os.path.basename(source_file))
167        def new_sink_name(source_base_name, timestamp):
168            return source_base_name + '_%02.3f' % (timestamp) + '.wav'
169        # reopen source file
170        s = source(source_file, samplerate, hopsize)
[7fc5ba2]171        if samplerate == 0: samplerate = s.get_samplerate()
[dee4164]172        # create first sink at 0
173        g = sink(new_sink_name(source_base_name, 0.), samplerate)
174        total_frames = 0
175        # get next region
176        next_onset = int(timestamps.pop(0))
177        while True:
178            vec, read = s()
179            remaining = next_onset - total_frames
180            if remaining <= read:
181                # write remaining samples from current region
182                g(vec[0:remaining], remaining)
183                # close this file
184                del g
185                # create a new file for the new region
186                g = sink(new_sink_name(source_base_name, next_onset / float(samplerate)), samplerate)
187                # write the remaining samples in the new file
188                g(vec[remaining:read], read - remaining)
189                #print "new slice", total_frames_written, "+", remaining, "=", start_of_next_region
190                if len(timestamps):
191                    next_onset = int(timestamps.pop(0))
192                else:
193                    next_onset = 1e120
194            else:
195                g(vec[0:read], read)
196            total_frames += read
197            if read < hopsize: break
198
199        # print some info
200        duration = float (total_frames) / float(samplerate)
201        info = 'created %(nstamps)d slices from %(source_file)s' % locals()
202        info += ' (total %(duration).2fs at %(samplerate)dHz)\n' % locals()
203        sys.stderr.write(info)
Note: See TracBrowser for help on using the repository browser.