lib.fv200909opt

84 assert not do_pdur and not do_dissonance 85 FORMANT_LOW = erb_scale.f_to_erb(120.0) 86 FORMANT_HIGH = erb_scale.f_to_erb(6000.0) 87 assert float(DT)>0.0 88 assert float(LF)>0.0 89 bmin = erb_scale.f_to_erb(80.0) 90 bmax = erb_scale.f_to_erb(6000.0) 91 ectrs, neural, t0 = PS.perceptual_spec(data, dt, DT, 92 bmin, bmax, DB, 93 do_mod=do_voicing, 94 do_dissonance=do_dissonance, 95 do_peakalign=True, 96 PlompBouman=PlompBouman, 97 cachename=cachename 98 ) 99 100 assert 1 < neural.shape[0] < 200 101 band_indices = [i for (i,ec) in enumerate(ectrs) if ec['type']=='band'] 102 neural_b = neural.take(band_indices, axis=0) 103 assert neural_b.shape[1]==neural.shape[1] 104 if zerosub != 0.0: 105 neural_b = neural_b.copy() 106 try: 107 z = Z.PS(neural_b) 108 except Z.ZeroProblem: 109 die.warn("Bad utterance: zero does not converge.") 110 z = numpy.zeros((neural_b.shape[0],)) 111 assert neural_b.shape[0]==z.shape[0] 112 numpy.subtract(neural_b, z[:,numpy.newaxis], neural_b) 113 assert neural_b.shape[1]==neural.shape[1] 114 assert neural_b.shape[0]<=neural.shape[0] 115 116 neural_now = numpy.average(neural_b, axis=0) # Average over frequency. 117 assert neural_now.shape[0] == neural.shape[1] 118 neural_avg = numpy.sum(neural_now**2)/numpy.sum(neural_now) # Average over time. 119 # neural_avg is a scalar, grand average. 120 numpy.divide(neural, neural_avg, neural) 121 # Now, we've normalized by an over-all average loudness. 122 numpy.divide(neural_now, neural_avg, neural_now) 123 # Now, we've normalized by an over-all average loudness. 124 125 for (i,e) in enumerate(ectrs): 126 if e['type'] == 'haspitch': 127 numpy.divide(neural[i,:], neural_avg, neural[i,:]) 128 if e['type'] == 'dissonance': 129 numpy.divide(neural[i,:], neural_avg, neural[i,:]) 130 if e['type'] == 'peakalign': 131 numpy.divide(neural[i,:], neural_avg**2, neural[i,:]) 132 133 if do_irx: 134 irx = _irx 135 else: 136 irx = lambda x: x 137 138 139 o = [] 140 descr = [] 141 w = irx(0.04*LF/DT) 142 tmpo, tmpd = M.vowel(w, ectrs, neural, neural_now, Nsv, 143 formant_low=FORMANT_LOW, 144 formant_high=FORMANT_HIGH 145 ) 146 o.extend(tmpo) 147 descr.extend(tmpd) 148 assert len(descr)==len(o), "Descriptor mismatch" 149 150 w = irx(0.04*ELF/DT) 151 tmpo, tmpd = M.fricative_edge(w, ectrs, neural, neural_now, Nsv, 152 do_abs=False 153 ) 154 o.extend(tmpo) 155 descr.extend(tmpd) 156 assert len(descr)==len(o), "Descriptor mismatch" 157 158 if do_voicing: 159 w = irx(0.02*math.sqrt(LF)/DT) 160 tmpo, tmpd = M.haspitch(w, ectrs, neural, neural_now, Nsv) 161 o.extend(tmpo) 162 descr.extend(tmpd) 163 assert len(descr)==len(o), "Descriptor mismatch" 164 165 w = irx(0.03*ELF/DT) 166 tmpo, tmpd = M.peakiness(w, ectrs, neural, neural_now, Nsv) 167 o.extend(tmpo) 168 descr.extend(tmpd) 169 assert len(descr)==len(o), "Descriptor mismatch" 170 171 N = neural[0].shape[0] 172 for (i, (tmp, dsc)) in enumerate(zip(o, descr)): 173 assert tmp.shape == (N,), "Wrong size: %d, %s = %d vs. %d" % (i, str(dsc), tmp.shape[0], N) 174 175 return (o, descr, DT, t0)

Source Code for Module lib.fv200909opt