@@ -42,7 +42,7 @@ def load_audio(file, sr, **kwargs):
4242 except Exception as e :
4343 raise RuntimeError (f"Failed to load audio: { e } " )
4444
45- return np .frombuffer (out , np .float32 ).flatten (), sr
45+ return remix_audio (( np .frombuffer (out , np .float32 ).flatten (), sr ), ** kwargs )
4646
4747def remix_audio (input_audio ,target_sr = None ,norm = False ,to_int16 = False ,resample = False ,axis = 0 ,** kwargs ):
4848 audio = np .array (input_audio [0 ],dtype = "float32" )
@@ -65,10 +65,10 @@ def remix_audio(input_audio,target_sr=None,norm=False,to_int16=False,resample=Fa
6565
6666def load_input_audio (fname ,sr = None ,** kwargs ):
6767 if sr is None : sr = 44100
68- sound = load_audio (fname , sr , ** kwargs )
68+ audio , sr = load_audio (fname , sr , ** kwargs )
6969 # sound = librosa.load(fname,sr=sr,**kwargs)
70- print (f"loading sound { fname } { sound [ 0 ]. shape } { sound [ 1 ] } { sound [ 0 ]. dtype } " )
71- return sound
70+ print (f"loading sound { fname = } { audio . ndim = } { audio . max () = } { audio . min () = } { audio . dtype = } { sr = } " )
71+ return audio , sr
7272
7373def save_input_audio (fname ,input_audio ,sr = None ,to_int16 = False ,to_stereo = False ):
7474 print (f"saving sound to { fname } " )
0 commit comments