123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162 |
- #!/usr/bin/env python
- # -*- coding: utf-8 -*-
- # Beat tracking example
- # Appunti: buono per un video u po' psichedelico ci va:
- # <lora:bb3l15:1> an abstract circuit board design with orange yellow green and purple squares over red background in the style of bb3l15
- # su modello colorful_v30 (https://civitai.com/images/3024879?modelVersionId=188803&prioritizedUserIds=913950&period=AllTime&sort=Most+Reactions&limit=20 )
- # <lora:Ink_scenery:1> black background, sketch jungle scenery, path, dense su sd 1.5
- # Wilson <lora:Ink_scenery:1> black background, sketch jungle setting
- import os
- import numpy as np
- import librosa
- import random
- import math
- from scipy.interpolate import interp1d
- import matplotlib.pyplot as plt
- def plotting_stuffs():
- plt.figure(figsize=(15, 17))
- t = librosa.frames_to_time(range(rms.size), hop_length=flength)
- ax = plt.subplot(3, 1, 1)
- librosa.display.waveshow(wave, alpha=0.5)
- plt.plot(t, rms[0], color="r")
- plt.plot(t, trms, color="b")
- plt.ylim((-1, 1))
- plt.title("Wave&Featurres")
- plt.show()
- x = np.linspace(0,1,100)
- y = sig(x)
- plt.plot(x, y)
- plt.show()
- plt.hist(rms[0], color = 'red', edgecolor = 'black', bins = 10)
- plt.show()
- plt.hist(cent[0], color = 'blue', edgecolor = 'black', bins = int(cent.max()/100))
- plt.show()
- plt.hist(zcr[0], color = 'green', edgecolor = 'black', bins = 10)
- plt.show()
- plt.figure(figsize=(150, 17))
- t = librosa.frames_to_time(range(zcr.size), hop_length=flength)
- ax = plt.subplot(3, 1, 1)
- plt.xticks(np.arange(0, 12103, step=1))
- plt.plot(t, zcr[0], color="r")
- plt.ylim((zcr.min(), zcr.max()))
- plt.title("ZCR")
- plt.show()
- def f(t):
- return 1.0025+0.002*np.sin(1.25*3.14*t/30)
- #return x ** 2
- def sig(x):
- return 1/(1 + np.exp(-12*(x-0.431)))
- def transformXYrandom(x):
- return random.random()*10*x-5;
- strength_min = 0.4
- strength_max = 0.73
- # Assuming that into "generated" directoruy U've already create "project_name" subfolder
- #audio_input_file = '/home/lalo/data/studio_suono/ardourprojects/space/export/star_r1_sessione_20240310_msub07.wav'
- audio_input_file = "/home/luca-conte/Musica/ardour_projects/end_titles/export/end_titles_draft_r1_sessione.wav"
- #audio_input_file = '/home/lalo/data/studio_grafica/deforum/wilson_r1_mm_sample2.wav'
- #audio_input_file = '/home/lalo/data/studio_suono/spx/231104_001_m01.wav'
- #audio_input_file = '/home/lalo/data/studio_grafica/deforum/eucrasy_r1_sample.wav'
- #audio_input_file = '/home/lalo/data/studio_grafica/deforum/eucrasy_r1.wav'
- #audio_input_file = '/home/lalo/data/studio_grafica/deforum/eucrasy_short_r1.wav'
- #audio_input_file = '/home/lalo/data/studio_suono/231014_002_mastered_r2_clip.WAV'
- #audio_input_file = 'C:/Users/LucaConte/Music/lc_music/wilson_r1_mm.wav'
- # Store the sampling rate as `sr`
- fps = 24
- flength = 22050//fps
- #audio frame size is 22050/30=735
- wave, sr = librosa.load(audio_input_file)
- rms = librosa.feature.rms(y=wave, frame_length=flength, hop_length=flength)
- zcr = librosa.feature.zero_crossing_rate(y=wave,frame_length=flength,hop_length=flength)
- #rms = librosa.feature.rms(y=wave, frame_length=735, hop_length=735)
- cent = librosa.feature.spectral_centroid(y=wave, sr=sr,n_fft=flength, hop_length=flength)
- duration = int(math.ceil(librosa.get_duration(y=wave, sr=sr)))
- frames = duration * fps
- print("RMS SIZE: " + str(len(rms[0])))
- print("Rms min/max: " + str(rms.min()) + "/" + str(rms.max()))
- print("CEN SIZE: " + str(len(cent[0])))
- print("Cent min/max: " + str(cent.min()) + "/" + str(cent.max()))
- print("TOTAL FRAMES: " + str(frames))
- print("Audio duration in secs: " + str(duration))
- #
- # sr.len /22050 = duration
- # rms.len * 30 = duration
- # rms[i] mi da la potenza media del frame iesimo
- trms= rms[0]
- m = interp1d([min(trms), max(trms)], [strength_min, strength_max])
- c = interp1d([cent.min(), cent.max()], [-0.5, 0.5])
- # Creating the sctipt file (the real unique aoutput of this script)
- try:
- print("")
- print("------RMS---------")
- print("")
- for frame in range(len(rms[0])):
- print(str(frame) + ":(" + str(trms[frame]) + "),", end="")
- print("")
- print("-------CENTROIDS--------")
- print("")
- for frame in range(cent.size):
- print(str(frame) + ":(" + str(cent[0][frame]) + "),", end="")
- print("")
- print("-----TRANSFORM----------")
- print("")
- for frame in range(cent.size):
- print(str(frame) + ":(" + str(transformXYrandom(1)) + "),", end="")
- print("")
- print("-----ZERO CROSSING RATE----------")
- print("")
- for frame in range(zcr.size):
- print(str(frame) + ":(" + str(zcr[0][frame]) + "),", end="")
- print("RMS SIZE: " + str(len(rms[0])))
- print("Rms min/max: " + str(rms.min()) + "/" + str(rms.max()))
- print("Rms mean: " + str(np.mean(rms[0])))
- print("CEN SIZE: " + str(len(cent[0])))
- print("Cent min/max: " + str(cent.min()) + "/" + str(cent.max()))
- print("TOTAL FRAMES: " + str(frames))
- print("Audio duration in secs: " + str(duration))
- except:
- print(exception)
- plotting_stuffs()
|