notebook.community

Edit and run



In [40]:

    
import numpy as np
import pandas as pd
import sys

sys.path.append('../../tools/music-processing-experiments')

from time_intervals import block_labels



In [2]:

    
true_segments_df = pd.read_csv('../../data/beatles/_inbox/segmentation/01_09_true_segments.tsv', sep='\t')



In [6]:

    
true_segments_df = true_segments_df[['start', 'end', 'label']]



In [95]:

    
true_segments_df.head()
print(len(true_segments_df))



In [12]:

    
duration = true_segments_df['end'].iloc[-1]
duration









    Out[12]:





125.753469



In [31]:

    
def block_segments(duration, fs=44100.0, hop_size=2048):
    """
    Computes start and end times of regular overlapping blocks.
    """
    hop_duration = hop_size / fs
    start_times = np.arange(0, duration, hop_duration)
    end_times = start_times + hop_duration
    return pd.DataFrame({'start': start_times, 'end': end_times}, columns=['start', 'end'])

block_times = block_segments(duration)
print(block_times.shape)
print(block_times[:5])









    



(2708, 2)
     start      end
0  0.00000  0.04644
1  0.04644  0.09288
2  0.09288  0.13932
3  0.13932  0.18576
4  0.18576  0.23220



In [62]:

    
chords = true_segments_df
x_times = block_times['start']
block_size = 4096
hop_size = 2048
label_cols = ['label']

def time_to_samples(time, fs=44100.0):
    return np.round(time * fs)

# chords['start_sample'] = time_to_samples(chords['start'])
# chords['end_sample'] = time_to_samples(chords['end'])
# df_blocks = pd.DataFrame({'start': time_to_samples(x_times).astype(np.int64)})
# df_blocks['end'] = df_blocks['start'] + block_size
df_blocks = block_times

# df_labels = chords[['start_sample', 'end_sample', 'label']].copy()
# df_labels.rename(columns={'start_sample': 'start', 'end_sample': 'end'}, inplace=True)

# df_labelled_blocks = block_labels(df_blocks, df_labels)
df_labelled_blocks = block_labels(df_blocks, chords)



In [63]:

    
df_labelled_blocks









    Out[63]:






  
    
      
      start
      end
      label
    
  
  
    
      0
      0.000000
      0.046440
      N
    
    
      1
      0.046440
      0.092880
      N
    
    
      2
      0.092880
      0.139320
      N
    
    
      3
      0.139320
      0.185760
      N
    
    
      4
      0.185760
      0.232200
      N
    
    
      5
      0.232200
      0.278639
      N
    
    
      6
      0.278639
      0.325079
      N
    
    
      7
      0.325079
      0.371519
      N
    
    
      8
      0.371519
      0.417959
      N
    
    
      9
      0.417959
      0.464399
      N
    
    
      10
      0.464399
      0.510839
      G
    
    
      11
      0.510839
      0.557279
      G
    
    
      12
      0.557279
      0.603719
      G
    
    
      13
      0.603719
      0.650159
      G
    
    
      14
      0.650159
      0.696599
      G
    
    
      15
      0.696599
      0.743039
      G
    
    
      16
      0.743039
      0.789478
      G
    
    
      17
      0.789478
      0.835918
      G
    
    
      18
      0.835918
      0.882358
      G
    
    
      19
      0.882358
      0.928798
      G
    
    
      20
      0.928798
      0.975238
      G
    
    
      21
      0.975238
      1.021678
      G
    
    
      22
      1.021678
      1.068118
      G
    
    
      23
      1.068118
      1.114558
      G
    
    
      24
      1.114558
      1.160998
      G
    
    
      25
      1.160998
      1.207438
      G
    
    
      26
      1.207438
      1.253878
      G
    
    
      27
      1.253878
      1.300317
      G
    
    
      28
      1.300317
      1.346757
      G
    
    
      29
      1.346757
      1.393197
      G
    
    
      ...
      ...
      ...
      ...
    
    
      2678
      124.366077
      124.412517
      N
    
    
      2679
      124.412517
      124.458957
      N
    
    
      2680
      124.458957
      124.505397
      N
    
    
      2681
      124.505397
      124.551837
      N
    
    
      2682
      124.551837
      124.598277
      N
    
    
      2683
      124.598277
      124.644717
      N
    
    
      2684
      124.644717
      124.691156
      N
    
    
      2685
      124.691156
      124.737596
      N
    
    
      2686
      124.737596
      124.784036
      N
    
    
      2687
      124.784036
      124.830476
      N
    
    
      2688
      124.830476
      124.876916
      N
    
    
      2689
      124.876916
      124.923356
      N
    
    
      2690
      124.923356
      124.969796
      N
    
    
      2691
      124.969796
      125.016236
      N
    
    
      2692
      125.016236
      125.062676
      N
    
    
      2693
      125.062676
      125.109116
      N
    
    
      2694
      125.109116
      125.155556
      N
    
    
      2695
      125.155556
      125.201995
      N
    
    
      2696
      125.201995
      125.248435
      N
    
    
      2697
      125.248435
      125.294875
      N
    
    
      2698
      125.294875
      125.341315
      N
    
    
      2699
      125.341315
      125.387755
      N
    
    
      2700
      125.387755
      125.434195
      N
    
    
      2701
      125.434195
      125.480635
      N
    
    
      2702
      125.480635
      125.527075
      N
    
    
      2703
      125.527075
      125.573515
      N
    
    
      2704
      125.573515
      125.619955
      N
    
    
      2705
      125.619955
      125.666395
      N
    
    
      2706
      125.666395
      125.712834
      N
    
    
      2707
      125.712834
      125.759274
      N
    
  

2708 rows × 3 columns



In [66]:

    
df_labelled_blocks.to_csv('../../data/beatles/_inbox/segmentation/01_09_ref_frames_4096_2048_timed_2.tsv',
                          sep='\t', index=None, float_format='%.6f')



In [52]:

    
(pd.read_csv('../../data/beatles/_inbox/segmentation/01_09_ref_frames_4096_2048.tsv', sep='\t')['label'] == df_labelled_blocks['label']).all()









    Out[52]:





True



In [53]:

    
5548032/44100.









    Out[53]:





125.80571428571429



In [55]:

    
true_segments_df.iloc[-1]









    Out[55]:





start           121.7597
end             125.7535
label                  N
start_sample     5369601
end_sample       5545728
Name: 77, dtype: object



In [97]:

    
df_frames = df_labelled_blocks.copy()
df_frames.head()



In [104]:

    
def frames_to_segments(df_frames, total_duration=None):
    df = df_frames.copy()
    labels = df['label']
    segment_start = labels != labels.shift(1)
    df_segments = df[segment_start].copy()
    end_time = total_duration if total_duration else df['end'].iloc[-1]
    df_segments['end'] = df_segments['start'].shift(-1).fillna(end_time)
    return df_segments



In [109]:

    
df_segments = frames_to_segments(df_frames, total_duration=duration)
df_segments.tail()



In [99]:

    
df_segments.to_csv('../../data/beatles/_inbox/segmentation/01_09_reconstructed_segments.tsv',
                          sep='\t', index=None, float_format='%.6f')



In [128]:

    
with open('../../data/beatles/_inbox/outputs/yesterday_lstm_class.tsv') as file:
    yesterday_labels = [line.replace('\n', '').replace('\t', '') for line in file.readlines()]



In [144]:

    
fs = 44100.
hop_size = 2048

# no time, just 12 PCS labels
def read_label_file(file_name):
    with open(file_name) as file:
        return [line.replace('\n', '').replace('\t', '') for line in file.readlines()]

def read_labels_as_df(file_name):
    labels = read_label_file(file_name)
    # compute frame start and end times
    hop_duration = hop_size / fs
    start_times = hop_duration * np.arange(len(labels))
    return pd.DataFrame({
        'start': start_times,
        'end': hop_duration + start_times,
        'label': labels},
         columns=['start', 'end', 'label'])

def save_tsv(df, file_name):
    df.to_csv(file_name, sep='\t', index=None, float_format='%.6f')



In [159]:

    
df_frames = read_labels_as_df('../../data/beatles/_inbox/outputs/yesterday_lstm_class.tsv')
df_segments = frames_to_segments(df_frames)



In [160]:

    
df_segments.head()









    Out[160]:






  
    
      
      start
      end
      label
    
  
  
    
      0
      0.000000
      1.857596
      100001000000
    
    
      40
      1.857596
      8.173424
      100001000100
    
    
      176
      8.173424
      8.219864
      000001000100
    
    
      177
      8.219864
      8.452063
      100001000100
    
    
      182
      8.452063
      8.498503
      000001000100



In [161]:

    
def explode_pitch_classes(df):
    df = df.copy()
    labels = df['label']
    pcs = np.array([[p for p in label] for label in df_segments['label']]).T
    pcs_cols = ['C','Db','D','Eb','E','F','Gb','G','Ab','A','Bb','B']
    for i, col in enumerate(pcs_cols):
        df[col] = pcs[i]
    del df['label']
    return df



In [164]:

    
df_segments.head()



In [163]:

    
df_segments = explode_pitch_classes(df_segments)
save_tsv(df_segments, '../../data/beatles/_inbox/outputs/yesterday_lstm_class_segments.tsv')



In [166]:

    
24/(1000/64)









    Out[166]:





1.536



In [ ]:

	start	end	label
2474	114.892336	117.585850	D
2532	117.585850	118.050249	Bb
2542	118.050249	118.514649	C
2552	118.514649	121.719002	D
2621	121.719002	125.753469	N

	start	end	label
0	0.000000	0.046440	N
1	0.046440	0.092880	N
2	0.092880	0.139320	N
3	0.139320	0.185760	N
4	0.185760	0.232200	N
5	0.232200	0.278639	N
6	0.278639	0.325079	N
7	0.325079	0.371519	N
8	0.371519	0.417959	N
9	0.417959	0.464399	N
10	0.464399	0.510839	G
11	0.510839	0.557279	G
12	0.557279	0.603719	G
13	0.603719	0.650159	G
14	0.650159	0.696599	G
15	0.696599	0.743039	G
16	0.743039	0.789478	G
17	0.789478	0.835918	G
18	0.835918	0.882358	G
19	0.882358	0.928798	G
20	0.928798	0.975238	G
21	0.975238	1.021678	G
22	1.021678	1.068118	G
23	1.068118	1.114558	G
24	1.114558	1.160998	G
25	1.160998	1.207438	G
26	1.207438	1.253878	G
27	1.253878	1.300317	G
28	1.300317	1.346757	G
29	1.346757	1.393197	G
...	...	...	...
2678	124.366077	124.412517	N
2679	124.412517	124.458957	N
2680	124.458957	124.505397	N
2681	124.505397	124.551837	N
2682	124.551837	124.598277	N
2683	124.598277	124.644717	N
2684	124.644717	124.691156	N
2685	124.691156	124.737596	N
2686	124.737596	124.784036	N
2687	124.784036	124.830476	N
2688	124.830476	124.876916	N
2689	124.876916	124.923356	N
2690	124.923356	124.969796	N
2691	124.969796	125.016236	N
2692	125.016236	125.062676	N
2693	125.062676	125.109116	N
2694	125.109116	125.155556	N
2695	125.155556	125.201995	N
2696	125.201995	125.248435	N
2697	125.248435	125.294875	N
2698	125.294875	125.341315	N
2699	125.341315	125.387755	N
2700	125.387755	125.434195	N
2701	125.434195	125.480635	N
2702	125.480635	125.527075	N
2703	125.527075	125.573515	N
2704	125.573515	125.619955	N
2705	125.619955	125.666395	N
2706	125.666395	125.712834	N
2707	125.712834	125.759274	N

	start	end	label
0	0.00000	0.04644	N
1	0.04644	0.09288	N
2	0.09288	0.13932	N
3	0.13932	0.18576	N
4	0.18576	0.23220	N

	start	end	label
0	0.000000	1.857596	100001000000
40	1.857596	8.173424	100001000100
176	8.173424	8.219864	000001000100
177	8.219864	8.452063	100001000100
182	8.452063	8.498503	000001000100