CMS Anomaly Detection

Prepearing data



In [1]:

    
%matplotlib inline
import matplotlib.pyplot as plt

import numpy as np
import pandas as pd
from joblib import Parallel, delayed

import re

DATA_PATH = 'merged.pickle'
SUBSYSTEM_LABELS_PATH = 'Quality2010'

The input files contains preselected features from CMS 2010B open data. The features were generated from original root in following way:

There were selected 3 streams:
- MiniBias,
- muons,
- photons.
In each stream 4 "channels" were selected:
- muons
- photons
- PF (particle flows)
- calo (calorimiter)
For each channel from each event 5 quantile particles were selected with redards to thier momentum: quantile $q_i$ corresponds to particle with index closest to $\frac{i}{5}N$, i.e. $q_5$ corresponds to the particle with maximal momentum.
Each particle is described by its physical properties: $\eta, \phi, p_T, f_x, f_y, f_z, m$
Physical features were aggragated by lumisections, producing:
- 1, 25, 50, 75, 99 percentiles
- mean and std

As the result each lumisection is described by percentiles, means and stds of distributions of physical features of particles of particular quantiles within particular channel within particular stream.

Some additional features were added like total momentum of all particles of particular channel within event



In [2]:

    
import cPickle as pickle

with open(DATA_PATH, 'r') as f:
    data = pickle.load(f)

labels = np.load('labels.npy')



In [3]:

    
def load_subsystem_labels(data_dir, name_patten=r'Cert_13TeV_2010_([a-zA-Z0-9]+)[.]txt'):
    import os
    import re
    import json

    pattern = re.compile(name_patten)
    
    labels = dict()
    
    for p in os.listdir(data_dir):
        name = pattern.findall(p)[0]

        with open(os.path.join(data_dir, p)) as f:
            data = json.load(f)
            
            good_data = set()
            
            for run in data:
                for a, b in data[run]:
                    a = int(a)
                    b = int(b)
                    
                    for lb in range(a, b + 1):
                        good_data.add((int(run), lb))
            
            labels[name] = good_data
    
    return labels



In [4]:

    
subsystem_labels_dict = load_subsystem_labels(SUBSYSTEM_LABELS_PATH)



In [5]:

    
subsystems = subsystem_labels_dict.keys()



In [6]:

    
subsystem_labels = np.zeros(shape=(len(data), len(subsystem_labels_dict)), dtype='float32')
indx = data[['_run', '_luminosityBlock']]

for i, sub_name in enumerate(subsystems):
    good_set = subsystem_labels_dict[sub_name]

    for j in xrange(len(data)):
        run, lumiblock = indx.iloc[j]
        
        subsystem_labels[j, i] = 1.0 if ((run, lumiblock) in good_set) else 0.0



In [7]:

    
subsystem_labels









    Out[7]:





array([[ 1.,  0.,  0., ...,  1.,  1.,  1.],
       [ 1.,  0.,  0., ...,  1.,  1.,  1.],
       [ 1.,  0.,  0., ...,  1.,  1.,  1.],
       ..., 
       [ 1.,  1.,  0., ...,  1.,  1.,  1.],
       [ 1.,  1.,  0., ...,  1.,  1.,  1.],
       [ 1.,  1.,  0., ...,  1.,  1.,  1.]], dtype=float32)



In [8]:

    
np.mean(np.min(subsystem_labels) == labels)









    Out[8]:





0.45384803921568628



In [9]:

    
for i in xrange(subsystem_labels.shape[1]):
    print "%s: %.3f" % (subsystems[i], np.mean(subsystem_labels[:, i] == labels))









    



Muon: 0.865
L1tcalo: 0.890
Hlt: 0.889
Ecal: 0.893
Track: 0.853
Lumi: 0.454
Csc: 0.853
Pix: 0.853
Rpc: 0.857
L1tmu: 0.890
Strip: 0.853
Hcal: 0.857
Egamma: 0.875
Jetmet: 0.875
Dt: 0.856
Es: 0.852



In [10]:

    
for i in xrange(subsystem_labels.shape[1]):
    s = subsystem_labels[:, i]
    print "%s: %.3f" % (subsystems[i], np.mean(labels[s == 0.0]))









    



Muon: 0.033
L1tcalo: 0.030
Hlt: 0.030
Ecal: 0.030
Track: 0.034
Lumi: 0.546
Csc: 0.034
Pix: 0.034
Rpc: 0.033
L1tmu: 0.030
Strip: 0.034
Hcal: 0.033
Egamma: 0.032
Jetmet: 0.032
Dt: 0.033
Es: 0.034



In [11]:

    
lumi = np.maximum(
    np.maximum(data['_instantLumi_minibias'].get_values(), data['_instantLumi_muons']).get_values(),
    data['_instantLumi_photons'].get_values()
)



In [12]:

    
### technical columns
not_features = [
    '_luminosityBlock',
    '_run',
    '_instantLumi_minibias',
    '_instantLumi_muons',
    '_instantLumi_photons'
]

### columns that correspond to actual features
features = sorted(set(data.columns) - set(not_features))



In [13]:

    
np.sum(np.isnan(data.values))









    Out[13]:





0



In [14]:

    
for f in features + ['_instantLumi_minibias', '_instantLumi_muons', '_instantLumi_photons']:
    xs = data[f].values

    if np.std(xs) > 0.0:
        data[f] = (xs - np.mean(xs)) / np.std(xs)



In [15]:

    
np.sum(np.isnan(data.values))









    Out[15]:





0



In [16]:

    
nonempty = np.where(lumi > 0.0)[0]

data = data.iloc[nonempty]
labels = labels[nonempty]
lumi = lumi[nonempty]
subsystem_labels = subsystem_labels[nonempty]



In [17]:

    
_ = plt.hist(lumi, bins=25)



In [18]:

    
data









    Out[18]:






  
    
      
      _instantLumi_minibias
      _instantLumi_muons
      _instantLumi_photons
      _luminosityBlock
      _run
      minibias_PF_Px_mean
      minibias_PF_Px_p1
      minibias_PF_Px_p25
      minibias_PF_Px_p50
      minibias_PF_Px_p75
      ...
      photons_photons_pt__q4_p75
      photons_photons_pt__q4_p99
      photons_photons_pt__q4_std
      photons_photons_pt__q5_mean
      photons_photons_pt__q5_p1
      photons_photons_pt__q5_p25
      photons_photons_pt__q5_p50
      photons_photons_pt__q5_p75
      photons_photons_pt__q5_p99
      photons_photons_pt__q5_std
    
  
  
    
      0
      -0.476999
      -0.461257
      -0.474353
      712.0
      149442.0
      0.553982
      0.121924
      -2.377744
      2.979489
      3.999278
      ...
      0.764066
      0.771053
      0.613178
      0.671934
      -0.115348
      0.529921
      0.626325
      0.669504
      0.781640
      0.624168
    
    
      1
      -0.477623
      -0.461857
      -0.474955
      715.0
      149442.0
      0.618719
      0.140093
      -2.245878
      3.164899
      4.423358
      ...
      0.816295
      1.448301
      0.720708
      0.596897
      -0.115348
      0.500126
      0.613411
      0.762044
      0.373972
      0.564393
    
    
      2
      -0.477305
      -0.461539
      -0.474672
      713.0
      149442.0
      0.590468
      0.089144
      -2.267943
      3.180846
      4.379818
      ...
      1.024795
      0.315584
      0.565043
      0.521407
      -0.115348
      0.398654
      0.593673
      0.525674
      1.095464
      0.607292
    
    
      3
      -0.477561
      -0.461845
      -0.474898
      714.0
      149442.0
      0.563941
      0.119073
      -2.135948
      3.271239
      4.200118
      ...
      1.010522
      1.116072
      0.778321
      0.669518
      -0.115348
      0.659620
      0.662089
      0.603566
      0.905891
      0.494840
    
    
      4
      -0.538044
      -0.523290
      -0.535418
      1023.0
      149442.0
      0.512639
      0.077763
      -2.699199
      2.974805
      4.191212
      ...
      0.864409
      0.397704
      0.620604
      0.533768
      -0.115348
      0.444284
      0.585253
      0.609742
      1.004260
      0.574727
    
    
      5
      -0.537828
      -0.523068
      -0.535225
      1021.0
      149442.0
      0.517615
      0.103767
      -2.663293
      2.657162
      3.985256
      ...
      0.648973
      1.369331
      0.777599
      0.577041
      -0.115348
      0.526261
      0.596193
      0.478365
      0.648295
      0.346964
    
    
      6
      -0.537625
      -0.522880
      -0.535011
      1022.0
      149442.0
      0.563187
      0.102591
      -2.438237
      2.993670
      4.275795
      ...
      0.919552
      0.240982
      0.398985
      0.444162
      -0.115348
      0.329574
      0.505470
      0.449276
      0.451287
      0.421262
    
    
      7
      -0.537408
      -0.522655
      -0.534744
      1019.0
      149442.0
      0.505455
      0.100209
      -2.434321
      3.207387
      3.973735
      ...
      0.938196
      0.244517
      0.423203
      0.507372
      -0.115348
      0.346889
      0.567593
      0.525296
      0.685222
      0.375095
    
    
      8
      -0.537486
      -0.522684
      -0.534869
      1020.0
      149442.0
      0.574270
      0.096662
      -1.984827
      3.611923
      4.527441
      ...
      0.944487
      0.125781
      0.404884
      0.529739
      -0.115348
      0.443858
      0.608706
      0.572331
      0.111104
      0.021400
    
    
      9
      1.853466
      1.907932
      1.857009
      891.0
      148862.0
      0.143227
      0.193403
      -1.220393
      -0.248370
      0.592133
      ...
      0.895971
      0.757568
      0.771628
      0.576278
      -0.115348
      0.400897
      0.583197
      0.597291
      0.727995
      0.536766
    
    
      10
      1.837523
      1.891757
      1.841057
      911.0
      148862.0
      0.020426
      0.200582
      -1.243430
      -0.010208
      0.794309
      ...
      0.878920
      0.642180
      0.794367
      0.490828
      -0.115348
      0.318793
      0.600866
      0.581313
      0.796026
      0.817299
    
    
      11
      1.837981
      1.892196
      1.841510
      910.0
      148862.0
      0.254102
      0.299626
      -0.753641
      0.387506
      0.688613
      ...
      0.903513
      0.616177
      0.563428
      0.611265
      -0.115348
      0.515783
      0.643339
      0.601259
      0.662659
      0.452296
    
    
      12
      1.853642
      1.908058
      1.857170
      892.0
      148862.0
      0.053299
      0.220230
      -1.412691
      -0.203188
      0.617519
      ...
      1.060738
      1.160782
      1.041600
      0.575771
      -0.115348
      0.358568
      0.601125
      0.587111
      1.043687
      0.686101
    
    
      13
      1.835867
      1.890089
      1.839436
      912.0
      148862.0
      0.220551
      0.254586
      -0.802466
      0.278139
      0.755937
      ...
      0.838634
      0.884751
      0.868857
      0.562964
      -0.115348
      0.405869
      0.593424
      0.590186
      0.858611
      0.638545
    
    
      14
      1.845707
      1.900036
      1.849211
      901.0
      148862.0
      0.050288
      0.268303
      -0.701044
      0.263453
      0.662087
      ...
      0.942580
      0.889855
      0.813298
      0.580820
      -0.115348
      0.367007
      0.608496
      0.593837
      1.088881
      0.659789
    
    
      15
      1.839256
      1.893519
      1.842827
      909.0
      148862.0
      0.137335
      0.253475
      -0.964377
      -0.198334
      0.529419
      ...
      0.927195
      0.496566
      0.614150
      0.561602
      -0.115348
      0.398512
      0.617832
      0.598610
      0.772948
      0.550210
    
    
      16
      1.845051
      1.899399
      1.848600
      902.0
      148862.0
      0.139826
      0.201296
      -1.213878
      -0.248624
      0.542476
      ...
      0.968020
      0.866815
      0.935637
      0.595347
      -0.115348
      0.463678
      0.617370
      0.593838
      0.785318
      0.527427
    
    
      17
      -0.394267
      -0.377106
      -0.391542
      309.0
      149442.0
      0.554091
      0.114643
      -2.146046
      3.534587
      4.395530
      ...
      0.761780
      1.016628
      0.770595
      0.485900
      -0.115348
      0.346858
      0.570590
      0.594613
      0.488143
      0.431462
    
    
      18
      -0.394795
      -0.377646
      -0.392106
      310.0
      149442.0
      0.577791
      0.123994
      -2.043484
      3.302803
      4.151893
      ...
      0.867348
      0.998963
      0.871039
      0.583222
      -0.115348
      0.469590
      0.588269
      0.562702
      0.367881
      0.420787
    
    
      19
      -0.393894
      -0.376756
      -0.391188
      308.0
      149442.0
      0.586487
      0.113231
      -2.112022
      3.688505
      4.278188
      ...
      0.912303
      0.511949
      0.720140
      0.506801
      -0.115348
      0.450674
      0.553380
      0.568445
      0.777110
      0.556243
    
    
      20
      -0.225698
      -0.205767
      -0.222956
      471.0
      146804.0
      0.160347
      0.341338
      0.368587
      -0.196806
      -0.346609
      ...
      0.249630
      0.313199
      0.311957
      0.203223
      -0.115348
      0.236743
      0.213440
      0.196701
      0.055530
      0.116495
    
    
      21
      -0.226181
      -0.206227
      -0.223441
      473.0
      146804.0
      0.156684
      0.344022
      0.256757
      -0.215817
      -0.378021
      ...
      0.162188
      0.255926
      0.239644
      0.210386
      -0.115348
      0.322838
      0.204748
      0.142855
      0.381928
      0.121706
    
    
      22
      -0.225980
      -0.206040
      -0.223241
      470.0
      146804.0
      0.158915
      0.350837
      0.421057
      -0.191739
      -0.317630
      ...
      0.304777
      0.392592
      0.284241
      0.229816
      -0.115348
      0.323203
      0.205921
      0.141697
      0.131174
      0.074745
    
    
      23
      -0.226017
      -0.206095
      -0.223279
      472.0
      146804.0
      0.158551
      0.340362
      0.232593
      -0.195309
      -0.324071
      ...
      0.227385
      0.330222
      0.491577
      0.257404
      -0.115348
      0.281682
      0.217302
      0.201887
      0.231733
      0.181379
    
    
      24
      -0.225742
      -0.205788
      -0.222996
      469.0
      146804.0
      0.140641
      0.345640
      0.339246
      -0.289709
      -0.437911
      ...
      0.368665
      0.469223
      0.527272
      0.259785
      -0.115348
      0.386855
      0.221167
      0.236540
      0.207622
      0.248504
    
    
      25
      -0.227557
      -0.207655
      -0.224824
      482.0
      146804.0
      0.142174
      0.340112
      0.262324
      -0.307185
      -0.405788
      ...
      0.392122
      0.353573
      0.359102
      0.281337
      -0.115348
      0.379175
      0.213838
      0.246437
      0.412988
      0.238516
    
    
      26
      -0.225567
      -0.205613
      -0.222843
      468.0
      146804.0
      0.161805
      0.344569
      0.327394
      -0.105669
      -0.300049
      ...
      0.203539
      0.308345
      0.213659
      0.229013
      -0.115348
      0.352089
      0.205661
      0.193750
      0.315675
      0.059978
    
    
      27
      -0.227121
      -0.207215
      -0.224374
      481.0
      146804.0
      0.145664
      0.332887
      0.253074
      -0.350401
      -0.339488
      ...
      0.224392
      0.298649
      0.228139
      0.197570
      -0.115348
      0.239053
      0.198968
      0.180528
      0.073310
      0.042760
    
    
      28
      0.140034
      0.166046
      0.142922
      241.0
      147114.0
      0.066937
      0.302040
      -0.509565
      0.210655
      0.502740
      ...
      0.192426
      0.375928
      0.276894
      0.203357
      -0.115348
      0.336530
      0.207330
      0.182377
      0.048294
      0.051638
    
    
      29
      0.140302
      0.166340
      0.143204
      240.0
      147114.0
      0.190173
      0.273033
      -0.577491
      0.115347
      0.531911
      ...
      0.345948
      0.209574
      0.467636
      0.234368
      -0.115348
      0.351363
      0.204462
      0.190613
      0.265661
      0.175971
    
    
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
      ...
    
    
      40761
      2.902892
      2.974773
      2.906824
      179.0
      148952.0
      0.151138
      0.232927
      -1.294354
      0.226846
      0.705557
      ...
      0.973589
      0.986710
      0.708416
      0.544826
      -0.115348
      0.427452
      0.582249
      0.572360
      0.796757
      0.460581
    
    
      40762
      2.904878
      2.976819
      2.908760
      178.0
      148952.0
      0.231864
      0.289239
      -0.943275
      0.350481
      0.780441
      ...
      1.039547
      0.556406
      0.753270
      0.629318
      -0.115348
      0.455411
      0.608221
      0.605413
      0.922457
      0.685390
    
    
      40763
      2.906914
      -0.848565
      2.910910
      177.0
      148952.0
      0.205609
      0.221397
      -1.003021
      0.428950
      0.844791
      ...
      0.907821
      1.030230
      1.010337
      0.587340
      -0.115348
      0.402068
      0.622462
      0.602628
      0.960785
      0.597153
    
    
      40764
      2.908473
      2.980513
      2.912444
      176.0
      148952.0
      0.095460
      0.292578
      -1.066127
      0.166745
      0.526382
      ...
      0.924296
      0.797089
      0.640915
      0.546176
      -0.115348
      0.388512
      0.577270
      0.615741
      0.659437
      0.486046
    
    
      40765
      2.891564
      2.963304
      2.895541
      185.0
      148952.0
      0.173260
      0.289437
      -1.082365
      -0.227814
      0.555198
      ...
      0.890428
      0.699035
      0.586636
      0.572752
      -0.115348
      0.423211
      0.609287
      0.609872
      0.725501
      0.456311
    
    
      40766
      2.894841
      2.966656
      2.898794
      183.0
      148952.0
      0.197939
      0.256577
      -0.864153
      0.091139
      0.700455
      ...
      0.939332
      0.754420
      0.711834
      0.627152
      -0.115348
      0.481476
      0.633779
      0.610978
      0.830290
      0.558209
    
    
      40767
      2.897331
      2.969224
      2.901307
      182.0
      148952.0
      0.187638
      0.285519
      -0.691262
      0.503284
      0.859772
      ...
      0.967683
      0.876492
      0.678706
      0.576152
      -0.115348
      0.405302
      0.607997
      0.634564
      0.874259
      0.630896
    
    
      40768
      2.900572
      2.972462
      2.904531
      180.0
      148952.0
      0.238464
      0.300257
      -1.076722
      0.418564
      0.611386
      ...
      1.005201
      0.921115
      0.952743
      0.635327
      -0.115348
      0.428403
      0.589989
      0.602555
      0.954278
      1.842066
    
    
      40769
      -0.413906
      -0.397107
      -0.411242
      387.0
      149442.0
      0.575185
      0.120637
      -2.281897
      3.058253
      4.299345
      ...
      1.080313
      0.324990
      0.599762
      0.505528
      -0.115348
      0.363226
      0.534725
      0.553655
      0.483907
      0.425722
    
    
      40770
      -0.413593
      -0.396764
      -0.410927
      385.0
      149442.0
      0.598695
      0.127787
      -2.166623
      3.111146
      4.130128
      ...
      0.928078
      0.564214
      0.556453
      0.573485
      -0.115348
      0.286211
      0.582370
      0.621679
      0.634364
      0.673325
    
    
      40771
      -0.413808
      -0.396965
      -0.411086
      386.0
      149442.0
      0.564783
      0.130210
      -2.785280
      3.192240
      4.383056
      ...
      0.851874
      0.778637
      0.743982
      0.578963
      -0.115348
      0.471776
      0.589087
      0.536826
      0.712576
      0.370454
    
    
      40772
      -0.857999
      2.894878
      2.827338
      171.0
      148862.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.889084
      0.511768
      0.561222
      0.580890
      -0.115348
      0.499345
      0.587801
      0.551634
      0.833091
      0.481876
    
    
      40773
      -0.857999
      2.826386
      2.762186
      170.0
      148862.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.902296
      0.863034
      0.655097
      0.619085
      -0.115348
      0.389422
      0.616936
      0.630125
      0.853028
      0.527624
    
    
      40774
      -0.857999
      2.821834
      2.756299
      182.0
      148862.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.812797
      0.998281
      0.851491
      0.593229
      -0.115348
      0.454787
      0.612111
      0.657451
      0.747904
      0.652288
    
    
      40775
      -0.857999
      1.185661
      -0.855501
      17.0
      148828.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      -1.406542
      -1.449248
      -1.414295
      -1.335670
      -0.115348
      -0.995653
      -1.299526
      -1.475390
      -1.611429
      -1.470669
    
    
      40776
      -0.857999
      2.781881
      2.716375
      165.0
      148862.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.935766
      0.754058
      0.658169
      0.584419
      -0.115348
      0.432774
      0.600677
      0.591814
      0.895626
      0.441935
    
    
      40777
      -0.857999
      1.385288
      1.342722
      1536.0
      149181.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.943771
      0.471166
      0.517161
      0.473218
      -0.115348
      0.361935
      0.576693
      0.558094
      0.609971
      0.373905
    
    
      40778
      -0.857999
      1.384750
      1.342142
      1537.0
      149181.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.981591
      0.718133
      0.836164
      0.579317
      -0.115348
      0.385875
      0.612778
      0.611518
      0.747541
      0.670423
    
    
      40779
      -0.857999
      1.382778
      1.340241
      1542.0
      149181.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.912063
      0.774485
      0.925811
      0.589979
      -0.115348
      0.429033
      0.615602
      0.626123
      0.989212
      0.671891
    
    
      40780
      -0.857999
      1.382065
      1.339508
      1543.0
      149181.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.942877
      1.707885
      0.943092
      0.542625
      -0.115348
      0.409707
      0.590393
      0.570283
      0.981879
      0.554108
    
    
      40781
      -0.857999
      1.384597
      1.341965
      1538.0
      149181.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.970771
      0.988100
      0.775045
      0.507598
      -0.115348
      0.335137
      0.593299
      0.604263
      0.644468
      0.543094
    
    
      40782
      -0.857999
      1.384127
      1.341540
      1539.0
      149181.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.882849
      0.714974
      0.744845
      0.564940
      -0.115348
      0.432921
      0.621131
      0.580774
      0.807918
      0.524712
    
    
      40783
      -0.857999
      1.383092
      1.340576
      1540.0
      149181.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.858010
      1.162390
      0.849604
      0.551138
      -0.115348
      0.307825
      0.576889
      0.615084
      0.966162
      0.701171
    
    
      40784
      -0.857999
      1.382828
      1.340324
      1541.0
      149181.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.792172
      0.481995
      0.497062
      0.469144
      -0.115348
      0.328909
      0.566370
      0.542170
      0.600684
      0.389513
    
    
      40793
      -0.857999
      1.180659
      -0.855501
      29.0
      148828.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      -1.406542
      -1.449248
      -1.414295
      -1.335670
      -0.115348
      -0.995653
      -1.299526
      -1.475390
      -1.611429
      -1.470669
    
    
      40795
      -0.857999
      -0.848565
      -0.054579
      343.0
      147219.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      -1.406542
      -1.449248
      -1.414295
      0.374269
      2.074624
      0.934642
      0.402299
      0.044024
      -0.890081
      -1.470669
    
    
      40796
      -0.857999
      -0.848565
      2.829290
      172.0
      148862.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.896104
      0.637716
      0.542963
      0.602062
      -0.115348
      0.414534
      0.607376
      0.589908
      0.915982
      0.610430
    
    
      40797
      -0.857999
      -0.848565
      2.762324
      181.0
      148862.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.953119
      1.197147
      1.013682
      0.573956
      -0.115348
      0.389071
      0.606260
      0.625781
      1.080387
      0.635778
    
    
      40798
      -0.857999
      -0.848565
      2.766229
      180.0
      148862.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.822746
      0.614369
      0.676742
      0.536445
      -0.115348
      0.384111
      0.570027
      0.579671
      0.659704
      0.539166
    
    
      40799
      -0.857999
      -0.848565
      2.815175
      173.0
      148862.0
      0.179143
      0.436371
      2.126189
      0.088207
      -1.171486
      ...
      0.940939
      0.763052
      0.698729
      0.556129
      -0.115348
      0.452743
      0.594686
      0.577589
      0.658719
      0.382850
    
  

26046 rows × 2699 columns

Grouping features

Feature set has its own intristic hierarchy. It can be easily seen from their names:

<stream>_<particle type>_<physical feature>_<particle quantile>_<feature quantile>

We are going to build hierarchical Artificial Neural Network, so firstly we must bring features into hierarchy.



In [19]:

    
### utility functions
def insert(keys, d, f):
    key = keys[0]

    if len(keys) == 1:
        d[key] = f
    else:
        if not d.has_key(key):
            d[key] = dict()
        return insert(keys[1:], d[key], f)

def levels(features, n_levels = 5):
    dicts = [features]

    levels = list()

    for level in range(n_levels):
        levels.append(
            set([ k for d in dicts for k in d ])
        )
    
        dicts = [ d[k] for d in dicts for k in d ]
    return levels
    
def get_feature_groups(feature_list, re_exp):
    """
    Retuns:
    1. hierachical dictionary feature groups -> feature full name
    2. feature levels
    3. unprocessed features
        
    """
    features = dict()
    rest = list()
    n_levels = set()

    for f in feature_list:
        matches = re.findall(re_exp, f)

        if len(matches) == 1:
            insert(matches[0], features, f)
            n_levels.add(len(matches[0]))
        elif len(matches) == 0:
            rest.append(f)
        else:
            raise Exception('Very suspicious feature: %s -> %s' % (f, matches))
    assert len(n_levels) == 1
    return features, levels(features, n_levels=list(n_levels)[0]), rest



In [20]:

    
def insert_fake_path(d, level, path = 'general'):
    if level == 0:
        return { path : d }
    else:
        r = dict()
        for k in d:
            r[k] = insert_fake_path(d[k], level - 1, path)
        
        return r

Selecting particles' features:

<stream>_<particle type>_<physical feature>_<particle quantile>_<feature quantile>



In [21]:

    
particle_f_re = re.compile(r'([a-zA-Z]+)[_]([a-zA-Z]+)[_]([a-zA-Z]+)[_]+(q[12345])[_](\w+)')
particle_features, particle_levels, rest = get_feature_groups(features, particle_f_re)



In [22]:

    
for level in particle_levels:
    print ' '.join(list(level))









    



muons minibias photons
muons photons PF calo
phi pt fX fY fZ eta mass
q1 q3 q2 q5 q4
std p99 p1 p25 p75 p50 mean

Selecting features that belong to a particle type:

<stream>_<particle type>_<physical feature>_<feature quantile>



In [23]:

    
particle_type_f_re = re.compile(r'([a-zA-Z]+)[_]([a-zA-Z]+)[_]([a-zA-Z]+)[_]+([a-zA-Z0-9]+)')
particle_type_features, particle_type_levels, rest = get_feature_groups(rest, particle_type_f_re)



In [24]:

    
for level in particle_type_levels:
    print ' '.join(list(level))









    



muons minibias photons
muons photons PF calo
Pz Px Py
std p99 p1 p25 p75 p50 mean



In [25]:

    
particle_type_features = insert_fake_path(particle_type_features, level = 2, path='allParticles')

for level in levels(particle_type_features, n_levels=5):
    print ' '.join(list(level))









    



muons minibias photons
muons photons PF calo
allParticles
Pz Px Py
std p99 p1 p25 p75 p50 mean

The features above are components of momentum of particles of particular type (channel) within event.

Selecting features specific to events:

<stream>_<physical feature>_<feature quantile>



In [26]:

    
event_f_re = re.compile(r'([a-zA-Z]+)[_]([a-zA-Z]+)[_]+(\w+)')
event_features, event_levels, rest = get_feature_groups(rest, event_f_re)



In [27]:

    
for level in event_levels:
    print ' '.join(list(level))









    



muons minibias photons
instantLumi
std p99 p1 p25 p75 p50 mean



In [28]:

    
f = insert_fake_path(event_features, level = 1, path='allChannels')
f = insert_fake_path(f, level = 2, path='allParticles')

event_features = f

for level in levels(event_features, n_levels=5):
    print ' '.join(list(level))









    



muons minibias photons
allChannels
allParticles
instantLumi
std p99 p1 p25 p75 p50 mean

Which are instant luminosity of each event.



In [29]:

    
rest









    Out[29]:





['minibias_nEvents',
 'minibias_nonZeroWeights',
 'muons_nEvents',
 'muons_nonZeroWeights',
 'photons_nEvents',
 'photons_nonZeroWeights']

And finally features specific to lumisection itself:

<stream>_<physical feature>_<feature quantile>



In [30]:

    
stream_f_re = re.compile(r'([a-zA-Z]+)[_]([a-zA-Z]+)')
stream_features, stream_levels, rest = get_feature_groups(rest, stream_f_re)



In [31]:

    
for level in stream_levels:
    print ' '.join(list(level))









    



muons minibias photons
nEvents nonZeroWeights

Number of events and fration of non-zero features for lumisection (all NA's are replaced with zeros).



In [32]:

    
rest









    Out[32]:





[]



In [33]:

    
from collections import defaultdict

def flatten(a_dict):
    for k in a_dict:
        if hasattr(a_dict[k], 'keys'):
            for path, value in flatten(a_dict[k]):
                yield (k, ) + path, value
        else:
            yield (k, ), a_dict[k]

def merge(dicts):
    result = dict()
    for d in dicts:
        for path, value in flatten(d):
            insert(path, result, value)

    return result

def flatten_dict(d):
    r = dict()
    for paths, v in flatten(d):
        k = '_'.join(paths)
        r[k] = v
    return r

def squezze(d, depth = 5, last=2):
    dc = d.copy()

    if depth - 1 == last:
        for k in d:
            dc[k] = flatten_dict(d[k])
        
        return d
    else:
        for k in d:
            dc[k] = squezze(d[k], depth-1, last)
        
        return dc

def group(d, level=2):
    gd = defaultdict(lambda: list())
    for path, k in flatten(d):
        gk = path[:level]
        gd[gk].append(k)
    
    return gd



In [34]:

    
feature_hierarchy = merge([
    particle_features, particle_type_features, event_features
])



In [35]:

    
grouped = group(feature_hierarchy, level=2)



In [36]:

    
len(grouped)









    Out[36]:





15



In [37]:

    
[ (g, len(fs)) for g, fs in grouped.items() ]









    Out[37]:





[((u'muons', u'photons'), 231),
 ((u'minibias', u'PF'), 126),
 ((u'photons', u'photons'), 231),
 ((u'minibias', u'calo'), 266),
 ((u'muons', u'muons'), 266),
 ((u'photons', u'muons'), 266),
 ((u'minibias', 'allChannels'), 7),
 ((u'photons', u'calo'), 266),
 ((u'photons', u'PF'), 126),
 ((u'muons', u'PF'), 126),
 ((u'minibias', u'photons'), 231),
 ((u'muons', 'allChannels'), 7),
 ((u'photons', 'allChannels'), 7),
 ((u'minibias', u'muons'), 266),
 ((u'muons', u'calo'), 266)]



In [38]:

    
channels = set([ k[1] for k in grouped ]) - set(['allChannels'])
print channels









    



set([u'muons', u'photons', u'PF', u'calo'])



In [39]:

    
for stream, channel in grouped.keys():
    if channel not in channels:
        for c in channels:
            grouped[(stream, c)].extend(grouped[(stream, channel)])
        del grouped[(stream, channel)]



In [40]:

    
[ (g, len(fs)) for g, fs in grouped.items() ]









    Out[40]:





[((u'muons', u'photons'), 238),
 ((u'minibias', u'PF'), 133),
 ((u'photons', u'photons'), 238),
 ((u'minibias', u'calo'), 273),
 ((u'muons', u'muons'), 273),
 ((u'photons', u'muons'), 273),
 ((u'photons', u'calo'), 273),
 ((u'photons', u'PF'), 133),
 ((u'muons', u'PF'), 133),
 ((u'minibias', u'photons'), 238),
 ((u'minibias', u'muons'), 273),
 ((u'muons', u'calo'), 273)]

Building netwrok



In [41]:

    
%env THEANO_FLAGS='device=gpu0', 'floatX=float32'

import theano
import theano.tensor as T

from lasagne import *

import crayimage
from crayimage.nn import Expression









    



env: THEANO_FLAGS='device=gpu0', 'floatX=float32'






    



Using gpu device 0: GeForce GTX TITAN X (CNMeM is disabled, cuDNN 5005)



In [42]:

    
class AE(Expression):
    def __init__(self, n_input_features, nums_units=(50, 10)):
        X_batch = T.fmatrix('X')
        self.input = layers.InputLayer(shape=(None, n_input_features), input_var=X_batch)
        self.drop = layers.DropoutLayer(self.input, p=0.1)
        net = self.input
        
        for n in nums_units:
            net = layers.DenseLayer(net, num_units=n, nonlinearity=nonlinearities.sigmoid)
        
        code = layers.get_output(net, deterministic=True)
        self.code_layer = net
        
        for n in nums_units[:-1][::-1]:
            net = layers.DenseLayer(net, num_units=n, nonlinearity=nonlinearities.sigmoid)
        
        net = layers.DenseLayer(net, num_units=n_input_features, nonlinearity=nonlinearities.linear)
        self.net = net
        
        X_reconstructed = layers.get_output(net)
        X_reconstructed_det = layers.get_output(net, deterministic=True)
        self.X_reconstructed = X_reconstructed
        
        super(AE, self).__init__(self.input, self.net)
        
        weights = T.fvector('weights')
        reconstruction_error = T.sum((X_reconstructed - X_batch) ** 2, axis=1)
        reconstruction_error_det = T.sum((X_reconstructed_det - X_batch) ** 2, axis=1)

        mse_loss = T.sum(weights * reconstruction_error) / T.sum(weights)
        
        reg = regularization.regularize_network_params(net, regularization.l2)
        reg_C = T.fscalar('reg_c')
        
        loss = mse_loss + reg_C * reg
        
        learning_rate = T.fscalar('learning rate')
        params = layers.get_all_params(net)
        upd = updates.adadelta(loss, params, learning_rate=learning_rate)
        
        self.train = theano.function([X_batch, weights, reg_C, learning_rate], mse_loss, updates=upd)
        self.get_error = theano.function([X_batch], reconstruction_error_det)
        self.encode = theano.function([X_batch], code)
        
        given_code = T.fmatrix('given code')
        X_decoded = layers.get_output(net, inputs={self.code_layer : given_code})
        self.decode = theano.function([given_code], X_decoded)
    
    @staticmethod
    def batch_stream(X, weights, batch_size=32):
        indx = np.random.permutation(X.shape[0])
        n_batches = X.shape[0] / batch_size
        
        for i in xrange(n_batches):
            batch_indx = indx[(i * batch_size):(i * batch_size + batch_size)]
            yield X[batch_indx], weights[batch_indx]
    
    def fit(self, X, weights, n_epoches = 1, batch_size=32, learning_rate = 1.0, regularization_c = 1.0e-3):
        n_batches = X.shape[0] / batch_size
        
        learning_rate = np.float32(learning_rate)
        regularization_c = np.float32(regularization_c)
        
        losses = np.zeros(shape=(n_epoches, n_batches), dtype='float32')
        for epoch in xrange(n_epoches):
            batch_stream = self.batch_stream(X, weights, batch_size)
            
            for i, (X_batch, w_batch) in enumerate(batch_stream):
                assert np.sum(w_batch) > 0.0

                losses[epoch, i] = self.train(X_batch, w_batch, regularization_c, learning_rate)
            
            yield losses[:(epoch + 1)]



In [43]:

    
def plot_hist(xs, ws, n_bins=50,
              labels=tuple(), colors=('green', 'red', 'blue'),
              title='', xlabel='', legend_loc='upper right',
              vline=None):
    plt.figure(figsize=(12, 8))
    ws = [ w / np.sum(w) for w in ws ]
    hs, _, _ = plt.hist(
        xs, bins=n_bins, weights=ws, histtype='step', label=labels, color=colors[:len(xs)]
    )
    plt.title(title, fontsize=24)
    plt.xlabel(xlabel, fontsize=20)
    
    if vline is not None:
        plt.plot([vline, vline], [0.0, np.max([np.max(h) for h in hs])], '--', label='well reconstruction cut')
    
    plt.legend(loc=legend_loc)
    
    plt.show()



In [44]:

    
from sklearn.svm import OneClassSVM



In [45]:

    
for g in [('muons', 'muons'), ('photons', 'photons'), ('minibias', 'PF'), ('minibias', 'calo')]:
    if len(g) < 1:
        continue

    X = data[grouped[g]].get_values().astype('float32')
    X_good = X[labels == 1.0]
    X_bad = X[labels == 0.0]
    
    weights_good = lumi[labels == 1.0].astype('float32')
    weights_bad = lumi[labels == 0.0].astype('float32')

    ae = AE(X.shape[1], nums_units=(150, 20))
    
    for l in ae.fit(X_good, weights_good, n_epoches=128,
                    batch_size=128, learning_rate=1.0,
                    regularization_c=1.0e-4):
        #print np.mean(l)
        pass
    
    X_mean = np.sum(weights_good[:, None] * X_good, axis=0) / np.sum(weights_good)
    mean_error = np.sum(np.sum((X_good - X_mean) ** 2, axis=1) * weights_good) / np.sum(weights_good)
    AE_error = np.sum(ae.get_error(X_good) * weights_good) / np.sum(weights_good)

    print 'Feature group', g
    print 'Mean field estimation error: %.2e' % mean_error
    print 'AE error: %.2e' % AE_error
    
    log_E_good = np.log(ae.get_error(X_good) / mean_error)
    log_E_bad = np.log(ae.get_error(X_bad) / mean_error)
    
    cut = np.percentile(log_E_good, q = 95)
    
    plot_hist(
        [log_E_good, log_E_bad], [weights_good, weights_bad],
        labels = ['Good lumisections', 'Bad lumisections'],
        xlabel = '$\log E_{\mathrm{reconstruction}}$',
        title = 'Reconstruction error for %s %s' % g,
        vline = cut
    )
    
    well_approximated_bad = log_E_bad < cut
    badly_approximated_bad = log_E_bad >= cut

    svm = OneClassSVM(nu=0.1, cache_size=128, gamma = 2.0 / X_good.shape[1])
    svm.fit(ae.encode(X_good), sample_weight=weights_good)
    
    score_good = svm.decision_function(ae.encode(X_good))[:, 0]
    score_bad = svm.decision_function(ae.encode(X_bad[well_approximated_bad]))[:, 0]
    score_badly_bad = svm.decision_function(ae.encode(X_bad[badly_approximated_bad]))[:, 0]
    
    plot_hist(
        [score_good, score_bad, score_badly_bad],
        [weights_good, weights_bad[well_approximated_bad], weights_bad[badly_approximated_bad]],
        labels=['Good lumisections', 'Well reconstructed bad lumisections', 'Poorly reconstructed bad lumisections'],
        title = 'Good lumisection support estimation %s %s' % g,
        xlabel = "distance to the $\\nu$-SVM's decision function",
        legend_loc='upper left'
    )









    



Feature group ('muons', 'muons')
Mean field estimation error: 4.06e+01
AE error: 4.02e+00






    












    












    



Feature group ('photons', 'photons')
Mean field estimation error: 4.48e+01
AE error: 3.97e+00






    












    












    



Feature group ('minibias', 'PF')
Mean field estimation error: 3.86e+01
AE error: 5.09e+00






    












    












    



Feature group ('minibias', 'calo')
Mean field estimation error: 7.94e+01
AE error: 2.00e+01

Test against ground truth



In [46]:

    
from sklearn.metrics import roc_curve, auc, roc_auc_score



In [47]:

    
channels = [('muons', 'muons'), ('photons', 'photons'), ('minibias', 'PF'), ('minibias', 'calo')]
reconstruction_error = np.ndarray(shape=(len(data), len(channels)), dtype='float32')

for i, g in enumerate(channels):
    X = data[grouped[g]].get_values().astype('float32')
    X_good = X[labels == 1.0]
    X_bad = X[labels == 0.0]
    
    weights_good = lumi[labels == 1.0].astype('float32')
    weights_bad = lumi[labels == 0.0].astype('float32')

    ae = AE(X.shape[1], nums_units=(150, 20))
    
    for l in ae.fit(X_good, weights_good, n_epoches=256,
                    batch_size=128, learning_rate=1.0,
                    regularization_c=1.0e-4):
        #print np.mean(l)
        pass
    
    print 'AE for %s is fit' % (g, )
    
    reconstruction_error[:, i] = ae.get_error(X)









    



AE for ('muons', 'muons') is fit
AE for ('photons', 'photons') is fit
AE for ('minibias', 'PF') is fit
AE for ('minibias', 'calo') is fit



In [48]:

    
for i, g in enumerate(channels):
    plt.figure(figsize=(10, 10))
    plt.title('ROC AUC of reconstruction error for %s against subsystems.' % (g, ))
    plt.plot([0, 1], [0, 1], '--')
    plt.xlabel('FPR')
    plt.ylabel('TPR')

    for j, sub in enumerate(subsystems):
        fpr, tpr, _ = roc_curve(subsystem_labels[:, j], -reconstruction_error[:, i])
        score = auc(fpr, tpr, reorder=True)
        plt.plot(fpr, tpr, label='against %s: %.2f' % (sub, score))
    plt.legend(loc='lower right')
    plt.show()









    



/home/mborisya/opt/miniconda/lib/python2.7/site-packages/sklearn/metrics/ranking.py:542: UndefinedMetricWarning: No positive samples in y_true, true positive value should be meaningless
  UndefinedMetricWarning)



In [49]:

    
aucs = np.ones(shape=(reconstruction_error.shape[1], subsystem_labels.shape[1])) / 2.0

for i in xrange(reconstruction_error.shape[1]):
    for j in xrange(subsystem_labels.shape[1]):
        try:
            aucs[i, j] = roc_auc_score(subsystem_labels[:, j], -reconstruction_error[:, i])
        except:
            pass



In [52]:

    
plt.figure(figsize=(12, 6))
plt.matshow(aucs, cmap=plt.cm.viridis)
plt.xticks(np.arange(len(subsystems)), subsystems)
plt.yticks(np.arange(4), [ "%s_%s" % g for g in channels ])
plt.colorbar()
plt.show()









    





<matplotlib.figure.Figure at 0x7f946fc81510>



In [ ]:

	_instantLumi_minibias	_instantLumi_muons	_instantLumi_photons	_luminosityBlock	_run	minibias_PF_Px_mean	minibias_PF_Px_p1	minibias_PF_Px_p25	minibias_PF_Px_p50	minibias_PF_Px_p75	...	photons_photons_pt__q4_p75	photons_photons_pt__q4_p99	photons_photons_pt__q4_std	photons_photons_pt__q5_mean	photons_photons_pt__q5_p1	photons_photons_pt__q5_p25	photons_photons_pt__q5_p50	photons_photons_pt__q5_p75	photons_photons_pt__q5_p99	photons_photons_pt__q5_std
0	-0.476999	-0.461257	-0.474353	712.0	149442.0	0.553982	0.121924	-2.377744	2.979489	3.999278	...	0.764066	0.771053	0.613178	0.671934	-0.115348	0.529921	0.626325	0.669504	0.781640	0.624168
1	-0.477623	-0.461857	-0.474955	715.0	149442.0	0.618719	0.140093	-2.245878	3.164899	4.423358	...	0.816295	1.448301	0.720708	0.596897	-0.115348	0.500126	0.613411	0.762044	0.373972	0.564393
2	-0.477305	-0.461539	-0.474672	713.0	149442.0	0.590468	0.089144	-2.267943	3.180846	4.379818	...	1.024795	0.315584	0.565043	0.521407	-0.115348	0.398654	0.593673	0.525674	1.095464	0.607292
3	-0.477561	-0.461845	-0.474898	714.0	149442.0	0.563941	0.119073	-2.135948	3.271239	4.200118	...	1.010522	1.116072	0.778321	0.669518	-0.115348	0.659620	0.662089	0.603566	0.905891	0.494840
4	-0.538044	-0.523290	-0.535418	1023.0	149442.0	0.512639	0.077763	-2.699199	2.974805	4.191212	...	0.864409	0.397704	0.620604	0.533768	-0.115348	0.444284	0.585253	0.609742	1.004260	0.574727
5	-0.537828	-0.523068	-0.535225	1021.0	149442.0	0.517615	0.103767	-2.663293	2.657162	3.985256	...	0.648973	1.369331	0.777599	0.577041	-0.115348	0.526261	0.596193	0.478365	0.648295	0.346964
6	-0.537625	-0.522880	-0.535011	1022.0	149442.0	0.563187	0.102591	-2.438237	2.993670	4.275795	...	0.919552	0.240982	0.398985	0.444162	-0.115348	0.329574	0.505470	0.449276	0.451287	0.421262
7	-0.537408	-0.522655	-0.534744	1019.0	149442.0	0.505455	0.100209	-2.434321	3.207387	3.973735	...	0.938196	0.244517	0.423203	0.507372	-0.115348	0.346889	0.567593	0.525296	0.685222	0.375095
8	-0.537486	-0.522684	-0.534869	1020.0	149442.0	0.574270	0.096662	-1.984827	3.611923	4.527441	...	0.944487	0.125781	0.404884	0.529739	-0.115348	0.443858	0.608706	0.572331	0.111104	0.021400
9	1.853466	1.907932	1.857009	891.0	148862.0	0.143227	0.193403	-1.220393	-0.248370	0.592133	...	0.895971	0.757568	0.771628	0.576278	-0.115348	0.400897	0.583197	0.597291	0.727995	0.536766
10	1.837523	1.891757	1.841057	911.0	148862.0	0.020426	0.200582	-1.243430	-0.010208	0.794309	...	0.878920	0.642180	0.794367	0.490828	-0.115348	0.318793	0.600866	0.581313	0.796026	0.817299
11	1.837981	1.892196	1.841510	910.0	148862.0	0.254102	0.299626	-0.753641	0.387506	0.688613	...	0.903513	0.616177	0.563428	0.611265	-0.115348	0.515783	0.643339	0.601259	0.662659	0.452296
12	1.853642	1.908058	1.857170	892.0	148862.0	0.053299	0.220230	-1.412691	-0.203188	0.617519	...	1.060738	1.160782	1.041600	0.575771	-0.115348	0.358568	0.601125	0.587111	1.043687	0.686101
13	1.835867	1.890089	1.839436	912.0	148862.0	0.220551	0.254586	-0.802466	0.278139	0.755937	...	0.838634	0.884751	0.868857	0.562964	-0.115348	0.405869	0.593424	0.590186	0.858611	0.638545
14	1.845707	1.900036	1.849211	901.0	148862.0	0.050288	0.268303	-0.701044	0.263453	0.662087	...	0.942580	0.889855	0.813298	0.580820	-0.115348	0.367007	0.608496	0.593837	1.088881	0.659789
15	1.839256	1.893519	1.842827	909.0	148862.0	0.137335	0.253475	-0.964377	-0.198334	0.529419	...	0.927195	0.496566	0.614150	0.561602	-0.115348	0.398512	0.617832	0.598610	0.772948	0.550210
16	1.845051	1.899399	1.848600	902.0	148862.0	0.139826	0.201296	-1.213878	-0.248624	0.542476	...	0.968020	0.866815	0.935637	0.595347	-0.115348	0.463678	0.617370	0.593838	0.785318	0.527427
17	-0.394267	-0.377106	-0.391542	309.0	149442.0	0.554091	0.114643	-2.146046	3.534587	4.395530	...	0.761780	1.016628	0.770595	0.485900	-0.115348	0.346858	0.570590	0.594613	0.488143	0.431462
18	-0.394795	-0.377646	-0.392106	310.0	149442.0	0.577791	0.123994	-2.043484	3.302803	4.151893	...	0.867348	0.998963	0.871039	0.583222	-0.115348	0.469590	0.588269	0.562702	0.367881	0.420787
19	-0.393894	-0.376756	-0.391188	308.0	149442.0	0.586487	0.113231	-2.112022	3.688505	4.278188	...	0.912303	0.511949	0.720140	0.506801	-0.115348	0.450674	0.553380	0.568445	0.777110	0.556243
20	-0.225698	-0.205767	-0.222956	471.0	146804.0	0.160347	0.341338	0.368587	-0.196806	-0.346609	...	0.249630	0.313199	0.311957	0.203223	-0.115348	0.236743	0.213440	0.196701	0.055530	0.116495
21	-0.226181	-0.206227	-0.223441	473.0	146804.0	0.156684	0.344022	0.256757	-0.215817	-0.378021	...	0.162188	0.255926	0.239644	0.210386	-0.115348	0.322838	0.204748	0.142855	0.381928	0.121706
22	-0.225980	-0.206040	-0.223241	470.0	146804.0	0.158915	0.350837	0.421057	-0.191739	-0.317630	...	0.304777	0.392592	0.284241	0.229816	-0.115348	0.323203	0.205921	0.141697	0.131174	0.074745
23	-0.226017	-0.206095	-0.223279	472.0	146804.0	0.158551	0.340362	0.232593	-0.195309	-0.324071	...	0.227385	0.330222	0.491577	0.257404	-0.115348	0.281682	0.217302	0.201887	0.231733	0.181379
24	-0.225742	-0.205788	-0.222996	469.0	146804.0	0.140641	0.345640	0.339246	-0.289709	-0.437911	...	0.368665	0.469223	0.527272	0.259785	-0.115348	0.386855	0.221167	0.236540	0.207622	0.248504
25	-0.227557	-0.207655	-0.224824	482.0	146804.0	0.142174	0.340112	0.262324	-0.307185	-0.405788	...	0.392122	0.353573	0.359102	0.281337	-0.115348	0.379175	0.213838	0.246437	0.412988	0.238516
26	-0.225567	-0.205613	-0.222843	468.0	146804.0	0.161805	0.344569	0.327394	-0.105669	-0.300049	...	0.203539	0.308345	0.213659	0.229013	-0.115348	0.352089	0.205661	0.193750	0.315675	0.059978
27	-0.227121	-0.207215	-0.224374	481.0	146804.0	0.145664	0.332887	0.253074	-0.350401	-0.339488	...	0.224392	0.298649	0.228139	0.197570	-0.115348	0.239053	0.198968	0.180528	0.073310	0.042760
28	0.140034	0.166046	0.142922	241.0	147114.0	0.066937	0.302040	-0.509565	0.210655	0.502740	...	0.192426	0.375928	0.276894	0.203357	-0.115348	0.336530	0.207330	0.182377	0.048294	0.051638
29	0.140302	0.166340	0.143204	240.0	147114.0	0.190173	0.273033	-0.577491	0.115347	0.531911	...	0.345948	0.209574	0.467636	0.234368	-0.115348	0.351363	0.204462	0.190613	0.265661	0.175971
...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...
40761	2.902892	2.974773	2.906824	179.0	148952.0	0.151138	0.232927	-1.294354	0.226846	0.705557	...	0.973589	0.986710	0.708416	0.544826	-0.115348	0.427452	0.582249	0.572360	0.796757	0.460581
40762	2.904878	2.976819	2.908760	178.0	148952.0	0.231864	0.289239	-0.943275	0.350481	0.780441	...	1.039547	0.556406	0.753270	0.629318	-0.115348	0.455411	0.608221	0.605413	0.922457	0.685390
40763	2.906914	-0.848565	2.910910	177.0	148952.0	0.205609	0.221397	-1.003021	0.428950	0.844791	...	0.907821	1.030230	1.010337	0.587340	-0.115348	0.402068	0.622462	0.602628	0.960785	0.597153
40764	2.908473	2.980513	2.912444	176.0	148952.0	0.095460	0.292578	-1.066127	0.166745	0.526382	...	0.924296	0.797089	0.640915	0.546176	-0.115348	0.388512	0.577270	0.615741	0.659437	0.486046
40765	2.891564	2.963304	2.895541	185.0	148952.0	0.173260	0.289437	-1.082365	-0.227814	0.555198	...	0.890428	0.699035	0.586636	0.572752	-0.115348	0.423211	0.609287	0.609872	0.725501	0.456311
40766	2.894841	2.966656	2.898794	183.0	148952.0	0.197939	0.256577	-0.864153	0.091139	0.700455	...	0.939332	0.754420	0.711834	0.627152	-0.115348	0.481476	0.633779	0.610978	0.830290	0.558209
40767	2.897331	2.969224	2.901307	182.0	148952.0	0.187638	0.285519	-0.691262	0.503284	0.859772	...	0.967683	0.876492	0.678706	0.576152	-0.115348	0.405302	0.607997	0.634564	0.874259	0.630896
40768	2.900572	2.972462	2.904531	180.0	148952.0	0.238464	0.300257	-1.076722	0.418564	0.611386	...	1.005201	0.921115	0.952743	0.635327	-0.115348	0.428403	0.589989	0.602555	0.954278	1.842066
40769	-0.413906	-0.397107	-0.411242	387.0	149442.0	0.575185	0.120637	-2.281897	3.058253	4.299345	...	1.080313	0.324990	0.599762	0.505528	-0.115348	0.363226	0.534725	0.553655	0.483907	0.425722
40770	-0.413593	-0.396764	-0.410927	385.0	149442.0	0.598695	0.127787	-2.166623	3.111146	4.130128	...	0.928078	0.564214	0.556453	0.573485	-0.115348	0.286211	0.582370	0.621679	0.634364	0.673325
40771	-0.413808	-0.396965	-0.411086	386.0	149442.0	0.564783	0.130210	-2.785280	3.192240	4.383056	...	0.851874	0.778637	0.743982	0.578963	-0.115348	0.471776	0.589087	0.536826	0.712576	0.370454
40772	-0.857999	2.894878	2.827338	171.0	148862.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.889084	0.511768	0.561222	0.580890	-0.115348	0.499345	0.587801	0.551634	0.833091	0.481876
40773	-0.857999	2.826386	2.762186	170.0	148862.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.902296	0.863034	0.655097	0.619085	-0.115348	0.389422	0.616936	0.630125	0.853028	0.527624
40774	-0.857999	2.821834	2.756299	182.0	148862.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.812797	0.998281	0.851491	0.593229	-0.115348	0.454787	0.612111	0.657451	0.747904	0.652288
40775	-0.857999	1.185661	-0.855501	17.0	148828.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	-1.406542	-1.449248	-1.414295	-1.335670	-0.115348	-0.995653	-1.299526	-1.475390	-1.611429	-1.470669
40776	-0.857999	2.781881	2.716375	165.0	148862.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.935766	0.754058	0.658169	0.584419	-0.115348	0.432774	0.600677	0.591814	0.895626	0.441935
40777	-0.857999	1.385288	1.342722	1536.0	149181.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.943771	0.471166	0.517161	0.473218	-0.115348	0.361935	0.576693	0.558094	0.609971	0.373905
40778	-0.857999	1.384750	1.342142	1537.0	149181.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.981591	0.718133	0.836164	0.579317	-0.115348	0.385875	0.612778	0.611518	0.747541	0.670423
40779	-0.857999	1.382778	1.340241	1542.0	149181.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.912063	0.774485	0.925811	0.589979	-0.115348	0.429033	0.615602	0.626123	0.989212	0.671891
40780	-0.857999	1.382065	1.339508	1543.0	149181.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.942877	1.707885	0.943092	0.542625	-0.115348	0.409707	0.590393	0.570283	0.981879	0.554108
40781	-0.857999	1.384597	1.341965	1538.0	149181.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.970771	0.988100	0.775045	0.507598	-0.115348	0.335137	0.593299	0.604263	0.644468	0.543094
40782	-0.857999	1.384127	1.341540	1539.0	149181.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.882849	0.714974	0.744845	0.564940	-0.115348	0.432921	0.621131	0.580774	0.807918	0.524712
40783	-0.857999	1.383092	1.340576	1540.0	149181.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.858010	1.162390	0.849604	0.551138	-0.115348	0.307825	0.576889	0.615084	0.966162	0.701171
40784	-0.857999	1.382828	1.340324	1541.0	149181.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.792172	0.481995	0.497062	0.469144	-0.115348	0.328909	0.566370	0.542170	0.600684	0.389513
40793	-0.857999	1.180659	-0.855501	29.0	148828.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	-1.406542	-1.449248	-1.414295	-1.335670	-0.115348	-0.995653	-1.299526	-1.475390	-1.611429	-1.470669
40795	-0.857999	-0.848565	-0.054579	343.0	147219.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	-1.406542	-1.449248	-1.414295	0.374269	2.074624	0.934642	0.402299	0.044024	-0.890081	-1.470669
40796	-0.857999	-0.848565	2.829290	172.0	148862.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.896104	0.637716	0.542963	0.602062	-0.115348	0.414534	0.607376	0.589908	0.915982	0.610430
40797	-0.857999	-0.848565	2.762324	181.0	148862.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.953119	1.197147	1.013682	0.573956	-0.115348	0.389071	0.606260	0.625781	1.080387	0.635778
40798	-0.857999	-0.848565	2.766229	180.0	148862.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.822746	0.614369	0.676742	0.536445	-0.115348	0.384111	0.570027	0.579671	0.659704	0.539166
40799	-0.857999	-0.848565	2.815175	173.0	148862.0	0.179143	0.436371	2.126189	0.088207	-1.171486	...	0.940939	0.763052	0.698729	0.556129	-0.115348	0.452743	0.594686	0.577589	0.658719	0.382850